RubyGems - json_schema - Versions diffs - 0.0.7 - Mend

json_schema 0.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

data/README.md +36 -0
data/lib/json_pointer.rb +7 -0
data/lib/json_pointer/evaluator.rb +75 -0
data/lib/json_reference.rb +39 -0
data/lib/json_schema.rb +27 -0
data/lib/json_schema/parser.rb +296 -0
data/lib/json_schema/reference_expander.rb +156 -0
data/lib/json_schema/schema.rb +155 -0
data/lib/json_schema/schema_error.rb +25 -0
data/lib/json_schema/validator.rb +405 -0
data/test/data_scaffold.rb +238 -0
data/test/json_pointer/evaluator_test.rb +60 -0
data/test/json_schema/parser_test.rb +230 -0
data/test/json_schema/reference_expander_test.rb +149 -0
data/test/json_schema/validator_test.rb +606 -0
data/test/json_schema_test.rb +67 -0
data/test/test_helper.rb +4 -0
metadata +64 -0

data/README.md ADDED Viewed

@@ -0,0 +1,36 @@
+# json_schema
+A JSON Schema V4 and Hyperschema V4 parser and validator.
+``` ruby
+require "json"
+require "json_schema"
+# parse the schema
+schema_data = JSON.parse(File.read("schema.json"))
+schema = JsonSchema.parse!(schema_data)
+# validate some data
+data = JSON.parse(File.read("data.json"))
+schema.validate!(data)
+# iterate through hyperschema links
+schema.links.each do |link|
+  puts "#{link.method} #{link.href}"
+end
+```
+## Development
+Run the test suite with:
+```
+rake
+```
+Or run specific suites or tests with:
+```
+ruby -Ilib -Itest test/json_schema/validator_test.rb
+ruby -Ilib -Itest test/json_schema/validator_test.rb -n /anyOf/
+```

data/lib/json_pointer.rb ADDED Viewed

@@ -0,0 +1,7 @@
+require_relative "json_pointer/evaluator"
+module JsonPointer
+  def self.evaluate(data, path)
+    Evaluator.new(data).evaluate(path)
+  end
+end

data/lib/json_pointer/evaluator.rb ADDED Viewed

@@ -0,0 +1,75 @@
+module JsonPointer
+  class Evaluator
+    def initialize(data)
+      @data = data
+    end
+    def evaluate(original_path)
+      path = original_path
+      # the leading # can either be included or not
+      path = path[1..-1] if path[0] == "#"
+      # special case on "" or presumably "#"
+      if path.empty?
+        return @data
+      end
+      if path[0] != "/"
+        raise %{Path must begin with a leading "/": #{original_path}.}
+      end
+      path_parts = split(path)
+      evaluate_segment(@data, path_parts)
+    end
+    private
+    def evaluate_segment(data, path_parts)
+      if path_parts.empty?
+        data
+      elsif data == nil
+        # spec doesn't define how to handle this, so we'll return `nil`
+        nil
+      else
+        key = transform_key(path_parts.shift)
+        if data.is_a?(Array)
+          unless key =~ /^\d+$/
+            raise %{Key operating on an array must be a digit or "-": #{key}.}
+          end
+          evaluate_segment(data[key.to_i], path_parts)
+        else
+          evaluate_segment(data[key], path_parts)
+        end
+      end
+    end
+    # custom split method to account for blank segments
+    def split(path)
+      parts = []
+      last_index = 0
+      while index = path.index("/", last_index)
+        if index == last_index
+          parts << ""
+        else
+          parts << path[last_index...index]
+        end
+        last_index = index + 1
+      end
+      # and also get that last segment
+      parts << path[last_index..-1]
+      # it should begin with a blank segment from the leading "/"; kill that
+      parts.shift
+      parts
+    end
+    def transform_key(key)
+      # ~ has special meaning to JSON pointer to allow keys containing "/", so
+      # perform some transformations first as defined by the spec
+      # first as defined by the spec
+      key = key.gsub('~1', '/')
+      key = key.gsub('~0', '~')
+      key
+    end
+  end
+end

data/lib/json_reference.rb ADDED Viewed

@@ -0,0 +1,39 @@
+require "json_pointer"
+require "uri"
+module JsonReference
+  class Reference
+    attr_accessor :pointer
+    attr_accessor :uri
+    def initialize(ref)
+      # given a simple fragment without '#', resolve as a JSON Pointer only as
+      # per spec
+      if ref.include?("#")
+        uri, @pointer = ref.split('#')
+        if uri && !uri.empty?
+          @uri = URI.parse(uri)
+        end
+      else
+        @pointer = ref
+      end
+      # normalize pointers by prepending "#"
+      @pointer = "#" + @pointer
+    end
+    # Given the document addressed by #uri, resolves the JSON Pointer part of
+    # the reference.
+    def resolve_pointer(data)
+      JsonPointer.evaluate(data, @pointer)
+    end
+    def to_s
+      if @uri
+        "#{@uri.to_s}#{@pointer}"
+      else
+        @pointer
+      end
+    end
+  end
+end

data/lib/json_schema.rb ADDED Viewed

@@ -0,0 +1,27 @@
+require_relative "json_schema/parser"
+require_relative "json_schema/reference_expander"
+require_relative "json_schema/schema"
+require_relative "json_schema/schema_error"
+require_relative "json_schema/validator"
+module JsonSchema
+  def self.parse(data)
+    parser = Parser.new
+    if schema = parser.parse(data)
+      valid, errors = schema.expand_references
+      if valid
+        [schema, nil]
+      else
+        [nil, errors]
+      end
+    else
+      [nil, parser.errors]
+    end
+  end
+  def self.parse!(data)
+    schema = Parser.new.parse!(data)
+    schema.expand_references!
+    schema
+  end
+end

data/lib/json_schema/parser.rb ADDED Viewed

@@ -0,0 +1,296 @@
+require "json_reference"
+module JsonSchema
+  class Parser
+    ALLOWED_TYPES = %w{any array boolean integer number null object string}
+    BOOLEAN = [FalseClass, TrueClass]
+    FRIENDLY_TYPES = {
+      Array      => "array",
+      FalseClass => "boolean",
+      Float      => "number",
+      Hash       => "object",
+      Integer    => "integer",
+      NilClass   => "null",
+      String     => "string",
+      TrueClass  => "boolean",
+    }
+    attr_accessor :errors
+    # Basic parsing of a schema. May return a malformed schema! (Use `#parse!`
+    # to raise errors instead).
+    def parse(data, parent = nil)
+      # while #parse_data is recursed into for many schemas over the same
+      # object, the @errors array is an instance-wide accumulator
+      @errors = []
+      schema = parse_data(data, parent)
+      if @errors.count == 0
+        schema
+      else
+        nil
+      end
+    end
+    def parse!(data, parent = nil)
+      schema = parse(data, parent)
+      if !schema
+        raise SchemaError.aggregate(@errors)
+      end
+      schema
+    end
+    private
+    def build_uri(id, parent_uri)
+      # kill any trailing slashes
+      if id
+        id = id.chomp("/")
+      end
+      # if id is missing, it's defined as its parent schema's URI
+      if id.nil?
+        parent_uri
+      # if id is defined as absolute, the schema's URI stays absolute
+      elsif id[0] == "/"
+        id
+      # otherwise build it according to the parent's URI
+      else
+        # make sure we don't end up with duplicate slashes
+        parent_uri = parent_uri.chomp("/")
+        parent_uri + "/" + id
+      end
+    end
+    def parse_all_of(schema)
+      if schema.all_of && schema.all_of.is_a?(Array)
+        schema.all_of = schema.all_of.map { |s| parse_data(s, schema) }
+      end
+    end
+    def parse_any_of(schema)
+      if schema.any_of && schema.any_of.is_a?(Array)
+        schema.any_of = schema.any_of.map { |s| parse_data(s, schema) }
+      end
+    end
+    def parse_one_of(schema)
+      if schema.one_of && schema.one_of.is_a?(Array)
+        schema.one_of = schema.one_of.map { |s| parse_data(s, schema) }
+      end
+    end
+    def parse_data(data, parent = nil)
+      schema = Schema.new
+      if !data.is_a?(Hash)
+        # it would be nice to make this message more specific/nicer (at best it
+        # points to the wrong schema)
+        message = %{Expected schema; value was: #{data.inspect}.}
+        @errors << SchemaError.new(parent, message)
+      elsif ref = data["$ref"]
+        schema.reference = JsonReference::Reference.new(ref)
+      else
+        schema = parse_schema(data, parent)
+      end
+      schema.parent = parent
+      schema
+    end
+    def parse_definitions(schema)
+      if schema.definitions && schema.definitions.is_a?(Hash)
+        # leave the original data reference intact
+        schema.definitions = schema.definitions.dup
+        schema.definitions.each do |key, definition|
+          subschema = parse_data(definition, schema)
+          schema.definitions[key] = subschema
+        end
+      end
+    end
+    def parse_dependencies(schema)
+      if schema.dependencies && schema.dependencies.is_a?(Hash)
+        # leave the original data reference intact
+        schema.dependencies = schema.dependencies.dup
+        schema.dependencies.each do |k, s|
+          # may be Array, String (simple dependencies), or Hash (schema
+          # dependency)
+          if s.is_a?(Hash)
+            schema.dependencies[k] = parse_data(s, schema)
+          elsif s.is_a?(String)
+            # just normalize all simple dependencies to arrays
+            schema.dependencies[k] = [s]
+          end
+        end
+      end
+    end
+    def parse_items(schema)
+      if schema.items
+        # tuple validation: an array of schemas
+        if schema.items.is_a?(Array)
+          schema.items = schema.items.map { |s| parse_data(s, schema) }
+        # list validation: a single schema
+        else
+          schema.items = parse_data(schema.items, schema)
+        end
+      end
+    end
+    def parse_links(schema)
+      if schema.links
+        schema.links = schema.links.map { |l|
+          link             = Schema::Link.new
+          link.parent      = schema
+          link.description = l["description"]
+          link.href        = l["href"]
+          link.method      = l["method"] ? l["method"].downcase.to_sym : nil
+          link.rel         = l["rel"]
+          link.title       = l["title"]
+          if l["schema"]
+            link.schema = parse_data(l["schema"], schema)
+          end
+          link
+        }
+      end
+    end
+    def parse_media(schema)
+      if data = schema.media
+        schema.media = Schema::Media.new
+        schema.media.binary_encoding = data["binaryEncoding"]
+        schema.media.type            = data["type"]
+      end
+    end
+    def parse_not(schema)
+      if schema.not && schema.not.is_a?(Hash)
+        schema.not = parse_data(schema.not, schema)
+      end
+    end
+    def parse_pattern_properties(schema)
+      if schema.pattern_properties && schema.pattern_properties.is_a?(Hash)
+        # leave the original data reference intact
+        properties = schema.pattern_properties.dup
+        properties = properties.map do |k, s|
+          [Regexp.new(k), parse_data(s, schema)]
+        end
+        schema.pattern_properties = Hash[*properties.flatten]
+      end
+    end
+    def parse_properties(schema)
+      # leave the original data reference intact
+      schema.properties = schema.properties.dup
+      if schema.properties && schema.properties.is_a?(Hash)
+        schema.properties.each do |key, definition|
+          subschema = parse_data(definition, schema)
+          schema.properties[key] = subschema
+        end
+      end
+    end
+    def parse_schema(data, parent = nil)
+      schema = Schema.new
+      schema.data        = data
+      schema.id          = validate_type(schema, [String], "id")
+      # build URI early so we can reference it in errors
+      schema.uri = parent ?  build_uri(schema.id, parent.uri) : "/"
+      schema.title       = validate_type(schema, [String], "title")
+      schema.description = validate_type(schema, [String], "description")
+      schema.default     = schema.data["default"]
+      # validation: any
+      schema.all_of        = validate_type(schema, [Array], "allOf") || []
+      schema.any_of        = validate_type(schema, [Array], "anyOf") || []
+      schema.definitions   = validate_type(schema, [Hash], "definitions") || {}
+      schema.enum          = validate_type(schema, [Array], "enum")
+      schema.one_of        = validate_type(schema, [Array], "oneOf") || []
+      schema.not           = validate_type(schema, [Hash], "not")
+      schema.type          = validate_type(schema, [Array, String], "type")
+      schema.type          = [schema.type] if schema.type.is_a?(String)
+      validate_known_type!(schema)
+      # validation: array
+      schema.additional_items = validate_type(schema, BOOLEAN, "additionalItems")
+      schema.items            = validate_type(schema, [Array, Hash], "items")
+      schema.max_items        = validate_type(schema, [Integer], "maxItems")
+      schema.min_items        = validate_type(schema, [Integer], "minItems")
+      schema.unique_items     = validate_type(schema, BOOLEAN, "uniqueItems")
+      # validation: number/integer
+      schema.max           = validate_type(schema, [Float, Integer], "maximum")
+      schema.max_exclusive = validate_type(schema, BOOLEAN, "exclusiveMaximum")
+      schema.min           = validate_type(schema, [Float, Integer], "minimum")
+      schema.min_exclusive = validate_type(schema, BOOLEAN, "exclusiveMinimum")
+      schema.multiple_of   = validate_type(schema, [Float, Integer], "multipleOf")
+      # validation: object
+      schema.additional_properties =
+        validate_type(schema, BOOLEAN, "additionalProperties")
+      schema.dependencies       = validate_type(schema, [Hash], "dependencies") || {}
+      schema.max_properties     = validate_type(schema, [Integer], "maxProperties")
+      schema.min_properties     = validate_type(schema, [Integer], "minProperties")
+      schema.pattern_properties = validate_type(schema, [Hash], "patternProperties") || {}
+      schema.properties         = validate_type(schema, [Hash], "properties") || {}
+      schema.required           = validate_type(schema, [Array], "required")
+      # validation: string
+      schema.format     = validate_type(schema, [String], "format")
+      schema.max_length = validate_type(schema, [Integer], "maxLength")
+      schema.min_length = validate_type(schema, [Integer], "minLength")
+      schema.pattern    = validate_type(schema, [String], "pattern")
+      schema.pattern    = Regexp.new(schema.pattern) if schema.pattern
+      # hyperschema
+      schema.links      = validate_type(schema, [Array], "links")
+      schema.media      = validate_type(schema, [Hash], "media")
+      schema.path_start = validate_type(schema, [String], "pathStart")
+      schema.read_only  = validate_type(schema, BOOLEAN, "readOnly")
+      parse_all_of(schema)
+      parse_any_of(schema)
+      parse_one_of(schema)
+      parse_definitions(schema)
+      parse_dependencies(schema)
+      parse_items(schema)
+      parse_links(schema)
+      parse_media(schema)
+      parse_not(schema)
+      parse_pattern_properties(schema)
+      parse_properties(schema)
+      schema
+    end
+    def validate_known_type!(schema)
+      if schema.type
+        if !(bad_types = schema.type - ALLOWED_TYPES).empty?
+          message = %{Unknown types: #{bad_types.sort.join(", ")}.}
+          @errors << SchemaError.new(schema, message)
+        end
+      end
+    end
+    def validate_type(schema, types, field)
+      friendly_types =
+        types.map { |t| FRIENDLY_TYPES[t] || t }.sort.uniq.join("/")
+      value = schema.data[field]
+      if !value.nil? && !types.any? { |t| value.is_a?(t) }
+        message = %{Expected "#{field}" to be of type "#{friendly_types}"; value was: #{value.inspect}.}
+        @errors << SchemaError.new(schema, message)
+        nil
+      else
+        value
+      end
+    end
+  end
+end