RubyGems - json-ld - Versions diffs - 0.1.0 → 0.1.2 - Mend

json-ld 0.1.0 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

data/History.markdown +15 -0
data/README.markdown +199 -3
data/VERSION +1 -1
data/lib/json/ld.rb +44 -4
data/lib/json/ld/api.rb +220 -224
data/lib/json/ld/compact.rb +126 -0
data/lib/json/ld/evaluation_context.rb +428 -204
data/lib/json/ld/expand.rb +185 -0
data/lib/json/ld/extensions.rb +34 -7
data/lib/json/ld/format.rb +2 -17
data/lib/json/ld/frame.rb +452 -0
data/lib/json/ld/from_rdf.rb +166 -0
data/lib/json/ld/reader.rb +7 -231
data/lib/json/ld/to_rdf.rb +181 -0
data/lib/json/ld/utils.rb +97 -0
data/lib/json/ld/writer.rb +33 -471
metadata +51 -34
data/lib/json/ld/normalize.rb +0 -120

data/lib/json/ld/utils.rb ADDED

@@ -0,0 +1,97 @@
+module JSON::LD
+  module Utils
+    ##
+    # Is value a subject? A value is a subject if
+    # * it is a Hash
+    # * it is not a @value, @set or @list
+    # * it has more than 1 key or any key is not @id
+    # @param [Object] value
+    # @return [Boolean]
+    def subject?(value)
+      value.is_a?(Hash) &&
+        (value.keys & %w(@value @list @set)).empty? &&
+        !(value.keys - ['@id']).empty?
+    end
+    ##
+    # Is value a subject reference?
+    # @param [Object] value
+    # @return [Boolean]
+    def subject_reference?(value)
+      value.is_a?(Hash) && value.keys == %w(@id)
+    end
+    ##
+    # Is value a blank node? Value is a blank node
+    #
+    # @param [Object] value
+    # @return [Boolean]
+    def blank_node?(value)
+      (subject?(value) || subject_reference?(value)) && value.fetch('@id', '_:')[0,2] == '_:'
+    end
+    ##
+    # Is value an expaned @list?
+    #
+    # @param [Object] value
+    # @return [Boolean]
+    def list?(value)
+      value.is_a?(Hash) && value.keys == %w(@list)
+    end
+    private
+    # Add debug event to debug array, if specified
+    #
+    # @param [String] message
+    # @yieldreturn [String] appended to message, to allow for lazy-evaulation of message
+    def debug(*args)
+      return unless ::JSON::LD.debug? || @options[:debug]
+      list = args
+      list << yield if block_given?
+      message = " " * (@depth || 0) * 2 + (list.empty? ? "" : list.join(": "))
+      puts message if JSON::LD::debug?
+      @options[:debug] << message if @options[:debug].is_a?(Array)
+    end
+    # Increase depth around a method invocation
+    def depth(options = {})
+      old_depth = @depth || 0
+      @depth = (options[:depth] || old_depth) + 1
+      ret = yield
+      @depth = old_depth
+      ret
+    end
+  end
+  ##
+  # Utility class for mapping old blank node identifiers, or unnamed blank
+  # nodes to new identifiers
+  class BlankNodeNamer < Hash
+    # @param [String] prefix
+    def initialize(prefix)
+      @prefix = "_:#{prefix}0"
+      super
+    end
+    ##
+    # Get a new mapped name for `old`
+    #
+    # @param [String] old
+    # @return [String]
+    def get_name(old)
+      if old && self.has_key?(old)
+        self[old]
+      elsif old
+        self[old] = @prefix.dup
+        @prefix.succ!
+        self[old]
+      else
+        # Not referenced, just return a new unique value
+        cur = @prefix.dup
+        @prefix.succ!
+        cur
+      end
+    end
+  end
+end

data/lib/json/ld/writer.rb CHANGED

@@ -51,6 +51,7 @@ module JSON::LD
   # @see http://json-ld.org/spec/ED/20110507/#the-normalization-algorithm
   # @author [Gregg Kellogg](http://greggkellogg.net/)
   class Writer < RDF::Writer
+    include Utils
     format Format
     # @attr [RDF::Graph] Graph of statements serialized
@@ -60,13 +61,9 @@ module JSON::LD
     attr :context
     ##
-    # Return the pre-serialized Hash before turning into JSON
-    #
-    # @return [Hash]
-    def self.hash(*args, &block)
-      hash = Hash.new
-      self.new(hash, *args, &block)
-      hash
+    # Override normal symbol generation
+    def self.to_sym
+      :jsonld
     end
     ##
@@ -80,33 +77,22 @@ module JSON::LD
     #   the encoding to use on the output stream (Ruby 1.9+)
     # @option options [Boolean]  :canonicalize (false)
     #   whether to canonicalize literals when serializing
-    # @option options [Hash]     :prefixes     (Hash.new)
+    # @option options [Hash]     :prefixes     (Hash.ordered)
     #   the prefix mappings to use (not supported by all writers)
     # @option options [Boolean]  :standard_prefixes   (false)
     #   Add standard prefixes to @prefixes, if necessary.
-    # @option options [IO, Array, Hash, String, EvaluationContext]     :context     (Hash.new)
+    # @option options [IO, Array, Hash, String, EvaluationContext]     :context     (Hash.ordered)
     #   context to use when serializing. Constructed context for native serialization.
-    # @option options [Boolean] :automatic (true)
-    #   Automatically create context coercions and generate compacted form
-    # @option options [Boolean] :expand (false)
-    #   Output document in [expanded form](http://json-ld.org/spec/latest/json-ld-api/#expansion)
-    # @option options [Boolean] :compact (false)
-    #   Output document in [compacted form](http://json-ld.org/spec/latest/json-ld-api/#compaction).
-    #   Requires a referenced evaluation context
-    # @option options [Boolean] :normalize (false)
-    #   Output document in [normalized form](http://json-ld.org/spec/latest/json-ld-api/#normalization)
-    # @option options [IO, Array, Hash, String] :frame
-    #   Output document in [framed form](http://json-ld.org/spec/latest/json-ld-api/#framing)
-    #   using the referenced document as a frame.
     # @yield  [writer] `self`
     # @yieldparam  [RDF::Writer] writer
     # @yieldreturn [void]
     # @yield  [writer]
     # @yieldparam [RDF::Writer] writer
     def initialize(output = $stdout, options = {}, &block)
+      options[:base_uri] ||= options[:base] if options.has_key?(:base)
+      options[:base] ||= options[:base_uri] if options.has_key?(:base_uri)
       super do
         @graph = RDF::Graph.new
-        @options[:automatic] = true unless [:automatic, :expand, :compact, :frame, :normalize].any? {|k| options.has_key?(k)}
         if block_given?
           case block.arity
@@ -128,7 +114,7 @@ module JSON::LD
     end
     ##
-    # Addes a statement to be serialized
+    # Adds a statement to be serialized
     # @param  [RDF::Statement] statement
     # @return [void]
     def write_statement(statement)
@@ -148,464 +134,40 @@ module JSON::LD
     end
     ##
-    # Outputs the Serialized JSON-LD representation of all stored triples.
+    # Outputs the Serialized JSON-LD representation of all stored statements.
+    #
+    # If provided a context or prefixes, we'll create a context
+    # and use it to compact the output. Otherwise, we return un-compacted JSON-LD
     #
     # @return [void]
     # @see    #write_triple
     def write_epilogue
       @debug = @options[:debug]
-      reset
-      raise RDF::WriterError, "Compaction requres a context" if @options[:compact] && !@options[:context]
-      @context = EvaluationContext.new(@options)
-      @context = @context.parse(@options[:context]) if @options[:context]
-      @context.language = @options[:language] if @options[:language]
-      @context.lists.each {|p| @list_range[p] = true}
-      debug {"\nserialize: graph: #{@graph.size}"}
-      debug {"=> options: #{@options.reject {|k,v| k == :debug}.inspect}"}
-      debug {"=> context: #{@context.inspect}"}
-      preprocess
-      # Update prefix mappings to those defined in context
-      @options[:prefixes] = {}
-      @context.iri_to_term.each_pair do |iri, term|
-        debug {"add prefix #{term.inspect} for #{iri}"}
-        prefix(term, iri)  # Define for output
-      end
-      # Don't generate context for expanded or normalized output
-      json_hash = (@options[:expand] || @options[:normalize]) ? Hash.new : context.serialize(:depth => @depth)
-      elements = []
-      order_subjects.each do |subject|
-        unless is_done?(subject)
-          elements << subject(subject, json_hash)
-        end
-      end
-      return if elements.empty?
-      # If there are more than one top-level subjects, place in an array form
-      if elements.length == 1 && elements.first.is_a?(Hash)
-        json_hash.merge!(elements.first)
-      else
-        json_hash['@id'] = elements
-      end
-      if @output.is_a?(Hash)
-        @output.merge!(json_hash)
-      else
-        json_state = if @options[:normalize]
-          # Normalization uses a compressed form
-          JSON::State.new(
-            :indent       => "",
-            :space        => "",
-            :space_before => "",
-            :object_nl    => "",
-            :array_nl     => ""
-          )
-        else
-          JSON::State.new(
-            :indent       => "  ",
-            :space        => " ",
-            :space_before => "",
-            :object_nl    => "\n",
-            :array_nl     => "\n"
-          )
-        end
-        @output.write(json_hash.to_json(json_state))
-      end
-    end
-    ##
-    # Returns the representation of a IRI reference.
-    #
-    # Spec confusion: should a subject IRI be normalized?
-    #
-    # @param  [RDF::URI] value
-    # @param  [Hash{Symbol => Object}] options
-    # @option options [:subject, :predicate, :object] position
-    #   Useful when determining how to serialize.
-    # @option options [RDF::URI] property
-    #   Property for object reference, which can be used to return bare strings
-    # @return [Object]
-    def format_iri(value, options = {})
-      debug {"format_iri(#{options.inspect}, #{value.inspect})"}
-      result = context.compact_iri(value, {:depth => @depth}.merge(options))
-      unless options[:position] != :object || iri_range?(options[:property])
-        result = {"@id" => result}
-      end
-      debug {"=> #{result.inspect}"}
-      result
-    end
-    ##
-    # @param  [RDF::Node] value
-    # @param  [Hash{Symbol => Object}] options
-    # @return [String]
-    # @raise  [NotImplementedError] unless implemented in subclass
-    # @see {#format\_iri}
-    def format_node(value, options = {})
-      format_iri(value, options)
-    end
-    ##
-    # Returns the representation of a literal.
-    #
-    # @param  [RDF::Literal, String, #to_s] literal
-    # @param  [Hash{Symbol => Object}] options
-    # @option options [RDF::URI] property
-    #   Property referencing literal for type coercion
-    # @return [Object]
-    def format_literal(literal, options = {})
-      debug {"format_literal(#{options.inspect}, #{literal.inspect})"}
-      value = Hash.new
-      value['@literal'] = literal.value
-      value['@type'] = literal.datatype.to_s if literal.has_datatype?
-      value['@language'] = literal.language.to_s if literal.has_language?
-      result = case literal
-      when RDF::Literal::Boolean, RDF::Literal::Integer, RDF::Literal::Double
-        literal.object
-      else
-        context.compact_value(options[:property], value, {:depth => @depth}.merge(options))
-      end
-      debug {"=> #{result.inspect}"}
-      result
-    end
-    ##
-    # Serialize an RDF list
-    #
-    # @param [RDF::URI] object
-    # @param  [Hash{Symbol => Object}] options
-    # @option options [RDF::URI] property
-    #   Property referencing literal for type and list coercion
-    # @return [Hash{"@list" => Array<Object>}]
-    def format_list(object, options = {})
-      predicate = options[:property]
-      list = RDF::List.new(object, @graph)
-      ary = []
-      debug {"format_list(#{list.inspect}, #{predicate})"}
-      depth do
-        list.each_statement do |st|
-          next unless st.predicate == RDF.first
-          debug {" format_list this: #{st.subject} first: #{st.object}"}
-          ary << if predicate || st.object.literal?
-            property(predicate, st.object)
-          else
-            subject(st.object)
-          end
-          subject_done(st.subject)
-        end
-      end
-      # Returns
-      ary = {'@list' => ary} unless predicate && list_range?(predicate)
-      debug {"format_list => #{ary.inspect}"}
-      ary
-    end
-    private
-    # Perform any preprocessing of statements required
-    def preprocess
-      @graph.each {|statement| preprocess_statement(statement)}
-    end
-    # Perform any statement preprocessing required. This is used to perform reference counts and determine required
-    # prefixes.
-    #
-    # @param [Statement] statement
-    def preprocess_statement(statement)
-      debug {"preprocess: #{statement.inspect}"}
-      references = ref_count(statement.object) + 1
-      @references[statement.object] = references
-      @subjects[statement.subject] = true
-      depth do
-        # Pre-fetch qnames, to fill prefixes
-        format_iri(statement.subject, :position => :subject)
-        format_iri(statement.predicate, :position => :predicate)
-        # To figure out coercion requirements
-        if statement.object.literal?
-          format_literal(statement.object, :property => statement.predicate)
-          datatype_range?(statement.predicate)
-        else
-          format_iri(statement.object, :position => :object)
-          iri_range?(statement.predicate)
-        end
-        list_range?(statement.predicate)
-      end
-      @references[statement.predicate] = ref_count(statement.predicate) + 1
-    end
-    # Serialize a subject
-    # Option contains referencing property, if this is recursive
-    # @return [Hash]
-    def subject(subject, options = {})
-      defn = Hash.new
-      raise RDF::WriterError, "Illegal use of subject #{subject.inspect}, not supported" unless subject.resource?
-      subject_done(subject)
-      properties = @graph.properties(subject)
-      debug {"subject: #{subject.inspect}, props: #{properties.inspect}"}
-      @graph.query(:subject => subject).each do |st|
-        raise RDF::WriterError, "Illegal use of predicate #{st.predicate.inspect}, not supported in RDF/XML" unless st.predicate.uri?
-      end
-      if subject.node? && ref_count(subject) > (options[:property] ? 1 : 0) && options[:expand]
-        raise RDF::WriterError, "Can't serialize named node when normalizing"
-      end
-      # Subject may be a list
-      if is_valid_list?(subject)
-        debug "subject is a list"
-        defn['@id'] = format_list(subject)
-        properties.delete(RDF.first.to_s)
-        properties.delete(RDF.rest.to_s)
-        # Special case, if there are no properties, then we can just serialize the list itself
-        return defn if properties.empty?
-      elsif subject.uri? || ref_count(subject) > 1
-        debug "subject is an iri or it's a node referenced multiple times"
-        # Don't need to set subject if it's a Node without references
-        defn['@id'] = format_iri(subject, :position => :subject)
-      else
-        debug "subject is an unreferenced BNode"
-      end
-      prop_list = order_properties(properties)
-      debug {"=> property order: #{prop_list.inspect}"}
-      prop_list.each do |prop|
-        predicate = RDF::URI.intern(prop)
-        p_iri = format_iri(predicate, :position => :predicate)
-        depth do
-          defn[p_iri] = property(predicate, properties[prop])
-          debug {"prop(#{p_iri}) => #{properties[prop]} => #{defn[p_iri].inspect}"}
-        end
-      end
-      debug {"subject: #{subject} has defn: #{defn.inspect}"}
-      defn
-    end
-    ##
-    # Serialize objects for a property
-    #
-    # Spec confusion: sorting of multi-valued properties not adequately specified.
-    #
-    # @param [RDF::URI] predicate
-    # @param [Array<RDF::URI>, RDF::URI] objects
-    # @param [Hash{Symbol => Object}] options
-    # @return [Array, Hash, Object]
-    def property(predicate, objects, options = {})
-      objects = objects.first if objects.is_a?(Array) && objects.length == 1
-      case objects
-      when Array
-        objects.sort_by(&:to_s).map {|o| property(predicate, o, options)}
-      when RDF::Literal
-        format_literal(objects, options.merge(:property => predicate))
-      else
-        if is_valid_list?(objects)
-          format_list(objects, :property => predicate)
-        elsif is_done?(objects) || !@subjects.include?(objects)
-          format_iri(objects, :position => :object, :property => predicate)
-        else
-          subject(objects, :property => predicate)
-        end
-      end
-    end
-    ##
-    # Take a hash from predicate IRIs to lists of values.
-    # Sort the lists of values.  Return a sorted list of properties.
-    # @param [Hash{String => Array<Resource>}] properties A hash of Property to Resource mappings
-    # @return [Array<String>}] Ordered list of properties.
-    def order_properties(properties)
-      # Make sorted list of properties
-      prop_list = []
-      properties.keys.sort do |a, b|
-        format_iri(a, :position => :predicate) <=> format_iri(b, :position => :predicate)
-      end.each do |prop|
-        prop_list << prop.to_s
-      end
-      prop_list
-    end
-    # Order subjects for output. Override this to output subjects in another order.
-    #
-    # @return [Array<Resource>] Ordered list of subjects
-    def order_subjects
-      seen = {}
-      subjects = []
-      return @subjects.keys.sort do |a,b|
-        format_iri(a, :position => :subject) <=> format_iri(b, :position => :subject)
-      end unless @options[:automatic]
-      # Sort subjects by resources over bnodes, ref_counts and the subject URI itself
-      recursable = @subjects.keys.
-        select {|s| !seen.include?(s)}.
-        map {|r| [r.is_a?(RDF::Node) ? 1 : 0, ref_count(r), r]}.
-        sort
-      subjects += recursable.map{|r| r.last}
-    end
-    # Return the number of times this node has been referenced in the object position
-    # @return [Integer]
-    def ref_count(node)
-      @references.fetch(node, 0)
-    end
-    ##
-    # Does predicate have a range of IRI?
-    # @param [RDF::URI] predicate
-    # @return [Boolean]
-    def iri_range?(predicate)
-      return false if predicate.nil? || [RDF.first, RDF.rest].include?(predicate) || @options[:expand]
-      return true if predicate == RDF.type
-      unless context.coerce(predicate)
-        not_iri = !@options[:automatic]
-        #debug {"  (automatic) = #{(!not_iri).inspect}"}
-        # Any literal object makes it not so
-        not_iri ||= @graph.query(:predicate => predicate).to_a.any? do |st|
-          l = RDF::List.new(st.object, @graph)
-          #debug {"  o.literal? #{st.object.literal?.inspect}"}
-          #debug {"  l.valid? #{l.valid?.inspect}"}
-          #debug {"  l.any.valid? #{l.to_a.any?(&:literal?).inspect}"}
-          st.object.literal? || (l.valid? && l.to_a.any?(&:literal?))
-        end
-        #debug {"  (literal) = #{(!not_iri).inspect}"}
-        # FIXME: detect when values are all represented through chaining
-        context.coerce(predicate, not_iri ? false : '@id')
+      # Turn graph into a triple array
+      statements = @graph.each_statement.to_a
+      debug("writer") { "serialize #{statements.length} statements, #{@options.inspect}"}
+      result = API.fromRDF(statements, nil, @options)
+      # If we were provided a context, or prefixes, use them to compact the output
+      context = RDF::Util::File.open_file(@options[:context]) if @options[:context].is_a?(String)
+      context ||= @options[:context]
+      context ||= if @options[:prefixes] || @options[:language] || @options[:standard_prefixes]
+        ctx = EvaluationContext.new(@options)
+        ctx.language = @options[:language] if @options[:language]
+        @options[:prefixes].each do |prefix, iri|
+          ctx.set_mapping(prefix, iri) if prefix && iri
+        end if @options[:prefixes]
+        ctx
       end
-      debug {"iri_range(#{predicate}) = #{context.coerce(predicate).inspect}"}
-      context.coerce(predicate) == '@id'
-    end
-    ##
-    # Does predicate have a range of specific typed literal?
-    # @param [RDF::URI] predicate
-    # @return [Boolean]
-    def datatype_range?(predicate)
-      unless context.coerce(predicate)
-        # objects of all statements with the predicate must be literal
-        # and have the same non-nil datatype
-        dt = nil
-        if @options[:automatic]
-          @graph.query(:predicate => predicate) do |st|
-            debug {"datatype_range? literal? #{st.object.literal?.inspect} dt? #{(st.object.literal? && st.object.has_datatype?).inspect}"}
-            if st.object.literal? && st.object.has_datatype?
-              dt = st.object.datatype.to_s if dt.nil?
-              debug {"=> dt: #{st.object.datatype}"}
-              dt = false unless dt == st.object.datatype.to_s
-            else
-              dt = false
-            end
-          end
-          # Cause necessary prefixes to be output
-          format_iri(dt, :position => :datatype) if dt && !NATIVE_DATATYPES.include?(dt.to_s)
-          debug {"range(#{predicate}) = #{dt.inspect}"}
-        else
-          dt = false
-        end
-        context.coerce(predicate, dt)
+      # Perform compaction, if we have a context
+      if context
+        debug("writer") { "compact result"}
+        result = API.compact(result, context, nil, @options)
       end
-      context.coerce(predicate)
-    end
-    ##
-    # Is every use of the predicate an RDF Collection?
-    #
-    # @param [RDF::URI] predicate
-    # @return [Boolean]
-    def list_range?(predicate)
-      return false if [RDF.first, RDF.rest].include?(predicate)
-      unless @list_range.include?(predicate.to_s)
-        # objects of all statements with the predicate must be a list
-        @list_range[predicate.to_s] = if @options[:automatic]
-          @graph.query(:predicate => predicate).to_a.all? do |st|
-            is_valid_list?(st.object)
-          end
-        else
-          false
-        end
-        context.list(predicate, true) if @list_range[predicate.to_s]
-        debug {"list(#{predicate}) = #{@list_range[predicate.to_s].inspect}"}
-      end
-      @list_range[predicate.to_s]
-    end
-    # Reset internal helper instance variables
-    def reset
-      @depth = 0
-      @references = {}
-      @serialized = {}
-      @subjects = {}
-      @list_range = {}
-    end
-    # Checks if l is a valid RDF list, i.e. no nodes have other properties.
-    def is_valid_list?(l)
-      #debug {"is_valid_list: #{l.inspect}"}
-      return RDF::List.new(l, @graph).valid?
-    end
-    def is_done?(subject)
-      @serialized.include?(subject)
-    end
-    # Mark a subject as done.
-    def subject_done(subject)
-      @serialized[subject] = true
-    end
-    # Add debug event to debug array, if specified
-    #
-    # @param [String] message
-    # @yieldreturn [String] appended to message, to allow for lazy-evaulation of message
-    def debug(*args)
-      return unless ::JSON::LD.debug? || @options[:debug]
-      message = " " * @depth * 2 + (args.empty? ? "" : args.join(": "))
-      message += yield if block_given?
-      puts message if JSON::LD::debug?
-      @options[:debug] << message if @options[:debug].is_a?(Array)
-    end
-    # Increase depth around a method invocation
-    def depth
-      @depth += 1
-      ret = yield
-      @depth -= 1
-      ret
+      @output.write(result.to_json(JSON_STATE))
     end
   end
 end