RubyGems - active-fedora - Versions diffs - 3.0.7 → 3.1.0.pre1 - Mend

active-fedora 3.0.7 → 3.1.0.pre1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

data/.rvmrc +1 -1
data/Gemfile.lock +39 -10
data/History.txt +0 -4
data/active-fedora.gemspec +4 -3
data/lib/active_fedora.rb +9 -9
data/lib/active_fedora/base.rb +92 -163
data/lib/active_fedora/datastream.rb +59 -60
data/lib/active_fedora/datastream_hash.rb +18 -0
data/lib/active_fedora/metadata_datastream.rb +3 -2
data/lib/active_fedora/metadata_datastream_helper.rb +3 -15
data/lib/active_fedora/model.rb +3 -3
data/lib/active_fedora/nokogiri_datastream.rb +305 -302
data/lib/active_fedora/qualified_dublin_core_datastream.rb +24 -19
data/lib/active_fedora/rels_ext_datastream.rb +39 -37
data/lib/active_fedora/rubydora_connection.rb +40 -0
data/lib/active_fedora/semantic_node.rb +1 -1
data/lib/active_fedora/solr_service.rb +1 -1
data/lib/active_fedora/version.rb +1 -1
data/lib/ruby-fedora.rb +0 -8
data/lib/tasks/active_fedora.rake +14 -9
data/lib/tasks/active_fedora_dev.rake +23 -40
data/spec/integration/base_loader_spec.rb +4 -21
data/spec/integration/base_spec.rb +300 -310
data/spec/integration/bug_spec.rb +9 -10
data/spec/integration/datastream_spec.rb +12 -12
data/spec/integration/metadata_datastream_helper_spec.rb +7 -10
data/spec/integration/model_spec.rb +3 -2
data/spec/integration/rels_ext_datastream_spec.rb +9 -15
data/spec/spec_helper.rb +2 -29
data/spec/unit/active_fedora_spec.rb +5 -5
data/spec/unit/base_cma_spec.rb +0 -7
data/spec/unit/base_datastream_management_spec.rb +8 -67
data/spec/unit/base_delegate_spec.rb +26 -9
data/spec/unit/base_extra_spec.rb +5 -3
data/spec/unit/base_file_management_spec.rb +10 -17
data/spec/unit/base_named_datastream_spec.rb +76 -199
data/spec/unit/base_spec.rb +152 -69
data/spec/unit/content_model_spec.rb +1 -1
data/spec/unit/datastream_concurrency_spec.rb +5 -4
data/spec/unit/datastream_spec.rb +28 -48
data/spec/unit/has_many_collection_spec.rb +2 -0
data/spec/unit/inheritance_spec.rb +6 -6
data/spec/unit/metadata_datastream_spec.rb +12 -28
data/spec/unit/model_spec.rb +10 -10
data/spec/unit/nokogiri_datastream_spec.rb +31 -33
data/spec/unit/qualified_dublin_core_datastream_spec.rb +15 -15
data/spec/unit/rels_ext_datastream_spec.rb +35 -29
data/spec/unit/rubydora_connection_spec.rb +26 -0
data/spec/unit/semantic_node_spec.rb +12 -17
data/spec/unit/solr_config_options_spec.rb +13 -14
data/spec/unit/solr_service_spec.rb +14 -17
metadata +59 -55
data/lib/fedora/base.rb +0 -38
data/lib/fedora/connection.rb +0 -218
data/lib/fedora/datastream.rb +0 -67
data/lib/fedora/fedora_object.rb +0 -161
data/lib/fedora/formats.rb +0 -30
data/lib/fedora/generic_search.rb +0 -71
data/lib/fedora/repository.rb +0 -298
data/spec/integration/datastreams_crud_spec.rb +0 -208
data/spec/integration/fedora_object_spec.rb +0 -77
data/spec/integration/repository_spec.rb +0 -301
data/spec/integration/rf_fedora_object_spec.rb +0 -95
data/spec/unit/connection_spec.rb +0 -25
data/spec/unit/fedora_object_spec.rb +0 -74
data/spec/unit/repository_spec.rb +0 -143
data/spec/unit/rf_datastream_spec.rb +0 -63

data/lib/active_fedora/datastream.rb CHANGED

@@ -1,63 +1,54 @@
-require 'fedora/datastream'
 module ActiveFedora
   #This class represents a Fedora datastream
-  class Datastream < Fedora::Datastream
+  class Datastream < Rubydora::Datastream
     attr_accessor :dirty, :last_modified, :fields
-    def initialize(attrs = {})
+    def initialize(digital_object, dsid, exists_in_fedora=false )
       @fields={}
       @dirty = false
-      super
+      super(digital_object, dsid)
     end
-    #Return the xml content representing this Datastream from Fedora
-    def content
-      result = Fedora::Repository.instance.fetch_custom(self.attributes[:pid], "datastreams/#{self.dsid}/content")
-      return result
-    end
+    # #Return the xml content representing this Datastream from Fedora
+    # def content
+    #   result = Fedora::Repository.instance.fetch_custom(self.attributes[:pid], "datastreams/#{self.dsid}/content")
+    #   return result
+    # end
     #set this Datastream's content
     def content=(content)
-      self.blob = content
+      super
       self.dirty = true
     end
-    def self.delete(parent_pid, dsid)
-      Fedora::Repository.instance.delete("%s/datastreams/%s"%[parent_pid, dsid])
-    end
+    # def self.delete(parent_pid, dsid)
+    #   Fedora::Repository.instance.delete("%s/datastreams/%s"%[parent_pid, dsid])
+    # end
-    def delete
-      self.class.delete(self.pid, self.dsid)
-    end
+    # def delete
+    #   self.class.delete(self.pid, self.dsid)
+    # end
-    #get this datastreams identifier
-    def pid
-      self.attributes[:pid]
-    end
+    # #get this datastreams identifier
+    # def pid
+    #   self.attributes[:pid]
+    # end
-    #set this datastreams parent identifier
-    def pid=(pid)
-      self.attributes[:pid] = pid
-    end
+    # #set this datastreams parent identifier
+    # def pid=(pid)
+    #   self.attributes[:pid] = pid
+    # end
-    #set this datastreams identifier (note: sets both dsID and dsid)
-    def dsid=(dsid)
-      self.attributes[:dsID] = dsid
-      self.attributes[:dsid] = dsid
-    end
+    # #set this datastreams identifier (note: sets both dsID and dsid)
+    # def dsid=(dsid)
+    #   self.attributes[:dsID] = dsid
+    #   self.attributes[:dsid] = dsid
+    # end
     def size
-      if !self.attributes.fetch(:dsSize,nil)
-        if self.new_object?
-          self.attributes[:dsSize]=nil
-        else
-          attrs = XmlSimple.xml_in(Fedora::Repository.instance.fetch_custom(self.pid,"datastreams/#{self.dsid}"))
-          self.attributes[:dsSize]=attrs["dsSize"].first
-        end
-      end
-      self.attributes[:dsSize]
+      self.profile['dsSize']
     end
     #compatibility method for rails' url generators. This method will
@@ -69,14 +60,19 @@ module ActiveFedora
     # Test whether this datastream been modified since it was last saved?
     def dirty?
-      @dirty
+      @dirty || changed?
+    end
+    def new_object?
+      new?
     end
     # Save the datastream into fedora.
     # Also triggers {#before_save} and {#after_save} callbacks
     def save
       before_save
-      result = Fedora::Repository.instance.save(self)
+      raise "No content #{dsid}" if @content.nil?
+      result = super
       after_save
       result
     end
@@ -86,6 +82,9 @@ module ActiveFedora
       #check_concurrency
     end
+    # serializes any changed data into the content field
+    def serialize!
+    end
     # Populate a Datastream object based on the "datastream" node from a FOXML file
     # @param [ActiveFedora::Datastream] tmpl the Datastream object that you are building
     # @param [Nokogiri::XML::Node] node the "foxml:datastream" node from a FOXML file
@@ -102,26 +101,26 @@ module ActiveFedora
     # returns a datetime in the standard W3C DateTime Format.
     # ie 2008-10-17T00:17:18.194Z
-    def last_modified_in_repository
-      # A hack to get around the fact that you can't call getDatastreamHistory
-      # or API-M getDatasreams on Fedora 3.0 REST API
-      # grabs the CREATED attribute off of the last foxml:datastreamVersion
-      # within the appropriate datastream node in the objectXML
-      if self.pid != nil
-        object_xml = Fedora::FedoraObject.object_xml(self.pid).gsub("\n     ","")
-        datastream_xml = REXML::Document.new(object_xml).root.elements["foxml:datastream[@ID='#{self.dsid}']"]
-        if datastream_xml.length > 3
-          datastream_xml.elements.each do |el|
-            logger.debug el.inspect
-          end
-        end
-        datastream_xml.elements[datastream_xml.length - 2].attributes["CREATED"]
-      else
-        return nil
-      end
-    end
+    # def last_modified_in_repository
+    #   # A hack to get around the fact that you can't call getDatastreamHistory
+    #   # or API-M getDatasreams on Fedora 3.0 REST API
+    #   # grabs the CREATED attribute off of the last foxml:datastreamVersion
+    #   # within the appropriate datastream node in the objectXML
+    #   if self.pid != nil
+    #     object_xml = Fedora::FedoraObject.object_xml(self.pid).gsub("\n     ","")
+    #     datastream_xml = REXML::Document.new(object_xml).root.elements["foxml:datastream[@ID='#{self.dsid}']"]
+    #
+    #     if datastream_xml.length > 3
+    #       datastream_xml.elements.each do |el|
+    #         logger.debug el.inspect
+    #       end
+    #     end
+    #
+    #     datastream_xml.elements[datastream_xml.length - 2].attributes["CREATED"]
+    #   else
+    #     return nil
+    #   end
+    # end
     def check_concurrency # :nodoc:
       return true

data/lib/active_fedora/datastream_hash.rb ADDED

@@ -0,0 +1,18 @@
+module ActiveFedora
+  class DatastreamHash < Hash
+    def initialize (obj)
+      @obj = obj
+      super()
+    end
+    def [] (key)
+      if key == 'DC' && !has_key?(key)
+        ds = Datastream.new(@obj.inner_object, key, true)
+        ds.content
+        self[key] = ds
+      end
+      super
+    end
+  end
+end

data/lib/active_fedora/metadata_datastream.rb CHANGED

@@ -133,8 +133,9 @@ module ActiveFedora
     # Populate a MetadataDatastream object based on the "datastream" node from a FOXML file
     # @param [ActiveFedora::Datastream] tmpl the Datastream object that you are building
     # @param [Nokogiri::XML::Node] node the "foxml:datastream" node from a FOXML file.  Assumes that the content of this datastream is that of an ActiveFedora MetadataDatastream (<fields>...</fields>)
-    def self.from_xml(tmpl, node) # :nodoc:
-      node.xpath("./foxml:datastreamVersion[last()]/foxml:xmlContent/fields/node()").each do |f|
+    def self.from_xml(xml, tmpl) # :nodoc:
+      node = Nokogiri::XML::Document.parse(xml)
+      node.xpath("fields/node()").each do |f|
           tmpl.send("#{f.name}_append", f.text) unless f.class == Nokogiri::XML::Text
       end
       tmpl.send(:dirty=, false)

data/lib/active_fedora/metadata_datastream_helper.rb CHANGED

@@ -21,20 +21,8 @@ module ActiveFedora::MetadataDatastreamHelper
     klass.send(:include, Solrizer::FieldNameMapper)
   end
-  #constructor, calls up to ActiveFedora::Datastream's constructor
-  def initialize(attrs=nil)
-    super
-    @fields={}
-  end
-  # sets the blob, which in this case is the xml version of self, then calls ActiveFedora::Datastream.save
-  def save
-    self.set_blob_for_save
-    super
-  end
-  def set_blob_for_save # :nodoc:
-    self.blob = self.to_xml
+  def serialize! # :nodoc:
+    self.content = self.to_xml  ##TODO only do this when the xml will have changed to avoid a load of the datastream content.
   end
   def to_solr(solr_doc = Hash.new) # :nodoc:
@@ -95,4 +83,4 @@ module ActiveFedora::MetadataDatastreamHelper
     return builder.to_xml
   end
-end
+end

data/lib/active_fedora/model.rb CHANGED

@@ -50,7 +50,7 @@ module ActiveFedora
       # @example this will return an instance of Book, even if the object hydra:dataset1 asserts that it is a Dataset
       #   Book.load_instance("hydra:dataset1")
       def load_instance(pid)
-        Fedora::Repository.instance.find_model(pid, self)
+        RubydoraConnection.instance.find_model(pid, self)
       end
       # Takes :all or a pid as arguments
@@ -75,7 +75,7 @@ module ActiveFedora
           hits = SolrService.instance.conn.query(q).hits
         end
         results = hits.map do |hit|
-          obj = Fedora::Repository.instance.find_model(hit[SOLR_DOCUMENT_ID], self)
+          obj = RubydoraConnection.instance.find_model(hit[SOLR_DOCUMENT_ID], self)
           #obj.inner_object.new_object = false
           #return obj
         end
@@ -208,7 +208,7 @@ module ActiveFedora
       def class_fields
         #create dummy object that is empty by passing in fake pid
-        object = self.new({:pid=>'FAKE'})
+        object = self.new()#{:pid=>'FAKE'})
         fields = object.fields
         #reset id to nothing
         fields[:id][:values] = []

data/lib/active_fedora/nokogiri_datastream.rb CHANGED

@@ -3,345 +3,348 @@ require  "om"
 require "solrizer/xml"
 #this class represents a MetadataDatastream, a special case of ActiveFedora::Datastream
-class ActiveFedora::NokogiriDatastream < ActiveFedora::Datastream
+module ActiveFedora
+  class NokogiriDatastream < Datastream
+    include MetadataDatastreamHelper
+    include OM::XML::Document
+    include Solrizer::XML::TerminologyBasedSolrizer # this adds support for calling .to_solr
-  include ActiveFedora::MetadataDatastreamHelper
-  include OM::XML::Document
-  include Solrizer::XML::TerminologyBasedSolrizer # this adds support for calling .to_solr
-  # extend(OM::XML::Container::ClassMethods)
+    # extend(OM::XML::Container::ClassMethods)
-  alias_method(:om_term_values, :term_values) unless method_defined?(:om_term_values)
-  alias_method(:om_update_values, :update_values) unless method_defined?(:om_update_values)
-  attr_accessor :internal_solr_doc
-  attr_reader :ng_xml
-  #constructor, calls up to ActiveFedora::Datastream's constructor
-  def initialize(attrs=nil)
-    super
-    @fields={}
-    self.class.from_xml(blob, self)
-  end
+    alias_method(:om_term_values, :term_values) unless method_defined?(:om_term_values)
+    alias_method(:om_update_values, :update_values) unless method_defined?(:om_update_values)
+    attr_accessor :internal_solr_doc
+    attr_reader :ng_xml
-  # Create an instance of this class based on xml content
-  # @param [String, File, Nokogiri::XML::Node] xml the xml content to build from
-  # @param [ActiveFedora::MetadataDatastream] tmpl the Datastream object that you are building @default a new instance of this class
-  # Careful! If you call this from a constructor, be sure to provide something 'ie. self' as the @tmpl. Otherwise, you will get an infinite loop!
-  def self.from_xml(xml, tmpl=self.new) # :nodoc:
-    if xml.nil?
-      tmpl.ng_xml = self.xml_template
-    elsif xml.kind_of? Nokogiri::XML::Node || xml.kind_of?(Nokogiri::XML::Document)
-      tmpl.ng_xml = xml
-    else
-      tmpl.ng_xml = Nokogiri::XML::Document.parse(xml)
-    end
-    tmpl.send(:dirty=, false)
-    return tmpl
-  end
-  def self.xml_template
-    Nokogiri::XML::Document.parse("<xml/>")
-  end
-  def ng_xml=(new_xml)
-    case new_xml
-    when Nokogiri::XML::Document, Nokogiri::XML::Element, Nokogiri::XML::Node
-      @ng_xml = new_xml
-    when String
-      @ng_xml = Nokogiri::XML::Document.parse(new_xml)
-    else
-      raise TypeError, "You passed a #{new_xml.class} into the ng_xml of the #{self.dsid} datastream. NokogiriDatastream.ng_xml= only accepts Nokogiri::XML::Document, Nokogiri::XML::Element, Nokogiri::XML::Node, or raw XML (String) as inputs."
+    def initialize(digital_object, dsid, exists_in_fedora=false)
+      super
+      self.class.from_xml(nil, self)
     end
-    self.dirty = true
-  end
-  def content=(content)
-    super
-    self.ng_xml = Nokogiri::XML::Document.parse(content)
-  end
-  def to_xml(xml = self.ng_xml)
-    ng_xml = self.ng_xml
-    if ng_xml.respond_to?(:root) && ng_xml.root.nil? && self.class.respond_to?(:root_property_ref) && !self.class.root_property_ref.nil?
-      ng_xml = self.class.generate(self.class.root_property_ref, "")
-      if xml.root.nil?
-        xml = ng_xml
+    # Create an instance of this class based on xml content
+    # @param [String, File, Nokogiri::XML::Node] xml the xml content to build from
+    # @param [ActiveFedora::MetadataDatastream] tmpl the Datastream object that you are building @default a new instance of this class
+    # Careful! If you call this from a constructor, be sure to provide something 'ie. self' as the @tmpl. Otherwise, you will get an infinite loop!
+    def self.from_xml(xml, tmpl=nil)
+      tmpl = self.new(nil, nil) if tmpl.nil?  ## This path is used only for unit testing (e.g. MarpaDCDatastream.from_xml(fixture("data.xml")) )
+      if xml.nil?
+        tmpl.ng_xml = self.xml_template
+      elsif xml.kind_of? Nokogiri::XML::Node || xml.kind_of?(Nokogiri::XML::Document)
+        tmpl.ng_xml = xml
+      else
+        tmpl.ng_xml = Nokogiri::XML::Document.parse(xml)
+      end
+      tmpl.send(:dirty=, false)
+      return tmpl
+    end
+    def self.xml_template
+      Nokogiri::XML::Document.parse("<xml/>")
+    end
+    def ng_xml=(new_xml)
+      case new_xml
+      when Nokogiri::XML::Document, Nokogiri::XML::Element, Nokogiri::XML::Node
+        @ng_xml = new_xml
+      when String
+        @ng_xml = Nokogiri::XML::Document.parse(new_xml)
+      else
+        raise TypeError, "You passed a #{new_xml.class} into the ng_xml of the #{self.dsid} datastream. NokogiriDatastream.ng_xml= only accepts Nokogiri::XML::Document, Nokogiri::XML::Element, Nokogiri::XML::Node, or raw XML (String) as inputs."
       end
     end
+    def content=(content)
+      super
+      self.ng_xml = Nokogiri::XML::Document.parse(content)
+    end
+    def to_xml(xml = self.ng_xml)
+      ng_xml = self.ng_xml
+      if ng_xml.respond_to?(:root) && ng_xml.root.nil? && self.class.respond_to?(:root_property_ref) && !self.class.root_property_ref.nil?
+        ng_xml = self.class.generate(self.class.root_property_ref, "")
+        if xml.root.nil?
+          xml = ng_xml
+        end
+      end
-    unless xml == ng_xml || ng_xml.root.nil?
-      if xml.kind_of?(Nokogiri::XML::Document)
-          xml.root.add_child(ng_xml.root)
-      elsif xml.kind_of?(Nokogiri::XML::Node)
-          xml.add_child(ng_xml.root)
-      else
-          raise "You can only pass instances of Nokogiri::XML::Node into this method.  You passed in #{xml}"
+      unless xml == ng_xml || ng_xml.root.nil?
+        if xml.kind_of?(Nokogiri::XML::Document)
+            xml.root.add_child(ng_xml.root)
+        elsif xml.kind_of?(Nokogiri::XML::Node)
+            xml.add_child(ng_xml.root)
+        else
+            raise "You can only pass instances of Nokogiri::XML::Node into this method.  You passed in #{xml}"
+        end
       end
+      return xml.to_xml {|config| config.no_declaration}
     end
-    return xml.to_xml {|config| config.no_declaration}
-  end
-  # ** Experimental **
-  #
-  # This method is called by ActiveFedora::Base.load_instance_from_solr
-  # in order to initialize a nokogiri datastreams values from a solr document.
-  # This method merely sets the internal_solr_doc to the document passed in.
-  # Then any calls to get_values get values from the solr document on demand
-  # instead of directly from the xml stored in Fedora.  This should be used
-  # for read-only purposes only, and instances where you want to improve performance by
-  # getting data from solr instead of Fedora.
-  #
-  # See ActiveFedora::Base.load_instance_from_solr and +get_values_from_solr+ for more information.
-  def from_solr(solr_doc)
-    #just initialize internal_solr_doc since any value retrieval will be done via lazy loading on this doc on-demand
-    @internal_solr_doc = solr_doc
-  end
+    # ** Experimental **
+    #
+    # This method is called by ActiveFedora::Base.load_instance_from_solr
+    # in order to initialize a nokogiri datastreams values from a solr document.
+    # This method merely sets the internal_solr_doc to the document passed in.
+    # Then any calls to get_values get values from the solr document on demand
+    # instead of directly from the xml stored in Fedora.  This should be used
+    # for read-only purposes only, and instances where you want to improve performance by
+    # getting data from solr instead of Fedora.
+    #
+    # See ActiveFedora::Base.load_instance_from_solr and +get_values_from_solr+ for more information.
+    def from_solr(solr_doc)
+      #just initialize internal_solr_doc since any value retrieval will be done via lazy loading on this doc on-demand
+      @internal_solr_doc = solr_doc
+    end
-  # ** Experimental **
-  # This method is called by +get_values+ if this datastream has been initialized by calling from_solr method via
-  # ActiveFedora::Base.load_instance_from_solr. This method retrieves values from a preinitialized @internal_solr_doc instead of xml.
-  # This makes the datastream read-only and this method is not intended to be used in any other case.
-  #
-  # Values are retrieved from the @internal_solr_doc on-demand instead of via xml preloaded into memory.
-  # A term_pointer is passed in and if it contains hierarchical indexes it will detect which solr field values need to be returned.
-  #
-  # ====Example 1 (non-hierarchical term_pointer):
-  #
-  #   term_pointer = [:image, :title_set, :title]
-  #
-  #   Returns value of "image_title_set_title_t" in @internal_solr_doc
-  #
-  # ====Example 2 (hierarchical term_pointer that contains one or more indexes):
-  #   term_pointer = [:image, {:title_set=>1}, :title]
-  #
-  #   relevant xml:
-  #         <image>
-  #           <title_set>
-  #             <title>Title 1</title>
-  #           </title_set>
-  #         </image>
-  #         <image>
-  #           <title_set>
-  #             <title>Title 2</title>
-  #           </title_set>
-  #           <title_set>
-  #             <title>Title 3</title>
-  #           </title_set>
-  #         </image>
-  #
-  #   Repeating element nodes are indexed and will be stored in solr as follows:
-  #     image_0_title_set_0_title_t = "Title 1"
-  #     image_1_title_set_0_title_t = "Title 2"
-  #     image_1_title_set_1_title_t = "Title 3"
-  #
-  #   Even though no image element index is specified, only the second image element has two title_set elements so the expected return value is
-  #     ["Title 3"]
-  #
-  #   While loading from solr the xml hierarchy is not immediately apparent so we must detect first how many image elements with a title_set element exist
-  #   and then check which of those elements have a second title element.
-  #
-  #   As this nokogiri datastream is indexed in solr, a value at each level in the tree will be stored independently and therefore
-  #   if 'image_0_title_set_0_title_t' exists in solr 'image_0_title_set_t' will also exist in solr.
-  #   So, we will build up the relevant solr names incrementally for a given term_pointer.  The last element in the
-  #   solr_name will not contain an index.
-  #
-  #   It then will do the following:
-  #     Because no index is supplied for :image it will detect which indexes exist in solr
-  #        image_0_title_set_t   (found key and add 'image_0_title_set' to base solr_name list)
-  #        image_1_title_set_t   (found key and add 'image_0_title_set' to base solr_name list)
-  #        image_2_title_set_t   (not found and stop checking indexes for image)
-  #     After iteration 1:
-  #        bases = ["image_0_title_set","image_1_title_set"]
-  #
-  #     Two image nodes were found and next sees index of 1 supplied for title_set so just uses index of 1 building off bases found in previous iteration
-  #        image_0_title_set_1_title_t (not found remove 'image_0_title_set' from base solr_name list)
-  #        image_1_title_set_1_title_t (found and replace 'image_1_title_set' with new base 'image_1_title_set_1_title')
-  #
-  #     After iteration 2:
-  #        bases = ["image_1_title_set_1_title"]
-  #     It always looks ahead one element so we check if any elements are after title.  There are not any other elements so we are done iterating.
-  #        returns @internal_solr_doc["image_1_title_set_1_title_t"]
-  # @param [Array] term_pointer Term pointer similar to an xpath ie. [:image, :title_set, :title]
-  # @return [Array] If no values are found an empty Array is returned.
-  def get_values_from_solr(*term_pointer)
-    values = []
-    solr_doc = @internal_solr_doc
-    return values if solr_doc.nil?
-    begin
-     term = self.class.terminology.retrieve_term(*OM.pointers_to_flat_array(term_pointer, false))
-     #check if hierarchical term pointer
-     if is_hierarchical_term_pointer?(*term_pointer)
-       # if we are hierarchical need to detect all possible node values that exist
-       # we do this by building up the possible solr names parent by parent and/or child by child
-       # if an index is supplied for any node in the pointer it will be used
-       # otherwise it will include all nodes and indexes that exist in solr
-       bases = []
-       #add first item in term_pointer as start of bases
-       # then iterate through possible nodes that might exist
-       term_pointer.first.kind_of?(Hash) ? bases << term_pointer.first.keys.first : bases << term_pointer.first
-       for i in 1..(term_pointer.length-1)
-         #iterate in reverse so that we can modify the bases array while iterating
-         (bases.length-1).downto(0) do |j|
-           current_last = (term_pointer[i].kind_of?(Hash) ? term_pointer[i].keys.first : term_pointer[i])
-           if (term_pointer[i-1].kind_of?(Hash))
-             #just use index supplied instead of trying possibilities
-             index = term_pointer[i-1].values.first
-             solr_name_base = OM::XML::Terminology.term_hierarchical_name({bases[j]=>index},current_last)
-             solr_name = generate_solr_symbol(solr_name_base, term.data_type)
-             bases.delete_at(j)
-             #insert the new solr name base if found
-             bases.insert(j,solr_name_base) if has_solr_name?(solr_name,solr_doc)
-           else
-             #detect how many nodes exist
-             index = 0
-             current_base = bases[j]
-             bases.delete_at(j)
-             solr_name_base = OM::XML::Terminology.term_hierarchical_name({current_base=>index},current_last)
-             solr_name = generate_solr_symbol(solr_name_base, term.data_type)
-             #check for indexes that exist until we find all nodes
-             while has_solr_name?(solr_name,solr_doc) do
-               #only reinsert if it exists
-               bases.insert(j,solr_name_base)
-               index = index + 1
+    # ** Experimental **
+    # This method is called by +get_values+ if this datastream has been initialized by calling from_solr method via
+    # ActiveFedora::Base.load_instance_from_solr. This method retrieves values from a preinitialized @internal_solr_doc instead of xml.
+    # This makes the datastream read-only and this method is not intended to be used in any other case.
+    #
+    # Values are retrieved from the @internal_solr_doc on-demand instead of via xml preloaded into memory.
+    # A term_pointer is passed in and if it contains hierarchical indexes it will detect which solr field values need to be returned.
+    #
+    # ====Example 1 (non-hierarchical term_pointer):
+    #
+    #   term_pointer = [:image, :title_set, :title]
+    #
+    #   Returns value of "image_title_set_title_t" in @internal_solr_doc
+    #
+    # ====Example 2 (hierarchical term_pointer that contains one or more indexes):
+    #   term_pointer = [:image, {:title_set=>1}, :title]
+    #
+    #   relevant xml:
+    #         <image>
+    #           <title_set>
+    #             <title>Title 1</title>
+    #           </title_set>
+    #         </image>
+    #         <image>
+    #           <title_set>
+    #             <title>Title 2</title>
+    #           </title_set>
+    #           <title_set>
+    #             <title>Title 3</title>
+    #           </title_set>
+    #         </image>
+    #
+    #   Repeating element nodes are indexed and will be stored in solr as follows:
+    #     image_0_title_set_0_title_t = "Title 1"
+    #     image_1_title_set_0_title_t = "Title 2"
+    #     image_1_title_set_1_title_t = "Title 3"
+    #
+    #   Even though no image element index is specified, only the second image element has two title_set elements so the expected return value is
+    #     ["Title 3"]
+    #
+    #   While loading from solr the xml hierarchy is not immediately apparent so we must detect first how many image elements with a title_set element exist
+    #   and then check which of those elements have a second title element.
+    #
+    #   As this nokogiri datastream is indexed in solr, a value at each level in the tree will be stored independently and therefore
+    #   if 'image_0_title_set_0_title_t' exists in solr 'image_0_title_set_t' will also exist in solr.
+    #   So, we will build up the relevant solr names incrementally for a given term_pointer.  The last element in the
+    #   solr_name will not contain an index.
+    #
+    #   It then will do the following:
+    #     Because no index is supplied for :image it will detect which indexes exist in solr
+    #        image_0_title_set_t   (found key and add 'image_0_title_set' to base solr_name list)
+    #        image_1_title_set_t   (found key and add 'image_0_title_set' to base solr_name list)
+    #        image_2_title_set_t   (not found and stop checking indexes for image)
+    #     After iteration 1:
+    #        bases = ["image_0_title_set","image_1_title_set"]
+    #
+    #     Two image nodes were found and next sees index of 1 supplied for title_set so just uses index of 1 building off bases found in previous iteration
+    #        image_0_title_set_1_title_t (not found remove 'image_0_title_set' from base solr_name list)
+    #        image_1_title_set_1_title_t (found and replace 'image_1_title_set' with new base 'image_1_title_set_1_title')
+    #
+    #     After iteration 2:
+    #        bases = ["image_1_title_set_1_title"]
+    #     It always looks ahead one element so we check if any elements are after title.  There are not any other elements so we are done iterating.
+    #        returns @internal_solr_doc["image_1_title_set_1_title_t"]
+    # @param [Array] term_pointer Term pointer similar to an xpath ie. [:image, :title_set, :title]
+    # @return [Array] If no values are found an empty Array is returned.
+    def get_values_from_solr(*term_pointer)
+      values = []
+      solr_doc = @internal_solr_doc
+      return values if solr_doc.nil?
+      begin
+       term = self.class.terminology.retrieve_term(*OM.pointers_to_flat_array(term_pointer, false))
+       #check if hierarchical term pointer
+       if is_hierarchical_term_pointer?(*term_pointer)
+         # if we are hierarchical need to detect all possible node values that exist
+         # we do this by building up the possible solr names parent by parent and/or child by child
+         # if an index is supplied for any node in the pointer it will be used
+         # otherwise it will include all nodes and indexes that exist in solr
+         bases = []
+         #add first item in term_pointer as start of bases
+         # then iterate through possible nodes that might exist
+         term_pointer.first.kind_of?(Hash) ? bases << term_pointer.first.keys.first : bases << term_pointer.first
+         for i in 1..(term_pointer.length-1)
+           #iterate in reverse so that we can modify the bases array while iterating
+           (bases.length-1).downto(0) do |j|
+             current_last = (term_pointer[i].kind_of?(Hash) ? term_pointer[i].keys.first : term_pointer[i])
+             if (term_pointer[i-1].kind_of?(Hash))
+               #just use index supplied instead of trying possibilities
+               index = term_pointer[i-1].values.first
+               solr_name_base = OM::XML::Terminology.term_hierarchical_name({bases[j]=>index},current_last)
+               solr_name = generate_solr_symbol(solr_name_base, term.data_type)
+               bases.delete_at(j)
+               #insert the new solr name base if found
+               bases.insert(j,solr_name_base) if has_solr_name?(solr_name,solr_doc)
+             else
+               #detect how many nodes exist
+               index = 0
+               current_base = bases[j]
+               bases.delete_at(j)
                solr_name_base = OM::XML::Terminology.term_hierarchical_name({current_base=>index},current_last)
                solr_name = generate_solr_symbol(solr_name_base, term.data_type)
+               #check for indexes that exist until we find all nodes
+               while has_solr_name?(solr_name,solr_doc) do
+                 #only reinsert if it exists
+                 bases.insert(j,solr_name_base)
+                 index = index + 1
+                 solr_name_base = OM::XML::Terminology.term_hierarchical_name({current_base=>index},current_last)
+                 solr_name = generate_solr_symbol(solr_name_base, term.data_type)
+               end
              end
            end
          end
-       end
-       #all existing applicable solr_names have been found and we can now grab all values and build up our value array
-       bases.each do |base|
-         field_name = generate_solr_symbol(base.to_sym, term.data_type)
-         value = (solr_doc[field_name].nil? ? solr_doc[field_name.to_s]: solr_doc[field_name])
+         #all existing applicable solr_names have been found and we can now grab all values and build up our value array
+         bases.each do |base|
+           field_name = generate_solr_symbol(base.to_sym, term.data_type)
+           value = (solr_doc[field_name].nil? ? solr_doc[field_name.to_s]: solr_doc[field_name])
+           unless value.nil?
+             value.is_a?(Array) ? values.concat(value) : values << value
+           end
+         end
+       else
+         #this is not hierarchical and we can simply look for the solr name created using the terms without any indexes
+         generic_field_name_base = OM::XML::Terminology.term_generic_name(*term_pointer)
+         generic_field_name = generate_solr_symbol(generic_field_name_base, term.data_type)
+         value = (solr_doc[generic_field_name].nil? ? solr_doc[generic_field_name.to_s]: solr_doc[generic_field_name])
          unless value.nil?
            value.is_a?(Array) ? values.concat(value) : values << value
          end
        end
-     else
-       #this is not hierarchical and we can simply look for the solr name created using the terms without any indexes
-       generic_field_name_base = OM::XML::Terminology.term_generic_name(*term_pointer)
-       generic_field_name = generate_solr_symbol(generic_field_name_base, term.data_type)
-       value = (solr_doc[generic_field_name].nil? ? solr_doc[generic_field_name.to_s]: solr_doc[generic_field_name])
-       unless value.nil?
-         value.is_a?(Array) ? values.concat(value) : values << value
-       end
-     end
-    rescue Exception => e
-      #just do nothing since term does not exist and return emtpy values
-      raise e
+      rescue Exception => e
+        #just do nothing since term does not exist and return emtpy values
+        raise e
+      end
+      values
     end
-    values
-  end
-  def generate_solr_symbol(base, data_type)
-    Solrizer::XML::TerminologyBasedSolrizer.default_field_mapper.solr_name(base.to_sym, data_type)
-  end
+    def generate_solr_symbol(base, data_type)
+      Solrizer::XML::TerminologyBasedSolrizer.default_field_mapper.solr_name(base.to_sym, data_type)
+    end
-  # ** Experimental **
-  #@return [Boolean] true if either the key for name exists in solr or if its string value exists
-  #@param [String] name Name of key to look for
-  #@param [Solr::Document] solr_doc Solr doc to query
-  def has_solr_name?(name, solr_doc=Hash.new)
-    !solr_doc[name].nil? || !solr_doc[name.to_s].nil?
-  end
+    # ** Experimental **
+    #@return [Boolean] true if either the key for name exists in solr or if its string value exists
+    #@param [String] name Name of key to look for
+    #@param [Solr::Document] solr_doc Solr doc to query
+    def has_solr_name?(name, solr_doc=Hash.new)
+      !solr_doc[name].nil? || !solr_doc[name.to_s].nil?
+    end
-  # ** Experimental **
-  #@return true if the term_pointer contains an index
-  # ====Example:
-  #     [:image, {:title_set=>1}, :title] return true
-  #     [:image, :title_set, :title]      return false
-  def is_hierarchical_term_pointer?(*term_pointer)
-    if term_pointer.length>1
-      term_pointer.each do |pointer|
-        if pointer.kind_of?(Hash)
-          return true
+    # ** Experimental **
+    #@return true if the term_pointer contains an index
+    # ====Example:
+    #     [:image, {:title_set=>1}, :title] return true
+    #     [:image, :title_set, :title]      return false
+    def is_hierarchical_term_pointer?(*term_pointer)
+      if term_pointer.length>1
+        term_pointer.each do |pointer|
+          if pointer.kind_of?(Hash)
+            return true
+          end
         end
       end
+      return false
     end
-    return false
-  end
-  # Update field values within the current datastream using {#update_values}, which is a wrapper for {http://rdoc.info/gems/om/1.2.4/OM/XML/TermValueOperators#update_values-instance_method OM::TermValueOperators#update_values}
-  # Ignores any fields from params that this datastream's Terminology doesn't recognize
-  #
-  # @param [Hash] params The params specifying which fields to update and their new values.  The syntax of the params Hash is the same as that expected by
-  #         term_pointers must be a valid OM Term pointers (ie. [:name]).  Strings will be ignored.
-  # @param [Hash] opts This is not currently used by the datastream-level update_indexed_attributes method
-  #
-  # Example:
-  #   @mods_ds.update_indexed_attributes( {[{":person"=>"0"}, "role"]=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"} })
-  #   => {"person_0_role"=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"}}
-  #
-  #   @mods_ds.to_xml # (the following is an approximation)
-  #   <mods>
-  #     <mods:name type="person">
-  #     <mods:role>
-  #       <mods:roleTerm>role1</mods:roleTerm>
-  #     </mods:role>
-  #     <mods:role>
-  #       <mods:roleTerm>role2</mods:roleTerm>
-  #     </mods:role>
-  #     <mods:role>
-  #       <mods:roleTerm>role3</mods:roleTerm>
-  #     </mods:role>
-  #     </mods:name>
-  #   </mods>
-  def update_indexed_attributes(params={}, opts={})
-    if self.class.terminology.nil?
-      raise "No terminology is set for this NokogiriDatastream class.  Cannot perform update_indexed_attributes"
-    end
-    # remove any fields from params that this datastream doesn't recognize
-    # make sure to make a copy of params so not to modify hash that might be passed to other methods
-    current_params = params.clone
-    current_params.delete_if do |term_pointer,new_values|
-      if term_pointer.kind_of?(String)
-        logger.warn "WARNING: #{dsid} ignoring {#{term_pointer.inspect} => #{new_values.inspect}} because #{term_pointer.inspect} is a String (only valid OM Term Pointers will be used).  Make sure your html has the correct field_selector tags in it."
-        true
-      else
-        !self.class.terminology.has_term?(*OM.destringify(term_pointer))
+    # Update field values within the current datastream using {#update_values}, which is a wrapper for {http://rdoc.info/gems/om/1.2.4/OM/XML/TermValueOperators#update_values-instance_method OM::TermValueOperators#update_values}
+    # Ignores any fields from params that this datastream's Terminology doesn't recognize
+    #
+    # @param [Hash] params The params specifying which fields to update and their new values.  The syntax of the params Hash is the same as that expected by
+    #         term_pointers must be a valid OM Term pointers (ie. [:name]).  Strings will be ignored.
+    # @param [Hash] opts This is not currently used by the datastream-level update_indexed_attributes method
+    #
+    # Example:
+    #   @mods_ds.update_indexed_attributes( {[{":person"=>"0"}, "role"]=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"} })
+    #   => {"person_0_role"=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"}}
+    #
+    #   @mods_ds.to_xml # (the following is an approximation)
+    #   <mods>
+    #     <mods:name type="person">
+    #     <mods:role>
+    #       <mods:roleTerm>role1</mods:roleTerm>
+    #     </mods:role>
+    #     <mods:role>
+    #       <mods:roleTerm>role2</mods:roleTerm>
+    #     </mods:role>
+    #     <mods:role>
+    #       <mods:roleTerm>role3</mods:roleTerm>
+    #     </mods:role>
+    #     </mods:name>
+    #   </mods>
+    def update_indexed_attributes(params={}, opts={})
+      if self.class.terminology.nil?
+        raise "No terminology is set for this NokogiriDatastream class.  Cannot perform update_indexed_attributes"
+      end
+      # remove any fields from params that this datastream doesn't recognize
+      # make sure to make a copy of params so not to modify hash that might be passed to other methods
+      current_params = params.clone
+      current_params.delete_if do |term_pointer,new_values|
+        if term_pointer.kind_of?(String)
+          logger.warn "WARNING: #{dsid} ignoring {#{term_pointer.inspect} => #{new_values.inspect}} because #{term_pointer.inspect} is a String (only valid OM Term Pointers will be used).  Make sure your html has the correct field_selector tags in it."
+          true
+        else
+          !self.class.terminology.has_term?(*OM.destringify(term_pointer))
+        end
       end
-    end
-    result = {}
-    unless current_params.empty?
-      result = update_values( current_params )
+      result = {}
+      unless current_params.empty?
+        result = update_values( current_params )
+      end
+      return result
     end
-    return result
-  end
-  def get_values(field_key,default=[])
-    term_values(*field_key)
-  end
+    def get_values(field_key,default=[])
+      term_values(*field_key)
+    end
-  # Update values in the datastream's xml
-  # This wraps {http://rdoc.info/gems/om/1.2.4/OM/XML/TermValueOperators#update_values-instance_method OM::TermValueOperators#update_values} so that returns an error if we have loaded from solr since datastreams loaded that way should be read-only
-  #
-  # @example Updating multiple values with a Hash of Term pointers and values
-  #   ds.update_values( {[{":person"=>"0"}, "role", "text"]=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"}, [{:person=>1}, :family_name]=>"Andronicus", [{"person"=>"1"},:given_name]=>["Titus"],[{:person=>1},:role,:text]=>["otherrole1","otherrole2"] } )
-  #   => {"person_0_role_text"=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"}, "person_1_role_text"=>{"0"=>"otherrole1", "1"=>"otherrole2"}}
-  def update_values(params={})
-    if @internal_solr_doc
-      raise "No update performed, this object was initialized via Solr instead of Fedora and is therefore read-only.  Please utilize ActiveFedora::Base.load_instance to first load object via Fedora instead."
-    else
-      result = om_update_values(params)
-      self.dirty= true
-      return result
+    # Update values in the datastream's xml
+    # This wraps {http://rdoc.info/gems/om/1.2.4/OM/XML/TermValueOperators#update_values-instance_method OM::TermValueOperators#update_values} so that returns an error if we have loaded from solr since datastreams loaded that way should be read-only
+    #
+    # @example Updating multiple values with a Hash of Term pointers and values
+    #   ds.update_values( {[{":person"=>"0"}, "role", "text"]=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"}, [{:person=>1}, :family_name]=>"Andronicus", [{"person"=>"1"},:given_name]=>["Titus"],[{:person=>1},:role,:text]=>["otherrole1","otherrole2"] } )
+    #   => {"person_0_role_text"=>{"0"=>"role1", "1"=>"role2", "2"=>"role3"}, "person_1_role_text"=>{"0"=>"otherrole1", "1"=>"otherrole2"}}
+    def update_values(params={})
+      if @internal_solr_doc
+        raise "No update performed, this object was initialized via Solr instead of Fedora and is therefore read-only.  Please utilize ActiveFedora::Base.load_instance to first load object via Fedora instead."
+      else
+        result = om_update_values(params)
+        self.dirty= true
+        return result
+      end
     end
-  end
-  #override OM::XML::term_values so can lazy load from solr if this datastream initialized using +from_solr+
-  def term_values(*term_pointer)
-    if @internal_solr_doc
-      #lazy load values from solr on demand
-      get_values_from_solr(*term_pointer)
-    else
-      om_term_values(*term_pointer)
+    #override OM::XML::term_values so can lazy load from solr if this datastream initialized using +from_solr+
+    def term_values(*term_pointer)
+      if @internal_solr_doc
+        #lazy load values from solr on demand
+        get_values_from_solr(*term_pointer)
+      else
+        om_term_values(*term_pointer)
+      end
     end
   end
 end