RubyGems - taxonifi - Versions diffs - 0.1.0 → 0.2.0 - Mend

taxonifi 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

data/Gemfile +1 -0
data/Gemfile.lock +24 -7
data/README.rdoc +5 -6
data/Rakefile +1 -1
data/VERSION +1 -1
data/lib/assessor/row_assessor.rb +25 -18
data/lib/export/format/base.rb +96 -1
data/lib/export/format/obo_nomenclature.rb +71 -0
data/lib/export/format/prolog.rb +59 -0
data/lib/export/format/species_file.rb +303 -193
data/lib/lumper/clump.rb +112 -0
data/lib/lumper/lumper.rb +71 -45
data/lib/lumper/lumps/parent_child_name_collection.rb +79 -15
data/lib/models/author_year.rb +1 -2
data/lib/models/base.rb +56 -51
data/lib/models/collection.rb +16 -1
data/lib/models/name.rb +56 -15
data/lib/models/name_collection.rb +70 -19
data/lib/models/ref.rb +17 -0
data/lib/models/ref_collection.rb +2 -1
data/lib/models/shared_class_methods.rb +29 -0
data/lib/models/species_name.rb +14 -12
data/lib/splitter/parser.rb +1 -2
data/lib/splitter/tokens.rb +1 -1
data/lib/taxonifi.rb +12 -0
data/lib/utils/array.rb +17 -0
data/lib/utils/hash.rb +17 -0
data/taxonifi.gemspec +116 -0
data/test/file_fixtures/Fossil.csv +11 -0
data/test/file_fixtures/Lygaeoidea.csv +1 -1
data/test/file_fixtures/names.csv +1 -0
data/test/helper.rb +14 -0
data/test/test_export_prolog.rb +14 -0
data/test/test_exporter.rb +23 -0
data/test/test_lumper_clump.rb +75 -0
data/test/test_lumper_names.rb +67 -9
data/test/test_lumper_parent_child_name_collection.rb +47 -3
data/test/test_lumper_refs.rb +22 -7
data/test/test_obo_nomenclature.rb +14 -0
data/test/test_parser.rb +4 -2
data/test/test_splitter_tokens.rb +9 -0
data/test/test_taxonifi_accessor.rb +21 -15
data/test/test_taxonifi_base.rb +25 -0
data/test/test_taxonifi_name.rb +41 -4
data/test/test_taxonifi_name_collection.rb +54 -17
data/test/test_taxonifi_species_name.rb +1 -1
metadata +34 -5

data/lib/export/format/species_file.rb CHANGED Viewed

@@ -29,7 +29,7 @@ module Taxonifi::Export
       'superfamily group' =>       44,
       'subinfraordinal group' =>   45,
       'infraorder' =>              46,
-      'suborder' =>                8,
+      'suborder' =>                48,
       'order' =>                   50,
       'mirorder' =>                51,
       'superorder' =>              52,
@@ -54,288 +54,398 @@ module Taxonifi::Export
     attr_accessor :name_collection
     attr_accessor :ref_collection
+    attr_accessor :pub_collection
     attr_accessor :author_index
     attr_accessor :genus_names, :species_names, :nomenclator
     attr_accessor :authorized_user_id, :time
-    # MANIFEST order is important
-    MANIFEST = %w{tblTaxa tblRefs tblPeople tblRefAuthors tblGenusNames tblSpeciesNames tblNomenclator tblCites}
+    attr_accessor :starting_ref_id
     def initialize(options = {})
       opts = {
         :nc => Taxonifi::Model::NameCollection.new,
         :export_folder => 'species_file',
-        :authorized_user_id => nil
+        :authorized_user_id => nil,
+        :starting_ref_id => 1,                              # should be configured elsewhere... but
+        :manifest => %w{tblPubs tblRefs tblPeople tblRefAuthors tblTaxa tblGenusNames tblSpeciesNames tblNomenclator tblCites}
       }.merge!(options)
+      @manifest = opts[:manifest]
       super(opts)
       raise Taxonifi::Export::ExportError, 'NameCollection not passed to SpeciesFile export.' if ! opts[:nc].class == Taxonifi::Model::NameCollection
       raise Taxonifi::Export::ExportError, 'You must provide authorized_user_id for species_file export initialization.' if opts[:authorized_user_id].nil?
       @name_collection = opts[:nc]
+      @pub_collection = {} # title => id
       @authorized_user_id = opts[:authorized_user_id]
       @author_index = {}
-      #
+      @starting_ref_id = opts[:starting_ref_id]
       # Careful here, at present we are just generating Reference micro-citations from our names, so the indexing "just works"
       # because it's all internal.  There will is a strong potential for key collisions if this pipeline is modified to
       # include references external to the initialized name_collection.  See also export_references.
       #
-      @by_author_reference_index = {}
+      # @by_author_reference_index = {}
       @genus_names = {}
       @species_names = {}
       @nomenclator = {}
       @time = Time.now.strftime("%F %T")
+      @empty_quotes = ""
     end
-    # Export only the ref_collection. Sidesteps the main name-centric exports
-    # Note that this still uses the base @name_collection object as a starting reference,
-    # it just references @name_collection.ref_collection.  So you can do:
-    #   nc = Taxonifi::Model::NameCollection.new
-    #   nc.ref_collection = Taxonifi::Model::RefCollection.new
-    #   etc.
-    def export_references(options = {})
-      opts = {
-        :starting_ref_id => 0,
-        :starting_author_id => 0
-      }
-      configure_folders
-      build_author_index
-      # order matters
-      ['tblPeople', 'tblRefs', 'tblRefAuthors', 'sqlRefs' ].each do |t|
-        write_file(t, send(t))
-      end
-    end
     # Assumes names that are the same are the same person.
     def build_author_index
       @author_index = @name_collection.ref_collection.unique_authors.inject({}){|hsh, a| hsh.merge!(a.compact_string => a)}
     end
     def export()
       super
-      @name_collection.generate_ref_collection(1)
+      # You must have
+      # how to create and link the reference IDs.
+      # Reference related approaches:
+      #
+      # @name_collection.generate_ref_collection(1)
+      # Give authors unique ids:
+      # @name_collection.ref_collection.uniquify_authors(1)
-      # Give authors unique ids
-      @name_collection.ref_collection.uniquify_authors(1)
-      build_author_index
+      if @name_collection.ref_collection
+        build_author_index
+      end
+      # raise Taxonifi::Export::ExportError, 'NameCollection has no RefCollection, you might try @name_collection.generate_ref_collection(1), or alter the manifest: hash.' if ! @name_collection.ref_collection.nil?
       # See notes in #initalize re potential key collisions!
-      @by_author_reference_index =  @name_collection.ref_collection.collection.inject({}){|hsh, r| hsh.merge!(r.author_year_index => r)}
+      # @by_author_reference_index =  @name_collection.ref_collection.collection.inject({}){|hsh, r| hsh.merge!(r.author_year_index => r)}
       @name_collection.names_at_rank('genus').inject(@genus_names){|hsh, n| hsh.merge!(n.name => nil)}
       @name_collection.names_at_rank('subgenus').inject(@genus_names){|hsh, n| hsh.merge!(n.name => nil)}
       @name_collection.names_at_rank('species').inject(@species_names){|hsh, n| hsh.merge!(n.name => nil)}
       @name_collection.names_at_rank('subspecies').inject(@species_names){|hsh, n| hsh.merge!(n.name => nil)}
-      MANIFEST.each do |f|
-        write_file(f, send(f))
+      str = [ 'BEGIN TRY', 'BEGIN TRANSACTION']
+      @manifest.each do |f|
+        str << send(f)
+      end
+      str << ['COMMIT', 'END TRY', 'BEGIN CATCH',
+        'SELECT ERROR_LINE() AS ErrorLine, ERROR_NUMBER() AS ErrorNumber, ERROR_MESSAGE() AS ErrorMessage;',
+        'ROLLBACK', 'END CATCH']
+      write_file('everything.sql', str.join("\n\n"))
+      true
+    end
+    # Deprecated!
+    # Export only the ref_collection. Sidesteps the main name-centric exports
+    # Note that this still uses the base @name_collection object as a starting reference,
+    # it just references @name_collection.ref_collection.  So you can do:
+    #   nc = Taxonifi::Model::NameCollection.new
+    #   nc.ref_collection = Taxonifi::Model::RefCollection.new
+    #   etc.
+    def export_references(options = {})
+      raise Taxonifi::Export::ExportError, 'Method deprecated, alter manifest: to achieve a similar result.'
+     #opts = {
+     #  :starting_ref_id => 0,
+     #  :starting_author_id => 0
+     #}
+     #configure_folders
+     #build_author_index
+     ## order matters
+     #['tblPeople', 'tblRefs', 'tblRefAuthors', 'sqlRefs' ].each do |t|
+     #  write_file(t, send(t))
+     #end
+    end
+    # Get's the reference for a name as referenced
+    # by .related[:link_to_ref_from_row]
+    def get_ref(name)
+      if not name.related[:link_to_ref_from_row].nil?
+        return @name_collection.ref_collection.object_from_row(name.related[:link_to_ref_from_row])
       end
+      nil
     end
     def tblTaxa
       @headers = %w{TaxonNameID TaxonNameStr RankID Name Parens AboveID RefID DataFlags AccessCode NameStatus StatusFlags OriginalGenusID LastUpdate ModifiedBy}
-      @csv_string = CSV.generate() do |csv|
-        csv << @headers
-        @name_collection.collection.each do |n|
-          ref = @by_author_reference_index[n.author_year_index]
-          cols = {
-            TaxonNameID: n.id,
-            TaxonNameStr: n.parent_ids_sf_style,        # closure -> ends with 1
-            RankID: SPECIES_FILE_RANKS[n.rank],
-            Name: n.name,
-            Parens: (n.parens ? 1 : 0),
-            AboveID: (n.related_name.nil? ? (n.parent ? n.parent.id : 0) : n.related_name.id),   # !! SF folks like to pre-populate with zeros
-            RefID: (ref ? ref.id : 0),
-            DataFlags: 0,                                # see http://software.speciesfile.org/Design/TaxaTables.aspx#Taxon, a flag populated when data is reviewed, initialize to zero
-            AccessCode: 0,
-            NameStatus: (n.related_name.nil? ? 0 : 7),                            # 0 :valid, 7: synonym)
-            StatusFlags: (n.related_name.nil? ? 0 : 262144),                      # 0 :valid, 262144: jr. synonym
-            OriginalGenusID: (!n.parens && n.parent_at_rank('genus') ? n.parent_at_rank('genus').id : 0),      # SF must be pre-configured with 0 filler (this restriction needs to go)
-            LastUpdate: @time,
-            ModifiedBy: @authorized_user_id,
-          }
-          csv <<  @headers.collect{|h| cols[h.to_sym]}
-        end
+      sql = []
+      @name_collection.collection.each do |n|
+        $DEBUG && $stderr.puts("#{n.name} is too long") if n.name.length > 30
+        ref = get_ref(n)
+        cols = {
+          TaxonNameID: n.id,
+          TaxonNameStr: n.parent_ids_sf_style,        # closure -> ends with 1
+          RankID: SPECIES_FILE_RANKS[n.rank],
+          Name: n.name,
+          Parens: (n.parens ? 1 : 0),
+          AboveID: (n.related_name.nil? ? (n.parent ? n.parent.id : 0) : n.related_name.id),   # !! SF folks like to pre-populate with zeros
+          RefID: (ref ? ref.id : 0),
+          DataFlags: 0,                                    # see http://software.speciesfile.org/Design/TaxaTables.aspx#Taxon, a flag populated when data is reviewed, initialize to zero
+          AccessCode: 0,
+          NameStatus: (n.related_name.nil? ? 0 : 7),                            # 0 :valid, 7: synonym)
+          StatusFlags: (n.related_name.nil? ? 0 : 262144),                      # 0 :valid, 262144: jr. synonym
+          OriginalGenusID: (!n.parens && n.parent_at_rank('genus') ? n.parent_at_rank('genus').id : 0),      # SF must be pre-configured with 0 filler (this restriction needs to go)
+          LastUpdate: @time,
+          ModifiedBy: @authorized_user_id,
+        }
+        sql << sql_insert_statement('tblTaxa', cols)
       end
-     @csv_string
+      sql.join("\n")
     end
     # Generate a tblRefs string.
     def tblRefs
-      @headers = %w{RefID ActualYear Title PubID  Verbatim}
-      @csv_string = CSV.generate(:col_sep => "\t") do |csv|
-        csv << @headers
-        @name_collection.ref_collection.collection.each_with_index do |r,i|
-          cols = {
-            RefID: r.id, #  i + 1,
-            Title: (r.title.nil? ? """""" : r.title),
-            PubID: 0,                                   # Careful - assumes you have a pre-generated PubID of Zero in there, PubID table is not included in CSV imports
-            ActualYear: r.year,
-            Verbatim: r.full_citation
-          }
-          csv <<  @headers.collect{|h| cols[h.to_sym]}
-        end
+      sql = []
+      @headers = %w{RefID ActualYear Title PubID Verbatim}
+      @name_collection.ref_collection.collection.each_with_index do |r,i|
+        # Assumes the 0 "null" pub id is there
+        pub_id = @pub_collection[r.publication] ? @pub_collection[r.publication] : 0
+        cols = {
+          RefID: r.id,
+          ContainingRefID: 0,
+          Title: (r.title.nil? ? @empty_quotes : r.title),
+          PubID: pub_id,
+          Series: @empty_quotes,
+          Volume: (r.volume ? r.volume : @empty_quotes),
+          Issue:  (r.number ? r.number : @empty_quotes),
+          RefPages: r.page_string, # always a string
+          ActualYear: (r.year ? r.year : @empty_quotes),
+          StatedYear: @empty_quotes,
+          AccessCode: 0,
+          Flags: 0,
+          Note: @empty_quotes,
+          LastUpdate: @time,
+          LinkID: 0,
+          ModifiedBy: @authorized_user_id,
+          CiteDataStatus: 0,
+          Verbatim: (r.full_citation ? r.full_citation : @empty_quotes)
+        }
+        sql << sql_insert_statement('tblRefs', cols)
       end
-      @csv_string
+      sql.join("\n")
     end
-    # TODO make a standard transaction wrapper
-    def sqlRefs
-      sql = [ 'BEGIN TRY', 'BEGIN TRANSACTION']
-      @headers = %w{RefID ActualYear Title PubID  Verbatim}
-      @name_collection.ref_collection.collection.each_with_index do |r,i|
+    # Generate tblPubs SQL
+    def tblPubs
+      sql = []
+      @headers = %w{PubID PrefID PubType ShortName FullName Note LastUpdate ModifiedBy Publisher PlacePublished PubRegID Status StartYear EndYear BHL}
+      # Hackish should build this elsewhere, but degrades OK
+      pubs = @name_collection.ref_collection.collection.collect{|r| r.publication}.compact.uniq
+      pubs.each_with_index do |p, i|
         cols = {
-          RefID: r.id, #  i + 1,
-          Title: (r.title.nil? ? """""" : r.title),
-          PubID: 0,                                   # Careful - assumes you have a pre-generated PubID of Zero in there, PubID table is not included in CSV imports
-          ActualYear: r.year,
-          Verbatim: r.full_citation
+          PubID: i + 1,
+          PrefID: 0,
+          PubType: 1,
+          ShortName: "unknown_#{i}", # Unique constraint
+          FullName: p,
+          Note: @empty_quotes,
+          LastUpdate: @time,
+          ModifiedBy: @authorized_user_id,
+          Publisher: @empty_quotes,
+          PlacePublished: @empty_quotes,
+          PubRegID: 0,
+          Status: 0,
+          StartYear: 0,
+          EndYear: 0,
+          BHL: 0
         }
-        sql <<  "INSERT INTO tblRefs (#{@headers.sort.join(",")}) VALUES (#{@headers.sort.collect{|h| "'#{cols[h.to_sym].to_s.gsub(/'/,"''")}'"}.join(",")});"
+        @pub_collection.merge!(p => i + 1)
+        sql << sql_insert_statement('tblPubs', cols)
       end
-      sql << ['COMMIT', 'END TRY', 'BEGIN CATCH', 'ROLLBACK', 'END CATCH']
-      sql.join("\n")
+      sql.join("\n")
     end
     # Generate tblPeople string.
     def tblPeople
       @headers = %w{PersonID FamilyName GivenNames GivenInitials Suffix Role LastUpdate ModifiedBy}
-      @csv_string = CSV.generate() do |csv|
-        csv << @headers
-        @author_index.keys.each_with_index do |k,i|
-          a = @author_index[k]
-          # a.id = i + 1
-          cols = {
-            PersonID: a.id,
-            FamilyName: a.last_name,
-            GivenName: a.first_name,
-            GivenInitials: a.initials_string,
-            Suffix: a.suffix,
-            Role: 1,                          # authors
-            LastUpdate: @time,
-            ModifiedBy: @authorized_user_id
-          }
-          csv <<  @headers.collect{|h| cols[h.to_sym]}
-        end
+      sql = []
+      @author_index.keys.each_with_index do |k,i|
+        a = @author_index[k]
+        # a.id = i + 1
+        cols = {
+          PersonID: a.id,
+          FamilyName: (a.last_name.length > 0 ? a.last_name : "Unknown"),
+          GivenNames: a.first_name || @empty_quotes,
+          GivenInitials: a.initials_string || @empty_quotes,
+          Suffix: a.suffix || @empty_quotes,
+          Role: 1,                          # authors
+          LastUpdate: @time,
+          ModifiedBy: @authorized_user_id
+        }
+        sql << sql_insert_statement('tblPeople', cols)
       end
-      @csv_string
+      sql.join("\n")
     end
     # Generate tblRefAuthors string.
     def tblRefAuthors
       @headers = %w{RefID PersonID SeqNum AuthorCount LastUpdate ModifiedBy}
-      @csv_string = CSV.generate() do |csv|
-        csv << @headers
-        @name_collection.ref_collection.collection.each do |r|
-          r.authors.each_with_index do |x, i|
-            a = @author_index[x.compact_string]
-            cols = {
-              RefID: r.id,
-              PersonID: a.id,
-              SeqNum: i + 1,
-              AuthorCount: r.authors.size,
-              LastUpdate: @time,
-              ModifiedBy: @authorized_user_id
-            }
-            csv <<  @headers.collect{|h| cols[h.to_sym]}
-          end
+      sql = []
+      @name_collection.ref_collection.collection.each do |r|
+        r.authors.each_with_index do |x, i|
+          a = @author_index[x.compact_string]
+          cols = {
+            RefID: r.id,
+            PersonID: a.id,
+            SeqNum: i + 1,
+            AuthorCount: r.authors.size,
+            LastUpdate: @time,
+            ModifiedBy: @authorized_user_id
+          }
+          sql << sql_insert_statement('tblRefAuthors', cols)
         end
       end
-      @csv_string
+      sql.join("\n")
     end
     # Generate tblCites string.
     def tblCites
       @headers = %w{TaxonNameID SeqNum RefID NomenclatorID LastUpdate ModifiedBy NewNameStatus CitePages Note TypeClarification CurrentConcept ConceptChange InfoFlags InfoFlagStatus PolynomialStatus}
-      @csv_string = CSV.generate() do |csv|
-        csv << @headers
-        @name_collection.collection.each do |n|
-          ref = @by_author_reference_index[n.author_year_index]
-          next if ref.nil?
-          cols = {
-            TaxonNameID: n.id,
-            SeqNum: 1,
-            RefID: ref.id,
-            NomenclatorID: @nomenclator[n.nomenclator_name],
-            LastUpdate: @time,
-            ModifiedBy: @authorized_user_id,
-            CitePages: """""",        # equates to "" in CSV speak
-            NewNameStatus: 0,
-            Note: """""",
-            TypeClarification: 0,     # We might derive more data from this
-            CurrentConcept: 1,        # Boolean, right?
-            ConceptChange: 0,         # Unspecified
-            InfoFlags: 0,             #
-            InfoFlagStatus: 1,        # 1 => needs review
-            PolynomialStatus: 0
-          }
-          csv <<  @headers.collect{|h| cols[h.to_sym]}
-        end
+      sql = []
+      @name_collection.collection.each do |n|
+        next if @nomenclator[n.nomenclator_name].nil? # Only create nomenclator records if they are original citations, otherwise not !! Might need updating in future imports
+        ref = get_ref(n)
+        # ref = @by_author_reference_index[n.author_year_index]
+        next if ref.nil?
+        cols = {
+          TaxonNameID:       n.id,
+          SeqNum:            1,
+          RefID:             ref.id,
+          NomenclatorID:     @nomenclator[n.nomenclator_name],
+          LastUpdate:        @time,
+          ModifiedBy:        @authorized_user_id,
+          CitePages:         @empty_quotes,        # equates to "" in CSV speak
+          NewNameStatus:     0,
+          Note:              @empty_quotes,
+          TypeClarification: 0,     # We might derive more data from this
+          CurrentConcept:    1,        # Boolean, right?
+          ConceptChange:     0,         # Unspecified
+          InfoFlags:         0,             #
+          InfoFlagStatus:    1,        # 1 => needs review
+          PolynomialStatus:  0
+        }
+        sql << sql_insert_statement('tblCites', cols)
       end
-      @csv_string
+      sql.join("\n")
     end
     def tblGenusNames
-      @csv_string = csv_for_genus_and_species_names_tables('Genus')
-      @csv_string
+      # TODO: SF tests catch unused names based on some names not being included in Nomeclator data.  We could optimize so that the work around is removed.
+      # I.e., all the names get added here, not all the names get added to Nomclator/Cites because of citations which are not original combinations
+      sql = sql_for_genus_and_species_names_tables('Genus')
+      sql
     end
     def tblSpeciesNames
-      @csv_string = csv_for_genus_and_species_names_tables('Species')
-      @csv_string
+      # TODO: SF tests catch unused names based on some names not being included in Nomeclator data.  We could optimize so that the work around is removed.
+      # I.e., all the names get added here, not all the names get added to Nomclator/Cites because of citations which are not original combinations
+      sql = sql_for_genus_and_species_names_tables('Species')
+      sql
     end
-    def csv_for_genus_and_species_names_tables(type)
+    def sql_for_genus_and_species_names_tables(type)
+      sql = []
       col = "#{type}NameID"
       @headers = [col, "Name", "LastUpdate", "ModifiedBy", "Italicize"]
-      @csv_string = CSV.generate() do |csv|
-        csv << @headers
-        var = self.send("#{type.downcase}_names")
-        var.keys.each_with_index do |n,i|
-          var[n] = i + 1
-          cols = {
-            col.to_sym => i + 1,
-            Name: n,
-            LastUpdate: @time,
-            ModifiedBy: @authorized_user_id,
-            Italicize: 1                              # always true for these data
-          }
-          csv <<  @headers.collect{|h| cols[h.to_sym]}
-        end
+      var = self.send("#{type.downcase}_names")
+      var.keys.each_with_index do |n,i|
+        var[n] = i + 1
+        cols = {
+          col.to_sym => i + 1,
+          Name: n,
+          LastUpdate: @time,
+          ModifiedBy: @authorized_user_id,
+          Italicize: 1                              # always true for these data
+        }
+        sql << sql_insert_statement("tbl#{type}Names", cols)
       end
-      @csv_string
+      sql.join("\n")
     end
-    # must be called post tblGenusNames and tblSpeciesNames
+    # Must be called post tblGenusNames and tblSpeciesNames.
+    # Some records are not used but can be cleaned by SF
     def tblNomenclator
       @headers = %w{NomenclatorID GenusNameID SubgenusNameID SpeciesNameID SubspeciesNameID LastUpdate ModifiedBy SuitableForGenus SuitableForSpecies InfrasubspeciesNameID InfrasubKind}
-      @csv_string = CSV.generate() do |csv|
-        csv << @headers
-        i = 1
-        @name_collection.collection.each do |n|
-          next if Taxonifi::RANKS.index(n.rank) < Taxonifi::RANKS.index('genus')
-          cols = {
-            NomenclatorID: i,
-            GenusNameID: @genus_names[n.parent_name_at_rank('genus')] || 0,
-            SubgenusNameID: @genus_names[n.parent_name_at_rank('subgenus')] || 0,
-            SpeciesNameID: @species_names[n.parent_name_at_rank('species')] || 0,
-            SubspeciesNameID: @species_names[n.parent_name_at_rank('subspecies')] || 0,
-            InfrasubspeciesNameID: 0,
-            InfrasubKind: 0,                          # this might be wrong
-            LastUpdate: @time,
-            ModifiedBy: @authorized_user_id,
-            SuitableForGenus: 0,                      # Set in SF
-            SuitableForSpecies: 0                     # Set in SF
-          }
-          @nomenclator.merge!(n.nomenclator_name => i)
-          i += 1
-          csv <<  @headers.collect{|h| cols[h.to_sym]}
-        end
+      sql = []
+      i = 1
+      @name_collection.collection.each do |n|
+        gid, sgid = 0,0
+        sid = @species_names[n.parent_name_at_rank('species')] || 0
+        ssid = @species_names[n.parent_name_at_rank('subspecies')] || 0
+        if n.parens == false
+          gid = @genus_names[n.parent_name_at_rank('genus')] || 0
+          sgid = @genus_names[n.parent_name_at_rank('subgenus')] || 0
+        end
+        next if Taxonifi::RANKS.index(n.rank) < Taxonifi::RANKS.index('subtribe')
+        ref = get_ref(n)
+        # debugger
+        # ref = @by_author_reference_index[n.author_year_index]
+        next if ref.nil?
+        cols = {
+          NomenclatorID: i,
+          GenusNameID: gid,
+          SubgenusNameID: sgid,
+          SpeciesNameID: sid,
+          SubspeciesNameID: ssid,
+          InfrasubspeciesNameID: 0,
+          InfrasubKind: 0,                          # this might be wrong
+          LastUpdate: @time,
+          ModifiedBy: @authorized_user_id,
+          SuitableForGenus: 0,                      # Set in SF
+          SuitableForSpecies: 0                     # Set in SF
+        }
+        @nomenclator.merge!(n.nomenclator_name => i)
+        i += 1
+        sql << sql_insert_statement('tblNomenclator', cols)
+      end
+      # TODO: DRY this up with above?!
+      @name_collection.combinations.each do |c|
+        gid, sgid = 0,0
+        sid = (c[2].nil? ? 0 : @species_names[c[2].name])
+        ssid = (c[3].nil? ? 0 : @species_names[c[3].name])
+        if c.compact.last.parens == false
+          gid = (c[0].nil? ? 0 : @genus_names[c[0].name])
+          sgid = (c[1].nil? ? 0 : @genus_names[c[1].name])
+        end
+        # ref = @by_author_reference_index[c.compact.last.author_year_index]
+        ref =  @name_collection.ref_collection.object_from_row(c.compact.last.related[:link_to_ref_from_row])
+        next if ref.nil?
+        cols = {
+          NomenclatorID: i,
+          GenusNameID: gid ,
+          SubgenusNameID: sgid ,
+          SpeciesNameID: sid ,
+          SubspeciesNameID: ssid ,
+          InfrasubspeciesNameID: 0,
+          InfrasubKind: 0,                          # this might be wrong
+          LastUpdate: @time,
+          ModifiedBy: @authorized_user_id,
+          SuitableForGenus: 0,                      # Set in SF
+          SuitableForSpecies: 0                     # Set in SF
+        }
+        # check!?
+        @nomenclator.merge!(c.compact.last.nomenclator_name => i)
+        sql << sql_insert_statement('tblNomenclator', cols)
+        i += 1
       end
-      @csv_string
+      sql.join("\n")
     end
-  end
-end
+  end # End class
+end # End module