RubyGems - dwca_hunter - Versions diffs - 0.5.5 → 0.7.0 - Mend

dwca_hunter 0.5.5 → 0.7.0

Files changed (32) hide show

checksums.yaml +4 -4
data/.byebug_history +37 -0
data/.gitignore +5 -0
data/.rubocop.yml +3 -2
data/.ruby-version +1 -1
data/Gemfile.lock +50 -77
data/LICENSE.txt +1 -1
data/README.md +1 -1
data/dwca_hunter.gemspec +7 -8
data/exe/dwcahunter +1 -3
data/lib/dwca_hunter.rb +31 -0
data/lib/dwca_hunter/resources/aos-birds.rb +143 -0
data/lib/dwca_hunter/resources/arctos.rb +93 -91
data/lib/dwca_hunter/resources/clements.rb +151 -0
data/lib/dwca_hunter/resources/freebase.rb +51 -49
data/lib/dwca_hunter/resources/how-moore-birds.rb +168 -0
data/lib/dwca_hunter/resources/ioc_word_bird.rb +200 -0
data/lib/dwca_hunter/resources/ipni.rb +3 -2
data/lib/dwca_hunter/resources/itis.rb +99 -99
data/lib/dwca_hunter/resources/mammal_divdb.rb +155 -0
data/lib/dwca_hunter/resources/mammal_species.rb +3 -3
data/lib/dwca_hunter/resources/mcz.rb +123 -0
data/lib/dwca_hunter/resources/ncbi.rb +22 -23
data/lib/dwca_hunter/resources/opentree.rb +5 -5
data/lib/dwca_hunter/resources/paleobiodb.rb +193 -0
data/lib/dwca_hunter/resources/paleodb_harvester.rb +140 -0
data/lib/dwca_hunter/resources/sherborn.rb +91 -0
data/lib/dwca_hunter/resources/wikispecies.rb +142 -127
data/lib/dwca_hunter/version.rb +1 -1
metadata +27 -34
data/ipni.csv.gz +0 -0
data/ipniWebName.csv.xz?dl=1 +0 -0

data/lib/dwca_hunter/resources/how-moore-birds.rb ADDED

@@ -0,0 +1,168 @@
+# frozen_string_literal: true
+module DwcaHunter
+  class ResourceHowardMoore < DwcaHunter::Resource
+    def initialize(opts = {})
+      @command = "how-moore-birds"
+      @title = "Howard and Moore Complete Checklist of the Birds of the World"
+      @url = "https://uofi.box.com/shared/static/m71m541dr5unc41xzg4y51d92b7wiy2k.csv"
+      @UUID = "85023fe5-bf2a-486b-bdae-3e61cefd41fd"
+      @download_path = File.join(Dir.tmpdir,
+                                 "dwca_hunter",
+                                 "how-moore-birds",
+                                 "data.csv")
+      @synonyms = []
+      @names = []
+      @vernaculars = []
+      @extensions = []
+      @synonyms_hash = {}
+      @vernaculars_hash = {}
+      super(opts)
+    end
+    def download
+      puts "Downloading cached verion of the file."
+      puts "Check https://www.howardandmoore.org/howard-and-moore-database/"
+      puts "If there is a more recent edition"
+      `curl -s -L #{@url} -o #{@download_path}`
+    end
+    def unpack; end
+    def make_dwca
+      DwcaHunter.logger_write(object_id, "Extracting data")
+      get_names
+      generate_dwca
+    end
+    private
+    def get_names
+      Dir.chdir(@download_dir)
+      collect_names
+    end
+    def collect_names
+      file = CSV.open(File.join(@download_dir, "data.csv"),
+                      headers: true)
+      file.each_with_index do |row, i|
+        kingdom = "Animalia"
+        phylum = "Chordata"
+        klass = "Aves"
+        family = row["FAMILY_NAME"].capitalize
+        genus = row["GENERA_NAME"].capitalize
+        species = row["SPECIES_NAME"]
+        species_au =
+          "#{row['species_author']} #{row['species_rec_year']}".strip
+        subspecies = row["SUB_SPECIES_NAME"]
+        subspecies_au =
+          "#{row['subspecies_author']} #{row['subspecies_rec_year']}".strip
+        code = "ICZN"
+        taxon_id = "gn_#{i + 1}"
+        name_string = species
+        name_string = if subspecies.to_s == "" ||
+                          name_string.include?(subspecies)
+                        "#{name_string} #{species_au}".strip
+                      else
+                        "#{name_string} #{subspecies} #{subspecies_au}".strip
+                      end
+        @names << { taxon_id: taxon_id,
+                    name_string: name_string,
+                    kingdom: kingdom,
+                    phylum: phylum,
+                    klass: klass,
+                    family: family,
+                    genus: genus,
+                    code: code }
+        if row["species_english_name"].to_s != ""
+          @vernaculars << {
+            taxon_id: taxon_id,
+            vern: row["species_english_name"],
+            lang: "en"
+          }
+        end
+        if row["species_english_name2"].to_s != ""
+          @vernaculars << {
+            taxon_id: taxon_id,
+            vern: row["species_english_name2"],
+            lang: "en"
+          }
+        end
+        puts "Processed %s names" % i if i % 10_000 == 0
+      end
+    end
+    def update_vernacular(taxon_id, canonical)
+      return unless @vernaculars_hash.key?(canonical)
+      @vernaculars_hash[canonical].each do |vern|
+        @vernaculars << { taxon_id: taxon_id, vern: vern }
+      end
+    end
+    def update_synonym(taxon_id, canonical)
+      return unless @synonyms_hash.key?(canonical)
+      @synonyms_hash[canonical].each do |syn|
+        @synonyms << { taxon_id: taxon_id, name_string: syn[:name_string],
+                       status: syn[:status] }
+      end
+    end
+    def generate_dwca
+      DwcaHunter.logger_write(object_id,
+                              "Creating DarwinCore Archive file")
+      @core = [["http://rs.tdwg.org/dwc/terms/taxonID",
+                "http://rs.tdwg.org/dwc/terms/scientificName",
+                "http://rs.tdwg.org/dwc/terms/kingdom",
+                "http://rs.tdwg.org/dwc/terms/phylum",
+                "http://rs.tdwg.org/dwc/terms/class",
+                "http://rs.tdwg.org/dwc/terms/family",
+                "http://rs.tdwg.org/dwc/terms/genus",
+                "http://rs.tdwg.org/dwc/terms/nomenclaturalCode"]]
+      @names.each do |n|
+        @core << [n[:taxon_id], n[:name_string],
+                  n[:kingdom], n[:phylum], n[:klass], n[:family],
+                  n[:genus], n[:code]]
+      end
+      @extensions << {
+        data: [[
+          "http://rs.tdwg.org/dwc/terms/taxonID",
+          "http://rs.tdwg.org/dwc/terms/vernacularName",
+          "http://purl.org/dc/terms/language"
+        ]],
+        file_name: "vernacular_names.txt",
+        row_type: "http://rs.gbif.org/terms/1.0/VernacularName"
+      }
+      @vernaculars.each do |v|
+        @extensions[-1][:data] << [v[:taxon_id], v[:vern], v[:lang]]
+      end
+      @eml = {
+        id: @uuid,
+        title: @title,
+        authors: [
+          {
+            last_name: "Christidis"
+          }
+        ],
+        metadata_providers: [
+          { first_name: "Dmitry",
+            last_name: "Mozzherin",
+            email: "dmozzherin@gmail.com" }
+        ],
+        abstract: "Christidis et al. 2018. The Howard and Moore Complete " \
+        "Checklist of the Birds of the World, version 4.1 " \
+        "(Downloadable checklist). " \
+        "Accessed from https://www.howardandmoore.org.",
+        url: @url
+      }
+      super
+    end
+  end
+end

data/lib/dwca_hunter/resources/ioc_word_bird.rb ADDED

@@ -0,0 +1,200 @@
+# frozen_string_literal: true
+module DwcaHunter
+  class ResourceIOCWorldBird < DwcaHunter::Resource
+    def initialize(opts = {})
+      @command = "ioc-world-bird"
+      @title = "IOC World Bird List"
+      @url = "https://uofi.box.com/shared/static/fbpuk5ghh9083nbzjdeyqtoqsvdnro01.csv"
+      @UUID = "6421ffec-38e3-40fb-a6d9-af27238a47a1"
+      @download_path = File.join(Dir.tmpdir,
+                                 "dwca_hunter",
+                                 "ioc-bird",
+                                 "data.csv")
+      @synonyms = []
+      @names = []
+      @vernaculars = []
+      @extensions = []
+      @synonyms_hash = {}
+      @vernaculars_hash = {}
+      super(opts)
+    end
+    def download
+      puts "Downloading cached and converted to csv version."
+      puts "CHECK FOR NEW VERSION at"
+      puts "https://www.worldbirdnames.org/ioc-lists/master-list-2/"
+      puts "Use libreoffice to convert to csv."
+      `curl -s -L #{@url} -o #{@download_path}`
+    end
+    def unpack; end
+    def make_dwca
+      DwcaHunter.logger_write(object_id, "Extracting data")
+      get_names
+      generate_dwca
+    end
+    private
+    def get_names
+      Dir.chdir(@download_dir)
+      collect_names
+    end
+    def collect_names
+      @names_index = {}
+      file = CSV.open(File.join(@download_dir, "data.csv"),
+                      headers: true)
+      order = ""
+      family = ""
+      genus = ""
+      species = ""
+      count = 0
+      file.each do |row|
+        order1 = row["Order"]
+        order = order1.capitalize if order1.to_s != ""
+        family1 = row["Family (Scientific)"]
+        family = family1.capitalize if family1.to_s != ""
+        genus1 = row["Genus"]
+        genus = genus1.capitalize if genus1.to_s != ""
+        species1 = row["Species (Scientific)"]
+        species = species1 if species1.to_s != ""
+        subspecies = row["Subspecies"]
+        next if species.to_s == ""
+        count += 1
+        taxon_id = "gn_#{count}"
+        name = {
+          taxon_id: taxon_id,
+          kingdom: "Animalia",
+          phylum: "Chordata",
+          klass: "Aves",
+          order: order,
+          family: family,
+          genus: genus,
+          code: "ICZN"
+        }
+        if subspecies.to_s == ""
+          auth = row["Authority"].to_s
+          auth = DwcaHunter.normalize_authors(auth) if auth != ""
+          name[:name_string] = clean(
+            "#{genus} #{species} #{auth}".
+            strip
+          )
+          @names << name
+          vernacular = row["Species (English)"]
+          if vernacular.to_s != ""
+            vernaclar = { taxon_id: taxon_id, vern: vernacular, lang: "en" }
+            @vernaculars << vernaclar
+          end
+          species = ""
+        else
+          name[:name_string] = clean(
+            "#{genus} #{species} #{subspecies} #{row['Authority']}".
+            strip
+          )
+          @names << name
+          species = ""
+          subspecies = ""
+        end
+      end
+    end
+    def clean(n)
+      n = n.gsub(/†/, "")
+      n.gsub(/\s+/, " ")
+    end
+    def generate_dwca
+      DwcaHunter.logger_write(object_id,
+                              "Creating DarwinCore Archive file")
+      @core = [["http://rs.tdwg.org/dwc/terms/taxonID",
+                "http://rs.tdwg.org/dwc/terms/scientificName",
+                "http://rs.tdwg.org/dwc/terms/kingdom",
+                "http://rs.tdwg.org/dwc/terms/phylum",
+                "http://rs.tdwg.org/dwc/terms/class",
+                "http://rs.tdwg.org/dwc/terms/order",
+                "http://rs.tdwg.org/dwc/terms/family",
+                "http://rs.tdwg.org/dwc/terms/genus",
+                "http://rs.tdwg.org/dwc/terms/nomenclaturalCode"]]
+      @names.each do |n|
+        @core << [n[:taxon_id], n[:name_string],
+                  n[:kingdom], n[:phylum], n[:klass], n[:order], n[:family],
+                  n[:genus], n[:code]]
+      end
+      @extensions << {
+        data: [[
+          "http://rs.tdwg.org/dwc/terms/taxonID",
+          "http://rs.tdwg.org/dwc/terms/vernacularName",
+          "http://purl.org/dc/terms/language"
+        ]],
+        file_name: "vernacular_names.txt",
+        row_type: "http://rs.gbif.org/terms/1.0/VernacularName"
+      }
+      @vernaculars.each do |v|
+        @extensions[-1][:data] << [v[:taxon_id], v[:vern], v[:lang]]
+      end
+      @eml = {
+        id: @uuid,
+        title: @title,
+        authors: [
+          { first_name: "Per",
+            last_name: "Alstrom" },
+          { first_name: "Mike",
+            last_name: "Blair" },
+          { first_name: "Rauri",
+            last_name: "Bowie" },
+          { first_name: "Nigel",
+            last_name: "Redman" },
+          { first_name: "Jon",
+            last_name: "Fjeldsa" },
+          { first_name: "Phil",
+            last_name: "Gregory" },
+          { first_name: "Leo",
+            last_name: "Joseph" },
+          { first_name: "Peter",
+            last_name: "Kovalik" },
+          { first_name: "Adolfo",
+            last_name: "Navarro-Siguenza" },
+          { first_name: "David",
+            last_name: "Parkin" },
+          { first_name: "Alan",
+            last_name: "Peterson" },
+          { first_name: "Douglas",
+            last_name: "Pratt" },
+          { first_name: "Pam",
+            last_name: "Rasmussen" },
+          { first_name: "Frank",
+            last_name: "Rheindt" },
+          { first_name: "Robert",
+            last_name: "Ridgely" },
+          { first_name: "Peter",
+            last_name: "Ryan" },
+          { first_name: "George",
+            last_name: "Sangster" },
+          { first_name: "Dick",
+            last_name: "Schodde" },
+          { first_name: "Minturn",
+            last_name: "Wright" }
+        ],
+        metadata_providers: [
+          { first_name: "Dmitry",
+            last_name: "Mozzherin",
+            email: "dmozzherin@gmail.com" }
+        ],
+        abstract: "The IOC World Bird List is an open access resource of " \
+                  "the international community of ornithologists.",
+        url: "https://www.worldbirdnames.org"
+      }
+      super
+    end
+  end
+end

data/lib/dwca_hunter/resources/ipni.rb CHANGED

@@ -8,7 +8,7 @@ module DwcaHunter
       @command = "ipni"
       @title = "The International Plant Names Index"
       @abbr = "IPNI"
-      @url = "https://www.dropbox.com/s/1n0sn80vkdir5nu/ipniWebName.csv.xz"
+      @url = "https://uofi.box.com/shared/static/s0x4xjonxt54pi89n543gdmttrdqd6iv.xz"
       @uuid = "6b3905ce-5025-49f3-9697-ddd5bdfb4ff0"
       @download_path = File.join(Dir.tmpdir, "dwca_hunter", "ipni",
                                  "ipni.csv.xz")
@@ -22,8 +22,9 @@ module DwcaHunter
     end
     def download
-      puts "Downloading cached verion of the file. Get daily updated one from"
+      puts "Download by hand from"
       puts "https://storage.cloud.google.com/ipni-data/ipniWebName.csv.xz"
+      puts "and copy to given url"
         `curl -s -L #{@url} -o #{@download_path}`
     end

data/lib/dwca_hunter/resources/itis.rb CHANGED

@@ -1,15 +1,16 @@
-# encoding: utf-8
+# frozen_string_literal: true
 module DwcaHunter
   class ResourceITIS < DwcaHunter::Resource
     def initialize(opts = {})
-      @command = 'itis'
-      @title = 'ITIS'
-      @url = 'https://www.itis.gov/downloads/itisMySQLTables.tar.gz'
-      @uuid =  '5d066e84-e512-4a2f-875c-0a605d3d9f35'
+      @command = "itis"
+      @title = "ITIS"
+      @url = "https://www.itis.gov/downloads/itisMySQLTables.tar.gz"
+      @uuid = "5d066e84-e512-4a2f-875c-0a605d3d9f35"
       @download_path = File.join(Dir.tmpdir,
-                                 'dwca_hunter',
-                                 'itis',
-                                 'data.tar.gz')
+                                 "dwca_hunter",
+                                 "itis",
+                                 "data.tar.gz")
       @ranks = {}
       @kingdoms = {}
       @authors = {}
@@ -19,20 +20,20 @@ module DwcaHunter
       @names = {}
       @extensions = []
       super(opts)
-      @itis_dir = File.join(@download_dir, 'itis')
+      @itis_dir = File.join(@download_dir, "itis")
     end
     def unpack
       unpack_tar
-      dir = Dir.entries(@download_dir).select {|e| e.match(/itisMySQL/)}[0]
+      dir = Dir.entries(@download_dir).select { |e| e.match(/itisMySQL/) }[0]
       FileUtils.mv(File.join(@download_dir, dir), @itis_dir)
       # Create a file with the same name as the directory we extracted.
-      FileUtils.touch(File.join(@itis_dir, 'version_' + dir))
+      FileUtils.touch(File.join(@itis_dir, "version_" + dir))
     end
     def make_dwca
-      DwcaHunter::logger_write(self.object_id, 'Extracting data')
+      DwcaHunter.logger_write(object_id, "Extracting data")
       get_ranks
       get_kingdoms
       get_authors
@@ -42,7 +43,8 @@ module DwcaHunter
       generate_dwca
     end
-  private
+    private
     def get_ranks
       # 0    kingdom_id integer not null
       # 1    rank_id smallint not null
@@ -50,15 +52,15 @@ module DwcaHunter
       # 3    dir_parent_rank_id smallint not null
       # 4    req_parent_rank_id smallint not null
       # 5    update_date date not null
-      rank_file = File.join(@itis_dir, 'taxon_unit_types')
-      f = open(rank_file, 'r:utf-8')
+      rank_file = File.join(@itis_dir, "taxon_unit_types")
+      f = open(rank_file, "r:utf-8")
       f.each do |l|
-        l.encode!('UTF-8',
-                  'ISO-8859-1',
+        l.encode!("UTF-8",
+                  "ISO-8859-1",
                   invalid: :replace,
-                  replace: '?')
-        row = l.strip.split('|')
-        @ranks[row[0].strip + '/' + row[1].strip] = row[2].strip
+                  replace: "?")
+        row = l.strip.split("|")
+        @ranks[row[0].strip + "/" + row[1].strip] = row[2].strip
       end
     end
@@ -67,9 +69,9 @@ module DwcaHunter
       # 1    kingdom_name char(10) not null
       # 2    update_date date not null
-      f = open(File.join(@itis_dir, 'kingdoms'))
+      f = open(File.join(@itis_dir, "kingdoms"))
       f.each do |l|
-        data = l.strip.split('|')
+        data = l.strip.split("|")
         @kingdoms[data[0].strip] = data[1].strip
       end
     end
@@ -80,13 +82,13 @@ module DwcaHunter
       # 2    update_date date not null
       # 3    kingdom_id smallint not null
-      f = open(File.join(@itis_dir, 'taxon_authors_lkp'))
+      f = open(File.join(@itis_dir, "taxon_authors_lkp"))
       f.each do |l|
-        l.encode!('UTF-8',
-                  'ISO-8859-1',
+        l.encode!("UTF-8",
+                  "ISO-8859-1",
                   invalid: :replace,
-                  replace: '?')
-        data = l.strip.split('|')
+                  replace: "?")
+        data = l.strip.split("|")
         @authors[data[0].strip] = data[1].strip
       end
     end
@@ -100,22 +102,22 @@ module DwcaHunter
       # 5    primary key (tsn,vernacular_name,language)
       #      constraint "itis".vernaculars_key
-      f = open(File.join(@itis_dir, 'vernaculars'))
+      f = open(File.join(@itis_dir, "vernaculars"))
       f.each_with_index do |l, i|
         if i % BATCH_SIZE == 0
-          DwcaHunter::logger_write(self.object_id,
-                                   "Extracted %s vernacular names" % i)
+          DwcaHunter.logger_write(object_id,
+                                  "Extracted %s vernacular names" % i)
         end
-        l.encode!('UTF-8',
-                  'ISO-8859-1',
+        l.encode!("UTF-8",
+                  "ISO-8859-1",
                   invalid: :replace,
-                  replace: '?')
-        data = l.split('|').map { |d| d.strip }
+                  replace: "?")
+        data = l.split("|").map(&:strip)
         name_tsn = data[0]
         string   = data[1]
         language = data[2]
-        language = 'Common name' if language == 'unspecified'
-        @vernaculars[name_tsn] = { name:string, language:language }
+        language = "Common name" if language == "unspecified"
+        @vernaculars[name_tsn] = { name: string, language: language }
       end
     end
@@ -124,17 +126,17 @@ module DwcaHunter
       # 1    tsn_accepted integer not null
       # 2    update_date date not null
-      f = open(File.join(@itis_dir, 'synonym_links'))
+      f = open(File.join(@itis_dir, "synonym_links"))
       f.each_with_index do |l, i|
         if i % BATCH_SIZE == 0
-          DwcaHunter::logger_write(self.object_id,
-                                   "Extracted %s synonyms" % i)
+          DwcaHunter.logger_write(object_id,
+                                  "Extracted %s synonyms" % i)
         end
-        l.encode!('UTF-8',
-                  'ISO-8859-1',
+        l.encode!("UTF-8",
+                  "ISO-8859-1",
                   invalid: :replace,
-                  replace: '?')
-        data = l.split('|').map { |d| d.strip }
+                  replace: "?")
+        data = l.split("|").map(&:strip)
         synonym_name_tsn = data[0]
         accepted_name_tsn = data[1]
         @synonyms[synonym_name_tsn] = accepted_name_tsn
@@ -167,19 +169,19 @@ module DwcaHunter
       # 22   update_date date not null
       # 23   uncertain_prnt_ind char(3)
-      f = open(File.join(@itis_dir, 'taxonomic_units'))
+      f = open(File.join(@itis_dir, "taxonomic_units"))
       f.each_with_index do |l, i|
         if i % BATCH_SIZE == 0
-          DwcaHunter::logger_write(self.object_id,
-                                   "Extracted %s names" % i)
+          DwcaHunter.logger_write(object_id,
+                                  "Extracted %s names" % i)
         end
-        l.encode!('UTF-8',
-                  'ISO-8859-1',
+        l.encode!("UTF-8",
+                  "ISO-8859-1",
                   invalid: :replace,
-                  replace: '?')
-        data = l.split("|").map { |d| d.strip }
-        name_tsn   = data[0]
-        x1         = data[1]
+                  replace: "?")
+        data = l.split("|").map(&:strip)
+        name_tsn = data[0]
+        x1 = data[1]
         name_part1 = data[2]
         x2         = data[3]
         name_part2 = data[4]
@@ -193,16 +195,15 @@ module DwcaHunter
         kingdom_id = data[20]
         rank_id    = data[21]
-        parent_tsn = nil if parent_tsn == ''
+        parent_tsn = nil if parent_tsn == ""
         name = [x1, name_part1, x2, name_part2,
                 sp_marker1, name_part3, sp_marker2, name_part4]
         canonical_name = name.clone
         name << @authors[author_id] if @authors[author_id]
-        name = name.join(' ').strip.gsub(/\s+/, ' ')
-        canonical_name = canonical_name.join(' ').strip.gsub(/\s+/, ' ')
-        rank = @ranks[kingdom_id + '/' + rank_id] ?
-               @ranks[kingdom_id + '/' + rank_id] :
-               ''
+        name = name.join(" ").strip.gsub(/\s+/, " ")
+        canonical_name = canonical_name.join(" ").strip.gsub(/\s+/, " ")
+        rank = @ranks[kingdom_id + "/" + rank_id] ||
+               ""
         @names[name_tsn] = { name: name,
                              canonical_name: canonical_name,
                              status: status,
@@ -212,58 +213,57 @@ module DwcaHunter
     end
     def generate_dwca
-      DwcaHunter::logger_write(self.object_id,
-                               'Creating DarwinCore Archive file')
-      @core = [['http://rs.tdwg.org/dwc/terms/taxonID',
-                'http://rs.tdwg.org/dwc/terms/parentNameUsageID',
-                'http://rs.tdwg.org/dwc/terms/acceptedNameUsageID',
-                'http://rs.tdwg.org/dwc/terms/scientificName',
-                'http://rs.tdwg.org/ontology/voc/TaxonName#nameComplete',
-                'http://rs.tdwg.org/dwc/terms/taxonomicStatus',
-                'http://rs.tdwg.org/dwc/terms/taxonRank']]
-      @extensions << { data: [['http://rs.tdwg.org/dwc/terms/taxonID',
-                               'http://rs.tdwg.org/dwc/terms/vernacularName',
-                               'http://purl.org/dc/terms/language']],
-                       file_name: 'vernacular_names.txt',
-                       row_type: 'http://rs.gbif.org/terms/1.0/VernacularName'
-                     }
-      @names.keys.each_with_index do |k, i|
+      DwcaHunter.logger_write(object_id,
+                              "Creating DarwinCore Archive file")
+      @core = [["http://rs.tdwg.org/dwc/terms/taxonID",
+                "http://rs.tdwg.org/dwc/terms/parentNameUsageID",
+                "http://rs.tdwg.org/dwc/terms/acceptedNameUsageID",
+                "http://rs.tdwg.org/dwc/terms/scientificName",
+                "http://rs.tdwg.org/ontology/voc/TaxonName#nameComplete",
+                "http://rs.tdwg.org/dwc/terms/taxonomicStatus",
+                "http://rs.tdwg.org/dwc/terms/taxonRank"]]
+      @extensions << { data: [["http://rs.tdwg.org/dwc/terms/taxonID",
+                               "http://rs.tdwg.org/dwc/terms/vernacularName",
+                               "http://purl.org/dc/terms/language"]],
+                       file_name: "vernacular_names.txt",
+                       row_type: "http://rs.gbif.org/terms/1.0/VernacularName" }
+      @names.keys.each_with_index do |k, _i|
         d = @names[k]
-        accepted_id = @synonyms[k] ? @synonyms[k] : nil
+        accepted_id = @synonyms[k] || nil
         parent_id = d[:parent_tsn].to_i == 0 ? nil : d[:parent_tsn]
         row = [k, parent_id, accepted_id, d[:name], d[:canonical_name], d[:status], d[:rank]]
         @core << row
       end
-      @vernaculars.keys.each_with_index do |k, i|
+      @vernaculars.keys.each_with_index do |k, _i|
         d = @vernaculars[k]
         @extensions[0][:data] << [k, d[:name], d[:language]]
       end
       @eml = {
-          id: @uuid,
-          title: @title,
-          authors: [
-            {email: 'itiswebmaster@itis.gov'}
-          ],
-          metadata_providers: [
-            { first_name: 'Dmitry',
-              last_name: 'Mozzherin',
-              email: 'dmozzherin@gmail.com' }
-            ],
-          abstract: 'The White House Subcommittee on Biodiversity and ' +
-                    'Ecosystem Dynamics has identified systematics as a ' +
-                    'research priority that is fundamental to ecosystem ' +
-                    'management and biodiversity conservation. This primary ' +
-                    'need identified by the Subcommittee requires ' +
-                    'improvements in the organization of, and access to, ' +
-                    'standardized nomenclature. ITIS (originally referred ' +
-                    'to as the Interagency Taxonomic Information System) ' +
-                    'was designed to fulfill these requirements. In the ' +
-                    'future, the ITIS will provide taxonomic data and a ' +
-                    'directory of taxonomic expertise that will support ' +
-                    'the system',
-          url: 'http://www.itis.gov'
+        id: @uuid,
+        title: @title,
+        authors: [
+          { email: "itiswebmaster@itis.gov" }
+        ],
+        metadata_providers: [
+          { first_name: "Dmitry",
+            last_name: "Mozzherin",
+            email: "dmozzherin@gmail.com" }
+        ],
+        abstract: "The White House Subcommittee on Biodiversity and " \
+                    "Ecosystem Dynamics has identified systematics as a " \
+                    "research priority that is fundamental to ecosystem " \
+                    "management and biodiversity conservation. This primary " \
+                    "need identified by the Subcommittee requires " \
+                    "improvements in the organization of, and access to, " \
+                    "standardized nomenclature. ITIS (originally referred " \
+                    "to as the Interagency Taxonomic Information System) " \
+                    "was designed to fulfill these requirements. In the " \
+                    "future, the ITIS will provide taxonomic data and a " \
+                    "directory of taxonomic expertise that will support " \
+                    "the system",
+        url: "http://www.itis.gov"
       }
       super
     end