RubyGems - dwc-archive - Versions diffs - 0.9.10 → 0.9.11 - Mend

dwc-archive 0.9.10 → 0.9.11

Files changed (19) hide show

checksums.yaml +4 -4
data/.travis.yml +1 -1
data/CHANGELOG +10 -8
data/README.md +8 -1
data/lib/dwc-archive.rb +1 -1
data/lib/dwc-archive/archive.rb +1 -1
data/lib/dwc-archive/classification_normalizer.rb +11 -12
data/lib/dwc-archive/core.rb +3 -1
data/lib/dwc-archive/expander.rb +1 -0
data/lib/dwc-archive/generator.rb +13 -12
data/lib/dwc-archive/generator_eml_xml.rb +68 -45
data/lib/dwc-archive/generator_meta_xml.rb +33 -20
data/lib/dwc-archive/version.rb +1 -1
data/lib/dwc-archive/xml_reader.rb +54 -38
data/spec/files/generator_eml.xml +47 -0
data/spec/files/generator_meta.xml +19 -0
data/spec/lib/generator_spec.rb +13 -4
metadata +6 -3
data/] +0 -40

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 8e8c929203d1b652f8ba345b0c4c39cfc87a0369
-  data.tar.gz: 739a064221bf52523990bfea38749f11b4d986c0
+  metadata.gz: 5c6c5b2a4de324abded5b3adb81d6bcd9603965f
+  data.tar.gz: ac00e15f95766838ff42a9bdc3f1a682c4a8e9ff
 SHA512:
-  metadata.gz: adfd46bea84e301ceca6de355f189b884bc6a9a22eb8d98e3976f17e3407d2de7f15963ec0d6f29958de057de9d579c81d8007d72c38fc1b9f9ada9295381152
-  data.tar.gz: 2e188f828d0bbe28baf5f1d8aa7aab12ca330000bf3f5ee145501d78961f9ca5e696be1171998a433952cf84546a8d5fd61c6cf45958576a7e0800fbf4542dae
+  metadata.gz: d84f2974ed7bcbabc62d2d3b5c5b15dd8d6d2aa38836a955c12896ada2391e978ca2d420d86bf59db2ab61cc801c9c43036be13699ba7b3902d8daa4f366d45b
+  data.tar.gz: a07a91365cba60fa418b85d7b516781c9209ea607dbe5ec45da86febd14bfa104cc16e4b55619a157f5bbb487dff2fd7e318399d815a63372197a9732b3820fb

data/.travis.yml CHANGED

@@ -1,5 +1,5 @@
 rvm:
-  - 1.9.3-p448
+  - 1.9.3-p484
   - 2.0.0-p353
 before_install:
   - sudo apt-get update

data/CHANGELOG CHANGED

@@ -1,15 +1,17 @@
-0.9.7 Refactoring and tests improvements
+0.9.11 Removed VERSION duplicate
-0.9.6 Added support for GNUB DwCA files
+0.9.7  Refactoring and tests improvements
-0.9.4 Gem dependencies updated, added travis support
+0.9.6  Added support for GNUB DwCA files
-0.9.0 Migrated code to ruby 1.9.3
+0.9.4  Gem dependencies updated, added travis support
-0.8.3 Updated outdated exception rasing
+0.9.0  Migrated code to ruby 1.9.3
-0.8.2 Removed species info from linnean classification path
+0.8.3  Updated outdated exception rasing
-0.8.1 Linnean classification path is now only for species and infraspecies with canonical forms. It ends with a canonical form of the taxon
+0.8.2  Removed species info from linnean classification path
-0.8.0 Added linnean classification path to normalized data from DwCA. It consists of data associated with clades like 'kingdom', 'order' etc.
+0.8.1  Linnean classification path is now only for species and infraspecies with canonical forms. It ends with a canonical form of the taxon
+0.8.0  Added linnean classification path to normalized data from DwCA. It consists of data associated with clades like 'kingdom', 'order' etc.

data/README.md CHANGED

@@ -175,7 +175,11 @@ Note on Patches/Pull Requests
 Copyright
 ---------
-Copyright (c) 2010-2013 Marine Biological Laboratory. See LICENSE for details.
+Author -- [Dmitry Mozzherin][13]
+Contributors -- [Matt Yoder][14]
+Copyright (c) 2010-2014 [Marine Biological Laboratory][15]. See LICENSE for details.
 [1]: https://badge.fury.io/rb/dwc-archive.png
 [2]: http://badge.fury.io/rb/dwc-archive
@@ -189,3 +193,6 @@ Copyright (c) 2010-2013 Marine Biological Laboratory. See LICENSE for details.
 [10]: https://gemnasium.com/GlobalNamesArchitecture/dwc-archive
 [11]: http://bit.ly/2IxcBA
 [12]: http://redis.io/topics/quickstart
+[13]: https://github.com/dimus
+[14]: https://github.com/mjy
+[15]: http://mbl.edu

data/lib/dwc-archive.rb CHANGED

@@ -8,6 +8,7 @@ require 'ostruct'
 require 'digest'
 require 'csv'
 require 'logger'
+require 'nokogiri'
 require_relative 'dwc-archive/xml_reader'
 require_relative 'dwc-archive/ingester'
 require_relative 'dwc-archive/errors'
@@ -24,7 +25,6 @@ require_relative 'dwc-archive/version'
 class DarwinCore
-  VERSION = DarwinCore::VERSION
   DEFAULT_TMP_DIR = "/tmp"
   attr_reader :archive, :core, :metadata, :extensions,

data/lib/dwc-archive/archive.rb CHANGED

@@ -1,7 +1,7 @@
-require 'nokogiri'
 class DarwinCore
   class Archive
     attr_reader :meta, :eml
     def initialize(archive_path, tmp_dir)
       @archive_path = archive_path
       @tmp_dir = tmp_dir

data/lib/dwc-archive/classification_normalizer.rb CHANGED

@@ -72,21 +72,11 @@ class DarwinCore
     end
     def name_strings(opts = {})
-      opts = { with_hash: false }.merge(opts)
-      if !!opts[:with_hash]
-        @name_strings
-      else
-        @name_strings.keys
-      end
+      process_strings(@name_strings, opts)
     end
     def vernacular_name_strings(opts = {})
-      opts = { with_hash: false }.merge(opts)
-      if !!opts[:with_hash]
-        @vernacular_name_strings
-      else
-        @vernacular_name_strings.keys
-      end
+      process_strings(@vernacular_name_strings, opts)
     end
     def normalize(opts = {})
@@ -110,6 +100,15 @@ class DarwinCore
   private
+    def process_strings(strings, opts)
+      opts = { with_hash: false }.merge(opts)
+      if !!opts[:with_hash]
+        strings
+      else
+        strings.keys
+      end
+    end
     def get_canonical_name(a_scientific_name)
       if @with_canonical_names
         canonical_name = @parser.parse(a_scientific_name,

data/lib/dwc-archive/core.rb CHANGED

@@ -2,6 +2,7 @@ class DarwinCore
   class Core
     include DarwinCore::Ingester
     attr_reader :id
     def initialize(dwc)
       @dwc = dwc
       @archive = @dwc.archive
@@ -9,9 +10,10 @@ class DarwinCore
       root_key = @archive.meta.keys[0]
       @data = @archive.meta[root_key][:core]
       raise DarwinCore::CoreFileError.
-        new("Cannot find core in meta.xml, is meta.xml valid?") unless @data
+        new('Cannot find core in meta.xml, is meta.xml valid?') unless @data
       @id = @data[:id][:attributes]
       get_attributes(DarwinCore::CoreFileError)
     end
   end
 end

data/lib/dwc-archive/expander.rb CHANGED

@@ -1,5 +1,6 @@
 class DarwinCore
   class Expander
     def initialize(archive_path, tmp_dir)
       @archive_path = archive_path
       @tmp_dir = tmp_dir

data/lib/dwc-archive/generator.rb CHANGED

@@ -21,12 +21,7 @@ class DarwinCore
     def add_core(data, file_name, keep_headers = true)
       c = CSV.open(File.join(@path,file_name), @write)
       header = data.shift
-      fields = header.map do |f|
-        f.strip!
-        err = 'No header in core data, or header fields are not urls'
-        raise DarwinCore::GeneratorError.new(err) unless f.match(/^http:\/\//)
-        f.split('/')[-1]
-      end
+      fields = get_fields(header, 'core')
       data.unshift(fields) if keep_headers
       ignore_header_lines = keep_headers ? 1 : 0
       @meta_xml_data[:core] = { fields: header,
@@ -41,12 +36,7 @@ class DarwinCore
                       row_type = 'http://rs.tdwg.org/dwc/terms/Taxon')
       c = CSV.open(File.join(@path,file_name), @write)
       header = data.shift
-      fields = header.map do |f|
-        f.strip!
-        err = 'No header in core data, or header fields are not urls'
-        raise DarwinCore::GeneratorError.new(err) unless f.match(/^http:\/\//)
-        f.split('/')[-1]
-      end
+      fields = get_fields(header, 'extension')
       data.unshift(fields) if keep_headers
       ignore_header_lines = keep_headers ? 1 : 0
       @meta_xml_data[:extensions] << { fields: header,
@@ -81,5 +71,16 @@ class DarwinCore
       a = "cd #{@path}; tar -zcf #{@dwc_path} *"
       system(a)
     end
+    private
+    def get_fields(header, file_type)
+      header.map do |f|
+        f.strip!
+        err = "No header in %s data, or header fields are not urls" % file_type
+        raise DarwinCore::GeneratorError.new(err) unless f.match(/^http:\/\//)
+        f.split('/')[-1]
+      end
+    end
   end
 end

data/lib/dwc-archive/generator_eml_xml.rb CHANGED

@@ -22,51 +22,9 @@ class DarwinCore
             :'xmlns:res' =>        'eml://ecoinformatics.org/resource-2.1.1',
             :'xmlns:dc' =>         'http://purl.org/dc/terms/',
             :'xmlns:xsi' =>        'http://www.w3.org/2001/XMLSchema-instance',
-            :'xsi:schemaLocation' => 'eml_uri')  do
-            xml.dataset(id: @data[:id]) do
-              xml.title(@data[:title])
-              xml.license(@data[:license])
-              contacts = []
-              @data[:authors].each_with_index do |a, i|
-                creator_id = i + 1
-                contacts << creator_id
-                xml.creator(id: creator_id, scope: 'document') do
-                  xml.individualName do
-                    xml.givenName(a[:first_name])
-                    xml.surName(a[:last_name])
-                  end
-                  xml.organizationName(a[:organization]) if a[:organization]
-                  xml.positionName(a[:position]) if a[:position]
-                  xml.onlineUrl(a[:url]) if a[:url]
-                  xml.electronicMailAddress(a[:email])
-                end
-              end
-              @data[:metadata_providers].each_with_index do |a, i|
-                xml.metadataProvider do
-                  xml.individualName do
-                    xml.givenName(a[:first_name])
-                    xml.surName(a[:last_name])
-                  end
-                  xml.organizationName(a[:organization]) if a[:organization]
-                  xml.positionName(a[:position]) if a[:position]
-                  xml.onlineUrl(a[:url]) if a[:url]
-                  xml.electronicMailAddress(a[:email])
-                end
-              end if @data[:metadata_providers]
-              xml.pubDate(Time.now.to_s)
-              xml.abstract() do
-                xml.para(@data[:abstract])
-              end
-              contacts.each do |contact|
-                xml.contact { xml.references(contact) }
-              end
-            end
-            xml.additionalMetadata do
-              xml.metadata do
-                xml.citation(@data[:citation])
-                xml.resourceLogoUrl(@data[:logo_url]) if @data[:logo_url]
-              end
-            end
+            :'xsi:schemaLocation' => 'eml_uri') do
+            build_dataset(xml)
+            build_additional_metadata(xml)
             xml.parent.namespace = xml.parent.namespace_definitions.first
           end
         end
@@ -77,6 +35,71 @@ class DarwinCore
       end
       private
+      def build_dataset(xml)
+        xml.dataset(id: @data[:id]) do
+          xml.title(@data[:title])
+          xml.license(@data[:license])
+          contacts = []
+          build_authors(xml, contacts)
+          build_metadata_providers(xml)
+          xml.pubDate(Time.now.to_s)
+          build_abstract(xml)
+          build_contacts(xml, contacts)
+        end
+      end
+      def build_abstract(xml)
+        xml.abstract() do
+          xml.para(@data[:abstract])
+        end
+      end
+      def build_contacts(xml, contacts)
+        contacts.each do |contact|
+          xml.contact { xml.references(contact) }
+        end
+      end
+      def build_metadata_providers(xml)
+        @data[:metadata_providers].each_with_index do |a, i|
+          xml.metadataProvider do
+            build_person(xml, a)
+          end
+        end if @data[:metadata_providers]
+      end
+      def build_authors(xml, contacts)
+        @data[:authors].each_with_index do |a, i|
+          creator_id = i + 1
+          contacts << creator_id
+          xml.creator(id: creator_id, scope: 'document') do
+            build_person(xml, a)
+          end
+        end
+      end
+      def build_additional_metadata(xml)
+        xml.additionalMetadata do
+          xml.metadata do
+            xml.citation(@data[:citation])
+            xml.resourceLogoUrl(@data[:logo_url]) if @data[:logo_url]
+          end
+        end
+      end
+      def build_person(xml, data)
+        a = data
+        xml.individualName do
+          xml.givenName(a[:first_name])
+          xml.surName(a[:last_name])
+        end
+        xml.organizationName(a[:organization]) if a[:organization]
+        xml.positionName(a[:position]) if a[:position]
+        xml.onlineUrl(a[:url]) if a[:url]
+        xml.electronicMailAddress(a[:email])
+      end
       def timestamp
         t = Time.now.getutc.to_a[0..5].reverse
         t[0..2].join('-') + '::' + t[-3..-1].join(':')

data/lib/dwc-archive/generator_meta_xml.rb CHANGED

@@ -16,26 +16,7 @@ class DarwinCore
                    fieldsEnclosedBy: '"',
                    linesTerminatedBy: "\n",
                    rowType: 'http://rs.tdwg.org/dwc/terms/Taxon' }
-          xml.archive(xmlns: 'http://rs.tdwg.org/dwc/text/',
-            :'xmlns:xsi' => 'http://www.w3.org/2001/XMLSchema-instance',
-            :'xsi:schemaLocation' => schema_uri) do
-            xml.core(opts.merge(ignoreHeaderLines:
-                                  @data[:core][:ignoreHeaderLines])) do
-              xml.files { xml.location(@data[:core][:location]) }
-              taxon_id, fields = find_taxon_id(@data[:core][:fields])
-              xml.id_(index: taxon_id[1])
-              fields.each { |f| xml.field(term: f[0], index: f[1]) }
-            end
-            @data[:extensions].each do |e|
-              xml.extension(opts.merge(ignoreHeaderLines: e[:ignoreHeaderLines],
-                                       rowType: e[:rowType])) do
-                xml.files { xml.location(e[:location]) }
-                taxon_id, fields = find_taxon_id(e[:fields])
-                xml.coreid(index: taxon_id[1])
-                fields.each { |f| xml.field(term: f[0], index: f[1]) }
-              end
-            end
-          end
+          build_archive(xml, opts, schema_uri)
         end
         meta_xml_data = builder.to_xml
         meta_file = open(File.join(@path, 'meta.xml'), @write)
@@ -44,6 +25,38 @@ class DarwinCore
       end
       private
+      def build_archive(xml, opts, schema_uri)
+        xml.archive(xmlns: 'http://rs.tdwg.org/dwc/text/',
+          :'xmlns:xsi' => 'http://www.w3.org/2001/XMLSchema-instance',
+          :'xsi:schemaLocation' => schema_uri) do
+          build_core(xml, opts)
+          build_extensions(xml, opts)
+        end
+      end
+      def build_core(xml, opts)
+        xml.core(opts.merge(ignoreHeaderLines:
+                              @data[:core][:ignoreHeaderLines])) do
+          xml.files { xml.location(@data[:core][:location]) }
+          taxon_id, fields = find_taxon_id(@data[:core][:fields])
+          xml.id_(index: taxon_id[1])
+          fields.each { |f| xml.field(term: f[0], index: f[1]) }
+        end
+      end
+      def build_extensions(xml, opts)
+        @data[:extensions].each do |e|
+          xml.extension(opts.merge(ignoreHeaderLines: e[:ignoreHeaderLines],
+                                   rowType: e[:rowType])) do
+            xml.files { xml.location(e[:location]) }
+            taxon_id, fields = find_taxon_id(e[:fields])
+            xml.coreid(index: taxon_id[1])
+            fields.each { |f| xml.field(term: f[0], index: f[1]) }
+          end
+        end
+      end
       def find_taxon_id(data)
         fields = []
         data.each_with_index { |f, i| fields << [f.strip, i] }

data/lib/dwc-archive/version.rb CHANGED

@@ -1,3 +1,3 @@
 class DarwinCore
-  VERSION = "0.9.10"
+  VERSION = "0.9.11"
 end

data/lib/dwc-archive/xml_reader.rb CHANGED

@@ -1,64 +1,80 @@
 # USAGE: Hash.from_xml:(YOUR_XML_STRING)
-require 'nokogiri'
 # modified from
 # http://stackoverflow.com/questions/1230741/
 # convert-a-nokogiri-document-to-a-ruby-hash/1231297#1231297
 class DarwinCore
   module XmlReader
     class << self
       def from_xml(xml_io)
         result = Nokogiri::XML(xml_io)
         return { result.root.name.to_sym => xml_node_to_hash(result.root)}
       end
       private
       def xml_node_to_hash(node)
         # If we are at the root of the document, start the hash
         if node.element?
-          result_hash = {}
-          if node.attributes != {}
-            result_hash[:attributes] = {}
-            node.attributes.keys.each do |key|
-              result_hash[:attributes][node.attributes[key].
-                name.to_sym] = prepare(node.attributes[key].value)
-            end
-          end
-          if node.children.size > 0
-            node.children.each do |child|
-              result = xml_node_to_hash(child)
-              if child.name == "text"
-                unless child.next_sibling || child.previous_sibling
-                  return prepare(result)
-                end
-              elsif result_hash[child.name.to_sym]
-                if result_hash[child.name.to_sym].is_a?(Object::Array)
-                  result_hash[child.name.to_sym] << prepare(result)
-                else
-                  result_hash[child.name.to_sym] =
-                    [result_hash[child.name.to_sym]] << prepare(result)
-                end
-              else
-                result_hash[child.name.to_sym] = prepare(result)
-              end
-            end
-            return result_hash
-          else
-            return result_hash
-          end
+          prepare_node_element(node)
         else
           return prepare(node.content.to_s)
         end
       end
+      def add_attributes(node, result_hash)
+        if node.attributes != {}
+          result_hash[:attributes] = {}
+          node.attributes.keys.each do |key|
+            result_hash[:attributes][node.attributes[key].name.to_sym] =
+              prepare(node.attributes[key].value)
+          end
+        end
+      end
+      def prepare_node_element(node)
+        result_hash = {}
+        add_attributes(node, result_hash)
+        if node.children.size > 0
+          result_hash = add_children(node, result_hash)
+        end
+        result_hash
+      end
+      def add_children(node, result_hash)
+        node.children.each do |child|
+          result = xml_node_to_hash(child)
+          if child.name == "text"
+            text = handle_text(child, result)
+            return text if text
+          elsif result_hash[child.name.to_sym]
+            handle_child_node(child, result_hash, result)
+          else
+            result_hash[child.name.to_sym] = prepare(result)
+          end
+        end
+        result_hash
+      end
+      def handle_child_node(child, result_hash, result)
+        if result_hash[child.name.to_sym].is_a?(Object::Array)
+          result_hash[child.name.to_sym] << prepare(result)
+        else
+          result_hash[child.name.to_sym] =
+            [result_hash[child.name.to_sym]] << prepare(result)
+        end
+      end
+      def handle_text(child, result)
+        unless child.next_sibling || child.previous_sibling
+          prepare(result)
+        end
+      end
       def prepare(data)
-        return data if data.class != String
-        return true if data.strip == "true"
-        return false if data.strip == "false"
-        data.to_i.to_s == data ? data.to_i : data
+        (data.class == String && data.to_i.to_s == data) ? data.to_i : data
       end
     end
   end
 end

data/spec/files/generator_eml.xml ADDED

@@ -0,0 +1,47 @@
+<?xml version="1.0"?>
+<eml:eml xmlns:eml="eml://ecoinformatics.org/eml-2.1.1" xmlns:md="eml://ecoinformatics.org/methods-2.1.1" xmlns:proj="eml://ecoinformatics.org/project-2.1.1" xmlns:d="eml://ecoinformatics.org/dataset-2.1.1" xmlns:res="eml://ecoinformatics.org/resource-2.1.1" xmlns:dc="http://purl.org/dc/terms/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" packageId="1234/2013-12-30::19:45:33" system="http://globalnames.org" xml:lang="en" xsi:schemaLocation="eml_uri">
+  <dataset id="1234">
+    <title>Test Classification</title>
+    <license>http://creativecommons.org/licenses/by-sa/3.0/</license>
+    <creator id="1" scope="document">
+      <individualName>
+        <givenName>John</givenName>
+        <surName>Doe</surName>
+      </individualName>
+      <organizationName>Example</organizationName>
+      <positionName>Assistant Professor</positionName>
+      <onlineUrl>http://example.org</onlineUrl>
+      <electronicMailAddress>jdoe@example.com</electronicMailAddress>
+    </creator>
+    <creator id="2" scope="document">
+      <individualName>
+        <givenName>Jane</givenName>
+        <surName>Doe</surName>
+      </individualName>
+      <electronicMailAddress>jane@example.com</electronicMailAddress>
+    </creator>
+    <metadataProvider>
+      <individualName>
+        <givenName>Jim</givenName>
+        <surName>Doe</surName>
+      </individualName>
+      <onlineUrl>http://aggregator.example.org</onlineUrl>
+      <electronicMailAddress>jimdoe@example.com</electronicMailAddress>
+    </metadataProvider>
+    <pubDate>2013-12-30 14:45:33 -0500</pubDate>
+    <abstract>
+      <para>test classification</para>
+    </abstract>
+    <contact>
+      <references>1</references>
+    </contact>
+    <contact>
+      <references>2</references>
+    </contact>
+  </dataset>
+  <additionalMetadata>
+    <metadata>
+      <citation>Test classification: Doe John, Doe Jane, Taxnonmy, 10, 1, 2010</citation>
+    </metadata>
+  </additionalMetadata>
+</eml:eml>

data/spec/files/generator_meta.xml ADDED

@@ -0,0 +1,19 @@
+<?xml version="1.0"?>
+<archive xmlns="http://rs.tdwg.org/dwc/text/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://rs.tdwg.org/dwc/terms/xsd/archive/ http://darwincore.googlecode.com/svn/trunk/text/tdwg_dwc_text.xsd">
+  <core encoding="UTF-8" fieldsTerminatedBy="," fieldsEnclosedBy="&quot;" linesTerminatedBy="&#10;" rowType="http://rs.tdwg.org/dwc/terms/Taxon" ignoreHeaderLines="1">
+    <files>
+      <location>core.csv</location>
+    </files>
+    <id index="0"/>
+    <field term="http://rs.tdwg.org/dwc/terms/parentNameUsageID" index="1"/>
+    <field term="http://rs.tdwg.org/dwc/terms/scientificName" index="2"/>
+    <field term="http://rs.tdwg.org/dwc/terms/taxonRank" index="3"/>
+  </core>
+  <extension encoding="UTF-8" fieldsTerminatedBy="," fieldsEnclosedBy="&quot;" linesTerminatedBy="&#10;" rowType="http://rs.gbif.org/terms/1.0/VernacularName" ignoreHeaderLines="1">
+    <files>
+      <location>vern.csv</location>
+    </files>
+    <coreid index="0"/>
+    <field term="http://rs.tdwg.org/dwc/terms/vernacularName" index="1"/>
+  </extension>
+</archive>

data/spec/lib/generator_spec.rb CHANGED

@@ -50,16 +50,25 @@ describe DarwinCore::Generator do
                         'http://rs.gbif.org/terms/1.0/VernacularName')
       gen.add_meta_xml
-      meta = File.read(File.join(gen.path, 'meta.xml'))
-      expect(meta).to match %r|<location>core.csv</location>|
+      meta = File.read(File.join(gen.path, 'meta.xml')).strip
+      meta_from_file= File.read(File.expand_path(
+        '../../files/generator_meta.xml',
+        __FILE__)).strip
+      expect(meta).to eq meta_from_file
     end
   end
   describe '#add_eml_data' do
     it 'adds eml data' do
       gen.add_eml_xml(EML_DATA)
-      eml = File.read(File.join(gen.path, 'eml.xml'))
-      expect(eml).to match /jdoe@example.com/
+      eml = File.read(File.join(gen.path, 'eml.xml')).strip
+      eml.gsub!(%r|(<pubDate>).*?(</pubDate>)|, '\12013-12-30 14:45:33 -0500\2')
+      eml.gsub!(/(packageId=").*?"/, '\11234/2013-12-30::19:45:33"')
+      eml_from_file = File.read(File.expand_path(
+        '../../files/generator_eml.xml',
+        __FILE__)).strip
+      expect(eml.strip).to eq eml_from_file.strip
     end
   end

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: dwc-archive
 version: !ruby/object:Gem::Version
-  version: 0.9.10
+  version: 0.9.11
 platform: ruby
 authors:
 - Dmitry Mozzherin
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-12-27 00:00:00.000000000 Z
+date: 2014-01-21 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: nokogiri
@@ -171,7 +171,6 @@ files:
 - LICENSE
 - README.md
 - Rakefile
-- ']'
 - dwc-archive.gemspec
 - features/dwca-creator.feature
 - features/dwca-reader.feature
@@ -200,6 +199,8 @@ files:
 - spec/files/empty_coreid.tar.gz
 - spec/files/file with characters(3).gz
 - spec/files/flat_list.tar.gz
+- spec/files/generator_eml.xml
+- spec/files/generator_meta.xml
 - spec/files/gnub.tar.gz
 - spec/files/invalid.tar.gz
 - spec/files/junk_dir_inside.zip
@@ -263,6 +264,8 @@ test_files:
 - spec/files/empty_coreid.tar.gz
 - spec/files/file with characters(3).gz
 - spec/files/flat_list.tar.gz
+- spec/files/generator_eml.xml
+- spec/files/generator_meta.xml
 - spec/files/gnub.tar.gz
 - spec/files/invalid.tar.gz
 - spec/files/junk_dir_inside.zip

data/] DELETED

@@ -1,40 +0,0 @@
-require_relative '../spec_helper'
-describe DarwinCore::Core do
-  subject(:dwca) { DarwinCore.new(file_path) }
-  subject(:core) { DarwinCore::Core.new(dwca) }
-  let(:file_path) { File.join(File.expand_path('../../files', __FILE__),
-                             file_name) }
-  let(:file_name) { 'data.tar.gz' }
-  describe '.new' do
-    it 'creates new core' do
-      expect(core).to be_kind_of DarwinCore::Core
-    end
-  end
-  describe '#id' do
-    it 'returns core id' do
-      expect(core.id[:index]).to eq 0
-      expect(core.id[:term]).to eq 'http://rs.tdwg.org/dwc/terms/TaxonID'
-    end
-    context 'no coreid' do
-      let(:file_name) { 'empty_coreid.tar.gz' }
-      it 'does not return coreid' do
-        expect(core.id[:index]).to eq 0
-        expect(core.id[:term]).to be_nil
-      end
-    end
-  end
-  it 'reads core file from archive' do
-    core.read
-  end
-end