RubyGems - dwc-archive - Versions diffs - 0.9.10 → 0.9.11 - Mend

dwc-archive 0.9.10 → 0.9.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

checksums.yaml +4 -4
data/.travis.yml +1 -1
data/CHANGELOG +10 -8
data/README.md +8 -1
data/lib/dwc-archive.rb +1 -1
data/lib/dwc-archive/archive.rb +1 -1
data/lib/dwc-archive/classification_normalizer.rb +11 -12
data/lib/dwc-archive/core.rb +3 -1
data/lib/dwc-archive/expander.rb +1 -0
data/lib/dwc-archive/generator.rb +13 -12
data/lib/dwc-archive/generator_eml_xml.rb +68 -45
data/lib/dwc-archive/generator_meta_xml.rb +33 -20
data/lib/dwc-archive/version.rb +1 -1
data/lib/dwc-archive/xml_reader.rb +54 -38
data/spec/files/generator_eml.xml +47 -0
data/spec/files/generator_meta.xml +19 -0
data/spec/lib/generator_spec.rb +13 -4
metadata +6 -3
data/] +0 -40

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 8e8c929203d1b652f8ba345b0c4c39cfc87a0369
-  data.tar.gz: 739a064221bf52523990bfea38749f11b4d986c0
+  metadata.gz: 5c6c5b2a4de324abded5b3adb81d6bcd9603965f
+  data.tar.gz: ac00e15f95766838ff42a9bdc3f1a682c4a8e9ff
 SHA512:
-  metadata.gz: adfd46bea84e301ceca6de355f189b884bc6a9a22eb8d98e3976f17e3407d2de7f15963ec0d6f29958de057de9d579c81d8007d72c38fc1b9f9ada9295381152
-  data.tar.gz: 2e188f828d0bbe28baf5f1d8aa7aab12ca330000bf3f5ee145501d78961f9ca5e696be1171998a433952cf84546a8d5fd61c6cf45958576a7e0800fbf4542dae
+  metadata.gz: d84f2974ed7bcbabc62d2d3b5c5b15dd8d6d2aa38836a955c12896ada2391e978ca2d420d86bf59db2ab61cc801c9c43036be13699ba7b3902d8daa4f366d45b
+  data.tar.gz: a07a91365cba60fa418b85d7b516781c9209ea607dbe5ec45da86febd14bfa104cc16e4b55619a157f5bbb487dff2fd7e318399d815a63372197a9732b3820fb

data/.travis.yml CHANGED

@@ -1,5 +1,5 @@
 rvm:
-  - 1.9.3-p448
+  - 1.9.3-p484
   - 2.0.0-p353
 before_install:
   - sudo apt-get update

data/CHANGELOG CHANGED

@@ -1,15 +1,17 @@
-0.9.7 Refactoring and tests improvements
+0.9.11 Removed VERSION duplicate
-0.9.6 Added support for GNUB DwCA files
+0.9.7  Refactoring and tests improvements
-0.9.4 Gem dependencies updated, added travis support
+0.9.6  Added support for GNUB DwCA files
-0.9.0 Migrated code to ruby 1.9.3
+0.9.4  Gem dependencies updated, added travis support
-0.8.3 Updated outdated exception rasing
+0.9.0  Migrated code to ruby 1.9.3
-0.8.2 Removed species info from linnean classification path
+0.8.3  Updated outdated exception rasing
-0.8.1 Linnean classification path is now only for species and infraspecies with canonical forms. It ends with a canonical form of the taxon
+0.8.2  Removed species info from linnean classification path
-0.8.0 Added linnean classification path to normalized data from DwCA. It consists of data associated with clades like 'kingdom', 'order' etc.
+0.8.1  Linnean classification path is now only for species and infraspecies with canonical forms. It ends with a canonical form of the taxon
+0.8.0  Added linnean classification path to normalized data from DwCA. It consists of data associated with clades like 'kingdom', 'order' etc.

data/README.md CHANGED

@@ -175,7 +175,11 @@ Note on Patches/Pull Requests
 Copyright
 ---------
-Copyright (c) 2010-2013 Marine Biological Laboratory. See LICENSE for details.
+Author -- [Dmitry Mozzherin][13]
+Contributors -- [Matt Yoder][14]
+Copyright (c) 2010-2014 [Marine Biological Laboratory][15]. See LICENSE for details.
 [1]: https://badge.fury.io/rb/dwc-archive.png
 [2]: http://badge.fury.io/rb/dwc-archive
@@ -189,3 +193,6 @@ Copyright (c) 2010-2013 Marine Biological Laboratory. See LICENSE for details.
 [10]: https://gemnasium.com/GlobalNamesArchitecture/dwc-archive
 [11]: http://bit.ly/2IxcBA
 [12]: http://redis.io/topics/quickstart
+[13]: https://github.com/dimus
+[14]: https://github.com/mjy
+[15]: http://mbl.edu

data/lib/dwc-archive.rb CHANGED

@@ -8,6 +8,7 @@ require 'ostruct'
 require 'digest'
 require 'csv'
 require 'logger'
+require 'nokogiri'
 require_relative 'dwc-archive/xml_reader'
 require_relative 'dwc-archive/ingester'
 require_relative 'dwc-archive/errors'
@@ -24,7 +25,6 @@ require_relative 'dwc-archive/version'
 class DarwinCore
-  VERSION = DarwinCore::VERSION
   DEFAULT_TMP_DIR = "/tmp"
   attr_reader :archive, :core, :metadata, :extensions,

data/lib/dwc-archive/archive.rb CHANGED

@@ -1,7 +1,7 @@
-require 'nokogiri'
 class DarwinCore
   class Archive
     attr_reader :meta, :eml
     def initialize(archive_path, tmp_dir)
       @archive_path = archive_path
       @tmp_dir = tmp_dir

data/lib/dwc-archive/classification_normalizer.rb CHANGED

@@ -72,21 +72,11 @@ class DarwinCore
     end
     def name_strings(opts = {})
-      opts = { with_hash: false }.merge(opts)
-      if !!opts[:with_hash]
-        @name_strings
-      else
-        @name_strings.keys
-      end
+      process_strings(@name_strings, opts)
     end
     def vernacular_name_strings(opts = {})
-      opts = { with_hash: false }.merge(opts)
-      if !!opts[:with_hash]
-        @vernacular_name_strings
-      else
-        @vernacular_name_strings.keys
-      end
+      process_strings(@vernacular_name_strings, opts)
     end
     def normalize(opts = {})
@@ -110,6 +100,15 @@ class DarwinCore
   private
+    def process_strings(strings, opts)
+      opts = { with_hash: false }.merge(opts)
+      if !!opts[:with_hash]
+        strings
+      else
+        strings.keys
+      end
+    end
     def get_canonical_name(a_scientific_name)
       if @with_canonical_names
         canonical_name = @parser.parse(a_scientific_name,

data/lib/dwc-archive/core.rb CHANGED

@@ -2,6 +2,7 @@ class DarwinCore
   class Core
     include DarwinCore::Ingester
     attr_reader :id
     def initialize(dwc)
       @dwc = dwc
       @archive = @dwc.archive
@@ -9,9 +10,10 @@ class DarwinCore
       root_key = @archive.meta.keys[0]
       @data = @archive.meta[root_key][:core]
       raise DarwinCore::CoreFileError.
-        new("Cannot find core in meta.xml, is meta.xml valid?") unless @data
+        new('Cannot find core in meta.xml, is meta.xml valid?') unless @data
       @id = @data[:id][:attributes]
       get_attributes(DarwinCore::CoreFileError)
     end
   end
 end

data/lib/dwc-archive/expander.rb CHANGED

@@ -1,5 +1,6 @@
 class DarwinCore
   class Expander
     def initialize(archive_path, tmp_dir)
       @archive_path = archive_path
       @tmp_dir = tmp_dir

data/lib/dwc-archive/generator.rb CHANGED

@@ -21,12 +21,7 @@ class DarwinCore
     def add_core(data, file_name, keep_headers = true)
       c = CSV.open(File.join(@path,file_name), @write)
       header = data.shift
-      fields = header.map do |f|
-        f.strip!
-        err = 'No header in core data, or header fields are not urls'
-        raise DarwinCore::GeneratorError.new(err) unless f.match(/^http:\/\//)
-        f.split('/')[-1]
-      end
+      fields = get_fields(header, 'core')
       data.unshift(fields) if keep_headers
       ignore_header_lines = keep_headers ? 1 : 0
       @meta_xml_data[:core] = { fields: header,
@@ -41,12 +36,7 @@ class DarwinCore
                       row_type = 'http://rs.tdwg.org/dwc/terms/Taxon')
       c = CSV.open(File.join(@path,file_name), @write)
       header = data.shift
-      fields = header.map do |f|
-        f.strip!
-        err = 'No header in core data, or header fields are not urls'
-        raise DarwinCore::GeneratorError.new(err) unless f.match(/^http:\/\//)
-        f.split('/')[-1]
-      end
+      fields = get_fields(header, 'extension')
       data.unshift(fields) if keep_headers
       ignore_header_lines = keep_headers ? 1 : 0
       @meta_xml_data[:extensions] << { fields: header,
@@ -81,5 +71,16 @@ class DarwinCore
       a = "cd #{@path}; tar -zcf #{@dwc_path} *"
       system(a)
     end
+    private
+    def get_fields(header, file_type)
+      header.map do |f|
+        f.strip!
+        err = "No header in %s data, or header fields are not urls" % file_type
+        raise DarwinCore::GeneratorError.new(err) unless f.match(/^http:\/\//)
+        f.split('/')[-1]
+      end
+    end
   end
 end

data/lib/dwc-archive/generator_eml_xml.rb CHANGED

@@ -22,51 +22,9 @@ class DarwinCore
             :'xmlns:res' =>        'eml://ecoinformatics.org/resource-2.1.1',
             :'xmlns:dc' =>         'http://purl.org/dc/terms/',
             :'xmlns:xsi' =>        'http://www.w3.org/2001/XMLSchema-instance',
-            :'xsi:schemaLocation' => 'eml_uri')  do
-            xml.dataset(id: @data[:id]) do
-              xml.title(@data[:title])
-              xml.license(@data[:license])
-              contacts = []
-              @data[:authors].each_with_index do |a, i|
-                creator_id = i + 1
-                contacts << creator_id
-                xml.creator(id: creator_id, scope: 'document') do
-                  xml.individualName do
-                    xml.givenName(a[:first_name])
-                    xml.surName(a[:last_name])
-                  end
-                  xml.organizationName(a[:organization]) if a[:organization]
-                  xml.positionName(a[:position]) if a[:position]
-                  xml.onlineUrl(a[:url]) if a[:url]
-                  xml.electronicMailAddress(a[:email])
-                end
-              end
-              @data[:metadata_providers].each_with_index do |a, i|
-                xml.metadataProvider do
-                  xml.individualName do
-                    xml.givenName(a[:first_name])
-                    xml.surName(a[:last_name])
-                  end
-                  xml.organizationName(a[:organization]) if a[:organization]
-                  xml.positionName(a[:position]) if a[:position]
-                  xml.onlineUrl(a[:url]) if a[:url]
-                  xml.electronicMailAddress(a[:email])
-                end
-              end if @data[:metadata_providers]
-              xml.pubDate(Time.now.to_s)
-              xml.abstract() do
-                xml.para(@data[:abstract])
-              end
-              contacts.each do |contact|
-                xml.contact { xml.references(contact) }
-              end
-            end
-            xml.additionalMetadata do
-              xml.metadata do
-                xml.citation(@data[:citation])
-                xml.resourceLogoUrl(@data[:logo_url]) if @data[:logo_url]
-              end
-            end
+            :'xsi:schemaLocation' => 'eml_uri') do
+            build_dataset(xml)
+            build_additional_metadata(xml)
             xml.parent.namespace = xml.parent.namespace_definitions.first
           end
         end
@@ -77,6 +35,71 @@ class DarwinCore
       end
       private
+      def build_dataset(xml)
+        xml.dataset(id: @data[:id]) do
+          xml.title(@data[:title])
+          xml.license(@data[:license])
+          contacts = []
+          build_authors(xml, contacts)
+          build_metadata_providers(xml)
+          xml.pubDate(Time.now.to_s)
+          build_abstract(xml)
+          build_contacts(xml, contacts)
+        end
+      end
+      def build_abstract(xml)
+        xml.abstract() do
+          xml.para(@data[:abstract])
+        end
+      end
+      def build_contacts(xml, contacts)
+        contacts.each do |contact|
+          xml.contact { xml.references(contact) }
+        end
+      end
+      def build_metadata_providers(xml)
+        @data[:metadata_providers].each_with_index do |a, i|
+          xml.metadataProvider do
+            build_person(xml, a)
+          end
+        end if @data[:metadata_providers]
+      end
+      def build_authors(xml, contacts)
+        @data[:authors].each_with_index do |a, i|
+          creator_id = i + 1
+          contacts << creator_id
+          xml.creator(id: creator_id, scope: 'document') do
+            build_person(xml, a)
+          end
+        end
+      end
+      def build_additional_metadata(xml)
+        xml.additionalMetadata do
+          xml.metadata do
+            xml.citation(@data[:citation])
+            xml.resourceLogoUrl(@data[:logo_url]) if @data[:logo_url]
+          end
+        end
+      end
+      def build_person(xml, data)
+        a = data
+        xml.individualName do
+          xml.givenName(a[:first_name])
+          xml.surName(a[:last_name])
+        end
+        xml.organizationName(a[:organization]) if a[:organization]
+        xml.positionName(a[:position]) if a[:position]
+        xml.onlineUrl(a[:url]) if a[:url]
+        xml.electronicMailAddress(a[:email])
+      end
       def timestamp
         t = Time.now.getutc.to_a[0..5].reverse
         t[0..2].join('-') + '::' + t[-3..-1].join(':')

data/lib/dwc-archive/generator_meta_xml.rb CHANGED

@@ -16,26 +16,7 @@ class DarwinCore
                    fieldsEnclosedBy: '"',
                    linesTerminatedBy: "\n",
                    rowType: 'http://rs.tdwg.org/dwc/terms/Taxon' }
-          xml.archive(xmlns: 'http://rs.tdwg.org/dwc/text/',
-            :'xmlns:xsi' => 'http://www.w3.org/2001/XMLSchema-instance',
-            :'xsi:schemaLocation' => schema_uri) do
-            xml.core(opts.merge(ignoreHeaderLines:
-                                  @data[:core][:ignoreHeaderLines])) do
-              xml.files { xml.location(@data[:core][:location]) }
-              taxon_id, fields = find_taxon_id(@data[:core][:fields])
-              xml.id_(index: taxon_id[1])
-              fields.each { |f| xml.field(term: f[0], index: f[1]) }
-            end
-            @data[:extensions].each do |e|
-              xml.extension(opts.merge(ignoreHeaderLines: e[:ignoreHeaderLines],
-                                       rowType: e[:rowType])) do
-                xml.files { xml.location(e[:location]) }
-                taxon_id, fields = find_taxon_id(e[:fields])
-                xml.coreid(index: taxon_id[1])
-                fields.each { |f| xml.field(term: f[0], index: f[1]) }
-              end
-            end
-          end
+          build_archive(xml, opts, schema_uri)
         end
         meta_xml_data = builder.to_xml
         meta_file = open(File.join(@path, 'meta.xml'), @write)
@@ -44,6 +25,38 @@ class DarwinCore
       end
       private
+      def build_archive(xml, opts, schema_uri)
+        xml.archive(xmlns: 'http://rs.tdwg.org/dwc/text/',
+          :'xmlns:xsi' => 'http://www.w3.org/2001/XMLSchema-instance',
+          :'xsi:schemaLocation' => schema_uri) do
+          build_core(xml, opts)
+          build_extensions(xml, opts)
+        end
+      end
+      def build_core(xml, opts)
+        xml.core(opts.merge(ignoreHeaderLines:
+                              @data[:core][:ignoreHeaderLines])) do
+          xml.files { xml.location(@data[:core][:location]) }
+          taxon_id, fields = find_taxon_id(@data[:core][:fields])
+          xml.id_(index: taxon_id[1])
+          fields.each { |f| xml.field(term: f[0], index: f[1]) }
+        end
+      end
+      def build_extensions(xml, opts)
+        @data[:extensions].each do |e|
+          xml.extension(opts.merge(ignoreHeaderLines: e[:ignoreHeaderLines],
+                                   rowType: e[:rowType])) do
+            xml.files { xml.location(e[:location]) }
+            taxon_id, fields = find_taxon_id(e[:fields])
+            xml.coreid(index: taxon_id[1])
+            fields.each { |f| xml.field(term: f[0], index: f[1]) }
+          end
+        end
+      end
       def find_taxon_id(data)
         fields = []
         data.each_with_index { |f, i| fields << [f.strip, i] }

data/lib/dwc-archive/version.rb CHANGED

@@ -1,3 +1,3 @@
 class DarwinCore
-  VERSION = "0.9.10"
+  VERSION = "0.9.11"
 end

data/lib/dwc-archive/xml_reader.rb CHANGED

@@ -1,64 +1,80 @@
 # USAGE: Hash.from_xml:(YOUR_XML_STRING)
-require 'nokogiri'
 # modified from
 # http://stackoverflow.com/questions/1230741/
 # convert-a-nokogiri-document-to-a-ruby-hash/1231297#1231297
 class DarwinCore
   module XmlReader
     class << self
       def from_xml(xml_io)
         result = Nokogiri::XML(xml_io)
         return { result.root.name.to_sym => xml_node_to_hash(result.root)}
       end
       private
       def xml_node_to_hash(node)
         # If we are at the root of the document, start the hash
         if node.element?
-          result_hash = {}
-          if node.attributes != {}
-            result_hash[:attributes] = {}
-            node.attributes.keys.each do |key|
-              result_hash[:attributes][node.attributes[key].
-                name.to_sym] = prepare(node.attributes[key].value)
-            end
-          end
-          if node.children.size > 0
-            node.children.each do |child|
-              result = xml_node_to_hash(child)
-              if child.name == "text"
-                unless child.next_sibling || child.previous_sibling
-                  return prepare(result)
-                end
-              elsif result_hash[child.name.to_sym]
-                if result_hash[child.name.to_sym].is_a?(Object::Array)
-                  result_hash[child.name.to_sym] << prepare(result)
-                else
-                  result_hash[child.name.to_sym] =
-                    [result_hash[child.name.to_sym]] << prepare(result)
-                end
-              else
-                result_hash[child.name.to_sym] = prepare(result)
-              end
-            end
-            return result_hash
-          else
-            return result_hash
-          end
+          prepare_node_element(node)
         else
           return prepare(node.content.to_s)
         end
       end
+      def add_attributes(node, result_hash)
+        if node.attributes != {}
+          result_hash[:attributes] = {}
+          node.attributes.keys.each do |key|
+            result_hash[:attributes][node.attributes[key].name.to_sym] =
+              prepare(node.attributes[key].value)
+          end
+        end
+      end
+      def prepare_node_element(node)
+        result_hash = {}
+        add_attributes(node, result_hash)
+        if node.children.size > 0
+          result_hash = add_children(node, result_hash)
+        end
+        result_hash
+      end
+      def add_children(node, result_hash)
+        node.children.each do |child|
+          result = xml_node_to_hash(child)
+          if child.name == "text"
+            text = handle_text(child, result)
+            return text if text
+          elsif result_hash[child.name.to_sym]
+            handle_child_node(child, result_hash, result)
+          else
+            result_hash[child.name.to_sym] = prepare(result)
+          end
+        end
+        result_hash
+      end
+      def handle_child_node(child, result_hash, result)
+        if result_hash[child.name.to_sym].is_a?(Object::Array)
+          result_hash[child.name.to_sym] << prepare(result)
+        else
+          result_hash[child.name.to_sym] =
+            [result_hash[child.name.to_sym]] << prepare(result)
+        end
+      end
+      def handle_text(child, result)
+        unless child.next_sibling || child.previous_sibling
+          prepare(result)
+        end
+      end
       def prepare(data)
-        return data if data.class != String
-        return true if data.strip == "true"
-        return false if data.strip == "false"
-        data.to_i.to_s == data ? data.to_i : data
+        (data.class == String && data.to_i.to_s == data) ? data.to_i : data
       end
     end
   end
 end

data/spec/files/generator_eml.xml ADDED

@@ -0,0 +1,47 @@
+<?xml version="1.0"?>
+<eml:eml xmlns:eml="eml://ecoinformatics.org/eml-2.1.1" xmlns:md="eml://ecoinformatics.org/methods-2.1.1" xmlns:proj="eml://ecoinformatics.org/project-2.1.1" xmlns:d="eml://ecoinformatics.org/dataset-2.1.1" xmlns:res="eml://ecoinformatics.org/resource-2.1.1" xmlns:dc="http://purl.org/dc/terms/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" packageId="1234/2013-12-30::19:45:33" system="http://globalnames.org" xml:lang="en" xsi:schemaLocation="eml_uri">
+  <dataset id="1234">
+    <title>Test Classification</title>
+    <license>http://creativecommons.org/licenses/by-sa/3.0/</license>
+    <creator id="1" scope="document">
+      <individualName>
+        <givenName>John</givenName>
+        <surName>Doe</surName>
+      </individualName>
+      <organizationName>Example</organizationName>
+      <positionName>Assistant Professor</positionName>
+      <onlineUrl>http://example.org</onlineUrl>
+      <electronicMailAddress>jdoe@example.com</electronicMailAddress>
+    </creator>
+    <creator id="2" scope="document">
+      <individualName>
+        <givenName>Jane</givenName>
+        <surName>Doe</surName>
+      </individualName>
+      <electronicMailAddress>jane@example.com</electronicMailAddress>
+    </creator>
+    <metadataProvider>
+      <individualName>
+        <givenName>Jim</givenName>
+        <surName>Doe</surName>
+      </individualName>
+      <onlineUrl>http://aggregator.example.org</onlineUrl>
+      <electronicMailAddress>jimdoe@example.com</electronicMailAddress>
+    </metadataProvider>
+    <pubDate>2013-12-30 14:45:33 -0500</pubDate>
+    <abstract>
+      <para>test classification</para>
+    </abstract>
+    <contact>
+      <references>1</references>
+    </contact>
+    <contact>
+      <references>2</references>
+    </contact>
+  </dataset>
+  <additionalMetadata>
+    <metadata>
+      <citation>Test classification: Doe John, Doe Jane, Taxnonmy, 10, 1, 2010</citation>
+    </metadata>
+  </additionalMetadata>
+</eml:eml>

data/spec/files/generator_meta.xml ADDED

@@ -0,0 +1,19 @@
+<?xml version="1.0"?>
+<archive xmlns="http://rs.tdwg.org/dwc/text/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://rs.tdwg.org/dwc/terms/xsd/archive/ http://darwincore.googlecode.com/svn/trunk/text/tdwg_dwc_text.xsd">
+  <core encoding="UTF-8" fieldsTerminatedBy="," fieldsEnclosedBy="&quot;" linesTerminatedBy="&#10;" rowType="http://rs.tdwg.org/dwc/terms/Taxon" ignoreHeaderLines="1">
+    <files>
+      <location>core.csv</location>
+    </files>
+    <id index="0"/>
+    <field term="http://rs.tdwg.org/dwc/terms/parentNameUsageID" index="1"/>
+    <field term="http://rs.tdwg.org/dwc/terms/scientificName" index="2"/>
+    <field term="http://rs.tdwg.org/dwc/terms/taxonRank" index="3"/>
+  </core>
+  <extension encoding="UTF-8" fieldsTerminatedBy="," fieldsEnclosedBy="&quot;" linesTerminatedBy="&#10;" rowType="http://rs.gbif.org/terms/1.0/VernacularName" ignoreHeaderLines="1">
+    <files>
+      <location>vern.csv</location>
+    </files>
+    <coreid index="0"/>
+    <field term="http://rs.tdwg.org/dwc/terms/vernacularName" index="1"/>
+  </extension>
+</archive>

data/spec/lib/generator_spec.rb CHANGED

@@ -50,16 +50,25 @@ describe DarwinCore::Generator do
                         'http://rs.gbif.org/terms/1.0/VernacularName')
       gen.add_meta_xml
-      meta = File.read(File.join(gen.path, 'meta.xml'))
-      expect(meta).to match %r|<location>core.csv</location>|
+      meta = File.read(File.join(gen.path, 'meta.xml')).strip
+      meta_from_file= File.read(File.expand_path(
+        '../../files/generator_meta.xml',
+        __FILE__)).strip
+      expect(meta).to eq meta_from_file
     end
   end
   describe '#add_eml_data' do
     it 'adds eml data' do
       gen.add_eml_xml(EML_DATA)
-      eml = File.read(File.join(gen.path, 'eml.xml'))
-      expect(eml).to match /jdoe@example.com/
+      eml = File.read(File.join(gen.path, 'eml.xml')).strip
+      eml.gsub!(%r|(<pubDate>).*?(</pubDate>)|, '\12013-12-30 14:45:33 -0500\2')
+      eml.gsub!(/(packageId=").*?"/, '\11234/2013-12-30::19:45:33"')
+      eml_from_file = File.read(File.expand_path(
+        '../../files/generator_eml.xml',
+        __FILE__)).strip
+      expect(eml.strip).to eq eml_from_file.strip
     end
   end

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: dwc-archive
 version: !ruby/object:Gem::Version
-  version: 0.9.10
+  version: 0.9.11
 platform: ruby
 authors:
 - Dmitry Mozzherin
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-12-27 00:00:00.000000000 Z
+date: 2014-01-21 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: nokogiri
@@ -171,7 +171,6 @@ files:
 - LICENSE
 - README.md
 - Rakefile
-- ']'
 - dwc-archive.gemspec
 - features/dwca-creator.feature
 - features/dwca-reader.feature
@@ -200,6 +199,8 @@ files:
 - spec/files/empty_coreid.tar.gz
 - spec/files/file with characters(3).gz
 - spec/files/flat_list.tar.gz
+- spec/files/generator_eml.xml
+- spec/files/generator_meta.xml
 - spec/files/gnub.tar.gz
 - spec/files/invalid.tar.gz
 - spec/files/junk_dir_inside.zip
@@ -263,6 +264,8 @@ test_files:
 - spec/files/empty_coreid.tar.gz
 - spec/files/file with characters(3).gz
 - spec/files/flat_list.tar.gz
+- spec/files/generator_eml.xml
+- spec/files/generator_meta.xml
 - spec/files/gnub.tar.gz
 - spec/files/invalid.tar.gz
 - spec/files/junk_dir_inside.zip

data/] DELETED

@@ -1,40 +0,0 @@
-require_relative '../spec_helper'
-describe DarwinCore::Core do
-  subject(:dwca) { DarwinCore.new(file_path) }
-  subject(:core) { DarwinCore::Core.new(dwca) }
-  let(:file_path) { File.join(File.expand_path('../../files', __FILE__),
-                             file_name) }
-  let(:file_name) { 'data.tar.gz' }
-  describe '.new' do
-    it 'creates new core' do
-      expect(core).to be_kind_of DarwinCore::Core
-    end
-  end
-  describe '#id' do
-    it 'returns core id' do
-      expect(core.id[:index]).to eq 0
-      expect(core.id[:term]).to eq 'http://rs.tdwg.org/dwc/terms/TaxonID'
-    end
-    context 'no coreid' do
-      let(:file_name) { 'empty_coreid.tar.gz' }
-      it 'does not return coreid' do
-        expect(core.id[:index]).to eq 0
-        expect(core.id[:term]).to be_nil
-      end
-    end
-  end
-  it 'reads core file from archive' do
-    core.read
-  end
-end