dwc-archive 0.9.10 → 1.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +5 -5
- data/.gitignore +1 -0
- data/.rspec +2 -1
- data/.rubocop.yml +23 -0
- data/.ruby-version +1 -1
- data/.travis.yml +4 -7
- data/CHANGELOG +14 -8
- data/Gemfile +3 -1
- data/LICENSE +1 -1
- data/README.md +119 -107
- data/Rakefile +13 -36
- data/dwc-archive.gemspec +23 -19
- data/features/step_definitions/dwc-creator_steps.rb +5 -5
- data/features/step_definitions/dwc-reader_steps.rb +47 -28
- data/features/support/env.rb +1 -1
- data/lib/dwc_archive.rb +124 -0
- data/lib/dwc_archive/archive.rb +60 -0
- data/lib/dwc_archive/classification_normalizer.rb +382 -0
- data/lib/dwc_archive/core.rb +25 -0
- data/lib/{dwc-archive → dwc_archive}/errors.rb +10 -0
- data/lib/dwc_archive/expander.rb +88 -0
- data/lib/{dwc-archive → dwc_archive}/extension.rb +5 -3
- data/lib/dwc_archive/generator.rb +91 -0
- data/lib/dwc_archive/generator_eml_xml.rb +116 -0
- data/lib/dwc_archive/generator_meta_xml.rb +72 -0
- data/lib/dwc_archive/gnub_taxon.rb +14 -0
- data/lib/dwc_archive/ingester.rb +106 -0
- data/lib/dwc_archive/metadata.rb +57 -0
- data/lib/dwc_archive/taxon_normalized.rb +23 -0
- data/lib/dwc_archive/version.rb +6 -0
- data/lib/dwc_archive/xml_reader.rb +90 -0
- data/spec/files/file with characters(3).gz b/data/spec/files/file with → characters(3).tar.gz +0 -0
- data/spec/files/generator_eml.xml +47 -0
- data/spec/files/generator_meta.xml +19 -0
- data/spec/lib/classification_normalizer_spec.rb +96 -105
- data/spec/lib/core_spec.rb +43 -41
- data/spec/lib/darwin_core_spec.rb +108 -138
- data/spec/lib/generator_eml_xml_spec.rb +12 -11
- data/spec/lib/generator_meta_xml_spec.rb +12 -11
- data/spec/lib/generator_spec.rb +77 -69
- data/spec/lib/gnub_taxon_spec.rb +15 -17
- data/spec/lib/metadata_spec.rb +50 -41
- data/spec/lib/taxon_normalized_spec.rb +62 -65
- data/spec/lib/xml_reader_spec.rb +9 -12
- data/spec/spec_helper.rb +54 -51
- metadata +105 -88
- data/.rvmrc +0 -1
- data/] +0 -40
- data/lib/dwc-archive.rb +0 -107
- data/lib/dwc-archive/archive.rb +0 -40
- data/lib/dwc-archive/classification_normalizer.rb +0 -428
- data/lib/dwc-archive/core.rb +0 -17
- data/lib/dwc-archive/expander.rb +0 -84
- data/lib/dwc-archive/generator.rb +0 -85
- data/lib/dwc-archive/generator_eml_xml.rb +0 -86
- data/lib/dwc-archive/generator_meta_xml.rb +0 -58
- data/lib/dwc-archive/ingester.rb +0 -101
- data/lib/dwc-archive/metadata.rb +0 -48
- data/lib/dwc-archive/version.rb +0 -3
- data/lib/dwc-archive/xml_reader.rb +0 -64
data/lib/dwc-archive/version.rb
DELETED
@@ -1,64 +0,0 @@
|
|
1
|
-
# USAGE: Hash.from_xml:(YOUR_XML_STRING)
|
2
|
-
require 'nokogiri'
|
3
|
-
# modified from
|
4
|
-
# http://stackoverflow.com/questions/1230741/
|
5
|
-
# convert-a-nokogiri-document-to-a-ruby-hash/1231297#1231297
|
6
|
-
class DarwinCore
|
7
|
-
module XmlReader
|
8
|
-
class << self
|
9
|
-
def from_xml(xml_io)
|
10
|
-
result = Nokogiri::XML(xml_io)
|
11
|
-
return { result.root.name.to_sym => xml_node_to_hash(result.root)}
|
12
|
-
end
|
13
|
-
|
14
|
-
private
|
15
|
-
|
16
|
-
def xml_node_to_hash(node)
|
17
|
-
# If we are at the root of the document, start the hash
|
18
|
-
if node.element?
|
19
|
-
result_hash = {}
|
20
|
-
if node.attributes != {}
|
21
|
-
result_hash[:attributes] = {}
|
22
|
-
node.attributes.keys.each do |key|
|
23
|
-
result_hash[:attributes][node.attributes[key].
|
24
|
-
name.to_sym] = prepare(node.attributes[key].value)
|
25
|
-
end
|
26
|
-
end
|
27
|
-
if node.children.size > 0
|
28
|
-
node.children.each do |child|
|
29
|
-
result = xml_node_to_hash(child)
|
30
|
-
|
31
|
-
if child.name == "text"
|
32
|
-
unless child.next_sibling || child.previous_sibling
|
33
|
-
return prepare(result)
|
34
|
-
end
|
35
|
-
elsif result_hash[child.name.to_sym]
|
36
|
-
if result_hash[child.name.to_sym].is_a?(Object::Array)
|
37
|
-
result_hash[child.name.to_sym] << prepare(result)
|
38
|
-
else
|
39
|
-
result_hash[child.name.to_sym] =
|
40
|
-
[result_hash[child.name.to_sym]] << prepare(result)
|
41
|
-
end
|
42
|
-
else
|
43
|
-
result_hash[child.name.to_sym] = prepare(result)
|
44
|
-
end
|
45
|
-
end
|
46
|
-
|
47
|
-
return result_hash
|
48
|
-
else
|
49
|
-
return result_hash
|
50
|
-
end
|
51
|
-
else
|
52
|
-
return prepare(node.content.to_s)
|
53
|
-
end
|
54
|
-
end
|
55
|
-
|
56
|
-
def prepare(data)
|
57
|
-
return data if data.class != String
|
58
|
-
return true if data.strip == "true"
|
59
|
-
return false if data.strip == "false"
|
60
|
-
data.to_i.to_s == data ? data.to_i : data
|
61
|
-
end
|
62
|
-
end
|
63
|
-
end
|
64
|
-
end
|