assimilate 0.1.0 → 0.1.1

Sign up to get free protection for your applications and to get access to all the features.
@@ -30,8 +30,11 @@ class Assimilate::Batch
30
30
  end
31
31
  end
32
32
 
33
+ # The stripped record contains only the data values from the source (no internal values with leading underscores).
34
+ # Any nil values are ignored; these should not be stored but if they do appear in the catalog then don't want
35
+ # to include them when comparing new records vs. old.
33
36
  def stripped_record_for(key)
34
- @baseline[key] && @baseline[key].select {|k,v| k !~ /^_/}
37
+ @baseline[key] && @baseline[key].select {|k,v| k !~ /^_/ && !v.nil?}
35
38
  end
36
39
 
37
40
  def <<(record)
@@ -100,11 +103,14 @@ class Assimilate::Batch
100
103
  end
101
104
 
102
105
  def record_batch
103
- raise(Assimilate::DuplicateImportError, "duplicate batch for datestamp #{datestamp}") if @catalog.batches.find(@domainkey => @domain, 'datestamp' => @datestamp).to_a.any?
104
- raise(Assimilate::DuplicateImportError, "duplicate batch for file #{@filename}") if @catalog.batches.find(@domainkey => @domain, 'filename' => @filename).to_a.any?
106
+ # don't want leading underscore on attributes in the batches table
107
+ dkey = @domainkey.gsub(/^_/,'')
108
+
109
+ raise(Assimilate::DuplicateImportError, "duplicate batch for datestamp #{datestamp}") if @catalog.batches.find(dkey => @domain, 'datestamp' => @datestamp).to_a.any?
110
+ raise(Assimilate::DuplicateImportError, "duplicate batch for file #{@filename}") if @catalog.batches.find(dkey => @domain, 'filename' => @filename).to_a.any?
105
111
 
106
112
  @catalog.batches.insert({
107
- @domainkey => @domain,
113
+ dkey => @domain,
108
114
  'datestamp' => @datestamp,
109
115
  'filename' => @filename
110
116
  })
@@ -1,3 +1,3 @@
1
1
  module Assimilate
2
- VERSION = "0.1.0"
2
+ VERSION = "0.1.1"
3
3
  end
@@ -16,8 +16,7 @@ describe "loading extended data" do
16
16
  def import_base_data(datestamp, filename = "batch_input.csv")
17
17
  @batcher = @catalog.start_batch(domain: 'testdata', datestamp: datestamp, idfield: 'ID')
18
18
 
19
- @records = CSV.read(File.dirname(__FILE__) + "/../data/#{filename}", :headers => true)
20
- @records.each do |rec|
19
+ Assimilate.slurp(File.dirname(__FILE__) + "/../data/#{filename}") do |rec|
21
20
  @batcher << rec
22
21
  end
23
22
  @batcher.commit
@@ -31,8 +30,7 @@ describe "loading extended data" do
31
30
 
32
31
  def import_extended_data(datestamp, filename)
33
32
  @extender = @catalog.extend_data(domain: 'testdata', datastamp: datestamp, idfield: 'ID', key: 'inauguration')
34
- @records = CSV.read(File.dirname(__FILE__) + "/../data/#{filename}", :headers => true)
35
- @records.each do |rec|
33
+ Assimilate.slurp(File.dirname(__FILE__) + "/../data/#{filename}") do |rec|
36
34
  @extender << rec
37
35
  end
38
36
  @extender.commit
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: assimilate
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.1.0
4
+ version: 0.1.1
5
5
  prerelease:
6
6
  platform: ruby
7
7
  authors:
@@ -9,11 +9,11 @@ authors:
9
9
  autorequire:
10
10
  bindir: bin
11
11
  cert_chain: []
12
- date: 2012-05-03 00:00:00.000000000 Z
12
+ date: 2012-05-04 00:00:00.000000000 Z
13
13
  dependencies:
14
14
  - !ruby/object:Gem::Dependency
15
15
  name: mongo
16
- requirement: &2157622380 !ruby/object:Gem::Requirement
16
+ requirement: &2155898600 !ruby/object:Gem::Requirement
17
17
  none: false
18
18
  requirements:
19
19
  - - ~>
@@ -21,10 +21,10 @@ dependencies:
21
21
  version: 1.6.0
22
22
  type: :runtime
23
23
  prerelease: false
24
- version_requirements: *2157622380
24
+ version_requirements: *2155898600
25
25
  - !ruby/object:Gem::Dependency
26
26
  name: bson_ext
27
- requirement: &2157620560 !ruby/object:Gem::Requirement
27
+ requirement: &2155897820 !ruby/object:Gem::Requirement
28
28
  none: false
29
29
  requirements:
30
30
  - - ~>
@@ -32,10 +32,10 @@ dependencies:
32
32
  version: 1.6.0
33
33
  type: :runtime
34
34
  prerelease: false
35
- version_requirements: *2157620560
35
+ version_requirements: *2155897820
36
36
  - !ruby/object:Gem::Dependency
37
37
  name: activesupport
38
- requirement: &2157620020 !ruby/object:Gem::Requirement
38
+ requirement: &2155897040 !ruby/object:Gem::Requirement
39
39
  none: false
40
40
  requirements:
41
41
  - - ~>
@@ -43,10 +43,10 @@ dependencies:
43
43
  version: 3.2.0
44
44
  type: :runtime
45
45
  prerelease: false
46
- version_requirements: *2157620020
46
+ version_requirements: *2155897040
47
47
  - !ruby/object:Gem::Dependency
48
48
  name: rspec
49
- requirement: &2157619060 !ruby/object:Gem::Requirement
49
+ requirement: &2155896200 !ruby/object:Gem::Requirement
50
50
  none: false
51
51
  requirements:
52
52
  - - ~>
@@ -54,10 +54,10 @@ dependencies:
54
54
  version: 2.9.0
55
55
  type: :development
56
56
  prerelease: false
57
- version_requirements: *2157619060
57
+ version_requirements: *2155896200
58
58
  - !ruby/object:Gem::Dependency
59
59
  name: guard-rspec
60
- requirement: &2157618020 !ruby/object:Gem::Requirement
60
+ requirement: &2155895320 !ruby/object:Gem::Requirement
61
61
  none: false
62
62
  requirements:
63
63
  - - ~>
@@ -65,10 +65,10 @@ dependencies:
65
65
  version: 0.7.0
66
66
  type: :development
67
67
  prerelease: false
68
- version_requirements: *2157618020
68
+ version_requirements: *2155895320
69
69
  - !ruby/object:Gem::Dependency
70
70
  name: ruby_gntp
71
- requirement: &2157616740 !ruby/object:Gem::Requirement
71
+ requirement: &2155894100 !ruby/object:Gem::Requirement
72
72
  none: false
73
73
  requirements:
74
74
  - - ~>
@@ -76,7 +76,7 @@ dependencies:
76
76
  version: 0.3.4
77
77
  type: :development
78
78
  prerelease: false
79
- version_requirements: *2157616740
79
+ version_requirements: *2155894100
80
80
  description: Ingest updates from CSV and apply to set of hashes
81
81
  email:
82
82
  - jmay@pobox.com