text_ferry 0.0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/.gitignore +9 -0
- data/Gemfile +4 -0
- data/README.rdoc +58 -0
- data/Rakefile +23 -0
- data/lib/text_ferry/loader.rb +48 -0
- data/lib/text_ferry/version.rb +3 -0
- data/lib/text_ferry.rb +2 -0
- data/test/sample_data/routes.csv +20 -0
- data/test/test_helper.rb +4 -0
- data/test/text_ferry/loader_test.rb +47 -0
- data/text_ferry.gemspec +27 -0
- metadata +127 -0
data/.gitignore
ADDED
data/Gemfile
ADDED
data/README.rdoc
ADDED
@@ -0,0 +1,58 @@
|
|
1
|
+
= Text Ferry
|
2
|
+
Text Ferry is a super simple DSL for quickly loading CSV text files into a
|
3
|
+
database.
|
4
|
+
|
5
|
+
== Installation
|
6
|
+
gem install text_ferry
|
7
|
+
or in your Gemfile:
|
8
|
+
gem "text_ferry"
|
9
|
+
|
10
|
+
== Notes / Use
|
11
|
+
Text Ferry relies on Sequel[http://sequel.rubyforge.org/documentation.html] to
|
12
|
+
do the heavy lifting. You will need to be familiar with how to define a table
|
13
|
+
schema using Sequel. For example, to load a CSV file named "data.csv" that is
|
14
|
+
located in a folder named "/my_data":
|
15
|
+
|
16
|
+
loader = TextFerry::Loader.new("sqlite://sample.db", "/my_data")
|
17
|
+
loader.load_table(:data) do
|
18
|
+
primary_key :id
|
19
|
+
String :name
|
20
|
+
String :phone
|
21
|
+
end
|
22
|
+
|
23
|
+
This will load data from the CSV file into a database named "sample.db" using
|
24
|
+
the given column names and types. Note that if the table already exists in the
|
25
|
+
database, it will be dropped and re-created using the given schema.
|
26
|
+
|
27
|
+
== Patches / Pull Requests
|
28
|
+
* Fork the project.
|
29
|
+
* Make your feature addition or bug fix.
|
30
|
+
* Add tests for it. This is important so I don’t break it in a future version
|
31
|
+
unintentionally.
|
32
|
+
* Commit, do not mess with rakefile, version, or history (if you want to have
|
33
|
+
your own version, that is fine but bump version in a commit by itself I can
|
34
|
+
ignore when I pull).
|
35
|
+
* Send me a pull request. Bonus points for topic branches.
|
36
|
+
|
37
|
+
== License
|
38
|
+
The MIT License
|
39
|
+
|
40
|
+
Copyright © 2011 Bob Nadler, Jr.
|
41
|
+
|
42
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy of
|
43
|
+
this software and associated documentation files (the "Software"), to deal in
|
44
|
+
the Software without restriction, including without limitation the rights to
|
45
|
+
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
|
46
|
+
of the Software, and to permit persons to whom the Software is furnished to do
|
47
|
+
so, subject to the following conditions:
|
48
|
+
|
49
|
+
The above copyright notice and this permission notice shall be included in all
|
50
|
+
copies or substantial portions of the Software.
|
51
|
+
|
52
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
53
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
54
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
55
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
56
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
57
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
58
|
+
SOFTWARE.
|
data/Rakefile
ADDED
@@ -0,0 +1,23 @@
|
|
1
|
+
require "bundler/gem_tasks"
|
2
|
+
require 'rake/testtask'
|
3
|
+
require 'rdoc/task'
|
4
|
+
|
5
|
+
EXTRA_RDOC_FILES = ['README.rdoc']
|
6
|
+
MAIN_RDOC = 'README.rdoc'
|
7
|
+
TEST_FILES = Dir["test/**/*_test.rb"]
|
8
|
+
TITLE = 'Text Ferry'
|
9
|
+
|
10
|
+
task :default => ['test']
|
11
|
+
|
12
|
+
Rake::TestTask.new do |t|
|
13
|
+
t.libs << 'test'
|
14
|
+
t.test_files = TEST_FILES
|
15
|
+
end
|
16
|
+
|
17
|
+
RDoc::Task.new do |t|
|
18
|
+
t.main = MAIN_RDOC
|
19
|
+
t.rdoc_dir = 'doc'
|
20
|
+
t.rdoc_files.include(EXTRA_RDOC_FILES, 'lib/**/*.rb')
|
21
|
+
t.options << '-q'
|
22
|
+
t.title = TITLE
|
23
|
+
end
|
@@ -0,0 +1,48 @@
|
|
1
|
+
require "csv"
|
2
|
+
require "sequel"
|
3
|
+
|
4
|
+
module TextFerry
|
5
|
+
# Loads CSV data into a database.
|
6
|
+
class Loader
|
7
|
+
# database_uri::
|
8
|
+
# A URI that points to a database. See
|
9
|
+
# http://sequel.rubyforge.org/rdoc/classes/Sequel.html#method-c-connect
|
10
|
+
# for more info.
|
11
|
+
#
|
12
|
+
# data_path::
|
13
|
+
# The full path to a folder that contains one or more CSV files.
|
14
|
+
def initialize(database_uri, data_path)
|
15
|
+
@db = Sequel.connect(database_uri)
|
16
|
+
@data_path = data_path
|
17
|
+
end
|
18
|
+
|
19
|
+
# Loads data from a CSV file into the database. Assumes that +table_name+
|
20
|
+
# corresponds to a CSV file in +data_path+. Warning: if the table already
|
21
|
+
# exists, it will be dropped!
|
22
|
+
#
|
23
|
+
# table_name::
|
24
|
+
# The name of the CSV file to load; will also be used as the table name
|
25
|
+
# in the database.
|
26
|
+
#
|
27
|
+
# schema::
|
28
|
+
# A block that specifies the schema of the CSV file / table. See
|
29
|
+
# http://sequel.rubyforge.org/rdoc/files/doc/schema_modification_rdoc.html
|
30
|
+
# for more info.
|
31
|
+
def load_table(table_name, &schema)
|
32
|
+
@db.create_table!(table_name, &schema)
|
33
|
+
load_data(table_name)
|
34
|
+
end
|
35
|
+
|
36
|
+
private
|
37
|
+
def fields_for(table_name)
|
38
|
+
@db.schema(table_name).map { |c| c[0] }
|
39
|
+
end
|
40
|
+
|
41
|
+
def load_data(table_name)
|
42
|
+
CSV.table(File.join(@data_path, "#{table_name}.csv")).each do |row|
|
43
|
+
mapping = fields_for(table_name).map { |f| [f, row[f]] }
|
44
|
+
@db[table_name].insert(Hash[mapping])
|
45
|
+
end
|
46
|
+
end
|
47
|
+
end
|
48
|
+
end
|
data/lib/text_ferry.rb
ADDED
@@ -0,0 +1,20 @@
|
|
1
|
+
route_id,agency_id,route_short_name,route_long_name,route_type,route_url,route_color
|
2
|
+
1,2,"","Princeton Shuttle",2,"",
|
3
|
+
2,2,"","Atlantic City Rail Line",2,"",
|
4
|
+
3,2,"","Montclair-Boonton Line",2,"",
|
5
|
+
4,2,"","Montclair-Boonton Line",2,"",
|
6
|
+
5,2,"","Hudson-Bergen Light Rail",0,"",
|
7
|
+
6,2,"","Main/Bergen County Line",2,"",
|
8
|
+
7,2,"","Port Jervis Line",2,"",
|
9
|
+
8,2,"","Morris & Essex Line",2,"",
|
10
|
+
9,2,"","Gladstone Branch",2,"",
|
11
|
+
10,2,"MNRG","",2,"",
|
12
|
+
11,2,"","Northeast Corridor",2,"",
|
13
|
+
12,2,"","North Jersey Coast Line",2,"",
|
14
|
+
13,2,"","North Jersey Coast Line",2,"",
|
15
|
+
14,2,"","Newark Light Rail",0,"",
|
16
|
+
15,2,"","Pascack Valley Line",2,"",
|
17
|
+
16,2,"","Princeton Shuttle",2,"",
|
18
|
+
17,2,"","Raritan Valley Line",2,"",
|
19
|
+
18,2,"","Riverline Light Rail",0,"",
|
20
|
+
19,2,"","Meadowlands Rail Line",2,"",
|
data/test/test_helper.rb
ADDED
@@ -0,0 +1,47 @@
|
|
1
|
+
require "test_helper"
|
2
|
+
require "text_ferry"
|
3
|
+
|
4
|
+
class LoadTest < Test::Unit::TestCase
|
5
|
+
DATA_PATH = File.join(File.dirname(__FILE__), "..", "sample_data")
|
6
|
+
DB_FILE = File.join(DATA_PATH, "sample.db")
|
7
|
+
DB = Sequel.sqlite(DB_FILE)
|
8
|
+
|
9
|
+
setup do
|
10
|
+
@loader = TextFerry::Loader.new("sqlite://#{DB_FILE}", DATA_PATH)
|
11
|
+
end
|
12
|
+
|
13
|
+
test "create a new loader" do
|
14
|
+
assert @loader, "expected to be able to create a new Loader"
|
15
|
+
end
|
16
|
+
|
17
|
+
context "table creation" do
|
18
|
+
test "creates table if it doesn't exist" do
|
19
|
+
load_routes
|
20
|
+
assert DB[:routes].all.length
|
21
|
+
end
|
22
|
+
|
23
|
+
test "drops table if it already exists" do
|
24
|
+
DB.drop_table(:routes) if DB[:routes]
|
25
|
+
DB.create_table :routes do
|
26
|
+
primary_key :id
|
27
|
+
end
|
28
|
+
|
29
|
+
assert_nothing_raised { load_routes }
|
30
|
+
end
|
31
|
+
end
|
32
|
+
|
33
|
+
context "table data" do
|
34
|
+
test "loads all data from csv file" do
|
35
|
+
load_routes
|
36
|
+
assert_equal 19, DB[:routes].all.length
|
37
|
+
end
|
38
|
+
end
|
39
|
+
|
40
|
+
private
|
41
|
+
def load_routes
|
42
|
+
@loader.load_table(:routes) do
|
43
|
+
primary_key :route_id
|
44
|
+
String :route_long_name
|
45
|
+
end
|
46
|
+
end
|
47
|
+
end
|
data/text_ferry.gemspec
ADDED
@@ -0,0 +1,27 @@
|
|
1
|
+
# -*- encoding: utf-8 -*-
|
2
|
+
$:.push File.expand_path("../lib", __FILE__)
|
3
|
+
require "text_ferry/version"
|
4
|
+
|
5
|
+
Gem::Specification.new do |s|
|
6
|
+
s.name = "text_ferry"
|
7
|
+
s.version = TextFerry::VERSION
|
8
|
+
s.authors = ["Bob Nadler"]
|
9
|
+
s.email = ["bnadlerjr@gmail.com"]
|
10
|
+
s.homepage = "https://github.com/bnadlerjr/text_ferry"
|
11
|
+
s.summary = %q{A DSL for loading CSV text files into a database.}
|
12
|
+
s.description = %q{A DSL for loading CSV text files into a database.}
|
13
|
+
|
14
|
+
s.rubyforge_project = "text_ferry"
|
15
|
+
|
16
|
+
s.files = `git ls-files`.split("\n")
|
17
|
+
s.test_files = `git ls-files -- {test,spec,features}/*`.split("\n")
|
18
|
+
s.executables = `git ls-files -- bin/*`.split("\n").map{ |f| File.basename(f) }
|
19
|
+
s.require_paths = ["lib"]
|
20
|
+
|
21
|
+
s.add_development_dependency "contest", "~> 0.1.3"
|
22
|
+
s.add_development_dependency "rake", "~> 0.9.2"
|
23
|
+
s.add_development_dependency "rdoc", "~> 3.11"
|
24
|
+
|
25
|
+
s.add_runtime_dependency "sequel", "~> 3.28.0"
|
26
|
+
s.add_runtime_dependency "sqlite3", "~> 1.3.4"
|
27
|
+
end
|
metadata
ADDED
@@ -0,0 +1,127 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: text_ferry
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
prerelease:
|
5
|
+
version: 0.0.1
|
6
|
+
platform: ruby
|
7
|
+
authors:
|
8
|
+
- Bob Nadler
|
9
|
+
autorequire:
|
10
|
+
bindir: bin
|
11
|
+
cert_chain: []
|
12
|
+
|
13
|
+
date: 2011-10-31 00:00:00 Z
|
14
|
+
dependencies:
|
15
|
+
- !ruby/object:Gem::Dependency
|
16
|
+
name: contest
|
17
|
+
requirement: &id001 !ruby/object:Gem::Requirement
|
18
|
+
none: false
|
19
|
+
requirements:
|
20
|
+
- - ~>
|
21
|
+
- !ruby/object:Gem::Version
|
22
|
+
version: 0.1.3
|
23
|
+
type: :development
|
24
|
+
prerelease: false
|
25
|
+
version_requirements: *id001
|
26
|
+
- !ruby/object:Gem::Dependency
|
27
|
+
name: rake
|
28
|
+
requirement: &id002 !ruby/object:Gem::Requirement
|
29
|
+
none: false
|
30
|
+
requirements:
|
31
|
+
- - ~>
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: 0.9.2
|
34
|
+
type: :development
|
35
|
+
prerelease: false
|
36
|
+
version_requirements: *id002
|
37
|
+
- !ruby/object:Gem::Dependency
|
38
|
+
name: rdoc
|
39
|
+
requirement: &id003 !ruby/object:Gem::Requirement
|
40
|
+
none: false
|
41
|
+
requirements:
|
42
|
+
- - ~>
|
43
|
+
- !ruby/object:Gem::Version
|
44
|
+
version: "3.11"
|
45
|
+
type: :development
|
46
|
+
prerelease: false
|
47
|
+
version_requirements: *id003
|
48
|
+
- !ruby/object:Gem::Dependency
|
49
|
+
name: sequel
|
50
|
+
requirement: &id004 !ruby/object:Gem::Requirement
|
51
|
+
none: false
|
52
|
+
requirements:
|
53
|
+
- - ~>
|
54
|
+
- !ruby/object:Gem::Version
|
55
|
+
version: 3.28.0
|
56
|
+
type: :runtime
|
57
|
+
prerelease: false
|
58
|
+
version_requirements: *id004
|
59
|
+
- !ruby/object:Gem::Dependency
|
60
|
+
name: sqlite3
|
61
|
+
requirement: &id005 !ruby/object:Gem::Requirement
|
62
|
+
none: false
|
63
|
+
requirements:
|
64
|
+
- - ~>
|
65
|
+
- !ruby/object:Gem::Version
|
66
|
+
version: 1.3.4
|
67
|
+
type: :runtime
|
68
|
+
prerelease: false
|
69
|
+
version_requirements: *id005
|
70
|
+
description: A DSL for loading CSV text files into a database.
|
71
|
+
email:
|
72
|
+
- bnadlerjr@gmail.com
|
73
|
+
executables: []
|
74
|
+
|
75
|
+
extensions: []
|
76
|
+
|
77
|
+
extra_rdoc_files: []
|
78
|
+
|
79
|
+
files:
|
80
|
+
- .gitignore
|
81
|
+
- Gemfile
|
82
|
+
- README.rdoc
|
83
|
+
- Rakefile
|
84
|
+
- lib/text_ferry.rb
|
85
|
+
- lib/text_ferry/loader.rb
|
86
|
+
- lib/text_ferry/version.rb
|
87
|
+
- test/sample_data/routes.csv
|
88
|
+
- test/test_helper.rb
|
89
|
+
- test/text_ferry/loader_test.rb
|
90
|
+
- text_ferry.gemspec
|
91
|
+
homepage: https://github.com/bnadlerjr/text_ferry
|
92
|
+
licenses: []
|
93
|
+
|
94
|
+
post_install_message:
|
95
|
+
rdoc_options: []
|
96
|
+
|
97
|
+
require_paths:
|
98
|
+
- lib
|
99
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
100
|
+
none: false
|
101
|
+
requirements:
|
102
|
+
- - ">="
|
103
|
+
- !ruby/object:Gem::Version
|
104
|
+
hash: 3922030537894335762
|
105
|
+
segments:
|
106
|
+
- 0
|
107
|
+
version: "0"
|
108
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
109
|
+
none: false
|
110
|
+
requirements:
|
111
|
+
- - ">="
|
112
|
+
- !ruby/object:Gem::Version
|
113
|
+
hash: 3922030537894335762
|
114
|
+
segments:
|
115
|
+
- 0
|
116
|
+
version: "0"
|
117
|
+
requirements: []
|
118
|
+
|
119
|
+
rubyforge_project: text_ferry
|
120
|
+
rubygems_version: 1.8.5
|
121
|
+
signing_key:
|
122
|
+
specification_version: 3
|
123
|
+
summary: A DSL for loading CSV text files into a database.
|
124
|
+
test_files:
|
125
|
+
- test/sample_data/routes.csv
|
126
|
+
- test/test_helper.rb
|
127
|
+
- test/text_ferry/loader_test.rb
|