hdfs-viking 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: c623269fd30fca9866de8499134312561cf37814
4
+ data.tar.gz: d52b739f42b36d00ea7d4fc8234c00e4f0b45a7a
5
+ SHA512:
6
+ metadata.gz: 0d1404561bba13db1e7228d53aa7f4e471205151010ccd929aaad3b0f2da1afce10f4cc1c69130eeb36a1fba1f2494e216cac0b29f933f14d01a9e28af69be88
7
+ data.tar.gz: 4ff4fd3b3d32945a45d004968359defb23fef630b8dd95bfc795f32a2335724bee7fd5fc37b853cba97f31799b063f977c870be8f974298115980816dfb20367
data/.gitignore ADDED
@@ -0,0 +1,18 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
18
+ Jarfile.lock
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in viking.gemspec
4
+ gemspec
data/Jarfile ADDED
@@ -0,0 +1,3 @@
1
+ repository 'https://repository.cloudera.com/artifactory/cloudera-repos'
2
+ jar 'org.apache.hadoop:hadoop-common:2.0.0-cdh4.4.0'
3
+ jar 'org.apache.hadoop:hadoop-hdfs:2.0.0-cdh4.4.0'
data/Jarfile.lock ADDED
@@ -0,0 +1,124 @@
1
+ ---
2
+ version: 0.7.5
3
+ groups:
4
+ default:
5
+ dependencies:
6
+ - asm:asm:jar:3.1
7
+ - com.google.code.findbugs:jsr305:jar:1.3.9
8
+ - com.google.guava:guava:jar:11.0.2
9
+ - com.google.protobuf:protobuf-java:jar:2.4.0a
10
+ - com.jcraft:jsch:jar:0.1.42
11
+ - com.sun.jersey:jersey-core:jar:1.8
12
+ - com.sun.jersey:jersey-json:jar:1.8
13
+ - com.sun.jersey:jersey-server:jar:1.8
14
+ - com.sun.xml.bind:jaxb-impl:jar:2.2.3-1
15
+ - com.thoughtworks.paranamer:paranamer:jar:2.3
16
+ - commons-beanutils:commons-beanutils-core:jar:1.8.0
17
+ - commons-beanutils:commons-beanutils:jar:1.7.0
18
+ - commons-cli:commons-cli:jar:1.2
19
+ - commons-codec:commons-codec:jar:1.4
20
+ - commons-collections:commons-collections:jar:3.2.1
21
+ - commons-configuration:commons-configuration:jar:1.6
22
+ - commons-daemon:commons-daemon:jar:1.0.3
23
+ - commons-digester:commons-digester:jar:1.8
24
+ - commons-el:commons-el:jar:1.0
25
+ - commons-httpclient:commons-httpclient:jar:3.1
26
+ - commons-io:commons-io:jar:2.1
27
+ - commons-lang:commons-lang:jar:2.5
28
+ - commons-logging:commons-logging:jar:1.1.1
29
+ - commons-net:commons-net:jar:3.1
30
+ - javax.activation:activation:jar:1.1
31
+ - javax.servlet.jsp:jsp-api:jar:2.1
32
+ - javax.servlet:servlet-api:jar:2.5
33
+ - javax.xml.bind:jaxb-api:jar:2.2.2
34
+ - jline:jline:jar:0.9.94
35
+ - junit:junit:jar:4.8.2
36
+ - log4j:log4j:jar:1.2.17
37
+ - net.java.dev.jets3t:jets3t:jar:0.6.1
38
+ - net.sf.kosmosfs:kfs:jar:0.3
39
+ - org.apache.avro:avro:jar:1.7.4
40
+ - org.apache.commons:commons-compress:jar:1.4.1
41
+ - org.apache.commons:commons-math:jar:2.1
42
+ - org.apache.hadoop:hadoop-annotations:jar:2.0.0-cdh4.4.0
43
+ - org.apache.hadoop:hadoop-auth:jar:2.0.0-cdh4.4.0
44
+ - org.apache.hadoop:hadoop-common:jar:2.0.0-cdh4.4.0
45
+ - org.apache.hadoop:hadoop-hdfs:jar:2.0.0-cdh4.4.0
46
+ - org.apache.zookeeper:zookeeper:jar:3.4.5-cdh4.4.0
47
+ - org.codehaus.jackson:jackson-core-asl:jar:1.8.8
48
+ - org.codehaus.jackson:jackson-jaxrs:jar:1.7.1
49
+ - org.codehaus.jackson:jackson-mapper-asl:jar:1.8.8
50
+ - org.codehaus.jackson:jackson-xc:jar:1.7.1
51
+ - org.codehaus.jettison:jettison:jar:1.1
52
+ - org.mockito:mockito-all:jar:1.8.5
53
+ - org.mortbay.jetty:jetty-util:jar:6.1.26.cloudera.2
54
+ - org.mortbay.jetty:jetty:jar:6.1.26.cloudera.2
55
+ - org.slf4j:slf4j-api:jar:1.6.1
56
+ - org.slf4j:slf4j-log4j12:jar:1.6.1
57
+ - org.tukaani:xz:jar:1.0
58
+ - org.xerial.snappy:snappy-java:jar:1.0.4.1
59
+ - stax:stax-api:jar:1.0.1
60
+ - tomcat:jasper-compiler:jar:5.5.23
61
+ - tomcat:jasper-runtime:jar:5.5.23
62
+ - xmlenc:xmlenc:jar:0.52
63
+ artifacts:
64
+ - jar:org.apache.hadoop:hadoop-common:jar:2.0.0-cdh4.4.0:
65
+ transitive:
66
+ com.jcraft:jsch:jar:0.1.42: {}
67
+ org.mortbay.jetty:jetty-util:jar:6.1.26.cloudera.2: {}
68
+ com.sun.jersey:jersey-core:jar:1.8: {}
69
+ com.sun.jersey:jersey-server:jar:1.8:
70
+ asm:asm:jar:3.1: {}
71
+ com.google.guava:guava:jar:11.0.2:
72
+ com.google.code.findbugs:jsr305:jar:1.3.9: {}
73
+ org.apache.avro:avro:jar:1.7.4:
74
+ org.apache.commons:commons-compress:jar:1.4.1:
75
+ org.tukaani:xz:jar:1.0: {}
76
+ org.xerial.snappy:snappy-java:jar:1.0.4.1: {}
77
+ com.thoughtworks.paranamer:paranamer:jar:2.3: {}
78
+ org.apache.commons:commons-math:jar:2.1: {}
79
+ javax.servlet.jsp:jsp-api:jar:2.1: {}
80
+ org.codehaus.jackson:jackson-core-asl:jar:1.8.8: {}
81
+ commons-cli:commons-cli:jar:1.2: {}
82
+ net.sf.kosmosfs:kfs:jar:0.3: {}
83
+ org.apache.hadoop:hadoop-auth:jar:2.0.0-cdh4.4.0: {}
84
+ xmlenc:xmlenc:jar:0.52: {}
85
+ org.slf4j:slf4j-log4j12:jar:1.6.1: {}
86
+ commons-el:commons-el:jar:1.0: {}
87
+ junit:junit:jar:4.8.2: {}
88
+ org.apache.hadoop:hadoop-annotations:jar:2.0.0-cdh4.4.0: {}
89
+ org.slf4j:slf4j-api:jar:1.6.1: {}
90
+ org.mortbay.jetty:jetty:jar:6.1.26.cloudera.2: {}
91
+ org.mockito:mockito-all:jar:1.8.5: {}
92
+ javax.servlet:servlet-api:jar:2.5: {}
93
+ com.sun.jersey:jersey-json:jar:1.8:
94
+ com.sun.xml.bind:jaxb-impl:jar:2.2.3-1:
95
+ javax.xml.bind:jaxb-api:jar:2.2.2:
96
+ javax.activation:activation:jar:1.1: {}
97
+ org.codehaus.jackson:jackson-jaxrs:jar:1.7.1: {}
98
+ org.codehaus.jackson:jackson-xc:jar:1.7.1: {}
99
+ org.codehaus.jettison:jettison:jar:1.1:
100
+ stax:stax-api:jar:1.0.1: {}
101
+ com.google.protobuf:protobuf-java:jar:2.4.0a: {}
102
+ commons-lang:commons-lang:jar:2.5: {}
103
+ tomcat:jasper-compiler:jar:5.5.23: {}
104
+ org.codehaus.jackson:jackson-mapper-asl:jar:1.8.8: {}
105
+ tomcat:jasper-runtime:jar:5.5.23: {}
106
+ net.java.dev.jets3t:jets3t:jar:0.6.1: {}
107
+ org.apache.zookeeper:zookeeper:jar:3.4.5-cdh4.4.0:
108
+ jline:jline:jar:0.9.94: {}
109
+ commons-io:commons-io:jar:2.1: {}
110
+ commons-httpclient:commons-httpclient:jar:3.1: {}
111
+ commons-logging:commons-logging:jar:1.1.1: {}
112
+ commons-net:commons-net:jar:3.1: {}
113
+ commons-codec:commons-codec:jar:1.4: {}
114
+ commons-configuration:commons-configuration:jar:1.6:
115
+ commons-collections:commons-collections:jar:3.2.1: {}
116
+ commons-beanutils:commons-beanutils-core:jar:1.8.0: {}
117
+ commons-digester:commons-digester:jar:1.8:
118
+ commons-beanutils:commons-beanutils:jar:1.7.0: {}
119
+ log4j:log4j:jar:1.2.17: {}
120
+ - jar:org.apache.hadoop:hadoop-hdfs:jar:2.0.0-cdh4.4.0:
121
+ transitive:
122
+ commons-daemon:commons-daemon:jar:1.0.3: {}
123
+ remote_repositories:
124
+ - https://repository.cloudera.com/artifactory/cloudera-repos
data/LICENSE.txt ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2013 Erik Selin
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,49 @@
1
+ # Viking
2
+
3
+ A familiar jRuby hdfs wrapper.
4
+
5
+ ## Goal
6
+
7
+ The goal is to provide ways that are similar to the common ruby file system
8
+ api's for interacting with hdfs. All hdfs functionallity is powered by the java
9
+ hdfs classes.
10
+
11
+ ## Status
12
+
13
+ ### Available
14
+
15
+ - `File`
16
+ - `Dir`
17
+ - `FileUtils`
18
+
19
+ ### Not available yet but on the todo
20
+
21
+ - `File#fnmatch`
22
+ - `File#fnmatch?`
23
+ - `Dir#glob`
24
+ - `FileUtils#copy`
25
+
26
+ ## Example usage
27
+
28
+ # Set up hdfs config
29
+ Viking.configure({
30
+ host: '127.0.0.1',
31
+ port: 54310
32
+ })
33
+
34
+ # If "/some/data" exists and it is a file then print its content. If it is
35
+ # a directory then rename it. If it does not exist then we create it.
36
+ path = "/some/data"
37
+ if Viking::File.exists? path
38
+ if Viking::File.file? path
39
+ Viking::File.open(path) do |file|
40
+ puts "Reading data from #{f.path}:"
41
+ puts f.read
42
+ end
43
+ else
44
+ Viking::File.rename(path, "/some/dir")
45
+ end
46
+ else
47
+ Viking::Dir.mkdir(path)
48
+ end
49
+
data/Rakefile ADDED
@@ -0,0 +1,19 @@
1
+ #!/usr/bin/env rake
2
+
3
+ require "bundler/gem_tasks"
4
+ require 'rake/testtask'
5
+
6
+ Rake::TestTask.new do |t|
7
+ t.libs << 'lib/viking'
8
+ t.test_files = FileList['test/test_*.rb']
9
+ t.verbose = true
10
+ end
11
+
12
+ task :prepare do
13
+ require 'lock_jar'
14
+ LockJar.lock
15
+ lockfile = File.expand_path( "../Jarfile.lock", __FILE__ )
16
+ LockJar.install( :lockfile => lockfile )
17
+ end
18
+
19
+ task :default => :prepare
data/lib/viking/dir.rb ADDED
@@ -0,0 +1,137 @@
1
+ module Viking
2
+ class Dir
3
+
4
+ def self.format(dirname)
5
+ dirname.to_s.sub(/^[^:]*:\/*\//, '/')
6
+ end
7
+
8
+ def self.chdir(dirname=home, &block)
9
+ if block
10
+ main_dirname = pwd
11
+ Viking.client.set_working_directory(Path.new(dirname))
12
+
13
+ result = yield dirname
14
+
15
+ Viking.client.set_working_directory(Path.new(main_dirname))
16
+ result
17
+ else
18
+ Viking.client.set_working_directory(Path.new(dirname))
19
+ 0
20
+ end
21
+ end
22
+
23
+ def self.delete(dirname)
24
+ if exist?(dirname)
25
+ Viking.client.delete(Path.new(dirname), false)
26
+ 0
27
+ else
28
+ raise Errno::ENOENT.new("No such file or directory - No such directory: #{dirname}")
29
+ end
30
+ end
31
+
32
+ def self.entries(dirname)
33
+ if exist?(dirname)
34
+ iterator = Viking.client.list_located_status(Path.new(dirname))
35
+ entries = []
36
+
37
+ while(iterator.has_next) do
38
+ entry = format(iterator.next.path)
39
+ entries << Viking::File.basename(entry)
40
+ end
41
+
42
+ entries
43
+ else
44
+ raise Errno::ENOENT.new("No such file or directory - No such directory: #{dirname}")
45
+ end
46
+ end
47
+
48
+ def self.exist?(dirname)
49
+ Viking::File.exist?(dirname) && Viking::File.directory?(dirname)
50
+ end
51
+
52
+ def self.exists?(dirname)
53
+ exist?(dirname)
54
+ end
55
+
56
+ def self.foreach(dirname)
57
+ entries(dirname).each { |entry| yield entry }
58
+ end
59
+
60
+ def self.getwd
61
+ format(Viking.client.get_working_directory)
62
+ end
63
+
64
+ def self.home
65
+ format(Viking.client.get_home_directory)
66
+ end
67
+
68
+ def self.mkdir(dirname)
69
+ Viking.client.mkdirs(Path.new(dirname))
70
+ 0
71
+ end
72
+
73
+ def self.open(dirname, &block)
74
+ dir = Viking::Dir.new(dirname)
75
+ if block
76
+ value = yield dir
77
+ dir.close
78
+ value
79
+ else
80
+ dir
81
+ end
82
+ end
83
+
84
+ def self.pwd
85
+ getwd
86
+ end
87
+
88
+ def self.rmdir(dirname)
89
+ delete(dirname)
90
+ end
91
+
92
+ def initialize(path)
93
+ @path = path
94
+ @closed = false
95
+ end
96
+
97
+ def close
98
+ check_closed
99
+ @closed = true
100
+ end
101
+
102
+ def each
103
+ check_closed
104
+ entries.each do |file_name|
105
+ yield file_name
106
+ end
107
+ end
108
+
109
+ def path
110
+ @path
111
+ end
112
+
113
+ def read
114
+ check_closed
115
+ rewind if @entries.nil?
116
+ entry = @entries[@pos]
117
+ @pos += 1 unless entry.nil?
118
+ entry
119
+ end
120
+
121
+ def rewind
122
+ check_closed
123
+ @pos = 0
124
+ @entries = entries
125
+ end
126
+
127
+ private
128
+
129
+ def check_closed
130
+ raise IOError.new("closed directory") if @closed
131
+ end
132
+
133
+ def entries
134
+ Viking::Dir.entries(path)
135
+ end
136
+ end
137
+ end
@@ -0,0 +1,224 @@
1
+ module Viking
2
+ class File
3
+
4
+ def self.absolute_path(file_name, dir_string=Viking.client.get_working_directory)
5
+ dir_string = dir_string.to_s.sub(/[^\/]*:\/*\//, '/')
6
+ IO::File.absolute_path(file_name, dir_string)
7
+ end
8
+
9
+ def self.basename(file_name, suffix = nil)
10
+ base = file_name.split("/").last
11
+ suffix.nil? ? base : base.sub(suffix, '')
12
+ end
13
+
14
+ def self.chmod(mode_int, *file_names)
15
+ permission = FsPermission.new(mode_int)
16
+ file_names.each do |file_name|
17
+ Viking.client.set_permission(Path.new(file_name), permission)
18
+ end
19
+ file_names.size
20
+ end
21
+
22
+ def self.chown(owner_name, group_name, *file_names)
23
+ file_names.each do |file_name|
24
+ Viking.client.set_owner(Path.new(file_name), owner_name, group_name)
25
+ end
26
+ file_names.size
27
+ end
28
+
29
+ def self.delete(*file_names)
30
+ file_names.each do |file_name|
31
+ path = Path.new(file_name)
32
+ if file?(file_name)
33
+ Viking.client.delete(Path.new(file_name), false)
34
+ else
35
+ raise IOError, "File::delete can only delete files. Attempted to delete directory #{file_name}."
36
+ end
37
+ end
38
+ file_names.size
39
+ end
40
+
41
+ def self.directory?(file_name)
42
+ Viking.client.is_directory(Path.new(file_name))
43
+ end
44
+
45
+ def self.exist?(file_name)
46
+ exists?(file_name)
47
+ end
48
+
49
+ def self.exists?(file_name)
50
+ Viking.client.exists(Path.new(file_name))
51
+ end
52
+
53
+ def self.file?(file_name)
54
+ Viking.client.is_file(Path.new(file_name))
55
+ end
56
+
57
+ def self.ftype(file_name)
58
+ directory?(file_name) ? 'directory' : 'file'
59
+ end
60
+
61
+ def self.move(old_name, new_name)
62
+ rename(old_name, new_name)
63
+ end
64
+
65
+ def self.open(file_name, &block)
66
+ file = Viking::File.new(file_name)
67
+ if block
68
+ value = yield file
69
+ file.close unless file.closed?
70
+ value
71
+ else
72
+ file
73
+ end
74
+ end
75
+
76
+ def self.rename(old_name, new_name)
77
+ Viking.client.rename(Path.new(old_name), Path.new(new_name))
78
+ end
79
+
80
+ def self.size(file_name)
81
+ Viking.client.get_file_status(Path.new(file_name)).get_len
82
+ end
83
+
84
+ def self.size?(file_name)
85
+ exists?(file_name) ? size(file_name) : nil
86
+ end
87
+
88
+ def self.split(file_name)
89
+ name = basename(file_name)
90
+ path = file_name.sub(/\/#{name}$/,'')
91
+ [path, name]
92
+ end
93
+
94
+ def initialize(file_name)
95
+ @path = file_name
96
+ @reading = false
97
+ @writting = false
98
+ @closed = false
99
+ end
100
+
101
+ def path
102
+ @path
103
+ end
104
+
105
+ def size
106
+ Viking.client.get_file_status(Path.new(path)).get_len
107
+ end
108
+
109
+ def close
110
+ unless closed?
111
+ reader.close if @reading
112
+ writter.close if @writting
113
+
114
+ @reading = false
115
+ @writting = false
116
+
117
+ @closed = true
118
+ end
119
+ end
120
+
121
+ def closed?
122
+ @closed
123
+ end
124
+
125
+ def each_line(sep="\n", limit=nil)
126
+ while((line = gets(sep, limit)) != nil) do
127
+ yield line
128
+ end
129
+ close
130
+ end
131
+
132
+ def each_char
133
+ while(char = getc) do
134
+ yield char
135
+ end
136
+ close
137
+ end
138
+
139
+ def eof
140
+ eof?
141
+ end
142
+
143
+ def eof?
144
+ current_byte.nil?
145
+ end
146
+
147
+ def getc
148
+ byte = current_byte
149
+ next_byte
150
+ byte
151
+ end
152
+
153
+ def gets(sep=nil, limit=nil)
154
+ sep_bytes = sep.bytes.to_a if sep
155
+ bytes = []
156
+ while(b = getc) do
157
+ bytes << b
158
+ break if sep && bytes.last(sep_bytes.size) == sep_bytes
159
+ break if limit && bytes.size == limit
160
+ end
161
+ bytes.empty? ? nil : bytes.pack("C*")
162
+ end
163
+
164
+ def putc(obj)
165
+ if obj.is_a? Numeric
166
+ writter.java_send :write, [Java::int], obj
167
+ else
168
+ byte = obj.to_s.bytes.first
169
+ writter.write(byte)
170
+ end
171
+ end
172
+
173
+ def puts(*objs)
174
+ separator = "\n"
175
+ string = objs.reduce("") do |acc, obj|
176
+ if obj.end_with?(separator)
177
+ acc << obj
178
+ else
179
+ acc << obj
180
+ acc << separator
181
+ end
182
+ end
183
+ write(string)
184
+ end
185
+
186
+ def read(limit=nil)
187
+ gets(nil, limit)
188
+ end
189
+
190
+ def write(string)
191
+ writter.write_bytes(string)
192
+ end
193
+
194
+ private
195
+
196
+ def parse_byte(b)
197
+ b == -1 ? nil : b
198
+ end
199
+
200
+ def next_byte
201
+ b = reader.read
202
+ @b = parse_byte(b)
203
+ end
204
+
205
+ def current_byte
206
+ next_byte unless @reading
207
+ @b
208
+ end
209
+
210
+ def reader
211
+ @reader ||= begin
212
+ @reading = true
213
+ Viking.client.open(Path.new(path))
214
+ end
215
+ end
216
+
217
+ def writter
218
+ @writter ||= begin
219
+ @writting = true
220
+ Viking.client.create(Path.new(path))
221
+ end
222
+ end
223
+ end
224
+ end