embulk-input-filesplit 0.1.3 → 0.1.4
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/README.md +41 -40
- data/build.gradle +64 -64
- data/classpath/embulk-input-filesplit-0.1.4.jar +0 -0
- data/lib/embulk/input/filesplit.rb +3 -3
- data/src/main/java/org/embulk/input/filesplit/LocalFileSplitInputPlugin.java +300 -187
- data/src/test/java/org/embulk/input/filesplit/EmbulkPluginTester.java +70 -70
- data/src/test/java/org/embulk/input/filesplit/LocalFileSplitInputPluginTest.java +129 -94
- data/src/test/java/org/embulk/input/filesplit/LocalFileSplitInputTest.java +78 -78
- data/src/test/java/org/embulk/input/filesplit/PartialFileInputStreamTest.java +570 -570
- data/src/test/resources/data/sub1/test1.csv +1 -0
- data/src/test/resources/data/sub1/test2.csv +3 -0
- data/src/test/resources/data/sub2/test1.csv +1 -0
- data/src/test/resources/data/sub2/test2.csv +3 -0
- data/src/test/resources/data/sub2/x.csv +1 -0
- data/src/test/resources/data/test-header.csv +5 -5
- data/src/test/resources/data/test-semicolon.csv +4 -4
- data/src/test/resources/data/test.csv +4 -4
- data/src/test/resources/yml/test-error1.yml +22 -0
- data/src/test/resources/yml/test-error2.yml +24 -0
- data/src/test/resources/yml/test-header.yml +24 -24
- data/src/test/resources/yml/test-only-header.yml +24 -24
- data/src/test/resources/yml/test-path_prefix-directory.yml +23 -0
- data/src/test/resources/yml/test-path_prefix-files.yml +23 -0
- data/src/test/resources/yml/test-tasks.yml +23 -23
- data/src/test/resources/yml/test.yml +22 -22
- metadata +15 -6
- data/classpath/embulk-input-filesplit-0.1.3.jar +0 -0
@@ -0,0 +1 @@
|
|
1
|
+
1,aaaaa,12345
|
@@ -0,0 +1 @@
|
|
1
|
+
1,aaaaa,12345
|
@@ -0,0 +1 @@
|
|
1
|
+
5,xxx,0
|
@@ -1,5 +1,5 @@
|
|
1
|
-
id,name,value
|
2
|
-
1,aaaaa,12345
|
3
|
-
2,bbb,67890
|
4
|
-
3,ccccccccc,-1
|
5
|
-
4,dd,555555
|
1
|
+
id,name,value
|
2
|
+
1,aaaaa,12345
|
3
|
+
2,bbb,67890
|
4
|
+
3,ccccccccc,-1
|
5
|
+
4,dd,555555
|
@@ -1,4 +1,4 @@
|
|
1
|
-
1;aaaaa;12345
|
2
|
-
2;bbb;67890
|
3
|
-
3;ccccccccc;-1
|
4
|
-
4;dd;555555
|
1
|
+
1;aaaaa;12345
|
2
|
+
2;bbb;67890
|
3
|
+
3;ccccccccc;-1
|
4
|
+
4;dd;555555
|
@@ -1,4 +1,4 @@
|
|
1
|
-
1,aaaaa,12345
|
2
|
-
2,bbb,67890
|
3
|
-
3,ccccccccc,-1
|
4
|
-
4,dd,555555
|
1
|
+
1,aaaaa,12345
|
2
|
+
2,bbb,67890
|
3
|
+
3,ccccccccc,-1
|
4
|
+
4,dd,555555
|
@@ -0,0 +1,22 @@
|
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
parser:
|
4
|
+
charset: UTF-8
|
5
|
+
newline: CRLF
|
6
|
+
type: csv
|
7
|
+
delimiter: ','
|
8
|
+
quote: ''
|
9
|
+
columns:
|
10
|
+
- {name: id, type: long}
|
11
|
+
- {name: name, type: string}
|
12
|
+
- {name: value, type: long}
|
13
|
+
out:
|
14
|
+
type: file
|
15
|
+
path_prefix: 'temp/result'
|
16
|
+
file_ext: .csv
|
17
|
+
formatter:
|
18
|
+
type: csv
|
19
|
+
delimiter: ';'
|
20
|
+
header_line: false
|
21
|
+
charset: UTF-8
|
22
|
+
newline: CRLF
|
@@ -0,0 +1,24 @@
|
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path: 'data/test.csv'
|
4
|
+
path_prefix: 'data/sub1'
|
5
|
+
parser:
|
6
|
+
charset: UTF-8
|
7
|
+
newline: CRLF
|
8
|
+
type: csv
|
9
|
+
delimiter: ','
|
10
|
+
quote: ''
|
11
|
+
columns:
|
12
|
+
- {name: id, type: long}
|
13
|
+
- {name: name, type: string}
|
14
|
+
- {name: value, type: long}
|
15
|
+
out:
|
16
|
+
type: file
|
17
|
+
path_prefix: 'temp/result'
|
18
|
+
file_ext: .csv
|
19
|
+
formatter:
|
20
|
+
type: csv
|
21
|
+
delimiter: ';'
|
22
|
+
header_line: false
|
23
|
+
charset: UTF-8
|
24
|
+
newline: CRLF
|
@@ -1,25 +1,25 @@
|
|
1
|
-
in:
|
2
|
-
type: filesplit
|
3
|
-
path: 'data/test-header.csv'
|
4
|
-
header_line: true
|
5
|
-
parser:
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
type: csv
|
9
|
-
header_line: true
|
10
|
-
delimiter: ','
|
11
|
-
quote: ''
|
12
|
-
columns:
|
13
|
-
- {name: id, type: long}
|
14
|
-
- {name: name, type: string}
|
15
|
-
- {name: value, type: long}
|
16
|
-
out:
|
17
|
-
type: file
|
18
|
-
path_prefix: 'temp/result'
|
19
|
-
file_ext: .csv
|
20
|
-
formatter:
|
21
|
-
type: csv
|
22
|
-
delimiter: ';'
|
23
|
-
header_line: false
|
24
|
-
charset: UTF-8
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path: 'data/test-header.csv'
|
4
|
+
header_line: true
|
5
|
+
parser:
|
6
|
+
charset: UTF-8
|
7
|
+
newline: CRLF
|
8
|
+
type: csv
|
9
|
+
header_line: true
|
10
|
+
delimiter: ','
|
11
|
+
quote: ''
|
12
|
+
columns:
|
13
|
+
- {name: id, type: long}
|
14
|
+
- {name: name, type: string}
|
15
|
+
- {name: value, type: long}
|
16
|
+
out:
|
17
|
+
type: file
|
18
|
+
path_prefix: 'temp/result'
|
19
|
+
file_ext: .csv
|
20
|
+
formatter:
|
21
|
+
type: csv
|
22
|
+
delimiter: ';'
|
23
|
+
header_line: false
|
24
|
+
charset: UTF-8
|
25
25
|
newline: CRLF
|
@@ -1,25 +1,25 @@
|
|
1
|
-
in:
|
2
|
-
type: filesplit
|
3
|
-
path: 'data/test-only-header.csv'
|
4
|
-
header_line: true
|
5
|
-
parser:
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
type: csv
|
9
|
-
header_line: true
|
10
|
-
delimiter: ','
|
11
|
-
quote: ''
|
12
|
-
columns:
|
13
|
-
- {name: id, type: long}
|
14
|
-
- {name: name, type: string}
|
15
|
-
- {name: value, type: long}
|
16
|
-
out:
|
17
|
-
type: file
|
18
|
-
path_prefix: 'temp/result'
|
19
|
-
file_ext: .csv
|
20
|
-
formatter:
|
21
|
-
type: csv
|
22
|
-
delimiter: ';'
|
23
|
-
header_line: false
|
24
|
-
charset: UTF-8
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path: 'data/test-only-header.csv'
|
4
|
+
header_line: true
|
5
|
+
parser:
|
6
|
+
charset: UTF-8
|
7
|
+
newline: CRLF
|
8
|
+
type: csv
|
9
|
+
header_line: true
|
10
|
+
delimiter: ','
|
11
|
+
quote: ''
|
12
|
+
columns:
|
13
|
+
- {name: id, type: long}
|
14
|
+
- {name: name, type: string}
|
15
|
+
- {name: value, type: long}
|
16
|
+
out:
|
17
|
+
type: file
|
18
|
+
path_prefix: 'temp/result'
|
19
|
+
file_ext: .csv
|
20
|
+
formatter:
|
21
|
+
type: csv
|
22
|
+
delimiter: ';'
|
23
|
+
header_line: false
|
24
|
+
charset: UTF-8
|
25
25
|
newline: CRLF
|
@@ -0,0 +1,23 @@
|
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path_prefix: 'data/sub1'
|
4
|
+
parser:
|
5
|
+
charset: UTF-8
|
6
|
+
newline: CRLF
|
7
|
+
type: csv
|
8
|
+
delimiter: ','
|
9
|
+
quote: ''
|
10
|
+
columns:
|
11
|
+
- {name: id, type: long}
|
12
|
+
- {name: name, type: string}
|
13
|
+
- {name: value, type: long}
|
14
|
+
out:
|
15
|
+
type: file
|
16
|
+
path_prefix: 'temp/result'
|
17
|
+
file_ext: .csv
|
18
|
+
formatter:
|
19
|
+
type: csv
|
20
|
+
delimiter: ','
|
21
|
+
header_line: false
|
22
|
+
charset: UTF-8
|
23
|
+
newline: CRLF
|
@@ -0,0 +1,23 @@
|
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path_prefix: 'data/sub2/test'
|
4
|
+
parser:
|
5
|
+
charset: UTF-8
|
6
|
+
newline: CRLF
|
7
|
+
type: csv
|
8
|
+
delimiter: ','
|
9
|
+
quote: ''
|
10
|
+
columns:
|
11
|
+
- {name: id, type: long}
|
12
|
+
- {name: name, type: string}
|
13
|
+
- {name: value, type: long}
|
14
|
+
out:
|
15
|
+
type: file
|
16
|
+
path_prefix: 'temp/result'
|
17
|
+
file_ext: .csv
|
18
|
+
formatter:
|
19
|
+
type: csv
|
20
|
+
delimiter: ','
|
21
|
+
header_line: false
|
22
|
+
charset: UTF-8
|
23
|
+
newline: CRLF
|
@@ -1,24 +1,24 @@
|
|
1
|
-
in:
|
2
|
-
type: filesplit
|
3
|
-
path: 'data/test.csv'
|
4
|
-
tasks: 3
|
5
|
-
parser:
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
type: csv
|
9
|
-
delimiter: ','
|
10
|
-
quote: ''
|
11
|
-
columns:
|
12
|
-
- {name: id, type: long}
|
13
|
-
- {name: name, type: string}
|
14
|
-
- {name: value, type: long}
|
15
|
-
out:
|
16
|
-
type: file
|
17
|
-
path_prefix: 'temp/result'
|
18
|
-
file_ext: .csv
|
19
|
-
formatter:
|
20
|
-
type: csv
|
21
|
-
delimiter: ';'
|
22
|
-
header_line: false
|
23
|
-
charset: UTF-8
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path: 'data/test.csv'
|
4
|
+
tasks: 3
|
5
|
+
parser:
|
6
|
+
charset: UTF-8
|
7
|
+
newline: CRLF
|
8
|
+
type: csv
|
9
|
+
delimiter: ','
|
10
|
+
quote: ''
|
11
|
+
columns:
|
12
|
+
- {name: id, type: long}
|
13
|
+
- {name: name, type: string}
|
14
|
+
- {name: value, type: long}
|
15
|
+
out:
|
16
|
+
type: file
|
17
|
+
path_prefix: 'temp/result'
|
18
|
+
file_ext: .csv
|
19
|
+
formatter:
|
20
|
+
type: csv
|
21
|
+
delimiter: ';'
|
22
|
+
header_line: false
|
23
|
+
charset: UTF-8
|
24
24
|
newline: CRLF
|
@@ -1,23 +1,23 @@
|
|
1
|
-
in:
|
2
|
-
type: filesplit
|
3
|
-
path: 'data/test.csv'
|
4
|
-
parser:
|
5
|
-
charset: UTF-8
|
6
|
-
newline: CRLF
|
7
|
-
type: csv
|
8
|
-
delimiter: ','
|
9
|
-
quote: ''
|
10
|
-
columns:
|
11
|
-
- {name: id, type: long}
|
12
|
-
- {name: name, type: string}
|
13
|
-
- {name: value, type: long}
|
14
|
-
out:
|
15
|
-
type: file
|
16
|
-
path_prefix: 'temp/result'
|
17
|
-
file_ext: .csv
|
18
|
-
formatter:
|
19
|
-
type: csv
|
20
|
-
delimiter: ';'
|
21
|
-
header_line: false
|
22
|
-
charset: UTF-8
|
1
|
+
in:
|
2
|
+
type: filesplit
|
3
|
+
path: 'data/test.csv'
|
4
|
+
parser:
|
5
|
+
charset: UTF-8
|
6
|
+
newline: CRLF
|
7
|
+
type: csv
|
8
|
+
delimiter: ','
|
9
|
+
quote: ''
|
10
|
+
columns:
|
11
|
+
- {name: id, type: long}
|
12
|
+
- {name: name, type: string}
|
13
|
+
- {name: value, type: long}
|
14
|
+
out:
|
15
|
+
type: file
|
16
|
+
path_prefix: 'temp/result'
|
17
|
+
file_ext: .csv
|
18
|
+
formatter:
|
19
|
+
type: csv
|
20
|
+
delimiter: ';'
|
21
|
+
header_line: false
|
22
|
+
charset: UTF-8
|
23
23
|
newline: CRLF
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: embulk-input-filesplit
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
4
|
+
version: 0.1.4
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Hitoshi Tanaka
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2017-09-13 00:00:00.000000000 Z
|
12
12
|
dependencies: []
|
13
13
|
description:
|
14
14
|
email:
|
@@ -18,6 +18,7 @@ extra_rdoc_files: []
|
|
18
18
|
files:
|
19
19
|
- README.md
|
20
20
|
- build.gradle
|
21
|
+
- classpath/embulk-input-filesplit-0.1.4.jar
|
21
22
|
- lib/embulk/input/filesplit.rb
|
22
23
|
- src/main/java/org/embulk/input/filesplit/LocalFileSplitInputPlugin.java
|
23
24
|
- src/main/java/org/embulk/input/filesplit/PartialFile.java
|
@@ -27,16 +28,24 @@ files:
|
|
27
28
|
- src/test/java/org/embulk/input/filesplit/LocalFileSplitInputTest.java
|
28
29
|
- src/test/java/org/embulk/input/filesplit/PartialFileInputStreamTest.java
|
29
30
|
- src/test/resources/data/empty.csv
|
31
|
+
- src/test/resources/data/sub1/test1.csv
|
32
|
+
- src/test/resources/data/sub1/test2.csv
|
33
|
+
- src/test/resources/data/sub2/test1.csv
|
34
|
+
- src/test/resources/data/sub2/test2.csv
|
35
|
+
- src/test/resources/data/sub2/x.csv
|
30
36
|
- src/test/resources/data/test-header.csv
|
31
37
|
- src/test/resources/data/test-only-header.csv
|
32
38
|
- src/test/resources/data/test-semicolon.csv
|
33
39
|
- src/test/resources/data/test.csv
|
34
40
|
- src/test/resources/resource.txt
|
41
|
+
- src/test/resources/yml/test-error1.yml
|
42
|
+
- src/test/resources/yml/test-error2.yml
|
35
43
|
- src/test/resources/yml/test-header.yml
|
36
44
|
- src/test/resources/yml/test-only-header.yml
|
45
|
+
- src/test/resources/yml/test-path_prefix-directory.yml
|
46
|
+
- src/test/resources/yml/test-path_prefix-files.yml
|
37
47
|
- src/test/resources/yml/test-tasks.yml
|
38
48
|
- src/test/resources/yml/test.yml
|
39
|
-
- classpath/embulk-input-filesplit-0.1.3.jar
|
40
49
|
homepage: https://github.com/hito4t/embulk-input-filesplit
|
41
50
|
licenses:
|
42
51
|
- Apache 2.0
|
@@ -47,17 +56,17 @@ require_paths:
|
|
47
56
|
- lib
|
48
57
|
required_ruby_version: !ruby/object:Gem::Requirement
|
49
58
|
requirements:
|
50
|
-
- -
|
59
|
+
- - ">="
|
51
60
|
- !ruby/object:Gem::Version
|
52
61
|
version: '0'
|
53
62
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
54
63
|
requirements:
|
55
|
-
- -
|
64
|
+
- - ">="
|
56
65
|
- !ruby/object:Gem::Version
|
57
66
|
version: '0'
|
58
67
|
requirements: []
|
59
68
|
rubyforge_project:
|
60
|
-
rubygems_version: 2.
|
69
|
+
rubygems_version: 2.4.8
|
61
70
|
signing_key:
|
62
71
|
specification_version: 4
|
63
72
|
summary: Embulk plugin for splitting input file
|
Binary file
|