embulk-output-bigquery 0.4.14 → 0.6.3
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +5 -5
- data/CHANGELOG.md +28 -0
- data/README.md +74 -77
- data/embulk-output-bigquery.gemspec +10 -3
- data/lib/embulk/output/bigquery.rb +19 -49
- data/lib/embulk/output/bigquery/auth.rb +35 -0
- data/lib/embulk/output/bigquery/bigquery_client.rb +2 -11
- data/lib/embulk/output/bigquery/google_client.rb +3 -34
- data/lib/embulk/output/bigquery/value_converter_factory.rb +12 -0
- data/test/test_bigquery_client.rb +1 -5
- data/test/test_configure.rb +10 -19
- data/test/test_example.rb +0 -1
- data/test/test_helper.rb +4 -1
- data/test/test_transaction.rb +22 -62
- data/test/test_value_converter_factory.rb +42 -0
- metadata +29 -52
- data/example/config_append_direct_schema_update_options.yml +0 -31
- data/example/config_client_options.yml +0 -33
- data/example/config_csv.yml +0 -30
- data/example/config_delete_in_advance.yml +0 -29
- data/example/config_delete_in_advance_field_partitioned_table.yml +0 -33
- data/example/config_delete_in_advance_partitioned_table.yml +0 -33
- data/example/config_expose_errors.yml +0 -30
- data/example/config_gcs.yml +0 -32
- data/example/config_guess_from_embulk_schema.yml +0 -29
- data/example/config_guess_with_column_options.yml +0 -40
- data/example/config_gzip.yml +0 -1
- data/example/config_jsonl.yml +0 -1
- data/example/config_max_threads.yml +0 -34
- data/example/config_min_ouput_tasks.yml +0 -34
- data/example/config_mode_append.yml +0 -30
- data/example/config_mode_append_direct.yml +0 -30
- data/example/config_nested_record.yml +0 -1
- data/example/config_payload_column.yml +0 -20
- data/example/config_payload_column_index.yml +0 -20
- data/example/config_prevent_duplicate_insert.yml +0 -30
- data/example/config_progress_log_interval.yml +0 -31
- data/example/config_replace.yml +0 -30
- data/example/config_replace_backup.yml +0 -32
- data/example/config_replace_backup_field_partitioned_table.yml +0 -34
- data/example/config_replace_backup_partitioned_table.yml +0 -34
- data/example/config_replace_field_partitioned_table.yml +0 -33
- data/example/config_replace_partitioned_table.yml +0 -33
- data/example/config_replace_schema_update_options.yml +0 -33
- data/example/config_skip_file_generation.yml +0 -32
- data/example/config_table_strftime.yml +0 -30
- data/example/config_template_table.yml +0 -21
- data/example/config_uncompressed.yml +0 -1
- data/example/config_with_rehearsal.yml +0 -33
- data/example/example.csv +0 -17
- data/example/example.yml +0 -1
- data/example/example2_1.csv +0 -1
- data/example/example2_2.csv +0 -1
- data/example/example4_1.csv +0 -1
- data/example/example4_2.csv +0 -1
- data/example/example4_3.csv +0 -1
- data/example/example4_4.csv +0 -1
- data/example/json_key.json +0 -12
- data/example/nested_example.jsonl +0 -16
- data/example/schema.json +0 -30
- data/example/schema_expose_errors.json +0 -30
@@ -90,6 +90,10 @@ module Embulk
|
|
90
90
|
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'TIMESTAMP').create_converter }
|
91
91
|
end
|
92
92
|
|
93
|
+
def test_date
|
94
|
+
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'DATE').create_converter }
|
95
|
+
end
|
96
|
+
|
93
97
|
def test_record
|
94
98
|
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'RECORD').create_converter }
|
95
99
|
end
|
@@ -130,6 +134,10 @@ module Embulk
|
|
130
134
|
assert_equal 1408452095, converter.call(1408452095)
|
131
135
|
end
|
132
136
|
|
137
|
+
def test_date
|
138
|
+
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'DATE').create_converter }
|
139
|
+
end
|
140
|
+
|
133
141
|
def test_record
|
134
142
|
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'RECORD').create_converter }
|
135
143
|
end
|
@@ -166,6 +174,10 @@ module Embulk
|
|
166
174
|
assert_equal 1408452095.188766, converter.call(1408452095.188766)
|
167
175
|
end
|
168
176
|
|
177
|
+
def test_date
|
178
|
+
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'DATE').create_converter }
|
179
|
+
end
|
180
|
+
|
169
181
|
def test_record
|
170
182
|
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'RECORD').create_converter }
|
171
183
|
end
|
@@ -216,6 +228,14 @@ module Embulk
|
|
216
228
|
assert_equal "2016-02-26 00:00:00", converter.call("2016-02-26 00:00:00")
|
217
229
|
end
|
218
230
|
|
231
|
+
def test_date
|
232
|
+
converter = ValueConverterFactory.new(SCHEMA_TYPE, 'DATE').create_converter
|
233
|
+
assert_equal nil, converter.call(nil)
|
234
|
+
assert_equal "2016-02-26", converter.call("2016-02-26")
|
235
|
+
assert_equal "2016-02-26", converter.call("2016-02-26 00:00:00")
|
236
|
+
assert_raise { converter.call('foo') }
|
237
|
+
end
|
238
|
+
|
219
239
|
def test_record
|
220
240
|
converter = ValueConverterFactory.new(SCHEMA_TYPE, 'RECORD').create_converter
|
221
241
|
assert_equal({'foo'=>'foo'}, converter.call(%Q[{"foo":"foo"}]))
|
@@ -268,6 +288,24 @@ module Embulk
|
|
268
288
|
assert_equal expected, converter.call(Time.at(subject).utc)
|
269
289
|
end
|
270
290
|
|
291
|
+
def test_date
|
292
|
+
converter = ValueConverterFactory.new(SCHEMA_TYPE, 'DATE').create_converter
|
293
|
+
assert_equal nil, converter.call(nil)
|
294
|
+
timestamp = Time.parse("2016-02-26 00:00:00.500000 +00:00")
|
295
|
+
expected = "2016-02-26"
|
296
|
+
assert_equal expected, converter.call(timestamp)
|
297
|
+
|
298
|
+
converter = ValueConverterFactory.new(
|
299
|
+
SCHEMA_TYPE, 'DATE', timezone: 'Asia/Tokyo'
|
300
|
+
).create_converter
|
301
|
+
assert_equal nil, converter.call(nil)
|
302
|
+
timestamp = Time.parse("2016-02-25 15:00:00.500000 +00:00")
|
303
|
+
expected = "2016-02-26"
|
304
|
+
assert_equal expected, converter.call(timestamp)
|
305
|
+
|
306
|
+
assert_raise { converter.call('foo') }
|
307
|
+
end
|
308
|
+
|
271
309
|
def test_record
|
272
310
|
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'RECORD').create_converter }
|
273
311
|
end
|
@@ -298,6 +336,10 @@ module Embulk
|
|
298
336
|
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'TIMESTAMP').create_converter }
|
299
337
|
end
|
300
338
|
|
339
|
+
def test_date
|
340
|
+
assert_raise { ValueConverterFactory.new(SCHEMA_TYPE, 'DATE').create_converter }
|
341
|
+
end
|
342
|
+
|
301
343
|
def test_record
|
302
344
|
converter = ValueConverterFactory.new(SCHEMA_TYPE, 'RECORD').create_converter
|
303
345
|
assert_equal nil, converter.call(nil)
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: embulk-output-bigquery
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.6.3
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Satoshi Akama
|
@@ -9,22 +9,42 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date: 2019-
|
12
|
+
date: 2019-10-28 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
requirement: !ruby/object:Gem::Requirement
|
16
16
|
requirements:
|
17
|
-
- - "
|
17
|
+
- - "~>"
|
18
18
|
- !ruby/object:Gem::Version
|
19
|
-
version: '0'
|
19
|
+
version: '0.7'
|
20
|
+
- - "<"
|
21
|
+
- !ruby/object:Gem::Version
|
22
|
+
version: 0.12.0
|
23
|
+
name: signet
|
24
|
+
prerelease: false
|
25
|
+
type: :runtime
|
26
|
+
version_requirements: !ruby/object:Gem::Requirement
|
27
|
+
requirements:
|
28
|
+
- - "~>"
|
29
|
+
- !ruby/object:Gem::Version
|
30
|
+
version: '0.7'
|
31
|
+
- - "<"
|
32
|
+
- !ruby/object:Gem::Version
|
33
|
+
version: 0.12.0
|
34
|
+
- !ruby/object:Gem::Dependency
|
35
|
+
requirement: !ruby/object:Gem::Requirement
|
36
|
+
requirements:
|
37
|
+
- - "<"
|
38
|
+
- !ruby/object:Gem::Version
|
39
|
+
version: 0.33.0
|
20
40
|
name: google-api-client
|
21
41
|
prerelease: false
|
22
42
|
type: :runtime
|
23
43
|
version_requirements: !ruby/object:Gem::Requirement
|
24
44
|
requirements:
|
25
|
-
- - "
|
45
|
+
- - "<"
|
26
46
|
- !ruby/object:Gem::Version
|
27
|
-
version:
|
47
|
+
version: 0.33.0
|
28
48
|
- !ruby/object:Gem::Dependency
|
29
49
|
requirement: !ruby/object:Gem::Requirement
|
30
50
|
requirements:
|
@@ -83,52 +103,8 @@ files:
|
|
83
103
|
- README.md
|
84
104
|
- Rakefile
|
85
105
|
- embulk-output-bigquery.gemspec
|
86
|
-
- example/config_append_direct_schema_update_options.yml
|
87
|
-
- example/config_client_options.yml
|
88
|
-
- example/config_csv.yml
|
89
|
-
- example/config_delete_in_advance.yml
|
90
|
-
- example/config_delete_in_advance_field_partitioned_table.yml
|
91
|
-
- example/config_delete_in_advance_partitioned_table.yml
|
92
|
-
- example/config_expose_errors.yml
|
93
|
-
- example/config_gcs.yml
|
94
|
-
- example/config_guess_from_embulk_schema.yml
|
95
|
-
- example/config_guess_with_column_options.yml
|
96
|
-
- example/config_gzip.yml
|
97
|
-
- example/config_jsonl.yml
|
98
|
-
- example/config_max_threads.yml
|
99
|
-
- example/config_min_ouput_tasks.yml
|
100
|
-
- example/config_mode_append.yml
|
101
|
-
- example/config_mode_append_direct.yml
|
102
|
-
- example/config_nested_record.yml
|
103
|
-
- example/config_payload_column.yml
|
104
|
-
- example/config_payload_column_index.yml
|
105
|
-
- example/config_prevent_duplicate_insert.yml
|
106
|
-
- example/config_progress_log_interval.yml
|
107
|
-
- example/config_replace.yml
|
108
|
-
- example/config_replace_backup.yml
|
109
|
-
- example/config_replace_backup_field_partitioned_table.yml
|
110
|
-
- example/config_replace_backup_partitioned_table.yml
|
111
|
-
- example/config_replace_field_partitioned_table.yml
|
112
|
-
- example/config_replace_partitioned_table.yml
|
113
|
-
- example/config_replace_schema_update_options.yml
|
114
|
-
- example/config_skip_file_generation.yml
|
115
|
-
- example/config_table_strftime.yml
|
116
|
-
- example/config_template_table.yml
|
117
|
-
- example/config_uncompressed.yml
|
118
|
-
- example/config_with_rehearsal.yml
|
119
|
-
- example/example.csv
|
120
|
-
- example/example.yml
|
121
|
-
- example/example2_1.csv
|
122
|
-
- example/example2_2.csv
|
123
|
-
- example/example4_1.csv
|
124
|
-
- example/example4_2.csv
|
125
|
-
- example/example4_3.csv
|
126
|
-
- example/example4_4.csv
|
127
|
-
- example/json_key.json
|
128
|
-
- example/nested_example.jsonl
|
129
|
-
- example/schema.json
|
130
|
-
- example/schema_expose_errors.json
|
131
106
|
- lib/embulk/output/bigquery.rb
|
107
|
+
- lib/embulk/output/bigquery/auth.rb
|
132
108
|
- lib/embulk/output/bigquery/bigquery_client.rb
|
133
109
|
- lib/embulk/output/bigquery/file_writer.rb
|
134
110
|
- lib/embulk/output/bigquery/gcs_client.rb
|
@@ -162,7 +138,8 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
162
138
|
- !ruby/object:Gem::Version
|
163
139
|
version: '0'
|
164
140
|
requirements: []
|
165
|
-
|
141
|
+
rubyforge_project:
|
142
|
+
rubygems_version: 2.6.14.1
|
166
143
|
signing_key:
|
167
144
|
specification_version: 4
|
168
145
|
summary: Google BigQuery output plugin for Embulk
|
@@ -1,31 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: append_direct
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_table_name
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
compression: NONE
|
28
|
-
auto_create_dataset: true
|
29
|
-
auto_create_table: true
|
30
|
-
schema_file: example/schema.json
|
31
|
-
schema_update_options: [ALLOW_FIELD_ADDITION, ALLOW_FIELD_RELAXATION]
|
@@ -1,33 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: replace
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_table_name
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
auto_create_dataset: true
|
28
|
-
auto_create_table: true
|
29
|
-
schema_file: example/schema.json
|
30
|
-
timeout_sec: 400
|
31
|
-
open_timeout_sec: 400
|
32
|
-
retries: 2
|
33
|
-
application_name: "Embulk BigQuery plugin test"
|
data/example/config_csv.yml
DELETED
@@ -1,30 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: replace
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_table_name
|
26
|
-
source_format: CSV
|
27
|
-
compression: GZIP
|
28
|
-
auto_create_dataset: true
|
29
|
-
auto_create_table: true
|
30
|
-
schema_file: example/schema.json
|
@@ -1,29 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: delete_in_advance
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_table_name
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
auto_create_dataset: true
|
28
|
-
auto_create_table: true
|
29
|
-
schema_file: example/schema.json
|
@@ -1,33 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: delete_in_advance
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_field_partitioned_table_name
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
compression: NONE
|
28
|
-
auto_create_dataset: true
|
29
|
-
auto_create_table: true
|
30
|
-
schema_file: example/schema.json
|
31
|
-
time_partitioning:
|
32
|
-
type: 'DAY'
|
33
|
-
field: timestamp
|
@@ -1,33 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: delete_in_advance
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_partitioned_table_name$20160929
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
compression: NONE
|
28
|
-
auto_create_dataset: true
|
29
|
-
auto_create_table: true
|
30
|
-
schema_file: example/schema.json
|
31
|
-
time_partitioning:
|
32
|
-
type: 'DAY'
|
33
|
-
expiration_ms: 100
|
@@ -1,30 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: replace
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_table_name
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
compression: NONE
|
28
|
-
auto_create_dataset: true
|
29
|
-
auto_create_table: true
|
30
|
-
schema_file: example/schema_expose_errors.json
|
data/example/config_gcs.yml
DELETED
@@ -1,32 +0,0 @@
|
|
1
|
-
in:
|
2
|
-
type: file
|
3
|
-
path_prefix: example/example.csv
|
4
|
-
parser:
|
5
|
-
type: csv
|
6
|
-
charset: UTF-8
|
7
|
-
newline: CRLF
|
8
|
-
null_string: 'NULL'
|
9
|
-
skip_header_lines: 1
|
10
|
-
comment_line_marker: '#'
|
11
|
-
columns:
|
12
|
-
- {name: date, type: string}
|
13
|
-
- {name: timestamp, type: timestamp, format: "%Y-%m-%d %H:%M:%S.%N", timezone: "+09:00"}
|
14
|
-
- {name: "null", type: string}
|
15
|
-
- {name: long, type: long}
|
16
|
-
- {name: string, type: string}
|
17
|
-
- {name: double, type: double}
|
18
|
-
- {name: boolean, type: boolean}
|
19
|
-
out:
|
20
|
-
type: bigquery
|
21
|
-
mode: replace
|
22
|
-
auth_method: json_key
|
23
|
-
json_keyfile: example/your-project-000.json
|
24
|
-
dataset: your_dataset_name
|
25
|
-
table: your_table_name
|
26
|
-
source_format: NEWLINE_DELIMITED_JSON
|
27
|
-
compression: GZIP
|
28
|
-
auto_create_dataset: true
|
29
|
-
auto_create_table: true
|
30
|
-
schema_file: example/schema.json
|
31
|
-
gcs_bucket: your_bucket_name
|
32
|
-
auto_create_gcs_bucket: true
|