embulk-output-s3_parquet 0.0.2

Sign up to get free protection for your applications and to get access to all the features.
Files changed (30) hide show
  1. checksums.yaml +7 -0
  2. data/.gitignore +12 -0
  3. data/.scalafmt.conf +9 -0
  4. data/CHANGELOG.md +9 -0
  5. data/LICENSE.txt +21 -0
  6. data/README.md +122 -0
  7. data/build.gradle +101 -0
  8. data/example/config.yml +25 -0
  9. data/example/data.tsv +5 -0
  10. data/gradle/wrapper/gradle-wrapper.jar +0 -0
  11. data/gradle/wrapper/gradle-wrapper.properties +5 -0
  12. data/gradlew +172 -0
  13. data/gradlew.bat +84 -0
  14. data/lib/embulk/output/s3_parquet.rb +3 -0
  15. data/settings.gradle +1 -0
  16. data/src/main/scala/org/embulk/output/s3_parquet/S3ParquetOutputPlugin.scala +199 -0
  17. data/src/main/scala/org/embulk/output/s3_parquet/S3ParquetPageOutput.scala +65 -0
  18. data/src/main/scala/org/embulk/output/s3_parquet/aws/Aws.scala +45 -0
  19. data/src/main/scala/org/embulk/output/s3_parquet/aws/AwsClientConfiguration.scala +34 -0
  20. data/src/main/scala/org/embulk/output/s3_parquet/aws/AwsCredentials.scala +128 -0
  21. data/src/main/scala/org/embulk/output/s3_parquet/aws/AwsEndpointConfiguration.scala +49 -0
  22. data/src/main/scala/org/embulk/output/s3_parquet/aws/AwsS3Configuration.scala +56 -0
  23. data/src/main/scala/org/embulk/output/s3_parquet/aws/HttpProxy.scala +56 -0
  24. data/src/main/scala/org/embulk/output/s3_parquet/parquet/EmbulkMessageType.scala +59 -0
  25. data/src/main/scala/org/embulk/output/s3_parquet/parquet/ParquetFileWriteSupport.scala +33 -0
  26. data/src/main/scala/org/embulk/output/s3_parquet/parquet/ParquetFileWriter.scala +125 -0
  27. data/src/test/resources/org/embulk/output/s3_parquet/in1.csv +6 -0
  28. data/src/test/resources/org/embulk/output/s3_parquet/out1.tsv +5 -0
  29. data/src/test/scala/org/embulk/output/s3_parquet/TestS3ParquetOutputPlugin.scala +140 -0
  30. metadata +184 -0
metadata ADDED
@@ -0,0 +1,184 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: embulk-output-s3_parquet
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.2
5
+ platform: ruby
6
+ authors:
7
+ - Civitaspo
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2019-01-21 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ requirement: !ruby/object:Gem::Requirement
15
+ requirements:
16
+ - - "~>"
17
+ - !ruby/object:Gem::Version
18
+ version: '1.0'
19
+ name: bundler
20
+ prerelease: false
21
+ type: :development
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '1.0'
27
+ - !ruby/object:Gem::Dependency
28
+ requirement: !ruby/object:Gem::Requirement
29
+ requirements:
30
+ - - "~>"
31
+ - !ruby/object:Gem::Version
32
+ version: '12.0'
33
+ name: rake
34
+ prerelease: false
35
+ type: :development
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '12.0'
41
+ description: Dumps records to S3 Parquet.
42
+ email:
43
+ - civitaspo@gmail.com
44
+ executables: []
45
+ extensions: []
46
+ extra_rdoc_files: []
47
+ files:
48
+ - ".gitignore"
49
+ - ".scalafmt.conf"
50
+ - CHANGELOG.md
51
+ - LICENSE.txt
52
+ - README.md
53
+ - build.gradle
54
+ - classpath/accessors-smart-1.2.jar
55
+ - classpath/activation-1.1.jar
56
+ - classpath/apacheds-i18n-2.0.0-M15.jar
57
+ - classpath/apacheds-kerberos-codec-2.0.0-M15.jar
58
+ - classpath/api-asn1-api-1.0.0-M20.jar
59
+ - classpath/api-util-1.0.0-M20.jar
60
+ - classpath/asm-3.1.jar
61
+ - classpath/asm-5.0.4.jar
62
+ - classpath/avro-1.7.7.jar
63
+ - classpath/aws-java-sdk-core-1.11.479.jar
64
+ - classpath/aws-java-sdk-kms-1.11.479.jar
65
+ - classpath/aws-java-sdk-s3-1.11.479.jar
66
+ - classpath/aws-java-sdk-sts-1.11.479.jar
67
+ - classpath/commons-beanutils-1.7.0.jar
68
+ - classpath/commons-codec-1.10.jar
69
+ - classpath/commons-collections-3.2.2.jar
70
+ - classpath/commons-compress-1.4.1.jar
71
+ - classpath/commons-configuration-1.6.jar
72
+ - classpath/commons-digester-1.8.jar
73
+ - classpath/commons-io-2.4.jar
74
+ - classpath/commons-lang-2.6.jar
75
+ - classpath/commons-logging-1.2.jar
76
+ - classpath/commons-math3-3.1.1.jar
77
+ - classpath/commons-net-3.1.jar
78
+ - classpath/commons-pool-1.6.jar
79
+ - classpath/curator-client-2.7.1.jar
80
+ - classpath/curator-framework-2.7.1.jar
81
+ - classpath/curator-recipes-2.7.1.jar
82
+ - classpath/embulk-output-s3_parquet-0.0.2.jar
83
+ - classpath/gson-2.2.4.jar
84
+ - classpath/hadoop-annotations-2.9.2.jar
85
+ - classpath/hadoop-auth-2.9.2.jar
86
+ - classpath/hadoop-common-2.9.2.jar
87
+ - classpath/htrace-core4-4.1.0-incubating.jar
88
+ - classpath/httpclient-4.5.5.jar
89
+ - classpath/httpcore-4.4.9.jar
90
+ - classpath/ion-java-1.0.2.jar
91
+ - classpath/jackson-core-asl-1.9.13.jar
92
+ - classpath/jackson-databind-2.6.7.2.jar
93
+ - classpath/jackson-dataformat-cbor-2.6.7.jar
94
+ - classpath/jackson-jaxrs-1.8.3.jar
95
+ - classpath/jackson-mapper-asl-1.9.13.jar
96
+ - classpath/jackson-xc-1.8.3.jar
97
+ - classpath/java-xmlbuilder-0.4.jar
98
+ - classpath/jaxb-api-2.2.2.jar
99
+ - classpath/jaxb-impl-2.2.3-1.jar
100
+ - classpath/jcip-annotations-1.0-1.jar
101
+ - classpath/jersey-core-1.9.jar
102
+ - classpath/jersey-json-1.9.jar
103
+ - classpath/jersey-server-1.9.jar
104
+ - classpath/jets3t-0.9.0.jar
105
+ - classpath/jettison-1.1.jar
106
+ - classpath/jetty-6.1.26.jar
107
+ - classpath/jetty-sslengine-6.1.26.jar
108
+ - classpath/jetty-util-6.1.26.jar
109
+ - classpath/jline-0.9.94.jar
110
+ - classpath/jmespath-java-1.11.479.jar
111
+ - classpath/jsch-0.1.54.jar
112
+ - classpath/json-smart-2.3.jar
113
+ - classpath/jsp-api-2.1.jar
114
+ - classpath/jsr305-3.0.0.jar
115
+ - classpath/log4j-1.2.17.jar
116
+ - classpath/netty-3.7.0.Final.jar
117
+ - classpath/nimbus-jose-jwt-4.41.1.jar
118
+ - classpath/paranamer-2.3.jar
119
+ - classpath/parquet-column-1.10.0.jar
120
+ - classpath/parquet-common-1.10.0.jar
121
+ - classpath/parquet-encoding-1.10.0.jar
122
+ - classpath/parquet-format-2.4.0.jar
123
+ - classpath/parquet-hadoop-1.10.0.jar
124
+ - classpath/parquet-jackson-1.10.0.jar
125
+ - classpath/protobuf-java-2.5.0.jar
126
+ - classpath/scala-library-2.12.8.jar
127
+ - classpath/servlet-api-2.5-20081211.jar
128
+ - classpath/servlet-api-2.5.jar
129
+ - classpath/slf4j-api-1.7.25.jar
130
+ - classpath/slf4j-log4j12-1.7.25.jar
131
+ - classpath/snappy-java-1.1.7.2.jar
132
+ - classpath/stax-api-1.0-2.jar
133
+ - classpath/stax2-api-3.1.4.jar
134
+ - classpath/woodstox-core-5.0.3.jar
135
+ - classpath/xmlenc-0.52.jar
136
+ - classpath/xz-1.0.jar
137
+ - classpath/zookeeper-3.4.6.jar
138
+ - example/config.yml
139
+ - example/data.tsv
140
+ - gradle/wrapper/gradle-wrapper.jar
141
+ - gradle/wrapper/gradle-wrapper.properties
142
+ - gradlew
143
+ - gradlew.bat
144
+ - lib/embulk/output/s3_parquet.rb
145
+ - settings.gradle
146
+ - src/main/scala/org/embulk/output/s3_parquet/S3ParquetOutputPlugin.scala
147
+ - src/main/scala/org/embulk/output/s3_parquet/S3ParquetPageOutput.scala
148
+ - src/main/scala/org/embulk/output/s3_parquet/aws/Aws.scala
149
+ - src/main/scala/org/embulk/output/s3_parquet/aws/AwsClientConfiguration.scala
150
+ - src/main/scala/org/embulk/output/s3_parquet/aws/AwsCredentials.scala
151
+ - src/main/scala/org/embulk/output/s3_parquet/aws/AwsEndpointConfiguration.scala
152
+ - src/main/scala/org/embulk/output/s3_parquet/aws/AwsS3Configuration.scala
153
+ - src/main/scala/org/embulk/output/s3_parquet/aws/HttpProxy.scala
154
+ - src/main/scala/org/embulk/output/s3_parquet/parquet/EmbulkMessageType.scala
155
+ - src/main/scala/org/embulk/output/s3_parquet/parquet/ParquetFileWriteSupport.scala
156
+ - src/main/scala/org/embulk/output/s3_parquet/parquet/ParquetFileWriter.scala
157
+ - src/test/resources/org/embulk/output/s3_parquet/in1.csv
158
+ - src/test/resources/org/embulk/output/s3_parquet/out1.tsv
159
+ - src/test/scala/org/embulk/output/s3_parquet/TestS3ParquetOutputPlugin.scala
160
+ homepage: https://github.com/civitaspo/embulk-output-s3_parquet
161
+ licenses:
162
+ - MIT
163
+ metadata: {}
164
+ post_install_message:
165
+ rdoc_options: []
166
+ require_paths:
167
+ - lib
168
+ required_ruby_version: !ruby/object:Gem::Requirement
169
+ requirements:
170
+ - - ">="
171
+ - !ruby/object:Gem::Version
172
+ version: '0'
173
+ required_rubygems_version: !ruby/object:Gem::Requirement
174
+ requirements:
175
+ - - ">="
176
+ - !ruby/object:Gem::Version
177
+ version: '0'
178
+ requirements: []
179
+ rubyforge_project:
180
+ rubygems_version: 2.6.8
181
+ signing_key:
182
+ specification_version: 4
183
+ summary: S3 Parquet output plugin for Embulk
184
+ test_files: []