embulk 0.8.38-java → 0.10.27-java

Sign up to get free protection for your applications and to get access to all the features.
Files changed (603) hide show
  1. checksums.yaml +5 -5
  2. data/Gemfile +1 -1
  3. data/LICENSE +202 -0
  4. data/embulk.gemspec +34 -33
  5. data/lib/embulk.rb +5 -61
  6. data/lib/embulk/buffer.rb +1 -2
  7. data/lib/embulk/gem_version.rb +3 -0
  8. data/lib/embulk/guess/charset.rb +2 -11
  9. data/lib/embulk/java/bootstrap.rb +0 -1
  10. data/lib/embulk/java_plugin.rb +9 -1
  11. data/lib/embulk/logger.rb +2 -1
  12. data/lib/embulk/page_builder.rb +2 -2
  13. data/lib/embulk/plugin.rb +2 -2
  14. data/lib/embulk/schema.rb +3 -4
  15. data/lib/embulk/version.rb +43 -19
  16. metadata +23 -761
  17. data/.gitignore +0 -15
  18. data/.ruby-version +0 -1
  19. data/.travis.yml +0 -28
  20. data/COPYING +0 -14
  21. data/Gemfile.lock +0 -30
  22. data/README.md +0 -229
  23. data/Rakefile +0 -26
  24. data/appveyor.yml +0 -28
  25. data/bin/embulk +0 -139
  26. data/build.gradle +0 -419
  27. data/embulk-cli/build.gradle +0 -9
  28. data/embulk-cli/src/main/bat/selfrun.bat +0 -107
  29. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkArguments.java +0 -54
  30. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkCommandLine.java +0 -227
  31. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkCommandLineException.java +0 -25
  32. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkExample.java +0 -86
  33. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkMigrate.java +0 -480
  34. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkNew.java +0 -419
  35. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkRun.java +0 -786
  36. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkSelfUpdate.java +0 -235
  37. data/embulk-cli/src/main/java/org/embulk/cli/EmbulkSubcommand.java +0 -47
  38. data/embulk-cli/src/main/java/org/embulk/cli/Main.java +0 -31
  39. data/embulk-cli/src/main/java/org/embulk/cli/parse/AbstractHelpLineDefinition.java +0 -15
  40. data/embulk-cli/src/main/java/org/embulk/cli/parse/CliHelpFormatterWithHelpMessages.java +0 -141
  41. data/embulk-cli/src/main/java/org/embulk/cli/parse/CliOptionsWithHelpMessages.java +0 -45
  42. data/embulk-cli/src/main/java/org/embulk/cli/parse/EmbulkCommandLineHelpRequired.java +0 -10
  43. data/embulk-cli/src/main/java/org/embulk/cli/parse/EmbulkCommandLineParseException.java +0 -25
  44. data/embulk-cli/src/main/java/org/embulk/cli/parse/EmbulkCommandLineParser.java +0 -187
  45. data/embulk-cli/src/main/java/org/embulk/cli/parse/HelpMessageAsCliOption.java +0 -36
  46. data/embulk-cli/src/main/java/org/embulk/cli/parse/HelpMessageLineDefinition.java +0 -20
  47. data/embulk-cli/src/main/java/org/embulk/cli/parse/OptionBehavior.java +0 -39
  48. data/embulk-cli/src/main/java/org/embulk/cli/parse/OptionDefinition.java +0 -120
  49. data/embulk-cli/src/main/sh/selfrun.sh +0 -60
  50. data/embulk-cli/src/test/java/org/embulk/cli/DummyMain.java +0 -23
  51. data/embulk-cli/src/test/java/org/embulk/cli/SelfrunTest.java +0 -296
  52. data/embulk-core/build.gradle +0 -83
  53. data/embulk-core/src/main/java/org/embulk/EmbulkEmbed.java +0 -321
  54. data/embulk-core/src/main/java/org/embulk/EmbulkRunner.java +0 -531
  55. data/embulk-core/src/main/java/org/embulk/EmbulkService.java +0 -78
  56. data/embulk-core/src/main/java/org/embulk/EmbulkSetup.java +0 -49
  57. data/embulk-core/src/main/java/org/embulk/EmbulkVersion.java +0 -109
  58. data/embulk-core/src/main/java/org/embulk/command/PreviewPrinter.java +0 -87
  59. data/embulk-core/src/main/java/org/embulk/command/TablePreviewPrinter.java +0 -107
  60. data/embulk-core/src/main/java/org/embulk/command/VerticalPreviewPrinter.java +0 -47
  61. data/embulk-core/src/main/java/org/embulk/config/CommitReport.java +0 -36
  62. data/embulk-core/src/main/java/org/embulk/config/Config.java +0 -15
  63. data/embulk-core/src/main/java/org/embulk/config/ConfigDefault.java +0 -15
  64. data/embulk-core/src/main/java/org/embulk/config/ConfigDiff.java +0 -32
  65. data/embulk-core/src/main/java/org/embulk/config/ConfigException.java +0 -26
  66. data/embulk-core/src/main/java/org/embulk/config/ConfigInject.java +0 -14
  67. data/embulk-core/src/main/java/org/embulk/config/ConfigLoader.java +0 -149
  68. data/embulk-core/src/main/java/org/embulk/config/ConfigSource.java +0 -34
  69. data/embulk-core/src/main/java/org/embulk/config/DataSource.java +0 -41
  70. data/embulk-core/src/main/java/org/embulk/config/DataSourceImpl.java +0 -243
  71. data/embulk-core/src/main/java/org/embulk/config/DataSourceSerDe.java +0 -84
  72. data/embulk-core/src/main/java/org/embulk/config/GenericTypeReference.java +0 -20
  73. data/embulk-core/src/main/java/org/embulk/config/ModelManager.java +0 -123
  74. data/embulk-core/src/main/java/org/embulk/config/Task.java +0 -10
  75. data/embulk-core/src/main/java/org/embulk/config/TaskInvocationHandler.java +0 -180
  76. data/embulk-core/src/main/java/org/embulk/config/TaskReport.java +0 -32
  77. data/embulk-core/src/main/java/org/embulk/config/TaskSerDe.java +0 -349
  78. data/embulk-core/src/main/java/org/embulk/config/TaskSource.java +0 -34
  79. data/embulk-core/src/main/java/org/embulk/config/TaskValidationException.java +0 -38
  80. data/embulk-core/src/main/java/org/embulk/config/TaskValidator.java +0 -24
  81. data/embulk-core/src/main/java/org/embulk/config/UserDataException.java +0 -4
  82. data/embulk-core/src/main/java/org/embulk/config/UserDataExceptions.java +0 -17
  83. data/embulk-core/src/main/java/org/embulk/config/YamlTagResolver.java +0 -53
  84. data/embulk-core/src/main/java/org/embulk/exec/BufferFileInputPlugin.java +0 -88
  85. data/embulk-core/src/main/java/org/embulk/exec/BulkLoader.java +0 -754
  86. data/embulk-core/src/main/java/org/embulk/exec/ConfigurableGuessInputPlugin.java +0 -9
  87. data/embulk-core/src/main/java/org/embulk/exec/ExecModule.java +0 -53
  88. data/embulk-core/src/main/java/org/embulk/exec/ExecutionInterruptedException.java +0 -10
  89. data/embulk-core/src/main/java/org/embulk/exec/ExecutionResult.java +0 -33
  90. data/embulk-core/src/main/java/org/embulk/exec/ExtensionServiceLoaderModule.java +0 -43
  91. data/embulk-core/src/main/java/org/embulk/exec/ForGuess.java +0 -16
  92. data/embulk-core/src/main/java/org/embulk/exec/ForSystemConfig.java +0 -16
  93. data/embulk-core/src/main/java/org/embulk/exec/GuessExecutor.java +0 -309
  94. data/embulk-core/src/main/java/org/embulk/exec/LocalExecutorPlugin.java +0 -563
  95. data/embulk-core/src/main/java/org/embulk/exec/LoggerProvider.java +0 -68
  96. data/embulk-core/src/main/java/org/embulk/exec/NoSampleException.java +0 -10
  97. data/embulk-core/src/main/java/org/embulk/exec/PartialExecutionException.java +0 -26
  98. data/embulk-core/src/main/java/org/embulk/exec/PooledBufferAllocator.java +0 -77
  99. data/embulk-core/src/main/java/org/embulk/exec/PreviewExecutor.java +0 -222
  100. data/embulk-core/src/main/java/org/embulk/exec/PreviewResult.java +0 -27
  101. data/embulk-core/src/main/java/org/embulk/exec/PreviewedNoticeError.java +0 -17
  102. data/embulk-core/src/main/java/org/embulk/exec/ResumeState.java +0 -100
  103. data/embulk-core/src/main/java/org/embulk/exec/SamplingParserPlugin.java +0 -215
  104. data/embulk-core/src/main/java/org/embulk/exec/SetCurrentThreadName.java +0 -22
  105. data/embulk-core/src/main/java/org/embulk/exec/SkipTransactionException.java +0 -23
  106. data/embulk-core/src/main/java/org/embulk/exec/SystemConfigModule.java +0 -24
  107. data/embulk-core/src/main/java/org/embulk/exec/TempFileAllocator.java +0 -35
  108. data/embulk-core/src/main/java/org/embulk/exec/TransactionStage.java +0 -27
  109. data/embulk-core/src/main/java/org/embulk/jruby/JRubyPluginSource.java +0 -76
  110. data/embulk-core/src/main/java/org/embulk/jruby/JRubyScriptingModule.java +0 -395
  111. data/embulk-core/src/main/java/org/embulk/plugin/BuiltinPluginSourceModule.java +0 -17
  112. data/embulk-core/src/main/java/org/embulk/plugin/DefaultPluginType.java +0 -50
  113. data/embulk-core/src/main/java/org/embulk/plugin/InjectedPluginSource.java +0 -100
  114. data/embulk-core/src/main/java/org/embulk/plugin/MavenPluginType.java +0 -112
  115. data/embulk-core/src/main/java/org/embulk/plugin/PluginClassLoader.java +0 -993
  116. data/embulk-core/src/main/java/org/embulk/plugin/PluginClassLoaderFactory.java +0 -16
  117. data/embulk-core/src/main/java/org/embulk/plugin/PluginClassLoaderModule.java +0 -102
  118. data/embulk-core/src/main/java/org/embulk/plugin/PluginManager.java +0 -78
  119. data/embulk-core/src/main/java/org/embulk/plugin/PluginSource.java +0 -49
  120. data/embulk-core/src/main/java/org/embulk/plugin/PluginSourceNotMatchException.java +0 -25
  121. data/embulk-core/src/main/java/org/embulk/plugin/PluginType.java +0 -122
  122. data/embulk-core/src/main/java/org/embulk/plugin/compat/InputPluginWrapper.java +0 -102
  123. data/embulk-core/src/main/java/org/embulk/plugin/compat/PluginWrappers.java +0 -30
  124. data/embulk-core/src/main/java/org/embulk/plugin/compat/TransactionalFileInputWrapper.java +0 -96
  125. data/embulk-core/src/main/java/org/embulk/plugin/compat/TransactionalFileOutputWrapper.java +0 -102
  126. data/embulk-core/src/main/java/org/embulk/plugin/compat/TransactionalPageOutputWrapper.java +0 -95
  127. data/embulk-core/src/main/java/org/embulk/plugin/jar/InvalidJarPluginException.java +0 -14
  128. data/embulk-core/src/main/java/org/embulk/plugin/jar/JarPluginLoader.java +0 -232
  129. data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenArtifactFinder.java +0 -134
  130. data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenArtifactNotFoundException.java +0 -20
  131. data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenPluginSource.java +0 -187
  132. data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenPluginSourceModule.java +0 -22
  133. data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenRepositoryNotFoundException.java +0 -31
  134. data/embulk-core/src/main/java/org/embulk/spi/AbortTransactionResource.java +0 -36
  135. data/embulk-core/src/main/java/org/embulk/spi/Buffer.java +0 -148
  136. data/embulk-core/src/main/java/org/embulk/spi/BufferAllocator.java +0 -8
  137. data/embulk-core/src/main/java/org/embulk/spi/CloseResource.java +0 -42
  138. data/embulk-core/src/main/java/org/embulk/spi/Column.java +0 -95
  139. data/embulk-core/src/main/java/org/embulk/spi/ColumnConfig.java +0 -112
  140. data/embulk-core/src/main/java/org/embulk/spi/ColumnVisitor.java +0 -16
  141. data/embulk-core/src/main/java/org/embulk/spi/DataException.java +0 -23
  142. data/embulk-core/src/main/java/org/embulk/spi/DecoderPlugin.java +0 -16
  143. data/embulk-core/src/main/java/org/embulk/spi/EncoderPlugin.java +0 -16
  144. data/embulk-core/src/main/java/org/embulk/spi/Exec.java +0 -113
  145. data/embulk-core/src/main/java/org/embulk/spi/ExecAction.java +0 -6
  146. data/embulk-core/src/main/java/org/embulk/spi/ExecSession.java +0 -220
  147. data/embulk-core/src/main/java/org/embulk/spi/ExecutorPlugin.java +0 -19
  148. data/embulk-core/src/main/java/org/embulk/spi/Extension.java +0 -44
  149. data/embulk-core/src/main/java/org/embulk/spi/FileInput.java +0 -11
  150. data/embulk-core/src/main/java/org/embulk/spi/FileInputPlugin.java +0 -30
  151. data/embulk-core/src/main/java/org/embulk/spi/FileInputRunner.java +0 -169
  152. data/embulk-core/src/main/java/org/embulk/spi/FileOutput.java +0 -13
  153. data/embulk-core/src/main/java/org/embulk/spi/FileOutputPlugin.java +0 -28
  154. data/embulk-core/src/main/java/org/embulk/spi/FileOutputRunner.java +0 -199
  155. data/embulk-core/src/main/java/org/embulk/spi/FilterPlugin.java +0 -18
  156. data/embulk-core/src/main/java/org/embulk/spi/FormatterPlugin.java +0 -18
  157. data/embulk-core/src/main/java/org/embulk/spi/GuessPlugin.java +0 -9
  158. data/embulk-core/src/main/java/org/embulk/spi/InputPlugin.java +0 -33
  159. data/embulk-core/src/main/java/org/embulk/spi/OutputPlugin.java +0 -29
  160. data/embulk-core/src/main/java/org/embulk/spi/Page.java +0 -86
  161. data/embulk-core/src/main/java/org/embulk/spi/PageBuilder.java +0 -696
  162. data/embulk-core/src/main/java/org/embulk/spi/PageFormat.java +0 -47
  163. data/embulk-core/src/main/java/org/embulk/spi/PageOutput.java +0 -11
  164. data/embulk-core/src/main/java/org/embulk/spi/PageReader.java +0 -248
  165. data/embulk-core/src/main/java/org/embulk/spi/ParserPlugin.java +0 -17
  166. data/embulk-core/src/main/java/org/embulk/spi/ProcessState.java +0 -10
  167. data/embulk-core/src/main/java/org/embulk/spi/ProcessTask.java +0 -117
  168. data/embulk-core/src/main/java/org/embulk/spi/Schema.java +0 -139
  169. data/embulk-core/src/main/java/org/embulk/spi/SchemaConfig.java +0 -93
  170. data/embulk-core/src/main/java/org/embulk/spi/SchemaConfigException.java +0 -22
  171. data/embulk-core/src/main/java/org/embulk/spi/TaskState.java +0 -81
  172. data/embulk-core/src/main/java/org/embulk/spi/TempFileException.java +0 -19
  173. data/embulk-core/src/main/java/org/embulk/spi/TempFileSpace.java +0 -88
  174. data/embulk-core/src/main/java/org/embulk/spi/Transactional.java +0 -10
  175. data/embulk-core/src/main/java/org/embulk/spi/TransactionalFileInput.java +0 -17
  176. data/embulk-core/src/main/java/org/embulk/spi/TransactionalFileOutput.java +0 -19
  177. data/embulk-core/src/main/java/org/embulk/spi/TransactionalPageOutput.java +0 -17
  178. data/embulk-core/src/main/java/org/embulk/spi/json/JsonParseException.java +0 -17
  179. data/embulk-core/src/main/java/org/embulk/spi/json/JsonParser.java +0 -233
  180. data/embulk-core/src/main/java/org/embulk/spi/json/RubyValueApi.java +0 -100
  181. data/embulk-core/src/main/java/org/embulk/spi/time/DateTimeZoneSerDe.java +0 -55
  182. data/embulk-core/src/main/java/org/embulk/spi/time/Timestamp.java +0 -180
  183. data/embulk-core/src/main/java/org/embulk/spi/time/TimestampFormat.java +0 -127
  184. data/embulk-core/src/main/java/org/embulk/spi/time/TimestampFormatter.java +0 -125
  185. data/embulk-core/src/main/java/org/embulk/spi/time/TimestampParseException.java +0 -12
  186. data/embulk-core/src/main/java/org/embulk/spi/time/TimestampParser.java +0 -310
  187. data/embulk-core/src/main/java/org/embulk/spi/time/TimestampSerDe.java +0 -49
  188. data/embulk-core/src/main/java/org/embulk/spi/type/AbstractType.java +0 -58
  189. data/embulk-core/src/main/java/org/embulk/spi/type/BooleanType.java +0 -12
  190. data/embulk-core/src/main/java/org/embulk/spi/type/DoubleType.java +0 -12
  191. data/embulk-core/src/main/java/org/embulk/spi/type/JsonType.java +0 -14
  192. data/embulk-core/src/main/java/org/embulk/spi/type/LongType.java +0 -12
  193. data/embulk-core/src/main/java/org/embulk/spi/type/StringType.java +0 -12
  194. data/embulk-core/src/main/java/org/embulk/spi/type/TimestampType.java +0 -41
  195. data/embulk-core/src/main/java/org/embulk/spi/type/Type.java +0 -15
  196. data/embulk-core/src/main/java/org/embulk/spi/type/TypeDeserializer.java +0 -45
  197. data/embulk-core/src/main/java/org/embulk/spi/type/Types.java +0 -16
  198. data/embulk-core/src/main/java/org/embulk/spi/unit/ByteSize.java +0 -156
  199. data/embulk-core/src/main/java/org/embulk/spi/unit/LocalFile.java +0 -106
  200. data/embulk-core/src/main/java/org/embulk/spi/unit/LocalFileSerDe.java +0 -113
  201. data/embulk-core/src/main/java/org/embulk/spi/unit/ToString.java +0 -54
  202. data/embulk-core/src/main/java/org/embulk/spi/unit/ToStringMap.java +0 -34
  203. data/embulk-core/src/main/java/org/embulk/spi/util/CharsetSerDe.java +0 -55
  204. data/embulk-core/src/main/java/org/embulk/spi/util/Decoders.java +0 -81
  205. data/embulk-core/src/main/java/org/embulk/spi/util/DynamicColumnNotFoundException.java +0 -10
  206. data/embulk-core/src/main/java/org/embulk/spi/util/DynamicColumnSetter.java +0 -21
  207. data/embulk-core/src/main/java/org/embulk/spi/util/DynamicColumnSetterFactory.java +0 -134
  208. data/embulk-core/src/main/java/org/embulk/spi/util/DynamicPageBuilder.java +0 -200
  209. data/embulk-core/src/main/java/org/embulk/spi/util/Encoders.java +0 -81
  210. data/embulk-core/src/main/java/org/embulk/spi/util/Executors.java +0 -93
  211. data/embulk-core/src/main/java/org/embulk/spi/util/FileInputInputStream.java +0 -111
  212. data/embulk-core/src/main/java/org/embulk/spi/util/FileOutputOutputStream.java +0 -119
  213. data/embulk-core/src/main/java/org/embulk/spi/util/Filters.java +0 -100
  214. data/embulk-core/src/main/java/org/embulk/spi/util/InputStreamFileInput.java +0 -189
  215. data/embulk-core/src/main/java/org/embulk/spi/util/InputStreamTransactionalFileInput.java +0 -25
  216. data/embulk-core/src/main/java/org/embulk/spi/util/Inputs.java +0 -65
  217. data/embulk-core/src/main/java/org/embulk/spi/util/LineDecoder.java +0 -157
  218. data/embulk-core/src/main/java/org/embulk/spi/util/LineEncoder.java +0 -123
  219. data/embulk-core/src/main/java/org/embulk/spi/util/ListFileInput.java +0 -52
  220. data/embulk-core/src/main/java/org/embulk/spi/util/Newline.java +0 -38
  221. data/embulk-core/src/main/java/org/embulk/spi/util/OutputStreamFileOutput.java +0 -88
  222. data/embulk-core/src/main/java/org/embulk/spi/util/PagePrinter.java +0 -126
  223. data/embulk-core/src/main/java/org/embulk/spi/util/Pages.java +0 -149
  224. data/embulk-core/src/main/java/org/embulk/spi/util/ResumableInputStream.java +0 -168
  225. data/embulk-core/src/main/java/org/embulk/spi/util/RetryExecutor.java +0 -130
  226. data/embulk-core/src/main/java/org/embulk/spi/util/Timestamps.java +0 -53
  227. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/AbstractDynamicColumnSetter.java +0 -94
  228. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/BooleanColumnSetter.java +0 -71
  229. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/DefaultValueSetter.java +0 -20
  230. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/DoubleColumnSetter.java +0 -68
  231. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/JsonColumnSetter.java +0 -64
  232. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/LongColumnSetter.java +0 -78
  233. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/NullDefaultValueSetter.java +0 -39
  234. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/SkipColumnSetter.java +0 -68
  235. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/StringColumnSetter.java +0 -63
  236. data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/TimestampColumnSetter.java +0 -72
  237. data/embulk-core/src/main/resources/embulk/logback-color.xml +0 -72
  238. data/embulk-core/src/main/resources/embulk/logback-console.xml +0 -14
  239. data/embulk-core/src/main/resources/embulk/logback-file.xml +0 -23
  240. data/embulk-core/src/main/resources/embulk/parent_first_packages.properties +0 -73
  241. data/embulk-core/src/main/resources/embulk/parent_first_resources.properties +0 -29
  242. data/embulk-core/src/test/java/org/embulk/EmbulkTestRuntime.java +0 -122
  243. data/embulk-core/src/test/java/org/embulk/GuiceBinder.java +0 -72
  244. data/embulk-core/src/test/java/org/embulk/RandomManager.java +0 -53
  245. data/embulk-core/src/test/java/org/embulk/TestPluginSourceModule.java +0 -23
  246. data/embulk-core/src/test/java/org/embulk/TestUtilityModule.java +0 -17
  247. data/embulk-core/src/test/java/org/embulk/config/TestConfigLoader.java +0 -66
  248. data/embulk-core/src/test/java/org/embulk/config/TestConfigSource.java +0 -114
  249. data/embulk-core/src/test/java/org/embulk/config/TestTaskSource.java +0 -70
  250. data/embulk-core/src/test/java/org/embulk/plugin/MockPluginSource.java +0 -58
  251. data/embulk-core/src/test/java/org/embulk/plugin/TestPluginType.java +0 -83
  252. data/embulk-core/src/test/java/org/embulk/plugin/TestPluginTypeSerDe.java +0 -67
  253. data/embulk-core/src/test/java/org/embulk/plugin/jar/ExampleJarSpiV0.java +0 -9
  254. data/embulk-core/src/test/java/org/embulk/plugin/jar/JarBuilder.java +0 -101
  255. data/embulk-core/src/test/java/org/embulk/plugin/jar/TestJarPluginLoader.java +0 -60
  256. data/embulk-core/src/test/java/org/embulk/plugin/maven/TestMavenArtifactFinder.java +0 -41
  257. data/embulk-core/src/test/java/org/embulk/spi/MockFileOutput.java +0 -63
  258. data/embulk-core/src/test/java/org/embulk/spi/MockFormatterPlugin.java +0 -108
  259. data/embulk-core/src/test/java/org/embulk/spi/MockParserPlugin.java +0 -80
  260. data/embulk-core/src/test/java/org/embulk/spi/PageTestUtils.java +0 -59
  261. data/embulk-core/src/test/java/org/embulk/spi/TestBuffer.java +0 -24
  262. data/embulk-core/src/test/java/org/embulk/spi/TestFileInputInputStream.java +0 -89
  263. data/embulk-core/src/test/java/org/embulk/spi/TestFileInputRunner.java +0 -199
  264. data/embulk-core/src/test/java/org/embulk/spi/TestFileOutputRunner.java +0 -221
  265. data/embulk-core/src/test/java/org/embulk/spi/TestInputStreamFileInput.java +0 -188
  266. data/embulk-core/src/test/java/org/embulk/spi/TestPageBuilderReader.java +0 -411
  267. data/embulk-core/src/test/java/org/embulk/spi/json/TestJsonParser.java +0 -102
  268. data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestamp.java +0 -116
  269. data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestampFormatterParser.java +0 -75
  270. data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestampFormatterParserDeprecated.java +0 -67
  271. data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestampParser.java +0 -232
  272. data/embulk-core/src/test/java/org/embulk/spi/type/TestTypeSerDe.java +0 -45
  273. data/embulk-core/src/test/java/org/embulk/spi/unit/TestByteSize.java +0 -79
  274. data/embulk-core/src/test/java/org/embulk/spi/util/TestLineDecoder.java +0 -237
  275. data/embulk-core/src/test/java/org/embulk/spi/util/TestLineEncoder.java +0 -123
  276. data/embulk-core/src/test/resources/m2.test/.gitignore +0 -1
  277. data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.jar +0 -0
  278. data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.jar.sha1 +0 -1
  279. data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.pom +0 -9
  280. data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.pom.sha1 +0 -1
  281. data/embulk-docs/Makefile +0 -178
  282. data/embulk-docs/build.gradle +0 -41
  283. data/embulk-docs/make.bat +0 -243
  284. data/embulk-docs/push-gh-pages.sh +0 -49
  285. data/embulk-docs/src/_static/embulk-architecture.png +0 -0
  286. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-oneline-tr.png +0 -0
  287. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-oneline-wt.png +0 -0
  288. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-oneline.ai +0 -396
  289. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq-tr-small.png +0 -0
  290. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq-tr.png +0 -0
  291. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq-wt.png +0 -0
  292. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq.ai +0 -417
  293. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq.svg +0 -1
  294. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-symbol-tr.png +0 -0
  295. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-symbol-wt.png +0 -0
  296. data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-symbol.ai +1 -394
  297. data/embulk-docs/src/_static/embulk-logo.svg +0 -133
  298. data/embulk-docs/src/built-in.rst +0 -1017
  299. data/embulk-docs/src/conf.py +0 -260
  300. data/embulk-docs/src/customization.rst +0 -184
  301. data/embulk-docs/src/developers/index.rst +0 -45
  302. data/embulk-docs/src/index.rst +0 -102
  303. data/embulk-docs/src/logo.rst +0 -27
  304. data/embulk-docs/src/recipe.rst +0 -8
  305. data/embulk-docs/src/recipe/scheduled-csv-load-to-elasticsearch-kibana5.rst +0 -163
  306. data/embulk-docs/src/release.rst +0 -108
  307. data/embulk-docs/src/release/release-0.1.0.rst +0 -8
  308. data/embulk-docs/src/release/release-0.2.0.rst +0 -16
  309. data/embulk-docs/src/release/release-0.2.1.rst +0 -19
  310. data/embulk-docs/src/release/release-0.3.0.rst +0 -34
  311. data/embulk-docs/src/release/release-0.3.1.rst +0 -11
  312. data/embulk-docs/src/release/release-0.3.2.rst +0 -15
  313. data/embulk-docs/src/release/release-0.4.0.rst +0 -74
  314. data/embulk-docs/src/release/release-0.4.1.rst +0 -18
  315. data/embulk-docs/src/release/release-0.4.10.rst +0 -17
  316. data/embulk-docs/src/release/release-0.4.2.rst +0 -18
  317. data/embulk-docs/src/release/release-0.4.3.rst +0 -34
  318. data/embulk-docs/src/release/release-0.4.4.rst +0 -39
  319. data/embulk-docs/src/release/release-0.4.5.rst +0 -24
  320. data/embulk-docs/src/release/release-0.4.6.rst +0 -30
  321. data/embulk-docs/src/release/release-0.4.7.rst +0 -16
  322. data/embulk-docs/src/release/release-0.4.8.rst +0 -15
  323. data/embulk-docs/src/release/release-0.4.9.rst +0 -23
  324. data/embulk-docs/src/release/release-0.5.0.rst +0 -89
  325. data/embulk-docs/src/release/release-0.5.1.rst +0 -13
  326. data/embulk-docs/src/release/release-0.5.2.rst +0 -30
  327. data/embulk-docs/src/release/release-0.5.3.rst +0 -22
  328. data/embulk-docs/src/release/release-0.5.4.rst +0 -24
  329. data/embulk-docs/src/release/release-0.5.5.rst +0 -18
  330. data/embulk-docs/src/release/release-0.6.0.rst +0 -34
  331. data/embulk-docs/src/release/release-0.6.1.rst +0 -11
  332. data/embulk-docs/src/release/release-0.6.10.rst +0 -15
  333. data/embulk-docs/src/release/release-0.6.11.rst +0 -19
  334. data/embulk-docs/src/release/release-0.6.12.rst +0 -31
  335. data/embulk-docs/src/release/release-0.6.13.rst +0 -23
  336. data/embulk-docs/src/release/release-0.6.14.rst +0 -47
  337. data/embulk-docs/src/release/release-0.6.15.rst +0 -26
  338. data/embulk-docs/src/release/release-0.6.16.rst +0 -26
  339. data/embulk-docs/src/release/release-0.6.17.rst +0 -39
  340. data/embulk-docs/src/release/release-0.6.18.rst +0 -14
  341. data/embulk-docs/src/release/release-0.6.19.rst +0 -18
  342. data/embulk-docs/src/release/release-0.6.2.rst +0 -17
  343. data/embulk-docs/src/release/release-0.6.20.rst +0 -19
  344. data/embulk-docs/src/release/release-0.6.21.rst +0 -20
  345. data/embulk-docs/src/release/release-0.6.22.rst +0 -26
  346. data/embulk-docs/src/release/release-0.6.23.rst +0 -17
  347. data/embulk-docs/src/release/release-0.6.24.rst +0 -13
  348. data/embulk-docs/src/release/release-0.6.25.rst +0 -12
  349. data/embulk-docs/src/release/release-0.6.26.rst +0 -17
  350. data/embulk-docs/src/release/release-0.6.27.rst +0 -11
  351. data/embulk-docs/src/release/release-0.6.3.rst +0 -23
  352. data/embulk-docs/src/release/release-0.6.4.rst +0 -13
  353. data/embulk-docs/src/release/release-0.6.5.rst +0 -17
  354. data/embulk-docs/src/release/release-0.6.6.rst +0 -17
  355. data/embulk-docs/src/release/release-0.6.7.rst +0 -17
  356. data/embulk-docs/src/release/release-0.6.8.rst +0 -24
  357. data/embulk-docs/src/release/release-0.6.9.rst +0 -24
  358. data/embulk-docs/src/release/release-0.7.0.rst +0 -96
  359. data/embulk-docs/src/release/release-0.7.1.rst +0 -22
  360. data/embulk-docs/src/release/release-0.7.10.rst +0 -13
  361. data/embulk-docs/src/release/release-0.7.11.rst +0 -12
  362. data/embulk-docs/src/release/release-0.7.2.rst +0 -25
  363. data/embulk-docs/src/release/release-0.7.3.rst +0 -21
  364. data/embulk-docs/src/release/release-0.7.4.rst +0 -14
  365. data/embulk-docs/src/release/release-0.7.5.rst +0 -22
  366. data/embulk-docs/src/release/release-0.7.6.rst +0 -18
  367. data/embulk-docs/src/release/release-0.7.7.rst +0 -13
  368. data/embulk-docs/src/release/release-0.7.8.rst +0 -14
  369. data/embulk-docs/src/release/release-0.7.9.rst +0 -14
  370. data/embulk-docs/src/release/release-0.8.0.rst +0 -74
  371. data/embulk-docs/src/release/release-0.8.1.rst +0 -18
  372. data/embulk-docs/src/release/release-0.8.10.rst +0 -35
  373. data/embulk-docs/src/release/release-0.8.11.rst +0 -12
  374. data/embulk-docs/src/release/release-0.8.12.rst +0 -12
  375. data/embulk-docs/src/release/release-0.8.13.rst +0 -12
  376. data/embulk-docs/src/release/release-0.8.14.rst +0 -31
  377. data/embulk-docs/src/release/release-0.8.15.rst +0 -17
  378. data/embulk-docs/src/release/release-0.8.16.rst +0 -43
  379. data/embulk-docs/src/release/release-0.8.17.rst +0 -11
  380. data/embulk-docs/src/release/release-0.8.18.rst +0 -27
  381. data/embulk-docs/src/release/release-0.8.19.rst +0 -43
  382. data/embulk-docs/src/release/release-0.8.2.rst +0 -19
  383. data/embulk-docs/src/release/release-0.8.20.rst +0 -11
  384. data/embulk-docs/src/release/release-0.8.21.rst +0 -17
  385. data/embulk-docs/src/release/release-0.8.22.rst +0 -15
  386. data/embulk-docs/src/release/release-0.8.23.rst +0 -14
  387. data/embulk-docs/src/release/release-0.8.24.rst +0 -15
  388. data/embulk-docs/src/release/release-0.8.25.rst +0 -14
  389. data/embulk-docs/src/release/release-0.8.26.rst +0 -16
  390. data/embulk-docs/src/release/release-0.8.27.rst +0 -15
  391. data/embulk-docs/src/release/release-0.8.28.rst +0 -14
  392. data/embulk-docs/src/release/release-0.8.29.rst +0 -14
  393. data/embulk-docs/src/release/release-0.8.3.rst +0 -15
  394. data/embulk-docs/src/release/release-0.8.30.rst +0 -14
  395. data/embulk-docs/src/release/release-0.8.31.rst +0 -12
  396. data/embulk-docs/src/release/release-0.8.32.rst +0 -14
  397. data/embulk-docs/src/release/release-0.8.33.rst +0 -13
  398. data/embulk-docs/src/release/release-0.8.34.rst +0 -12
  399. data/embulk-docs/src/release/release-0.8.35.rst +0 -12
  400. data/embulk-docs/src/release/release-0.8.36.rst +0 -32
  401. data/embulk-docs/src/release/release-0.8.37.rst +0 -20
  402. data/embulk-docs/src/release/release-0.8.38.rst +0 -12
  403. data/embulk-docs/src/release/release-0.8.4.rst +0 -18
  404. data/embulk-docs/src/release/release-0.8.5.rst +0 -11
  405. data/embulk-docs/src/release/release-0.8.6.rst +0 -14
  406. data/embulk-docs/src/release/release-0.8.7.rst +0 -18
  407. data/embulk-docs/src/release/release-0.8.8.rst +0 -18
  408. data/embulk-docs/src/release/release-0.8.9.rst +0 -14
  409. data/embulk-jruby-strptime/build.gradle +0 -3
  410. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/RubyDateParser.java +0 -121
  411. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/StrptimeFormat.java +0 -53
  412. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/StrptimeParser.java +0 -884
  413. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/StrptimeToken.java +0 -111
  414. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/TimeZoneConverter.java +0 -466
  415. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/lexer/StrptimeLexer.flex +0 -62
  416. data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/lexer/StrptimeLexer.java +0 -577
  417. data/embulk-standards/build.gradle +0 -7
  418. data/embulk-standards/src/main/java/org/embulk/standards/Bzip2FileDecoderPlugin.java +0 -55
  419. data/embulk-standards/src/main/java/org/embulk/standards/Bzip2FileEncoderPlugin.java +0 -67
  420. data/embulk-standards/src/main/java/org/embulk/standards/ConfigInputPlugin.java +0 -170
  421. data/embulk-standards/src/main/java/org/embulk/standards/CsvFormatterPlugin.java +0 -295
  422. data/embulk-standards/src/main/java/org/embulk/standards/CsvParserPlugin.java +0 -416
  423. data/embulk-standards/src/main/java/org/embulk/standards/CsvTokenizer.java +0 -545
  424. data/embulk-standards/src/main/java/org/embulk/standards/GzipFileDecoderPlugin.java +0 -55
  425. data/embulk-standards/src/main/java/org/embulk/standards/GzipFileEncoderPlugin.java +0 -71
  426. data/embulk-standards/src/main/java/org/embulk/standards/JsonParserPlugin.java +0 -235
  427. data/embulk-standards/src/main/java/org/embulk/standards/LocalFileInputPlugin.java +0 -232
  428. data/embulk-standards/src/main/java/org/embulk/standards/LocalFileOutputPlugin.java +0 -148
  429. data/embulk-standards/src/main/java/org/embulk/standards/NullOutputPlugin.java +0 -59
  430. data/embulk-standards/src/main/java/org/embulk/standards/RemoveColumnsFilterPlugin.java +0 -268
  431. data/embulk-standards/src/main/java/org/embulk/standards/RenameFilterPlugin.java +0 -479
  432. data/embulk-standards/src/main/java/org/embulk/standards/StandardPluginExtension.java +0 -16
  433. data/embulk-standards/src/main/java/org/embulk/standards/StandardPluginModule.java +0 -60
  434. data/embulk-standards/src/main/java/org/embulk/standards/StdoutOutputPlugin.java +0 -91
  435. data/embulk-standards/src/main/resources/META-INF/services/org.embulk.spi.Extension +0 -1
  436. data/embulk-standards/src/test/java/org/embulk/standards/TestCsvFormatterPlugin.java +0 -312
  437. data/embulk-standards/src/test/java/org/embulk/standards/TestCsvParserPlugin.java +0 -75
  438. data/embulk-standards/src/test/java/org/embulk/standards/TestCsvTokenizer.java +0 -457
  439. data/embulk-standards/src/test/java/org/embulk/standards/TestJsonParserPlugin.java +0 -351
  440. data/embulk-standards/src/test/java/org/embulk/standards/TestRemoveColumnsFilterPlugin.java +0 -121
  441. data/embulk-standards/src/test/java/org/embulk/standards/TestRenameFilterPlugin.java +0 -1020
  442. data/embulk-standards/src/test/java/org/embulk/standards/guess/TestCsvAllStringsGuessPlugin.java +0 -38
  443. data/embulk-standards/src/test/java/org/embulk/standards/guess/TestCsvGuessPlugin.java +0 -248
  444. data/embulk-standards/src/test/java/org/embulk/standards/preview/TestFilePreview.java +0 -73
  445. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row.csv +0 -1
  446. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_and_header.csv +0 -2
  447. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_and_header_guessed.yml +0 -12
  448. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_and_header_seed.yml +0 -1
  449. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_guessed.yml +0 -12
  450. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_seed.yml +0 -1
  451. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows.csv +0 -1
  452. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header.csv +0 -2
  453. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_guessed.yml +0 -16
  454. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_seed.yml +0 -1
  455. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_with_trim_needed.csv +0 -2
  456. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_with_trim_needed_guessed.yml +0 -16
  457. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_with_trim_needed_seed.yml +0 -1
  458. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_guessed.yml +0 -16
  459. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_seed.yml +0 -1
  460. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_with_trim_needed.csv +0 -1
  461. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_with_trim_needed_guessed.yml +0 -16
  462. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_with_trim_needed_seed.yml +0 -1
  463. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row.csv +0 -1
  464. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_and_header.csv +0 -2
  465. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_and_header_guessed.yml +0 -12
  466. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_and_header_seed.yml +0 -1
  467. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_guessed.yml +0 -12
  468. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_seed.yml +0 -1
  469. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_int_single_column_rows.csv +0 -2
  470. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_int_single_column_rows_guessed.yml +0 -12
  471. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_int_single_column_rows_seed.yml +0 -1
  472. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows.csv +0 -2
  473. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_and_header.csv +0 -3
  474. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_and_header_guessed.yml +0 -16
  475. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_and_header_seed.yml +0 -1
  476. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_guessed.yml +0 -16
  477. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_seed.yml +0 -1
  478. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_string_single_column_rows.csv +0 -2
  479. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_string_single_column_rows_guessed.yml +0 -12
  480. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_string_single_column_rows_seed.yml +0 -1
  481. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_backslash_escape.csv +0 -5
  482. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_backslash_escape_guessed.yml +0 -17
  483. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_backslash_escape_seed.yml +0 -1
  484. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_double_single_column.csv +0 -12
  485. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_double_single_column_guessed.yml +0 -12
  486. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_double_single_column_seed.yml +0 -1
  487. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column.csv +0 -4
  488. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_guessed.yml +0 -12
  489. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_seed.yml +0 -1
  490. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_with_header.csv +0 -5
  491. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_with_header_guessed.yml +0 -12
  492. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_with_header_seed.yml +0 -1
  493. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_semicolon_delimiter.csv +0 -5
  494. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_semicolon_delimiter_guessed.yml +0 -17
  495. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_semicolon_delimiter_seed.yml +0 -1
  496. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_simple.csv +0 -5
  497. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_simple_guessed.yml +0 -17
  498. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_simple_seed.yml +0 -1
  499. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_single_quote.csv +0 -5
  500. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_single_quote_guessed.yml +0 -17
  501. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_single_quote_seed.yml +0 -1
  502. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_skip_suggest_if_empty_sample_records.csv +0 -5
  503. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_skip_suggest_if_empty_sample_records_guessed.yml +0 -2
  504. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_skip_suggest_if_empty_sample_records_seed.yml +0 -1
  505. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column.csv +0 -4
  506. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_guessed.yml +0 -12
  507. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_seed.yml +0 -1
  508. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_with_header.csv +0 -5
  509. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_with_header_guessed.yml +0 -12
  510. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_with_header_seed.yml +0 -1
  511. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_tab_delimiter.csv +0 -4
  512. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_tab_delimiter_guessed.yml +0 -16
  513. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_tab_delimiter_seed.yml +0 -1
  514. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv_all_strings/test/test_simple.csv +0 -5
  515. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv_all_strings/test/test_simple_guessed.yml +0 -17
  516. data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv_all_strings/test/test_simple_seed.yml +0 -1
  517. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes.csv +0 -5
  518. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes_exec.yml +0 -1
  519. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes_load.yml +0 -19
  520. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes_previewed.csv +0 -1
  521. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_simple.csv +0 -5
  522. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_simple_load.yml +0 -19
  523. data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_simple_previewed.csv +0 -4
  524. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep.csv +0 -5
  525. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_expected.csv +0 -4
  526. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_filter.yml +0 -2
  527. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_in.yml +0 -18
  528. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names.csv +0 -5
  529. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names.yml +0 -2
  530. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names_expected.csv +0 -4
  531. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names_in.yml +0 -17
  532. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_unmatched_filter.yml +0 -3
  533. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_without_unmatched_filter.yml +0 -2
  534. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove.csv +0 -5
  535. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_expected.csv +0 -4
  536. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_filter.yml +0 -2
  537. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_in.yml +0 -18
  538. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_with_unmatched_filter.yml +0 -3
  539. data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_without_unmatched_filter.yml +0 -2
  540. data/embulk-test/build.gradle +0 -6
  541. data/embulk-test/src/main/java/org/embulk/test/EmbulkTests.java +0 -75
  542. data/embulk-test/src/main/java/org/embulk/test/PreviewResultInputPlugin.java +0 -65
  543. data/embulk-test/src/main/java/org/embulk/test/TestingBulkLoader.java +0 -129
  544. data/embulk-test/src/main/java/org/embulk/test/TestingEmbulk.java +0 -710
  545. data/gradle/wrapper/gradle-wrapper.jar +0 -0
  546. data/gradle/wrapper/gradle-wrapper.properties +0 -5
  547. data/gradlew +0 -172
  548. data/gradlew.bat +0 -84
  549. data/lib/embulk/data/bundle/.bundle/config +0 -3
  550. data/lib/embulk/data/bundle/.ruby-version +0 -1
  551. data/lib/embulk/data/bundle/Gemfile +0 -31
  552. data/lib/embulk/data/bundle/embulk/filter/example.rb +0 -42
  553. data/lib/embulk/data/bundle/embulk/input/example.rb +0 -54
  554. data/lib/embulk/data/bundle/embulk/output/example.rb +0 -58
  555. data/lib/embulk/data/new/LICENSE.txt +0 -21
  556. data/lib/embulk/data/new/README.md.vm +0 -106
  557. data/lib/embulk/data/new/gitignore.vm +0 -17
  558. data/lib/embulk/data/new/java/build.gradle.vm +0 -96
  559. data/lib/embulk/data/new/java/config/checkstyle/checkstyle.xml +0 -128
  560. data/lib/embulk/data/new/java/config/checkstyle/default.xml +0 -108
  561. data/lib/embulk/data/new/java/decoder.java.vm +0 -86
  562. data/lib/embulk/data/new/java/encoder.java.vm +0 -88
  563. data/lib/embulk/data/new/java/file_input.java.vm +0 -145
  564. data/lib/embulk/data/new/java/file_output.java.vm +0 -95
  565. data/lib/embulk/data/new/java/filter.java.vm +0 -57
  566. data/lib/embulk/data/new/java/formatter.java.vm +0 -55
  567. data/lib/embulk/data/new/java/gradle/wrapper/gradle-wrapper.jar +0 -0
  568. data/lib/embulk/data/new/java/gradle/wrapper/gradle-wrapper.properties +0 -5
  569. data/lib/embulk/data/new/java/gradlew +0 -172
  570. data/lib/embulk/data/new/java/gradlew.bat +0 -84
  571. data/lib/embulk/data/new/java/input.java.vm +0 -89
  572. data/lib/embulk/data/new/java/output.java.vm +0 -79
  573. data/lib/embulk/data/new/java/parser.java.vm +0 -61
  574. data/lib/embulk/data/new/java/plugin_loader.rb.vm +0 -3
  575. data/lib/embulk/data/new/java/test.java.vm +0 -5
  576. data/lib/embulk/data/new/ruby/.ruby-version +0 -1
  577. data/lib/embulk/data/new/ruby/Gemfile +0 -2
  578. data/lib/embulk/data/new/ruby/Rakefile +0 -3
  579. data/lib/embulk/data/new/ruby/decoder_guess.rb.vm +0 -25
  580. data/lib/embulk/data/new/ruby/filter.rb.vm +0 -50
  581. data/lib/embulk/data/new/ruby/formatter.rb.vm +0 -49
  582. data/lib/embulk/data/new/ruby/gemspec.vm +0 -20
  583. data/lib/embulk/data/new/ruby/input.rb.vm +0 -59
  584. data/lib/embulk/data/new/ruby/output.rb.vm +0 -61
  585. data/lib/embulk/data/new/ruby/parser.rb.vm +0 -44
  586. data/lib/embulk/data/new/ruby/parser_guess.rb.vm +0 -65
  587. data/lib/embulk/data/package_data.rb +0 -59
  588. data/lib/embulk/guess/bzip2.rb +0 -23
  589. data/lib/embulk/guess/csv.rb +0 -374
  590. data/lib/embulk/guess/csv_all_strings.rb +0 -13
  591. data/lib/embulk/guess/gzip.rb +0 -18
  592. data/lib/embulk/guess/json.rb +0 -50
  593. data/lib/embulk/runner.rb +0 -53
  594. data/settings.gradle +0 -8
  595. data/test/helper.rb +0 -23
  596. data/test/monkey_strptime/mri/date/test_date_strptime.rb +0 -515
  597. data/test/monkey_strptime/run-test.rb +0 -29
  598. data/test/vanilla/guess/test_csv_all_strings.rb +0 -43
  599. data/test/vanilla/guess/test_csv_guess.rb +0 -170
  600. data/test/vanilla/guess/test_schema_guess.rb +0 -47
  601. data/test/vanilla/guess/test_time_format_guess.rb +0 -135
  602. data/test/vanilla/run-test.rb +0 -14
  603. data/test/vanilla/time/test_timestamp_parser.rb +0 -102
@@ -1,416 +0,0 @@
1
- package org.embulk.standards;
2
-
3
- import com.google.common.base.Optional;
4
- import com.google.common.collect.ImmutableSet;
5
- import com.fasterxml.jackson.annotation.JsonCreator;
6
- import com.fasterxml.jackson.annotation.JsonIgnore;
7
- import com.fasterxml.jackson.annotation.JsonValue;
8
- import org.embulk.config.Task;
9
- import org.embulk.config.Config;
10
- import org.embulk.config.ConfigDefault;
11
- import org.embulk.config.ConfigSource;
12
- import org.embulk.config.ConfigException;
13
- import org.embulk.config.TaskSource;
14
- import org.embulk.spi.time.TimestampParser;
15
- import org.embulk.spi.time.TimestampParseException;
16
- import org.embulk.spi.json.JsonParser;
17
- import org.embulk.spi.json.JsonParseException;
18
- import org.embulk.spi.Column;
19
- import org.embulk.spi.Schema;
20
- import org.embulk.spi.SchemaConfig;
21
- import org.embulk.spi.ColumnVisitor;
22
- import org.embulk.spi.PageBuilder;
23
- import org.embulk.spi.ParserPlugin;
24
- import org.embulk.spi.Exec;
25
- import org.embulk.spi.FileInput;
26
- import org.embulk.spi.PageOutput;
27
- import org.embulk.spi.DataException;
28
- import org.embulk.spi.util.LineDecoder;
29
- import org.embulk.spi.util.Timestamps;
30
- import org.slf4j.Logger;
31
-
32
- public class CsvParserPlugin
33
- implements ParserPlugin
34
- {
35
- private static final ImmutableSet<String> TRUE_STRINGS =
36
- ImmutableSet.of(
37
- "true", "True", "TRUE",
38
- "yes", "Yes", "YES",
39
- "t", "T", "y", "Y",
40
- "on", "On", "ON",
41
- "1");
42
-
43
- public interface PluginTask
44
- extends Task, LineDecoder.DecoderTask, TimestampParser.Task
45
- {
46
- @Config("columns")
47
- SchemaConfig getSchemaConfig();
48
-
49
- @Config("header_line")
50
- @ConfigDefault("null")
51
- Optional<Boolean> getHeaderLine();
52
-
53
- @Config("skip_header_lines")
54
- @ConfigDefault("0")
55
- int getSkipHeaderLines();
56
- void setSkipHeaderLines(int n);
57
-
58
- @Config("delimiter")
59
- @ConfigDefault("\",\"")
60
- String getDelimiter();
61
-
62
- @Config("quote")
63
- @ConfigDefault("\"\\\"\"")
64
- Optional<QuoteCharacter> getQuoteChar();
65
-
66
- @Config("escape")
67
- @ConfigDefault("\"\\\\\"")
68
- Optional<EscapeCharacter> getEscapeChar();
69
-
70
- // Null value handling: if the CsvParser found 'non-quoted empty string's,
71
- // it replaces them to string that users specified like "\N", "NULL".
72
- @Config("null_string")
73
- @ConfigDefault("null")
74
- Optional<String> getNullString();
75
-
76
- @Config("trim_if_not_quoted")
77
- @ConfigDefault("false")
78
- boolean getTrimIfNotQuoted();
79
-
80
- @Config("quotes_in_quoted_fields")
81
- @ConfigDefault("\"ACCEPT_ONLY_RFC4180_ESCAPED\"")
82
- QuotesInQuotedFields getQuotesInQuotedFields();
83
-
84
- @Config("max_quoted_size_limit")
85
- @ConfigDefault("131072") //128kB
86
- long getMaxQuotedSizeLimit();
87
-
88
- @Config("comment_line_marker")
89
- @ConfigDefault("null")
90
- Optional<String> getCommentLineMarker();
91
-
92
- @Config("allow_optional_columns")
93
- @ConfigDefault("false")
94
- boolean getAllowOptionalColumns();
95
-
96
- @Config("allow_extra_columns")
97
- @ConfigDefault("false")
98
- boolean getAllowExtraColumns();
99
-
100
- @Config("stop_on_invalid_record")
101
- @ConfigDefault("false")
102
- boolean getStopOnInvalidRecord();
103
- }
104
-
105
- public enum QuotesInQuotedFields
106
- {
107
- ACCEPT_ONLY_RFC4180_ESCAPED,
108
- ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS,
109
- ;
110
-
111
- @JsonCreator
112
- public static QuotesInQuotedFields ofString(final String string)
113
- {
114
- for (final QuotesInQuotedFields value : values()) {
115
- if (string.equals(value.toString())) {
116
- return value;
117
- }
118
- }
119
- throw new ConfigException("\"quotes_in_quoted_fields\" must be one of [ACCEPT_ONLY_RFC4180_ESCAPED, ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS].");
120
- }
121
- }
122
-
123
- public static class QuoteCharacter
124
- {
125
- private final char character;
126
-
127
- public QuoteCharacter(char character)
128
- {
129
- this.character = character;
130
- }
131
-
132
- public static QuoteCharacter noQuote()
133
- {
134
- return new QuoteCharacter(CsvTokenizer.NO_QUOTE);
135
- }
136
-
137
- @JsonCreator
138
- public static QuoteCharacter ofString(String str)
139
- {
140
- if (str.length() >= 2) {
141
- throw new ConfigException("\"quote\" option accepts only 1 character.");
142
- } else if (str.isEmpty()) {
143
- Exec.getLogger(CsvParserPlugin.class).warn("Setting '' (empty string) to \"quote\" option is obsoleted. Currently it becomes '\"' automatically but this behavior will be removed. Please set '\"' explicitly.");
144
- return new QuoteCharacter('"');
145
- } else {
146
- return new QuoteCharacter(str.charAt(0));
147
- }
148
- }
149
-
150
- @JsonIgnore
151
- public char getCharacter()
152
- {
153
- return character;
154
- }
155
-
156
- @JsonValue
157
- public String getOptionalString()
158
- {
159
- return new String(new char[] { character });
160
- }
161
-
162
- @Override
163
- public boolean equals(Object obj)
164
- {
165
- if (!(obj instanceof QuoteCharacter)) {
166
- return false;
167
- }
168
- QuoteCharacter o = (QuoteCharacter) obj;
169
- return character == o.character;
170
- }
171
- }
172
-
173
- public static class EscapeCharacter
174
- {
175
- private final char character;
176
-
177
- public EscapeCharacter(char character)
178
- {
179
- this.character = character;
180
- }
181
-
182
- public static EscapeCharacter noEscape()
183
- {
184
- return new EscapeCharacter(CsvTokenizer.NO_ESCAPE);
185
- }
186
-
187
- @JsonCreator
188
- public static EscapeCharacter ofString(String str)
189
- {
190
- if (str.length() >= 2) {
191
- throw new ConfigException("\"escape\" option accepts only 1 character.");
192
- } else if (str.isEmpty()) {
193
- Exec.getLogger(CsvParserPlugin.class).warn("Setting '' (empty string) to \"escape\" option is obsoleted. Currently it becomes null automatically but this behavior will be removed. Please set \"escape: null\" explicitly.");
194
- return noEscape();
195
- } else {
196
- return new EscapeCharacter(str.charAt(0));
197
- }
198
- }
199
-
200
- @JsonIgnore
201
- public char getCharacter()
202
- {
203
- return character;
204
- }
205
-
206
- @JsonValue
207
- public String getOptionalString()
208
- {
209
- return new String(new char[] { character });
210
- }
211
-
212
- @Override
213
- public boolean equals(Object obj)
214
- {
215
- if (!(obj instanceof EscapeCharacter)) {
216
- return false;
217
- }
218
- EscapeCharacter o = (EscapeCharacter) obj;
219
- return character == o.character;
220
- }
221
- }
222
-
223
- private final Logger log;
224
-
225
- public CsvParserPlugin()
226
- {
227
- log = Exec.getLogger(CsvParserPlugin.class);
228
- }
229
-
230
- @Override
231
- public void transaction(ConfigSource config, ParserPlugin.Control control)
232
- {
233
- PluginTask task = config.loadConfig(PluginTask.class);
234
-
235
- // backward compatibility
236
- if (task.getHeaderLine().isPresent()) {
237
- if (task.getSkipHeaderLines() > 0) {
238
- throw new ConfigException("'header_line' option is invalid if 'skip_header_lines' is set.");
239
- }
240
- if (task.getHeaderLine().get()) {
241
- task.setSkipHeaderLines(1);
242
- } else {
243
- task.setSkipHeaderLines(0);
244
- }
245
- }
246
-
247
- control.run(task.dump(), task.getSchemaConfig().toSchema());
248
- }
249
-
250
- @Override
251
- public void run(TaskSource taskSource, final Schema schema,
252
- FileInput input, PageOutput output)
253
- {
254
- PluginTask task = taskSource.loadTask(PluginTask.class);
255
- final TimestampParser[] timestampParsers = Timestamps.newTimestampColumnParsers(task, task.getSchemaConfig());
256
- final JsonParser jsonParser = new JsonParser();
257
- final CsvTokenizer tokenizer = new CsvTokenizer(new LineDecoder(input, task), task);
258
- final boolean allowOptionalColumns = task.getAllowOptionalColumns();
259
- final boolean allowExtraColumns = task.getAllowExtraColumns();
260
- final boolean stopOnInvalidRecord = task.getStopOnInvalidRecord();
261
- final int skipHeaderLines = task.getSkipHeaderLines();
262
-
263
- try (final PageBuilder pageBuilder = new PageBuilder(Exec.getBufferAllocator(), schema, output)) {
264
- while (tokenizer.nextFile()) {
265
- // skip the header lines for each file
266
- for (int skipHeaderLineNumber = skipHeaderLines; skipHeaderLineNumber > 0; skipHeaderLineNumber--) {
267
- if (!tokenizer.skipHeaderLine()) {
268
- break;
269
- }
270
- }
271
-
272
- if (!tokenizer.nextRecord()) {
273
- // empty file
274
- continue;
275
- }
276
-
277
- while (true) {
278
- boolean hasNextRecord;
279
-
280
- try {
281
- schema.visitColumns(new ColumnVisitor() {
282
- public void booleanColumn(Column column)
283
- {
284
- String v = nextColumn();
285
- if (v == null) {
286
- pageBuilder.setNull(column);
287
- } else {
288
- pageBuilder.setBoolean(column, TRUE_STRINGS.contains(v));
289
- }
290
- }
291
-
292
- public void longColumn(Column column)
293
- {
294
- String v = nextColumn();
295
- if (v == null) {
296
- pageBuilder.setNull(column);
297
- } else {
298
- try {
299
- pageBuilder.setLong(column, Long.parseLong(v));
300
- } catch (NumberFormatException e) {
301
- // TODO support default value
302
- throw new CsvRecordValidateException(e);
303
- }
304
- }
305
- }
306
-
307
- public void doubleColumn(Column column)
308
- {
309
- String v = nextColumn();
310
- if (v == null) {
311
- pageBuilder.setNull(column);
312
- } else {
313
- try {
314
- pageBuilder.setDouble(column, Double.parseDouble(v));
315
- } catch (NumberFormatException e) {
316
- // TODO support default value
317
- throw new CsvRecordValidateException(e);
318
- }
319
- }
320
- }
321
-
322
- public void stringColumn(Column column)
323
- {
324
- String v = nextColumn();
325
- if (v == null) {
326
- pageBuilder.setNull(column);
327
- } else {
328
- pageBuilder.setString(column, v);
329
- }
330
- }
331
-
332
- public void timestampColumn(Column column)
333
- {
334
- String v = nextColumn();
335
- if (v == null) {
336
- pageBuilder.setNull(column);
337
- } else {
338
- try {
339
- pageBuilder.setTimestamp(column, timestampParsers[column.getIndex()].parse(v));
340
- } catch (TimestampParseException e) {
341
- // TODO support default value
342
- throw new CsvRecordValidateException(e);
343
- }
344
- }
345
- }
346
-
347
- public void jsonColumn(Column column)
348
- {
349
- String v = nextColumn();
350
- if (v == null) {
351
- pageBuilder.setNull(column);
352
- } else {
353
- try {
354
- pageBuilder.setJson(column, jsonParser.parse(v));
355
- } catch (JsonParseException e) {
356
- // TODO support default value
357
- throw new CsvRecordValidateException(e);
358
- }
359
- }
360
- }
361
-
362
- private String nextColumn()
363
- {
364
- if (allowOptionalColumns && !tokenizer.hasNextColumn()) {
365
- //TODO warning
366
- return null;
367
- }
368
- return tokenizer.nextColumnOrNull();
369
- }
370
- });
371
-
372
- try {
373
- hasNextRecord = tokenizer.nextRecord();
374
- } catch (CsvTokenizer.TooManyColumnsException ex) {
375
- if (allowExtraColumns) {
376
- String tooManyColumnsLine = tokenizer.skipCurrentLine();
377
- // TODO warning
378
- hasNextRecord = tokenizer.nextRecord();
379
- } else {
380
- // this line will be skipped at the following catch section
381
- throw ex;
382
- }
383
- }
384
- pageBuilder.addRecord();
385
-
386
- } catch (CsvTokenizer.InvalidFormatException | CsvTokenizer.InvalidValueException | CsvRecordValidateException e) {
387
- String skippedLine = tokenizer.skipCurrentLine();
388
- long lineNumber = tokenizer.getCurrentLineNumber();
389
- if (stopOnInvalidRecord) {
390
- throw new DataException(String.format("Invalid record at line %d: %s", lineNumber, skippedLine), e);
391
- }
392
- log.warn(String.format("Skipped line %d (%s): %s", lineNumber, e.getMessage(), skippedLine));
393
- //exec.notice().skippedLine(skippedLine);
394
-
395
- hasNextRecord = tokenizer.nextRecord();
396
- }
397
-
398
- if (!hasNextRecord) {
399
- break;
400
- }
401
- }
402
- }
403
-
404
- pageBuilder.finish();
405
- }
406
- }
407
-
408
- static class CsvRecordValidateException
409
- extends DataException
410
- {
411
- CsvRecordValidateException(Throwable cause)
412
- {
413
- super(cause);
414
- }
415
- }
416
- }
@@ -1,545 +0,0 @@
1
- package org.embulk.standards;
2
-
3
- import com.google.common.base.Preconditions;
4
- import java.util.List;
5
- import java.util.ArrayList;
6
- import java.util.Deque;
7
- import java.util.ArrayDeque;
8
- import org.embulk.spi.DataException;
9
- import org.embulk.spi.util.LineDecoder;
10
- import org.embulk.config.ConfigException;
11
- import org.embulk.standards.CsvParserPlugin.QuotesInQuotedFields;
12
-
13
- public class CsvTokenizer
14
- {
15
- static enum RecordState
16
- {
17
- NOT_END, END,
18
- }
19
-
20
- static enum ColumnState
21
- {
22
- BEGIN, VALUE, QUOTED_VALUE, AFTER_QUOTED_VALUE, FIRST_TRIM, LAST_TRIM_OR_VALUE,
23
- }
24
-
25
- private static final char END_OF_LINE = '\0';
26
- static final char NO_QUOTE = '\0';
27
- static final char NO_ESCAPE = '\0';
28
-
29
- private final char delimiterChar;
30
- private final String delimiterFollowingString;
31
- private final char quote;
32
- private final char escape;
33
- private final String newline;
34
- private final boolean trimIfNotQuoted;
35
- private final QuotesInQuotedFields quotesInQuotedFields;
36
- private final long maxQuotedSizeLimit;
37
- private final String commentLineMarker;
38
- private final LineDecoder input;
39
- private final String nullStringOrNull;
40
-
41
- private RecordState recordState = RecordState.END; // initial state is end of a record. nextRecord() must be called first
42
- private long lineNumber = 0;
43
-
44
- private String line = null;
45
- private int linePos = 0;
46
- private boolean wasQuotedColumn = false;
47
- private List<String> quotedValueLines = new ArrayList<>();
48
- private Deque<String> unreadLines = new ArrayDeque<>();
49
-
50
- public CsvTokenizer(LineDecoder input, CsvParserPlugin.PluginTask task)
51
- {
52
- String delimiter = task.getDelimiter();
53
- if (delimiter.length() == 0) {
54
- throw new ConfigException("Empty delimiter is not allowed");
55
- } else {
56
- this.delimiterChar = delimiter.charAt(0);
57
- if (delimiter.length() > 1) {
58
- delimiterFollowingString = delimiter.substring(1);
59
- } else {
60
- delimiterFollowingString = null;
61
- }
62
- }
63
- quote = task.getQuoteChar().or(CsvParserPlugin.QuoteCharacter.noQuote()).getCharacter();
64
- escape = task.getEscapeChar().or(CsvParserPlugin.EscapeCharacter.noEscape()).getCharacter();
65
- newline = task.getNewline().getString();
66
- trimIfNotQuoted = task.getTrimIfNotQuoted();
67
- quotesInQuotedFields = task.getQuotesInQuotedFields();
68
- if (trimIfNotQuoted && quotesInQuotedFields != QuotesInQuotedFields.ACCEPT_ONLY_RFC4180_ESCAPED) {
69
- // The combination makes some syntax very ambiguous such as:
70
- // val1, \"\"val2\"\" ,val3
71
- throw new ConfigException("[quotes_in_quoted_fields != ACCEPT_ONLY_RFC4180_ESCAPED] is not allowed to specify with [trim_if_not_quoted = true]");
72
- }
73
- maxQuotedSizeLimit = task.getMaxQuotedSizeLimit();
74
- commentLineMarker = task.getCommentLineMarker().orNull();
75
- nullStringOrNull = task.getNullString().orNull();
76
- this.input = input;
77
- }
78
-
79
- public long getCurrentLineNumber()
80
- {
81
- return lineNumber;
82
- }
83
-
84
- public boolean skipHeaderLine()
85
- {
86
- boolean skipped = input.poll() != null;
87
- if (skipped) {
88
- lineNumber++;
89
- }
90
- return skipped;
91
- }
92
-
93
- // returns skipped line
94
- public String skipCurrentLine()
95
- {
96
- String skippedLine;
97
- if (quotedValueLines.isEmpty()) {
98
- skippedLine = line;
99
- } else {
100
- // recover lines of quoted value
101
- skippedLine = quotedValueLines.remove(0); // TODO optimize performance
102
- unreadLines.addAll(quotedValueLines);
103
- lineNumber -= quotedValueLines.size();
104
- if (line != null) {
105
- unreadLines.add(line);
106
- lineNumber -= 1;
107
- }
108
- quotedValueLines.clear();
109
- }
110
- recordState = RecordState.END;
111
- return skippedLine;
112
- }
113
-
114
- public boolean nextFile()
115
- {
116
- boolean next = input.nextFile();
117
- if (next) {
118
- lineNumber = 0;
119
- }
120
- return next;
121
- }
122
-
123
- // used by guess-csv
124
- public boolean nextRecord()
125
- {
126
- return nextRecord(true);
127
- }
128
-
129
- public boolean nextRecord(boolean skipEmptyLine)
130
- {
131
- // If at the end of record, read the next line and initialize the state
132
- if (recordState != RecordState.END) {
133
- throw new TooManyColumnsException("Too many columns");
134
- }
135
-
136
- boolean hasNext = nextLine(skipEmptyLine);
137
- if (hasNext) {
138
- recordState = RecordState.NOT_END;
139
- return true;
140
- } else {
141
- return false;
142
- }
143
- }
144
-
145
- private boolean nextLine(boolean skipEmptyLine)
146
- {
147
- while (true) {
148
- if (!unreadLines.isEmpty()) {
149
- line = unreadLines.removeFirst();
150
- } else {
151
- line = input.poll();
152
- if (line == null) {
153
- return false;
154
- }
155
- }
156
- linePos = 0;
157
- lineNumber++;
158
-
159
- boolean skip = skipEmptyLine && (
160
- line.isEmpty() ||
161
- (commentLineMarker != null && line.startsWith(commentLineMarker)));
162
- if (!skip) {
163
- return true;
164
- }
165
- }
166
- }
167
-
168
- public boolean hasNextColumn()
169
- {
170
- return recordState == RecordState.NOT_END;
171
- }
172
-
173
- public String nextColumn()
174
- {
175
- if (!hasNextColumn()) {
176
- throw new TooFewColumnsException("Too few columns");
177
- }
178
-
179
- // reset last state
180
- wasQuotedColumn = false;
181
- quotedValueLines.clear();
182
-
183
- // local state
184
- int valueStartPos = linePos;
185
- int valueEndPos = 0; // initialized by VALUE state and used by LAST_TRIM_OR_VALUE and
186
- StringBuilder quotedValue = null; // initial by VALUE or FIRST_TRIM state and used by QUOTED_VALUE state
187
- ColumnState columnState = ColumnState.BEGIN;
188
-
189
- while (true) {
190
- final char c = nextChar();
191
-
192
- switch (columnState) {
193
- case BEGIN:
194
- // TODO optimization: state is BEGIN only at the first character of a column.
195
- // this block can be out of the looop.
196
- if (isDelimiter(c)) {
197
- // empty value
198
- if (delimiterFollowingString == null) {
199
- return "";
200
- } else if (isDelimiterFollowingFrom(linePos)) {
201
- linePos += delimiterFollowingString.length();
202
- return "";
203
- }
204
- // not a delimiter
205
- }
206
- if (isEndOfLine(c)) {
207
- // empty value
208
- recordState = RecordState.END;
209
- return "";
210
-
211
- } else if (isSpace(c) && trimIfNotQuoted) {
212
- columnState = ColumnState.FIRST_TRIM;
213
-
214
- } else if (isQuote(c)) {
215
- valueStartPos = linePos; // == 1
216
- wasQuotedColumn = true;
217
- quotedValue = new StringBuilder();
218
- columnState = ColumnState.QUOTED_VALUE;
219
-
220
- } else {
221
- columnState = ColumnState.VALUE;
222
- }
223
- break;
224
-
225
- case FIRST_TRIM:
226
- if (isDelimiter(c)) {
227
- // empty value
228
- if (delimiterFollowingString == null) {
229
- return "";
230
- } else if (isDelimiterFollowingFrom(linePos)) {
231
- linePos += delimiterFollowingString.length();
232
- return "";
233
- }
234
- // not a delimiter
235
- }
236
- if (isEndOfLine(c)) {
237
- // empty value
238
- recordState = RecordState.END;
239
- return "";
240
-
241
- } else if (isQuote(c)) {
242
- // column has heading spaces and quoted. TODO should this be rejected?
243
- valueStartPos = linePos;
244
- wasQuotedColumn = true;
245
- quotedValue = new StringBuilder();
246
- columnState = ColumnState.QUOTED_VALUE;
247
-
248
- } else if (isSpace(c)) {
249
- // skip this character
250
-
251
- } else {
252
- valueStartPos = linePos - 1;
253
- columnState = ColumnState.VALUE;
254
- }
255
- break;
256
-
257
- case VALUE:
258
- if (isDelimiter(c)) {
259
- if (delimiterFollowingString == null) {
260
- return line.substring(valueStartPos, linePos - 1);
261
- } else if (isDelimiterFollowingFrom(linePos)) {
262
- String value = line.substring(valueStartPos, linePos - 1);
263
- linePos += delimiterFollowingString.length();
264
- return value;
265
- }
266
- // not a delimiter
267
- }
268
- if (isEndOfLine(c)) {
269
- recordState = RecordState.END;
270
- return line.substring(valueStartPos, linePos);
271
-
272
- } else if (isSpace(c) && trimIfNotQuoted) {
273
- valueEndPos = linePos - 1; // this is possibly end of value
274
- columnState = ColumnState.LAST_TRIM_OR_VALUE;
275
-
276
- // TODO not implemented yet foo""bar""baz -> [foo, bar, baz].append
277
- //} else if (isQuote(c)) {
278
- // // In RFC4180, If fields are not enclosed with double quotes, then
279
- // // double quotes may not appear inside the fields. But they are often
280
- // // included in the fields. We should care about them later.
281
-
282
- } else {
283
- // keep VALUE state
284
- }
285
- break;
286
-
287
- case LAST_TRIM_OR_VALUE:
288
- if (isDelimiter(c)) {
289
- if (delimiterFollowingString == null) {
290
- return line.substring(valueStartPos, valueEndPos);
291
- } else if (isDelimiterFollowingFrom(linePos)) {
292
- linePos += delimiterFollowingString.length();
293
- return line.substring(valueStartPos, valueEndPos);
294
- } else {
295
- // not a delimiter
296
- }
297
- }
298
- if (isEndOfLine(c)) {
299
- recordState = RecordState.END;
300
- return line.substring(valueStartPos, valueEndPos);
301
-
302
- } else if (isSpace(c)) {
303
- // keep LAST_TRIM_OR_VALUE state
304
-
305
- } else {
306
- // this spaces are not trailing spaces. go back to VALUE state
307
- columnState = ColumnState.VALUE;
308
- }
309
- break;
310
-
311
- case QUOTED_VALUE:
312
- if (isEndOfLine(c)) {
313
- // multi-line quoted value
314
- quotedValue.append(line.substring(valueStartPos, linePos));
315
- quotedValue.append(newline);
316
- quotedValueLines.add(line);
317
- if (!nextLine(false)) {
318
- throw new InvalidValueException("Unexpected end of line during parsing a quoted value");
319
- }
320
- valueStartPos = 0;
321
-
322
- } else if (isQuote(c)) {
323
- char next = peekNextChar();
324
- final char nextNext = peekNextNextChar();
325
- if (isQuote(next) &&
326
- (quotesInQuotedFields != QuotesInQuotedFields.ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS ||
327
- (!isDelimiter(nextNext) && !isEndOfLine(nextNext)))) {
328
- // Escaped by preceding it with another quote.
329
- // A quote just before a delimiter or an end of line is recognized as a functional quote,
330
- // not just as a non-escaped stray "quote character" included the field, even if
331
- // ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS is specified.
332
- quotedValue.append(line.substring(valueStartPos, linePos));
333
- valueStartPos = ++linePos;
334
- } else if (quotesInQuotedFields == QuotesInQuotedFields.ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS &&
335
- !(isDelimiter(next) || isEndOfLine(next))) {
336
- // A non-escaped stray "quote character" in the field is processed as a regular character
337
- // if ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS is specified,
338
- if ((linePos - valueStartPos) + quotedValue.length() > maxQuotedSizeLimit) {
339
- throw new QuotedSizeLimitExceededException("The size of the quoted value exceeds the limit size (" + maxQuotedSizeLimit + ")");
340
- }
341
- } else {
342
- quotedValue.append(line.substring(valueStartPos, linePos - 1));
343
- columnState = ColumnState.AFTER_QUOTED_VALUE;
344
- }
345
-
346
- } else if (isEscape(c)) { // isQuote must be checked first in case of quote == escape
347
- // In RFC 4180, CSV's escape char is '\"'. But '\\' is often used.
348
- char next = peekNextChar();
349
- if (isEndOfLine(c)) {
350
- // escape end of line. TODO assuming multi-line quoted value without newline?
351
- quotedValue.append(line.substring(valueStartPos, linePos));
352
- quotedValueLines.add(line);
353
- if (!nextLine(false)) {
354
- throw new InvalidValueException("Unexpected end of line during parsing a quoted value");
355
- }
356
- valueStartPos = 0;
357
- } else if (isQuote(next) || isEscape(next)) { // escaped quote
358
- quotedValue.append(line.substring(valueStartPos, linePos - 1));
359
- quotedValue.append(next);
360
- valueStartPos = ++linePos;
361
- }
362
-
363
- } else {
364
- if ((linePos - valueStartPos) + quotedValue.length() > maxQuotedSizeLimit) {
365
- throw new QuotedSizeLimitExceededException("The size of the quoted value exceeds the limit size ("+maxQuotedSizeLimit+")");
366
- }
367
- // keep QUOTED_VALUE state
368
- }
369
- break;
370
-
371
- case AFTER_QUOTED_VALUE:
372
- if (isDelimiter(c)) {
373
- if (delimiterFollowingString == null) {
374
- return quotedValue.toString();
375
- } else if (isDelimiterFollowingFrom(linePos)) {
376
- linePos += delimiterFollowingString.length();
377
- return quotedValue.toString();
378
- }
379
- // not a delimiter
380
- }
381
- if (isEndOfLine(c)) {
382
- recordState = RecordState.END;
383
- return quotedValue.toString();
384
-
385
- } else if (isSpace(c)) {
386
- // column has trailing spaces and quoted. TODO should this be rejected?
387
-
388
- } else {
389
- throw new InvalidValueException(String.format("Unexpected extra character '%c' after a value quoted by '%c'", c, quote));
390
- }
391
- break;
392
-
393
- default:
394
- assert false;
395
- }
396
- }
397
- }
398
-
399
- public String nextColumnOrNull()
400
- {
401
- String v = nextColumn();
402
- if (nullStringOrNull == null) {
403
- if (v.isEmpty()) {
404
- if (wasQuotedColumn) {
405
- return "";
406
- }
407
- else {
408
- return null;
409
- }
410
- }
411
- else {
412
- return v;
413
- }
414
- }
415
- else {
416
- if (v.equals(nullStringOrNull)) {
417
- return null;
418
- }
419
- else {
420
- return v;
421
- }
422
- }
423
- }
424
-
425
- public boolean wasQuotedColumn()
426
- {
427
- return wasQuotedColumn;
428
- }
429
-
430
- private char nextChar()
431
- {
432
- Preconditions.checkState(line != null, "nextColumn is called after end of file");
433
-
434
- if (linePos >= line.length()) {
435
- return END_OF_LINE;
436
- } else {
437
- return line.charAt(linePos++);
438
- }
439
- }
440
-
441
- private char peekNextChar()
442
- {
443
- Preconditions.checkState(line != null, "peekNextChar is called after end of file");
444
-
445
- if (linePos >= line.length()) {
446
- return END_OF_LINE;
447
- } else {
448
- return line.charAt(linePos);
449
- }
450
- }
451
-
452
- private char peekNextNextChar()
453
- {
454
- Preconditions.checkState(line != null, "peekNextNextChar is called after end of file");
455
-
456
- if (linePos + 1 >= line.length()) {
457
- return END_OF_LINE;
458
- } else {
459
- return line.charAt(linePos + 1);
460
- }
461
- }
462
-
463
- private boolean isSpace(char c)
464
- {
465
- return c == ' ';
466
- }
467
-
468
- private boolean isDelimiterFollowingFrom(int pos)
469
- {
470
- if (line.length() < pos + delimiterFollowingString.length()) {
471
- return false;
472
- }
473
- for (int i = 0; i < delimiterFollowingString.length(); i++) {
474
- if (delimiterFollowingString.charAt(i) != line.charAt(pos + i)) {
475
- return false;
476
- }
477
- }
478
- return true;
479
- }
480
-
481
- private boolean isDelimiter(char c)
482
- {
483
- return c == delimiterChar;
484
- }
485
-
486
- private boolean isEndOfLine(char c)
487
- {
488
- return c == END_OF_LINE;
489
- }
490
-
491
- private boolean isQuote(char c)
492
- {
493
- return quote != NO_QUOTE && c == quote;
494
- }
495
-
496
- private boolean isEscape(char c)
497
- {
498
- return escape != NO_ESCAPE && c == escape;
499
- }
500
-
501
- public static class InvalidFormatException
502
- extends DataException
503
- {
504
- public InvalidFormatException(String message)
505
- {
506
- super(message);
507
- }
508
- }
509
-
510
- public static class InvalidValueException
511
- extends DataException
512
- {
513
- public InvalidValueException(String message)
514
- {
515
- super(message);
516
- }
517
- }
518
-
519
- public static class QuotedSizeLimitExceededException
520
- extends InvalidValueException
521
- {
522
- public QuotedSizeLimitExceededException(String message)
523
- {
524
- super(message);
525
- }
526
- }
527
-
528
- public class TooManyColumnsException
529
- extends InvalidFormatException
530
- {
531
- public TooManyColumnsException(String message)
532
- {
533
- super(message);
534
- }
535
- }
536
-
537
- public class TooFewColumnsException
538
- extends InvalidFormatException
539
- {
540
- public TooFewColumnsException(String message)
541
- {
542
- super(message);
543
- }
544
- }
545
- }