embulk 0.8.38-java → 0.10.27-java
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +5 -5
- data/Gemfile +1 -1
- data/LICENSE +202 -0
- data/embulk.gemspec +34 -33
- data/lib/embulk.rb +5 -61
- data/lib/embulk/buffer.rb +1 -2
- data/lib/embulk/gem_version.rb +3 -0
- data/lib/embulk/guess/charset.rb +2 -11
- data/lib/embulk/java/bootstrap.rb +0 -1
- data/lib/embulk/java_plugin.rb +9 -1
- data/lib/embulk/logger.rb +2 -1
- data/lib/embulk/page_builder.rb +2 -2
- data/lib/embulk/plugin.rb +2 -2
- data/lib/embulk/schema.rb +3 -4
- data/lib/embulk/version.rb +43 -19
- metadata +23 -761
- data/.gitignore +0 -15
- data/.ruby-version +0 -1
- data/.travis.yml +0 -28
- data/COPYING +0 -14
- data/Gemfile.lock +0 -30
- data/README.md +0 -229
- data/Rakefile +0 -26
- data/appveyor.yml +0 -28
- data/bin/embulk +0 -139
- data/build.gradle +0 -419
- data/embulk-cli/build.gradle +0 -9
- data/embulk-cli/src/main/bat/selfrun.bat +0 -107
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkArguments.java +0 -54
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkCommandLine.java +0 -227
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkCommandLineException.java +0 -25
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkExample.java +0 -86
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkMigrate.java +0 -480
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkNew.java +0 -419
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkRun.java +0 -786
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkSelfUpdate.java +0 -235
- data/embulk-cli/src/main/java/org/embulk/cli/EmbulkSubcommand.java +0 -47
- data/embulk-cli/src/main/java/org/embulk/cli/Main.java +0 -31
- data/embulk-cli/src/main/java/org/embulk/cli/parse/AbstractHelpLineDefinition.java +0 -15
- data/embulk-cli/src/main/java/org/embulk/cli/parse/CliHelpFormatterWithHelpMessages.java +0 -141
- data/embulk-cli/src/main/java/org/embulk/cli/parse/CliOptionsWithHelpMessages.java +0 -45
- data/embulk-cli/src/main/java/org/embulk/cli/parse/EmbulkCommandLineHelpRequired.java +0 -10
- data/embulk-cli/src/main/java/org/embulk/cli/parse/EmbulkCommandLineParseException.java +0 -25
- data/embulk-cli/src/main/java/org/embulk/cli/parse/EmbulkCommandLineParser.java +0 -187
- data/embulk-cli/src/main/java/org/embulk/cli/parse/HelpMessageAsCliOption.java +0 -36
- data/embulk-cli/src/main/java/org/embulk/cli/parse/HelpMessageLineDefinition.java +0 -20
- data/embulk-cli/src/main/java/org/embulk/cli/parse/OptionBehavior.java +0 -39
- data/embulk-cli/src/main/java/org/embulk/cli/parse/OptionDefinition.java +0 -120
- data/embulk-cli/src/main/sh/selfrun.sh +0 -60
- data/embulk-cli/src/test/java/org/embulk/cli/DummyMain.java +0 -23
- data/embulk-cli/src/test/java/org/embulk/cli/SelfrunTest.java +0 -296
- data/embulk-core/build.gradle +0 -83
- data/embulk-core/src/main/java/org/embulk/EmbulkEmbed.java +0 -321
- data/embulk-core/src/main/java/org/embulk/EmbulkRunner.java +0 -531
- data/embulk-core/src/main/java/org/embulk/EmbulkService.java +0 -78
- data/embulk-core/src/main/java/org/embulk/EmbulkSetup.java +0 -49
- data/embulk-core/src/main/java/org/embulk/EmbulkVersion.java +0 -109
- data/embulk-core/src/main/java/org/embulk/command/PreviewPrinter.java +0 -87
- data/embulk-core/src/main/java/org/embulk/command/TablePreviewPrinter.java +0 -107
- data/embulk-core/src/main/java/org/embulk/command/VerticalPreviewPrinter.java +0 -47
- data/embulk-core/src/main/java/org/embulk/config/CommitReport.java +0 -36
- data/embulk-core/src/main/java/org/embulk/config/Config.java +0 -15
- data/embulk-core/src/main/java/org/embulk/config/ConfigDefault.java +0 -15
- data/embulk-core/src/main/java/org/embulk/config/ConfigDiff.java +0 -32
- data/embulk-core/src/main/java/org/embulk/config/ConfigException.java +0 -26
- data/embulk-core/src/main/java/org/embulk/config/ConfigInject.java +0 -14
- data/embulk-core/src/main/java/org/embulk/config/ConfigLoader.java +0 -149
- data/embulk-core/src/main/java/org/embulk/config/ConfigSource.java +0 -34
- data/embulk-core/src/main/java/org/embulk/config/DataSource.java +0 -41
- data/embulk-core/src/main/java/org/embulk/config/DataSourceImpl.java +0 -243
- data/embulk-core/src/main/java/org/embulk/config/DataSourceSerDe.java +0 -84
- data/embulk-core/src/main/java/org/embulk/config/GenericTypeReference.java +0 -20
- data/embulk-core/src/main/java/org/embulk/config/ModelManager.java +0 -123
- data/embulk-core/src/main/java/org/embulk/config/Task.java +0 -10
- data/embulk-core/src/main/java/org/embulk/config/TaskInvocationHandler.java +0 -180
- data/embulk-core/src/main/java/org/embulk/config/TaskReport.java +0 -32
- data/embulk-core/src/main/java/org/embulk/config/TaskSerDe.java +0 -349
- data/embulk-core/src/main/java/org/embulk/config/TaskSource.java +0 -34
- data/embulk-core/src/main/java/org/embulk/config/TaskValidationException.java +0 -38
- data/embulk-core/src/main/java/org/embulk/config/TaskValidator.java +0 -24
- data/embulk-core/src/main/java/org/embulk/config/UserDataException.java +0 -4
- data/embulk-core/src/main/java/org/embulk/config/UserDataExceptions.java +0 -17
- data/embulk-core/src/main/java/org/embulk/config/YamlTagResolver.java +0 -53
- data/embulk-core/src/main/java/org/embulk/exec/BufferFileInputPlugin.java +0 -88
- data/embulk-core/src/main/java/org/embulk/exec/BulkLoader.java +0 -754
- data/embulk-core/src/main/java/org/embulk/exec/ConfigurableGuessInputPlugin.java +0 -9
- data/embulk-core/src/main/java/org/embulk/exec/ExecModule.java +0 -53
- data/embulk-core/src/main/java/org/embulk/exec/ExecutionInterruptedException.java +0 -10
- data/embulk-core/src/main/java/org/embulk/exec/ExecutionResult.java +0 -33
- data/embulk-core/src/main/java/org/embulk/exec/ExtensionServiceLoaderModule.java +0 -43
- data/embulk-core/src/main/java/org/embulk/exec/ForGuess.java +0 -16
- data/embulk-core/src/main/java/org/embulk/exec/ForSystemConfig.java +0 -16
- data/embulk-core/src/main/java/org/embulk/exec/GuessExecutor.java +0 -309
- data/embulk-core/src/main/java/org/embulk/exec/LocalExecutorPlugin.java +0 -563
- data/embulk-core/src/main/java/org/embulk/exec/LoggerProvider.java +0 -68
- data/embulk-core/src/main/java/org/embulk/exec/NoSampleException.java +0 -10
- data/embulk-core/src/main/java/org/embulk/exec/PartialExecutionException.java +0 -26
- data/embulk-core/src/main/java/org/embulk/exec/PooledBufferAllocator.java +0 -77
- data/embulk-core/src/main/java/org/embulk/exec/PreviewExecutor.java +0 -222
- data/embulk-core/src/main/java/org/embulk/exec/PreviewResult.java +0 -27
- data/embulk-core/src/main/java/org/embulk/exec/PreviewedNoticeError.java +0 -17
- data/embulk-core/src/main/java/org/embulk/exec/ResumeState.java +0 -100
- data/embulk-core/src/main/java/org/embulk/exec/SamplingParserPlugin.java +0 -215
- data/embulk-core/src/main/java/org/embulk/exec/SetCurrentThreadName.java +0 -22
- data/embulk-core/src/main/java/org/embulk/exec/SkipTransactionException.java +0 -23
- data/embulk-core/src/main/java/org/embulk/exec/SystemConfigModule.java +0 -24
- data/embulk-core/src/main/java/org/embulk/exec/TempFileAllocator.java +0 -35
- data/embulk-core/src/main/java/org/embulk/exec/TransactionStage.java +0 -27
- data/embulk-core/src/main/java/org/embulk/jruby/JRubyPluginSource.java +0 -76
- data/embulk-core/src/main/java/org/embulk/jruby/JRubyScriptingModule.java +0 -395
- data/embulk-core/src/main/java/org/embulk/plugin/BuiltinPluginSourceModule.java +0 -17
- data/embulk-core/src/main/java/org/embulk/plugin/DefaultPluginType.java +0 -50
- data/embulk-core/src/main/java/org/embulk/plugin/InjectedPluginSource.java +0 -100
- data/embulk-core/src/main/java/org/embulk/plugin/MavenPluginType.java +0 -112
- data/embulk-core/src/main/java/org/embulk/plugin/PluginClassLoader.java +0 -993
- data/embulk-core/src/main/java/org/embulk/plugin/PluginClassLoaderFactory.java +0 -16
- data/embulk-core/src/main/java/org/embulk/plugin/PluginClassLoaderModule.java +0 -102
- data/embulk-core/src/main/java/org/embulk/plugin/PluginManager.java +0 -78
- data/embulk-core/src/main/java/org/embulk/plugin/PluginSource.java +0 -49
- data/embulk-core/src/main/java/org/embulk/plugin/PluginSourceNotMatchException.java +0 -25
- data/embulk-core/src/main/java/org/embulk/plugin/PluginType.java +0 -122
- data/embulk-core/src/main/java/org/embulk/plugin/compat/InputPluginWrapper.java +0 -102
- data/embulk-core/src/main/java/org/embulk/plugin/compat/PluginWrappers.java +0 -30
- data/embulk-core/src/main/java/org/embulk/plugin/compat/TransactionalFileInputWrapper.java +0 -96
- data/embulk-core/src/main/java/org/embulk/plugin/compat/TransactionalFileOutputWrapper.java +0 -102
- data/embulk-core/src/main/java/org/embulk/plugin/compat/TransactionalPageOutputWrapper.java +0 -95
- data/embulk-core/src/main/java/org/embulk/plugin/jar/InvalidJarPluginException.java +0 -14
- data/embulk-core/src/main/java/org/embulk/plugin/jar/JarPluginLoader.java +0 -232
- data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenArtifactFinder.java +0 -134
- data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenArtifactNotFoundException.java +0 -20
- data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenPluginSource.java +0 -187
- data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenPluginSourceModule.java +0 -22
- data/embulk-core/src/main/java/org/embulk/plugin/maven/MavenRepositoryNotFoundException.java +0 -31
- data/embulk-core/src/main/java/org/embulk/spi/AbortTransactionResource.java +0 -36
- data/embulk-core/src/main/java/org/embulk/spi/Buffer.java +0 -148
- data/embulk-core/src/main/java/org/embulk/spi/BufferAllocator.java +0 -8
- data/embulk-core/src/main/java/org/embulk/spi/CloseResource.java +0 -42
- data/embulk-core/src/main/java/org/embulk/spi/Column.java +0 -95
- data/embulk-core/src/main/java/org/embulk/spi/ColumnConfig.java +0 -112
- data/embulk-core/src/main/java/org/embulk/spi/ColumnVisitor.java +0 -16
- data/embulk-core/src/main/java/org/embulk/spi/DataException.java +0 -23
- data/embulk-core/src/main/java/org/embulk/spi/DecoderPlugin.java +0 -16
- data/embulk-core/src/main/java/org/embulk/spi/EncoderPlugin.java +0 -16
- data/embulk-core/src/main/java/org/embulk/spi/Exec.java +0 -113
- data/embulk-core/src/main/java/org/embulk/spi/ExecAction.java +0 -6
- data/embulk-core/src/main/java/org/embulk/spi/ExecSession.java +0 -220
- data/embulk-core/src/main/java/org/embulk/spi/ExecutorPlugin.java +0 -19
- data/embulk-core/src/main/java/org/embulk/spi/Extension.java +0 -44
- data/embulk-core/src/main/java/org/embulk/spi/FileInput.java +0 -11
- data/embulk-core/src/main/java/org/embulk/spi/FileInputPlugin.java +0 -30
- data/embulk-core/src/main/java/org/embulk/spi/FileInputRunner.java +0 -169
- data/embulk-core/src/main/java/org/embulk/spi/FileOutput.java +0 -13
- data/embulk-core/src/main/java/org/embulk/spi/FileOutputPlugin.java +0 -28
- data/embulk-core/src/main/java/org/embulk/spi/FileOutputRunner.java +0 -199
- data/embulk-core/src/main/java/org/embulk/spi/FilterPlugin.java +0 -18
- data/embulk-core/src/main/java/org/embulk/spi/FormatterPlugin.java +0 -18
- data/embulk-core/src/main/java/org/embulk/spi/GuessPlugin.java +0 -9
- data/embulk-core/src/main/java/org/embulk/spi/InputPlugin.java +0 -33
- data/embulk-core/src/main/java/org/embulk/spi/OutputPlugin.java +0 -29
- data/embulk-core/src/main/java/org/embulk/spi/Page.java +0 -86
- data/embulk-core/src/main/java/org/embulk/spi/PageBuilder.java +0 -696
- data/embulk-core/src/main/java/org/embulk/spi/PageFormat.java +0 -47
- data/embulk-core/src/main/java/org/embulk/spi/PageOutput.java +0 -11
- data/embulk-core/src/main/java/org/embulk/spi/PageReader.java +0 -248
- data/embulk-core/src/main/java/org/embulk/spi/ParserPlugin.java +0 -17
- data/embulk-core/src/main/java/org/embulk/spi/ProcessState.java +0 -10
- data/embulk-core/src/main/java/org/embulk/spi/ProcessTask.java +0 -117
- data/embulk-core/src/main/java/org/embulk/spi/Schema.java +0 -139
- data/embulk-core/src/main/java/org/embulk/spi/SchemaConfig.java +0 -93
- data/embulk-core/src/main/java/org/embulk/spi/SchemaConfigException.java +0 -22
- data/embulk-core/src/main/java/org/embulk/spi/TaskState.java +0 -81
- data/embulk-core/src/main/java/org/embulk/spi/TempFileException.java +0 -19
- data/embulk-core/src/main/java/org/embulk/spi/TempFileSpace.java +0 -88
- data/embulk-core/src/main/java/org/embulk/spi/Transactional.java +0 -10
- data/embulk-core/src/main/java/org/embulk/spi/TransactionalFileInput.java +0 -17
- data/embulk-core/src/main/java/org/embulk/spi/TransactionalFileOutput.java +0 -19
- data/embulk-core/src/main/java/org/embulk/spi/TransactionalPageOutput.java +0 -17
- data/embulk-core/src/main/java/org/embulk/spi/json/JsonParseException.java +0 -17
- data/embulk-core/src/main/java/org/embulk/spi/json/JsonParser.java +0 -233
- data/embulk-core/src/main/java/org/embulk/spi/json/RubyValueApi.java +0 -100
- data/embulk-core/src/main/java/org/embulk/spi/time/DateTimeZoneSerDe.java +0 -55
- data/embulk-core/src/main/java/org/embulk/spi/time/Timestamp.java +0 -180
- data/embulk-core/src/main/java/org/embulk/spi/time/TimestampFormat.java +0 -127
- data/embulk-core/src/main/java/org/embulk/spi/time/TimestampFormatter.java +0 -125
- data/embulk-core/src/main/java/org/embulk/spi/time/TimestampParseException.java +0 -12
- data/embulk-core/src/main/java/org/embulk/spi/time/TimestampParser.java +0 -310
- data/embulk-core/src/main/java/org/embulk/spi/time/TimestampSerDe.java +0 -49
- data/embulk-core/src/main/java/org/embulk/spi/type/AbstractType.java +0 -58
- data/embulk-core/src/main/java/org/embulk/spi/type/BooleanType.java +0 -12
- data/embulk-core/src/main/java/org/embulk/spi/type/DoubleType.java +0 -12
- data/embulk-core/src/main/java/org/embulk/spi/type/JsonType.java +0 -14
- data/embulk-core/src/main/java/org/embulk/spi/type/LongType.java +0 -12
- data/embulk-core/src/main/java/org/embulk/spi/type/StringType.java +0 -12
- data/embulk-core/src/main/java/org/embulk/spi/type/TimestampType.java +0 -41
- data/embulk-core/src/main/java/org/embulk/spi/type/Type.java +0 -15
- data/embulk-core/src/main/java/org/embulk/spi/type/TypeDeserializer.java +0 -45
- data/embulk-core/src/main/java/org/embulk/spi/type/Types.java +0 -16
- data/embulk-core/src/main/java/org/embulk/spi/unit/ByteSize.java +0 -156
- data/embulk-core/src/main/java/org/embulk/spi/unit/LocalFile.java +0 -106
- data/embulk-core/src/main/java/org/embulk/spi/unit/LocalFileSerDe.java +0 -113
- data/embulk-core/src/main/java/org/embulk/spi/unit/ToString.java +0 -54
- data/embulk-core/src/main/java/org/embulk/spi/unit/ToStringMap.java +0 -34
- data/embulk-core/src/main/java/org/embulk/spi/util/CharsetSerDe.java +0 -55
- data/embulk-core/src/main/java/org/embulk/spi/util/Decoders.java +0 -81
- data/embulk-core/src/main/java/org/embulk/spi/util/DynamicColumnNotFoundException.java +0 -10
- data/embulk-core/src/main/java/org/embulk/spi/util/DynamicColumnSetter.java +0 -21
- data/embulk-core/src/main/java/org/embulk/spi/util/DynamicColumnSetterFactory.java +0 -134
- data/embulk-core/src/main/java/org/embulk/spi/util/DynamicPageBuilder.java +0 -200
- data/embulk-core/src/main/java/org/embulk/spi/util/Encoders.java +0 -81
- data/embulk-core/src/main/java/org/embulk/spi/util/Executors.java +0 -93
- data/embulk-core/src/main/java/org/embulk/spi/util/FileInputInputStream.java +0 -111
- data/embulk-core/src/main/java/org/embulk/spi/util/FileOutputOutputStream.java +0 -119
- data/embulk-core/src/main/java/org/embulk/spi/util/Filters.java +0 -100
- data/embulk-core/src/main/java/org/embulk/spi/util/InputStreamFileInput.java +0 -189
- data/embulk-core/src/main/java/org/embulk/spi/util/InputStreamTransactionalFileInput.java +0 -25
- data/embulk-core/src/main/java/org/embulk/spi/util/Inputs.java +0 -65
- data/embulk-core/src/main/java/org/embulk/spi/util/LineDecoder.java +0 -157
- data/embulk-core/src/main/java/org/embulk/spi/util/LineEncoder.java +0 -123
- data/embulk-core/src/main/java/org/embulk/spi/util/ListFileInput.java +0 -52
- data/embulk-core/src/main/java/org/embulk/spi/util/Newline.java +0 -38
- data/embulk-core/src/main/java/org/embulk/spi/util/OutputStreamFileOutput.java +0 -88
- data/embulk-core/src/main/java/org/embulk/spi/util/PagePrinter.java +0 -126
- data/embulk-core/src/main/java/org/embulk/spi/util/Pages.java +0 -149
- data/embulk-core/src/main/java/org/embulk/spi/util/ResumableInputStream.java +0 -168
- data/embulk-core/src/main/java/org/embulk/spi/util/RetryExecutor.java +0 -130
- data/embulk-core/src/main/java/org/embulk/spi/util/Timestamps.java +0 -53
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/AbstractDynamicColumnSetter.java +0 -94
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/BooleanColumnSetter.java +0 -71
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/DefaultValueSetter.java +0 -20
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/DoubleColumnSetter.java +0 -68
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/JsonColumnSetter.java +0 -64
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/LongColumnSetter.java +0 -78
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/NullDefaultValueSetter.java +0 -39
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/SkipColumnSetter.java +0 -68
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/StringColumnSetter.java +0 -63
- data/embulk-core/src/main/java/org/embulk/spi/util/dynamic/TimestampColumnSetter.java +0 -72
- data/embulk-core/src/main/resources/embulk/logback-color.xml +0 -72
- data/embulk-core/src/main/resources/embulk/logback-console.xml +0 -14
- data/embulk-core/src/main/resources/embulk/logback-file.xml +0 -23
- data/embulk-core/src/main/resources/embulk/parent_first_packages.properties +0 -73
- data/embulk-core/src/main/resources/embulk/parent_first_resources.properties +0 -29
- data/embulk-core/src/test/java/org/embulk/EmbulkTestRuntime.java +0 -122
- data/embulk-core/src/test/java/org/embulk/GuiceBinder.java +0 -72
- data/embulk-core/src/test/java/org/embulk/RandomManager.java +0 -53
- data/embulk-core/src/test/java/org/embulk/TestPluginSourceModule.java +0 -23
- data/embulk-core/src/test/java/org/embulk/TestUtilityModule.java +0 -17
- data/embulk-core/src/test/java/org/embulk/config/TestConfigLoader.java +0 -66
- data/embulk-core/src/test/java/org/embulk/config/TestConfigSource.java +0 -114
- data/embulk-core/src/test/java/org/embulk/config/TestTaskSource.java +0 -70
- data/embulk-core/src/test/java/org/embulk/plugin/MockPluginSource.java +0 -58
- data/embulk-core/src/test/java/org/embulk/plugin/TestPluginType.java +0 -83
- data/embulk-core/src/test/java/org/embulk/plugin/TestPluginTypeSerDe.java +0 -67
- data/embulk-core/src/test/java/org/embulk/plugin/jar/ExampleJarSpiV0.java +0 -9
- data/embulk-core/src/test/java/org/embulk/plugin/jar/JarBuilder.java +0 -101
- data/embulk-core/src/test/java/org/embulk/plugin/jar/TestJarPluginLoader.java +0 -60
- data/embulk-core/src/test/java/org/embulk/plugin/maven/TestMavenArtifactFinder.java +0 -41
- data/embulk-core/src/test/java/org/embulk/spi/MockFileOutput.java +0 -63
- data/embulk-core/src/test/java/org/embulk/spi/MockFormatterPlugin.java +0 -108
- data/embulk-core/src/test/java/org/embulk/spi/MockParserPlugin.java +0 -80
- data/embulk-core/src/test/java/org/embulk/spi/PageTestUtils.java +0 -59
- data/embulk-core/src/test/java/org/embulk/spi/TestBuffer.java +0 -24
- data/embulk-core/src/test/java/org/embulk/spi/TestFileInputInputStream.java +0 -89
- data/embulk-core/src/test/java/org/embulk/spi/TestFileInputRunner.java +0 -199
- data/embulk-core/src/test/java/org/embulk/spi/TestFileOutputRunner.java +0 -221
- data/embulk-core/src/test/java/org/embulk/spi/TestInputStreamFileInput.java +0 -188
- data/embulk-core/src/test/java/org/embulk/spi/TestPageBuilderReader.java +0 -411
- data/embulk-core/src/test/java/org/embulk/spi/json/TestJsonParser.java +0 -102
- data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestamp.java +0 -116
- data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestampFormatterParser.java +0 -75
- data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestampFormatterParserDeprecated.java +0 -67
- data/embulk-core/src/test/java/org/embulk/spi/time/TestTimestampParser.java +0 -232
- data/embulk-core/src/test/java/org/embulk/spi/type/TestTypeSerDe.java +0 -45
- data/embulk-core/src/test/java/org/embulk/spi/unit/TestByteSize.java +0 -79
- data/embulk-core/src/test/java/org/embulk/spi/util/TestLineDecoder.java +0 -237
- data/embulk-core/src/test/java/org/embulk/spi/util/TestLineEncoder.java +0 -123
- data/embulk-core/src/test/resources/m2.test/.gitignore +0 -1
- data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.jar +0 -0
- data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.jar.sha1 +0 -1
- data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.pom +0 -9
- data/embulk-core/src/test/resources/m2.test/org/embulk/example/embulk-example-maven-artifact/0.1.2/embulk-example-maven-artifact-0.1.2.pom.sha1 +0 -1
- data/embulk-docs/Makefile +0 -178
- data/embulk-docs/build.gradle +0 -41
- data/embulk-docs/make.bat +0 -243
- data/embulk-docs/push-gh-pages.sh +0 -49
- data/embulk-docs/src/_static/embulk-architecture.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-oneline-tr.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-oneline-wt.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-oneline.ai +0 -396
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq-tr-small.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq-tr.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq-wt.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq.ai +0 -417
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-sq.svg +0 -1
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-symbol-tr.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-symbol-wt.png +0 -0
- data/embulk-docs/src/_static/embulk-logo-v2/embulk-logo-v2-symbol.ai +1 -394
- data/embulk-docs/src/_static/embulk-logo.svg +0 -133
- data/embulk-docs/src/built-in.rst +0 -1017
- data/embulk-docs/src/conf.py +0 -260
- data/embulk-docs/src/customization.rst +0 -184
- data/embulk-docs/src/developers/index.rst +0 -45
- data/embulk-docs/src/index.rst +0 -102
- data/embulk-docs/src/logo.rst +0 -27
- data/embulk-docs/src/recipe.rst +0 -8
- data/embulk-docs/src/recipe/scheduled-csv-load-to-elasticsearch-kibana5.rst +0 -163
- data/embulk-docs/src/release.rst +0 -108
- data/embulk-docs/src/release/release-0.1.0.rst +0 -8
- data/embulk-docs/src/release/release-0.2.0.rst +0 -16
- data/embulk-docs/src/release/release-0.2.1.rst +0 -19
- data/embulk-docs/src/release/release-0.3.0.rst +0 -34
- data/embulk-docs/src/release/release-0.3.1.rst +0 -11
- data/embulk-docs/src/release/release-0.3.2.rst +0 -15
- data/embulk-docs/src/release/release-0.4.0.rst +0 -74
- data/embulk-docs/src/release/release-0.4.1.rst +0 -18
- data/embulk-docs/src/release/release-0.4.10.rst +0 -17
- data/embulk-docs/src/release/release-0.4.2.rst +0 -18
- data/embulk-docs/src/release/release-0.4.3.rst +0 -34
- data/embulk-docs/src/release/release-0.4.4.rst +0 -39
- data/embulk-docs/src/release/release-0.4.5.rst +0 -24
- data/embulk-docs/src/release/release-0.4.6.rst +0 -30
- data/embulk-docs/src/release/release-0.4.7.rst +0 -16
- data/embulk-docs/src/release/release-0.4.8.rst +0 -15
- data/embulk-docs/src/release/release-0.4.9.rst +0 -23
- data/embulk-docs/src/release/release-0.5.0.rst +0 -89
- data/embulk-docs/src/release/release-0.5.1.rst +0 -13
- data/embulk-docs/src/release/release-0.5.2.rst +0 -30
- data/embulk-docs/src/release/release-0.5.3.rst +0 -22
- data/embulk-docs/src/release/release-0.5.4.rst +0 -24
- data/embulk-docs/src/release/release-0.5.5.rst +0 -18
- data/embulk-docs/src/release/release-0.6.0.rst +0 -34
- data/embulk-docs/src/release/release-0.6.1.rst +0 -11
- data/embulk-docs/src/release/release-0.6.10.rst +0 -15
- data/embulk-docs/src/release/release-0.6.11.rst +0 -19
- data/embulk-docs/src/release/release-0.6.12.rst +0 -31
- data/embulk-docs/src/release/release-0.6.13.rst +0 -23
- data/embulk-docs/src/release/release-0.6.14.rst +0 -47
- data/embulk-docs/src/release/release-0.6.15.rst +0 -26
- data/embulk-docs/src/release/release-0.6.16.rst +0 -26
- data/embulk-docs/src/release/release-0.6.17.rst +0 -39
- data/embulk-docs/src/release/release-0.6.18.rst +0 -14
- data/embulk-docs/src/release/release-0.6.19.rst +0 -18
- data/embulk-docs/src/release/release-0.6.2.rst +0 -17
- data/embulk-docs/src/release/release-0.6.20.rst +0 -19
- data/embulk-docs/src/release/release-0.6.21.rst +0 -20
- data/embulk-docs/src/release/release-0.6.22.rst +0 -26
- data/embulk-docs/src/release/release-0.6.23.rst +0 -17
- data/embulk-docs/src/release/release-0.6.24.rst +0 -13
- data/embulk-docs/src/release/release-0.6.25.rst +0 -12
- data/embulk-docs/src/release/release-0.6.26.rst +0 -17
- data/embulk-docs/src/release/release-0.6.27.rst +0 -11
- data/embulk-docs/src/release/release-0.6.3.rst +0 -23
- data/embulk-docs/src/release/release-0.6.4.rst +0 -13
- data/embulk-docs/src/release/release-0.6.5.rst +0 -17
- data/embulk-docs/src/release/release-0.6.6.rst +0 -17
- data/embulk-docs/src/release/release-0.6.7.rst +0 -17
- data/embulk-docs/src/release/release-0.6.8.rst +0 -24
- data/embulk-docs/src/release/release-0.6.9.rst +0 -24
- data/embulk-docs/src/release/release-0.7.0.rst +0 -96
- data/embulk-docs/src/release/release-0.7.1.rst +0 -22
- data/embulk-docs/src/release/release-0.7.10.rst +0 -13
- data/embulk-docs/src/release/release-0.7.11.rst +0 -12
- data/embulk-docs/src/release/release-0.7.2.rst +0 -25
- data/embulk-docs/src/release/release-0.7.3.rst +0 -21
- data/embulk-docs/src/release/release-0.7.4.rst +0 -14
- data/embulk-docs/src/release/release-0.7.5.rst +0 -22
- data/embulk-docs/src/release/release-0.7.6.rst +0 -18
- data/embulk-docs/src/release/release-0.7.7.rst +0 -13
- data/embulk-docs/src/release/release-0.7.8.rst +0 -14
- data/embulk-docs/src/release/release-0.7.9.rst +0 -14
- data/embulk-docs/src/release/release-0.8.0.rst +0 -74
- data/embulk-docs/src/release/release-0.8.1.rst +0 -18
- data/embulk-docs/src/release/release-0.8.10.rst +0 -35
- data/embulk-docs/src/release/release-0.8.11.rst +0 -12
- data/embulk-docs/src/release/release-0.8.12.rst +0 -12
- data/embulk-docs/src/release/release-0.8.13.rst +0 -12
- data/embulk-docs/src/release/release-0.8.14.rst +0 -31
- data/embulk-docs/src/release/release-0.8.15.rst +0 -17
- data/embulk-docs/src/release/release-0.8.16.rst +0 -43
- data/embulk-docs/src/release/release-0.8.17.rst +0 -11
- data/embulk-docs/src/release/release-0.8.18.rst +0 -27
- data/embulk-docs/src/release/release-0.8.19.rst +0 -43
- data/embulk-docs/src/release/release-0.8.2.rst +0 -19
- data/embulk-docs/src/release/release-0.8.20.rst +0 -11
- data/embulk-docs/src/release/release-0.8.21.rst +0 -17
- data/embulk-docs/src/release/release-0.8.22.rst +0 -15
- data/embulk-docs/src/release/release-0.8.23.rst +0 -14
- data/embulk-docs/src/release/release-0.8.24.rst +0 -15
- data/embulk-docs/src/release/release-0.8.25.rst +0 -14
- data/embulk-docs/src/release/release-0.8.26.rst +0 -16
- data/embulk-docs/src/release/release-0.8.27.rst +0 -15
- data/embulk-docs/src/release/release-0.8.28.rst +0 -14
- data/embulk-docs/src/release/release-0.8.29.rst +0 -14
- data/embulk-docs/src/release/release-0.8.3.rst +0 -15
- data/embulk-docs/src/release/release-0.8.30.rst +0 -14
- data/embulk-docs/src/release/release-0.8.31.rst +0 -12
- data/embulk-docs/src/release/release-0.8.32.rst +0 -14
- data/embulk-docs/src/release/release-0.8.33.rst +0 -13
- data/embulk-docs/src/release/release-0.8.34.rst +0 -12
- data/embulk-docs/src/release/release-0.8.35.rst +0 -12
- data/embulk-docs/src/release/release-0.8.36.rst +0 -32
- data/embulk-docs/src/release/release-0.8.37.rst +0 -20
- data/embulk-docs/src/release/release-0.8.38.rst +0 -12
- data/embulk-docs/src/release/release-0.8.4.rst +0 -18
- data/embulk-docs/src/release/release-0.8.5.rst +0 -11
- data/embulk-docs/src/release/release-0.8.6.rst +0 -14
- data/embulk-docs/src/release/release-0.8.7.rst +0 -18
- data/embulk-docs/src/release/release-0.8.8.rst +0 -18
- data/embulk-docs/src/release/release-0.8.9.rst +0 -14
- data/embulk-jruby-strptime/build.gradle +0 -3
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/RubyDateParser.java +0 -121
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/StrptimeFormat.java +0 -53
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/StrptimeParser.java +0 -884
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/StrptimeToken.java +0 -111
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/TimeZoneConverter.java +0 -466
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/lexer/StrptimeLexer.flex +0 -62
- data/embulk-jruby-strptime/src/main/java/org/embulk/spi/time/lexer/StrptimeLexer.java +0 -577
- data/embulk-standards/build.gradle +0 -7
- data/embulk-standards/src/main/java/org/embulk/standards/Bzip2FileDecoderPlugin.java +0 -55
- data/embulk-standards/src/main/java/org/embulk/standards/Bzip2FileEncoderPlugin.java +0 -67
- data/embulk-standards/src/main/java/org/embulk/standards/ConfigInputPlugin.java +0 -170
- data/embulk-standards/src/main/java/org/embulk/standards/CsvFormatterPlugin.java +0 -295
- data/embulk-standards/src/main/java/org/embulk/standards/CsvParserPlugin.java +0 -416
- data/embulk-standards/src/main/java/org/embulk/standards/CsvTokenizer.java +0 -545
- data/embulk-standards/src/main/java/org/embulk/standards/GzipFileDecoderPlugin.java +0 -55
- data/embulk-standards/src/main/java/org/embulk/standards/GzipFileEncoderPlugin.java +0 -71
- data/embulk-standards/src/main/java/org/embulk/standards/JsonParserPlugin.java +0 -235
- data/embulk-standards/src/main/java/org/embulk/standards/LocalFileInputPlugin.java +0 -232
- data/embulk-standards/src/main/java/org/embulk/standards/LocalFileOutputPlugin.java +0 -148
- data/embulk-standards/src/main/java/org/embulk/standards/NullOutputPlugin.java +0 -59
- data/embulk-standards/src/main/java/org/embulk/standards/RemoveColumnsFilterPlugin.java +0 -268
- data/embulk-standards/src/main/java/org/embulk/standards/RenameFilterPlugin.java +0 -479
- data/embulk-standards/src/main/java/org/embulk/standards/StandardPluginExtension.java +0 -16
- data/embulk-standards/src/main/java/org/embulk/standards/StandardPluginModule.java +0 -60
- data/embulk-standards/src/main/java/org/embulk/standards/StdoutOutputPlugin.java +0 -91
- data/embulk-standards/src/main/resources/META-INF/services/org.embulk.spi.Extension +0 -1
- data/embulk-standards/src/test/java/org/embulk/standards/TestCsvFormatterPlugin.java +0 -312
- data/embulk-standards/src/test/java/org/embulk/standards/TestCsvParserPlugin.java +0 -75
- data/embulk-standards/src/test/java/org/embulk/standards/TestCsvTokenizer.java +0 -457
- data/embulk-standards/src/test/java/org/embulk/standards/TestJsonParserPlugin.java +0 -351
- data/embulk-standards/src/test/java/org/embulk/standards/TestRemoveColumnsFilterPlugin.java +0 -121
- data/embulk-standards/src/test/java/org/embulk/standards/TestRenameFilterPlugin.java +0 -1020
- data/embulk-standards/src/test/java/org/embulk/standards/guess/TestCsvAllStringsGuessPlugin.java +0 -38
- data/embulk-standards/src/test/java/org/embulk/standards/guess/TestCsvGuessPlugin.java +0 -248
- data/embulk-standards/src/test/java/org/embulk/standards/preview/TestFilePreview.java +0 -73
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row.csv +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_and_header.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_and_header_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_and_header_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_int_single_column_row_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows.csv +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_with_trim_needed.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_with_trim_needed_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_and_header_with_trim_needed_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_with_trim_needed.csv +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_with_trim_needed_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_rows_with_trim_needed_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row.csv +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_and_header.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_and_header_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_and_header_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_1_string_single_column_row_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_int_single_column_rows.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_int_single_column_rows_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_int_single_column_rows_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_and_header.csv +0 -3
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_and_header_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_and_header_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_rows_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_string_single_column_rows.csv +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_string_single_column_rows_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_2_string_single_column_rows_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_backslash_escape.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_backslash_escape_guessed.yml +0 -17
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_backslash_escape_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_double_single_column.csv +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_double_single_column_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_double_single_column_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_with_header.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_with_header_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_int_single_column_with_header_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_semicolon_delimiter.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_semicolon_delimiter_guessed.yml +0 -17
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_semicolon_delimiter_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_simple.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_simple_guessed.yml +0 -17
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_simple_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_single_quote.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_single_quote_guessed.yml +0 -17
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_single_quote_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_skip_suggest_if_empty_sample_records.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_skip_suggest_if_empty_sample_records_guessed.yml +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_skip_suggest_if_empty_sample_records_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_with_header.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_with_header_guessed.yml +0 -12
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_string_single_column_with_header_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_tab_delimiter.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_tab_delimiter_guessed.yml +0 -16
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv/test/test_tab_delimiter_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv_all_strings/test/test_simple.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv_all_strings/test/test_simple_guessed.yml +0 -17
- data/embulk-standards/src/test/resources/org/embulk/standards/guess/csv_all_strings/test/test_simple_seed.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes_exec.yml +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes_load.yml +0 -19
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_sample_buffer_bytes_previewed.csv +0 -1
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_simple.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_simple_load.yml +0 -19
- data/embulk-standards/src/test/resources/org/embulk/standards/preview/file/test/test_simple_previewed.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_expected.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_filter.yml +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_in.yml +0 -18
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names.yml +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names_expected.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_duplicated_column_names_in.yml +0 -17
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_with_unmatched_filter.yml +0 -3
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_keep_without_unmatched_filter.yml +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove.csv +0 -5
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_expected.csv +0 -4
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_filter.yml +0 -2
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_in.yml +0 -18
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_with_unmatched_filter.yml +0 -3
- data/embulk-standards/src/test/resources/org/embulk/standards/remove_columns/test/test_remove_without_unmatched_filter.yml +0 -2
- data/embulk-test/build.gradle +0 -6
- data/embulk-test/src/main/java/org/embulk/test/EmbulkTests.java +0 -75
- data/embulk-test/src/main/java/org/embulk/test/PreviewResultInputPlugin.java +0 -65
- data/embulk-test/src/main/java/org/embulk/test/TestingBulkLoader.java +0 -129
- data/embulk-test/src/main/java/org/embulk/test/TestingEmbulk.java +0 -710
- data/gradle/wrapper/gradle-wrapper.jar +0 -0
- data/gradle/wrapper/gradle-wrapper.properties +0 -5
- data/gradlew +0 -172
- data/gradlew.bat +0 -84
- data/lib/embulk/data/bundle/.bundle/config +0 -3
- data/lib/embulk/data/bundle/.ruby-version +0 -1
- data/lib/embulk/data/bundle/Gemfile +0 -31
- data/lib/embulk/data/bundle/embulk/filter/example.rb +0 -42
- data/lib/embulk/data/bundle/embulk/input/example.rb +0 -54
- data/lib/embulk/data/bundle/embulk/output/example.rb +0 -58
- data/lib/embulk/data/new/LICENSE.txt +0 -21
- data/lib/embulk/data/new/README.md.vm +0 -106
- data/lib/embulk/data/new/gitignore.vm +0 -17
- data/lib/embulk/data/new/java/build.gradle.vm +0 -96
- data/lib/embulk/data/new/java/config/checkstyle/checkstyle.xml +0 -128
- data/lib/embulk/data/new/java/config/checkstyle/default.xml +0 -108
- data/lib/embulk/data/new/java/decoder.java.vm +0 -86
- data/lib/embulk/data/new/java/encoder.java.vm +0 -88
- data/lib/embulk/data/new/java/file_input.java.vm +0 -145
- data/lib/embulk/data/new/java/file_output.java.vm +0 -95
- data/lib/embulk/data/new/java/filter.java.vm +0 -57
- data/lib/embulk/data/new/java/formatter.java.vm +0 -55
- data/lib/embulk/data/new/java/gradle/wrapper/gradle-wrapper.jar +0 -0
- data/lib/embulk/data/new/java/gradle/wrapper/gradle-wrapper.properties +0 -5
- data/lib/embulk/data/new/java/gradlew +0 -172
- data/lib/embulk/data/new/java/gradlew.bat +0 -84
- data/lib/embulk/data/new/java/input.java.vm +0 -89
- data/lib/embulk/data/new/java/output.java.vm +0 -79
- data/lib/embulk/data/new/java/parser.java.vm +0 -61
- data/lib/embulk/data/new/java/plugin_loader.rb.vm +0 -3
- data/lib/embulk/data/new/java/test.java.vm +0 -5
- data/lib/embulk/data/new/ruby/.ruby-version +0 -1
- data/lib/embulk/data/new/ruby/Gemfile +0 -2
- data/lib/embulk/data/new/ruby/Rakefile +0 -3
- data/lib/embulk/data/new/ruby/decoder_guess.rb.vm +0 -25
- data/lib/embulk/data/new/ruby/filter.rb.vm +0 -50
- data/lib/embulk/data/new/ruby/formatter.rb.vm +0 -49
- data/lib/embulk/data/new/ruby/gemspec.vm +0 -20
- data/lib/embulk/data/new/ruby/input.rb.vm +0 -59
- data/lib/embulk/data/new/ruby/output.rb.vm +0 -61
- data/lib/embulk/data/new/ruby/parser.rb.vm +0 -44
- data/lib/embulk/data/new/ruby/parser_guess.rb.vm +0 -65
- data/lib/embulk/data/package_data.rb +0 -59
- data/lib/embulk/guess/bzip2.rb +0 -23
- data/lib/embulk/guess/csv.rb +0 -374
- data/lib/embulk/guess/csv_all_strings.rb +0 -13
- data/lib/embulk/guess/gzip.rb +0 -18
- data/lib/embulk/guess/json.rb +0 -50
- data/lib/embulk/runner.rb +0 -53
- data/settings.gradle +0 -8
- data/test/helper.rb +0 -23
- data/test/monkey_strptime/mri/date/test_date_strptime.rb +0 -515
- data/test/monkey_strptime/run-test.rb +0 -29
- data/test/vanilla/guess/test_csv_all_strings.rb +0 -43
- data/test/vanilla/guess/test_csv_guess.rb +0 -170
- data/test/vanilla/guess/test_schema_guess.rb +0 -47
- data/test/vanilla/guess/test_time_format_guess.rb +0 -135
- data/test/vanilla/run-test.rb +0 -14
- data/test/vanilla/time/test_timestamp_parser.rb +0 -102
@@ -1,133 +0,0 @@
|
|
1
|
-
<?xml version="1.0" encoding="utf-8"?>
|
2
|
-
<!-- Generator: Adobe Illustrator 15.0.2, SVG Export Plug-In . SVG Version: 6.00 Build 0) -->
|
3
|
-
<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
|
4
|
-
<svg version="1.1" id="Layer_1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
|
5
|
-
width="466px" height="268px" viewBox="0 0 466 268" enable-background="new 0 0 466 268" xml:space="preserve">
|
6
|
-
<g>
|
7
|
-
<path fill="#EF4F39" d="M124.753,173.479c0,0,7.781,2.789,8.031,6.721c0.57,8.859,5.539,30.307-0.93,30.686
|
8
|
-
c-8.516,0.502-20.797-12.975-24.602-22.738c-5.82-14.951-4.18-19.992-4.18-19.992L124.753,173.479z"/>
|
9
|
-
<g>
|
10
|
-
<g>
|
11
|
-
<path fill="#1F1F1F" d="M38.015,225.368c1.477,4.021,3.523,7.008,6.141,8.953s5.891,2.918,9.828,2.918
|
12
|
-
c2.859,0,5.742-0.58,8.648-1.744c0.762-0.312,3.422-1.586,7.984-3.822c1.383-0.672,2.93-1.006,4.625-1.006
|
13
|
-
c2.328,0,4.297,1.051,5.906,3.152c1.34,1.699,2.012,3.398,2.012,5.096c0,3.803-2.707,7.246-8.113,10.33
|
14
|
-
c-6.488,3.713-13.844,5.57-22.07,5.57c-12.297,0-21.98-4.273-29.047-12.814c-5.094-6.17-7.645-13.592-7.645-22.268
|
15
|
-
c0-11.762,3.777-21.152,11.336-28.172c6.527-6.037,14.266-9.057,23.207-9.057c7.828,0,14.781,2.416,20.859,7.246
|
16
|
-
c5.859,4.695,9.75,11.066,11.672,19.115c0.672,2.863,1.008,5.725,1.008,8.586c0,5.277-2.93,7.916-8.789,7.916H38.015z
|
17
|
-
M64.511,211.616c-0.848-3.264-1.832-5.701-2.949-7.312c-2.414-3.531-5.812-5.299-10.195-5.299c-3.758,0-6.953,1.365-9.594,4.094
|
18
|
-
c-1.699,1.787-3.195,4.627-4.492,8.518H64.511z"/>
|
19
|
-
<path fill="#1F1F1F" d="M112.202,189.481c2.367-2.102,4.539-3.623,6.508-4.561c3.352-1.609,7.133-2.416,11.336-2.416
|
20
|
-
c5.23,0,9.812,1.117,13.75,3.354c1.742,0.984,3.598,2.797,5.566,5.434c3.355-2.727,6.215-4.693,8.586-5.902
|
21
|
-
c3.934-1.922,8.16-2.885,12.676-2.885c6.977,0,12.742,2.215,17.305,6.641c4.609,4.518,6.91,10.061,6.91,16.635v35.146
|
22
|
-
c0,3.848-0.449,6.666-1.34,8.451c-0.762,1.432-1.957,2.627-3.59,3.59c-1.633,0.961-3.344,1.443-5.129,1.443
|
23
|
-
c-1.793,0-3.5-0.469-5.133-1.41c-1.633-0.939-2.828-2.146-3.59-3.623c-0.895-1.785-1.34-4.604-1.34-8.451v-30.652
|
24
|
-
c0-2.951-0.895-5.342-2.684-7.176c-2.012-2.146-4.559-3.221-7.645-3.221c-3.133,0-5.75,1.051-7.852,3.154
|
25
|
-
c-1.875,1.832-2.816,4.246-2.816,7.242v30.652c0,3.805-0.449,6.621-1.34,8.451c-0.762,1.477-1.957,2.684-3.59,3.623
|
26
|
-
c-1.633,0.941-3.344,1.41-5.129,1.41c-1.789,0-3.5-0.469-5.133-1.41c-1.633-0.939-2.828-2.146-3.59-3.623
|
27
|
-
c-0.895-1.785-1.34-4.604-1.34-8.451v-28.641c0-4.066-0.961-7.152-2.887-9.254c-1.922-2.104-4.449-3.154-7.578-3.154
|
28
|
-
c-3.086,0-5.699,1.098-7.848,3.287c-1.789,1.879-2.68,4.248-2.68,7.109v30.652c0,3.805-0.453,6.621-1.344,8.451
|
29
|
-
c-0.762,1.477-1.957,2.684-3.59,3.623c-1.633,0.941-3.34,1.41-5.133,1.41c-1.785,0-3.496-0.469-5.129-1.41
|
30
|
-
c-1.633-0.939-2.828-2.146-3.59-3.623c-0.895-1.785-1.34-4.604-1.34-8.451v-46.414c0-3.398,0.848-6.127,2.547-8.186
|
31
|
-
c1.879-2.279,4.336-3.42,7.379-3.42c2.594,0,4.809,0.873,6.641,2.617C109.897,186.284,110.952,187.603,112.202,189.481z"/>
|
32
|
-
<path fill="#1F1F1F" d="M112.202,189.481c2.367-2.102,4.539-3.623,6.508-4.561c3.352-1.609,7.133-2.416,11.336-2.416
|
33
|
-
c5.23,0,9.812,1.117,13.75,3.354c1.742,0.984,3.598,2.797,5.566,5.434c3.355-2.727,6.215-4.693,8.586-5.902
|
34
|
-
c3.934-1.922,8.16-2.885,12.676-2.885c6.977,0,12.742,2.215,17.305,6.641c4.609,4.518,6.91,10.061,6.91,16.635v35.146
|
35
|
-
c0,3.848-0.449,6.666-1.34,8.451c-0.762,1.432-1.957,2.627-3.59,3.59c-1.633,0.961-3.344,1.443-5.129,1.443
|
36
|
-
c-1.793,0-3.5-0.469-5.133-1.41c-1.633-0.939-2.828-2.146-3.59-3.623c-0.895-1.785-1.34-4.604-1.34-8.451v-30.652
|
37
|
-
c0-2.951-0.895-5.342-2.684-7.176c-2.012-2.146-4.559-3.221-7.645-3.221c-3.133,0-5.75,1.051-7.852,3.154
|
38
|
-
c-1.875,1.832-2.816,4.246-2.816,7.242v30.652c0,3.805-0.449,6.621-1.34,8.451c-0.762,1.477-1.957,2.684-3.59,3.623
|
39
|
-
c-1.633,0.941-3.344,1.41-5.129,1.41c-1.789,0-3.5-0.469-5.133-1.41c-1.633-0.939-2.828-2.146-3.59-3.623
|
40
|
-
c-0.895-1.785-1.34-4.604-1.34-8.451v-28.641c0-4.066-0.961-7.152-2.887-9.254c-1.922-2.104-4.449-3.154-7.578-3.154
|
41
|
-
c-3.086,0-5.699,1.098-7.848,3.287c-1.789,1.879-2.68,4.248-2.68,7.109v30.652c0,3.805-0.453,6.621-1.344,8.451
|
42
|
-
c-0.762,1.477-1.957,2.684-3.59,3.623c-1.633,0.941-3.34,1.41-5.133,1.41c-1.785,0-3.496-0.469-5.129-1.41
|
43
|
-
c-1.633-0.939-2.828-2.146-3.59-3.623c-0.895-1.785-1.34-4.604-1.34-8.451v-46.414c0-3.398,0.848-6.127,2.547-8.186
|
44
|
-
c1.879-2.279,4.336-3.42,7.379-3.42c2.594,0,4.809,0.873,6.641,2.617C109.897,186.284,110.952,187.603,112.202,189.481z"/>
|
45
|
-
</g>
|
46
|
-
</g>
|
47
|
-
<g>
|
48
|
-
<path fill="#FFFFFF" d="M32.706,101.839c0,0,12.794,37.536,28.406,50.635c23.352,19.592,42.266,24.008,63.57,26.375
|
49
|
-
c27.992,3.109,68.055,0.375,76.672-3.381c19.914-8.666,36.523-27.725,41.93-43.279c5.414-15.557-82.844-32.125-82.844-32.125
|
50
|
-
l-30.766-13.865c0,0-19.617-10.143-26.719-6.76c-7.102,3.381-13.859,5.748-19.273,7.1c-5.406,1.354-13.523,0.338-22.656,2.029
|
51
|
-
C51.901,90.257,32.706,101.839,32.706,101.839z"/>
|
52
|
-
<path fill="#EF4F39" d="M32.331,101.245c0,0,0.391,10.795,3.898,14.678c4.727,5.23,3.203,11.189,13.461,25.664
|
53
|
-
c13.281,18.732,38.328,36.789,89.406,38.908c50.391,2.094,50.086-1.395,50.086-1.395s-6.891,1.152-44.25-0.252
|
54
|
-
c-23.625-0.889-56.344-5.354-75.016-20.842c-17.734-14.709-24.203-24.42-29.125-39.309c-2.094-6.34-5.797-6.422-5.992-15.996
|
55
|
-
C34.776,101.249,32.331,101.245,32.331,101.245z"/>
|
56
|
-
<g>
|
57
|
-
<path fill="#F16523" d="M195.331,176.63c0,0,5.219-1.023,11.352-4.504c8.711-4.943,14.773-11.02,15.852-11.918
|
58
|
-
c4.883-4.057,15.219-16.484,15.219-16.484c-0.414,0.613-5.562,9.764-12.305,15.977c-4.484,4.133-1.898,2.156-9.25,7.861
|
59
|
-
c-9.078,7.043-22,11.92-22,11.92"/>
|
60
|
-
<path fill="#F16523" d="M284.198,12.147c0,0-7.016,13.777-24.008,15.553c-11.57,1.211-13.188,11.16-13.188,11.16
|
61
|
-
s-4.055-10.652-14.453-12.174c-15.477-2.264-20.375-13.525-20.375-13.525c-4.391,16.23,0.68,24.346,3.383,28.404
|
62
|
-
c5.188,7.781,18.258,9.469,21.305,16.23c3.039,6.764,0.672,11.498-2.703,27.391c-3.383,15.893-19.281,12.848-32.125,11.156
|
63
|
-
c-7.117-0.934-18.672-8.105-41.508-16.402c0.242-4.438-2.695-9.434-1.016-16.23c6.086-24.6,24.094-34.361,12.938-32.715
|
64
|
-
c-8.805,1.301-50.031,32.121-56.523,36.102c-8.344-1.617-17.086-2.822-26.156-3.387c-31.359-1.947-39.305,14.033-48.945,20.627
|
65
|
-
c-17.148,11.734-8.07,17.84-8.07,17.84s28.812,1.553,40.109,3.975c9.469,2.027,32.125,8.453,33.812,11.496
|
66
|
-
c1.695,3.043,4.398,11.834,12.516,10.145c8.109-1.691,8.75-7.969,8.75-7.969c-0.344,9.131,6.805,21.156,14.242,31.639
|
67
|
-
s19.273,13.188,19.273,13.188c2.031,25.359-11.562,49.064-8.031,49.195c23.844,0.889,38.156-23.922,40.453-28.275
|
68
|
-
c4.82-9.131,3.297-19.656,3.297-19.656c42.266-8.113,49.461-34.107,53.203-45.637c6.344-19.529,3.055-59.438,3.055-59.438
|
69
|
-
s8.789-0.676,20.961-9.467C286.565,42.579,284.198,12.147,284.198,12.147z"/>
|
70
|
-
</g>
|
71
|
-
<path fill="#FFFFFF" d="M107.753,97.312c0,0-0.617-14.115,18.625-10.881s19.953,13.1,4.945,17.168
|
72
|
-
C116.323,107.669,108.065,103.565,107.753,97.312z"/>
|
73
|
-
<g>
|
74
|
-
<circle fill="#1F1F1F" cx="101.776" cy="92.2" r="4.312"/>
|
75
|
-
<path fill="#FFFFFF" d="M101.776,96.761c-2.516,0-4.562-2.046-4.562-4.561c0-2.516,2.047-4.562,4.562-4.562
|
76
|
-
s4.562,2.047,4.562,4.562C106.339,94.715,104.292,96.761,101.776,96.761z M101.776,88.138c-2.24,0-4.062,1.822-4.062,4.062
|
77
|
-
c0,2.239,1.822,4.061,4.062,4.061s4.062-1.822,4.062-4.061C105.839,89.96,104.017,88.138,101.776,88.138z"/>
|
78
|
-
<path fill="#FFFFFF" d="M104.394,90.595c0,0.512-0.414,0.928-0.93,0.928c-0.508,0-0.93-0.416-0.93-0.928
|
79
|
-
c0-0.516,0.422-0.932,0.93-0.932C103.979,89.663,104.394,90.079,104.394,90.595z"/>
|
80
|
-
</g>
|
81
|
-
<g>
|
82
|
-
<path fill="#EF4F39" d="M164.237,161.2c-1.523,0.254-4.141,0.254-9.383-1.184c-4.789-1.311-12.648-9.082-13.984-10.43
|
83
|
-
c0.438,0.631,0.875,1.254,1.312,1.875c7.438,10.482,19.273,13.188,19.273,13.188c1.969,24.617-10.773,47.672-8.297,49.121
|
84
|
-
c0.008-0.064,0.094-0.949,0.258-1.764c0.164-0.846,0.594-2.283,1.266-3.805c0.68-1.521,10.062-18.682,12.172-26.543
|
85
|
-
c2.117-7.861,1.188-21.727,1.188-21.727S165.761,160.948,164.237,161.2z"/>
|
86
|
-
<path fill="#EF4F39" d="M122.995,115.067c0,0,2.531-7.607,10.648-6.086s5.328,10.271,5.328,10.271s0.031-6.586-5.711-7.734
|
87
|
-
C128.19,110.503,122.995,115.067,122.995,115.067z"/>
|
88
|
-
<path fill="#EF4F39" d="M117.237,126.362c-5.328-0.635-5.711-8.242-9.891-11.287c-3.484-2.529-25.367-9.129-34.242-11.031
|
89
|
-
s-36.266-3.803-38.547-3.93s-2.914-3.043-3.297-3.553c-0.242-0.326,0.25-2.391,0.633-3.816c-3.898,6.225,0.859,9.432,0.859,9.432
|
90
|
-
s28.812,1.553,40.109,3.975c9.469,2.027,32.125,8.453,33.812,11.496c1.695,3.043,4.398,11.834,12.516,10.145
|
91
|
-
c8.109-1.691,8.75-7.969,8.75-7.969S122.144,126.946,117.237,126.362z"/>
|
92
|
-
<path fill="#EF4F39" d="M251.394,111.146c-1.352,7.1-6.594,22.994-16.398,32.799c-6.102,6.098-15.898,10.652-23.672,14.203
|
93
|
-
c-6.266,2.859-15.219,3.887-15.219,3.887l1.07,3.879c42.266-8.113,49.461-34.107,53.203-45.637
|
94
|
-
c2.305-7.115,3.344-16.934,3.719-26.541C253.448,98.396,252.308,106.351,251.394,111.146z"/>
|
95
|
-
</g>
|
96
|
-
</g>
|
97
|
-
<rect x="133.667" y="203.567" fill="#1F1F1F" width="20.055" height="21.766"/>
|
98
|
-
<g>
|
99
|
-
<g>
|
100
|
-
<path fill="#1F1F1F" d="M226.835,188.409c2.816-2.104,5.188-3.512,7.109-4.227c2.992-1.162,6.059-1.744,9.188-1.744
|
101
|
-
c8.32,0,15.586,3.379,21.801,10.127c6.348,6.889,9.527,15.496,9.527,25.826c0,11.402-3.555,20.658-10.668,27.77
|
102
|
-
c-5.723,5.768-12.543,8.654-20.457,8.654c-4.609,0-8.562-1.031-11.875-3.086c-1.516-0.984-3.148-2.619-4.895-4.896
|
103
|
-
c-2.059,5.051-5.23,7.578-9.527,7.578c-2.637,0-4.961-0.85-6.973-2.549c-2.238-1.967-3.355-4.697-3.355-8.182v-77.543
|
104
|
-
c0-3.799,0.449-6.594,1.344-8.383c0.758-1.477,1.953-2.684,3.59-3.623c1.629-0.939,3.34-1.408,5.129-1.408s3.5,0.469,5.133,1.408
|
105
|
-
s2.828,2.146,3.586,3.623c0.895,1.789,1.344,4.584,1.344,8.383V188.409z M240.519,201.22c-3.758,0-7.02,1.631-9.793,4.896
|
106
|
-
c-2.684,3.219-4.023,7.379-4.023,12.477c0,5.141,1.34,9.324,4.023,12.543c2.773,3.264,6.078,4.896,9.926,4.896
|
107
|
-
c4.16,0,7.488-1.746,9.996-5.23c2.457-3.49,3.688-7.535,3.688-12.143c0-4.695-1.23-8.742-3.688-12.143
|
108
|
-
C248.097,202.987,244.718,201.22,240.519,201.22z"/>
|
109
|
-
<path fill="#1F1F1F" d="M345.358,196.39v29.916c0,6.842-1.637,12.387-4.898,16.635c-2.773,3.578-6.352,6.396-10.734,8.451
|
110
|
-
c-4.918,2.324-10.148,3.488-15.695,3.488c-7.781,0-14.598-2.078-20.457-6.238c-4.559-3.221-7.645-7.064-9.258-11.537
|
111
|
-
c-1.074-3.037-1.605-6.641-1.605-10.799V196.39c0-3.801,0.445-6.617,1.336-8.451c0.762-1.477,1.949-2.684,3.559-3.623
|
112
|
-
c1.605-0.938,3.332-1.408,5.164-1.408c1.789,0,3.496,0.471,5.129,1.408c1.633,0.939,2.828,2.146,3.59,3.623
|
113
|
-
c0.895,1.789,1.34,4.607,1.34,8.451v27.434c0,2.818,0.449,4.945,1.344,6.373c2.281,3.668,5.57,5.502,9.859,5.502
|
114
|
-
c3.129,0,5.793-1.074,7.984-3.221c2.145-2.059,3.219-4.941,3.219-8.654V196.39c0-3.844,0.445-6.662,1.34-8.451
|
115
|
-
c0.762-1.477,1.957-2.684,3.59-3.623c1.633-0.938,3.344-1.408,5.133-1.408c1.785,0,3.5,0.471,5.129,1.408
|
116
|
-
c1.633,0.939,2.828,2.146,3.59,3.623C344.909,189.728,345.358,192.546,345.358,196.39z"/>
|
117
|
-
<path fill="#1F1F1F" d="M377.351,166.138v74.789c0,3.848-0.445,6.666-1.344,8.451c-0.758,1.477-1.953,2.684-3.586,3.623
|
118
|
-
c-1.633,0.941-3.344,1.41-5.133,1.41s-3.5-0.469-5.129-1.41c-1.633-0.939-2.832-2.146-3.59-3.623
|
119
|
-
c-0.895-1.785-1.344-4.604-1.344-8.451v-74.789c0-3.799,0.449-6.594,1.344-8.383c0.758-1.477,1.957-2.684,3.59-3.623
|
120
|
-
c1.629-0.939,3.34-1.408,5.129-1.408s3.5,0.469,5.133,1.408s2.828,2.146,3.586,3.623
|
121
|
-
C376.905,159.544,377.351,162.339,377.351,166.138z"/>
|
122
|
-
<path fill="#1F1F1F" d="M409.343,220.403v20.523c0,3.805-0.445,6.621-1.34,8.451c-0.762,1.477-1.957,2.684-3.586,3.623
|
123
|
-
c-1.633,0.941-3.344,1.41-5.133,1.41s-3.496-0.469-5.129-1.41c-1.633-0.939-2.828-2.146-3.594-3.623
|
124
|
-
c-0.891-1.785-1.34-4.604-1.34-8.451v-74.789c0-3.799,0.449-6.594,1.34-8.383c0.766-1.477,1.961-2.684,3.594-3.623
|
125
|
-
s3.34-1.408,5.129-1.408s3.5,0.469,5.133,1.408c1.629,0.939,2.824,2.146,3.586,3.623c0.895,1.789,1.34,4.584,1.34,8.383v40.582
|
126
|
-
l18.516-18.982c3.445-3.533,6.527-5.299,9.258-5.299c2.727,0,5.051,0.984,6.977,2.951c1.922,1.924,2.883,4.227,2.883,6.908
|
127
|
-
c0,1.969-0.738,3.936-2.215,5.904c-0.488,0.625-1.566,1.744-3.219,3.354l-12.609,12.072l17.641,21.936
|
128
|
-
c2.902,3.578,4.355,6.551,4.355,8.918c0,3.178-1.27,5.793-3.82,7.85c-1.836,1.432-3.957,2.146-6.375,2.146
|
129
|
-
c-2.41,0-4.672-0.961-6.77-2.885c-0.629-0.58-1.656-1.787-3.09-3.621L409.343,220.403z"/>
|
130
|
-
</g>
|
131
|
-
</g>
|
132
|
-
</g>
|
133
|
-
</svg>
|
@@ -1,1017 +0,0 @@
|
|
1
|
-
Configuration
|
2
|
-
==============
|
3
|
-
|
4
|
-
.. contents::
|
5
|
-
:local:
|
6
|
-
:depth: 2
|
7
|
-
|
8
|
-
Embulk configuration file format
|
9
|
-
---------------------------------
|
10
|
-
|
11
|
-
Embulk uses a YAML file to define a bulk data loading. Here is an example of the file:
|
12
|
-
|
13
|
-
.. code-block:: yaml
|
14
|
-
|
15
|
-
in:
|
16
|
-
type: file
|
17
|
-
path_prefix: ./mydata/csv/
|
18
|
-
decoders:
|
19
|
-
- {type: gzip}
|
20
|
-
parser:
|
21
|
-
charset: UTF-8
|
22
|
-
newline: CRLF
|
23
|
-
type: csv
|
24
|
-
delimiter: ','
|
25
|
-
quote: '"'
|
26
|
-
escape: '"'
|
27
|
-
null_string: 'NULL'
|
28
|
-
skip_header_lines: 1
|
29
|
-
columns:
|
30
|
-
- {name: id, type: long}
|
31
|
-
- {name: account, type: long}
|
32
|
-
- {name: time, type: timestamp, format: '%Y-%m-%d %H:%M:%S'}
|
33
|
-
- {name: purchase, type: timestamp, format: '%Y%m%d'}
|
34
|
-
- {name: comment, type: string}
|
35
|
-
filters:
|
36
|
-
- type: speedometer
|
37
|
-
speed_limit: 250000
|
38
|
-
out:
|
39
|
-
type: stdout
|
40
|
-
|
41
|
-
A configuration file consists of following sections:
|
42
|
-
|
43
|
-
* **in:** Input plugin options. An input plugin is either record-based (`MySQL <https://github.com/embulk/embulk-input-jdbc>`_, `DynamoDB <https://github.com/lulichn/embulk-input-dynamodb>`_, etc) or file-based (`S3 <https://github.com/embulk/embulk-input-s3>`_, `HTTP <https://github.com/takumakanari/embulk-input-http>`_, etc).
|
44
|
-
|
45
|
-
* **parser:** If the input is file-based, parser plugin parses a file format (built-in csv, `json <https://github.com/takumakanari/embulk-parser-json>`_, etc).
|
46
|
-
|
47
|
-
* **decoder:** If the input is file-based, decoder plugin decodes compression or encryption (built-in gzip, bzip2, `zip <https://github.com/hata/embulk-decoder-commons-compress>`_, `tar.gz <https://github.com/hata/embulk-decoder-commons-compress>`_, etc).
|
48
|
-
|
49
|
-
* **out:** Output plugin options. An output plugin is either record-based (`Oracle <https://github.com/embulk/embulk-output-jdbc>`_, `Elasticsearch <https://github.com/muga/embulk-output-elasticsearch>`_, etc) or file-based (`Google Cloud Storage <https://github.com/hakobera/embulk-output-gcs>`_, `Command <https://github.com/embulk/embulk-output-command>`_, etc)
|
50
|
-
|
51
|
-
* **formatter:** If the output is file-based, formatter plugin formats a file format (such as built-in csv, `jsonl <https://github.com/takei-yuya/embulk-formatter-jsonl>`_)
|
52
|
-
|
53
|
-
* **encoder:** If the output is file-based, encoder plugin encodes compression or encryption (such as built-in gzip or bzip2)
|
54
|
-
|
55
|
-
* **filters:** Filter plugins options (optional).
|
56
|
-
|
57
|
-
* **exec:** Executor plugin options. An executor plugin control parallel processing (such as built-in thread executor, `Hadoop MapReduce executor <https://github.com/embulk/embulk-executor-mapreduce>`_)
|
58
|
-
|
59
|
-
In many cases, what you need to write is **in:**, **out**: and **formatter** sections only because ``guess`` command guesses **parser** and **decoder** options for you. See also the `Quick Start <https://github.com/embulk/embulk#quick-start>`_.
|
60
|
-
|
61
|
-
|
62
|
-
Using variables
|
63
|
-
~~~~~~~~~~~~~~~~
|
64
|
-
|
65
|
-
You can embed environment variables in configuration file using `Liquid template engine <http://liquidmarkup.org/>`_ (This is experimental feature. Behavior might change or be removed in future releases).
|
66
|
-
|
67
|
-
To use template engine, configuration file name must end with ``.yml.liquid``.
|
68
|
-
|
69
|
-
Environment variables are set to ``env`` variable.
|
70
|
-
|
71
|
-
.. code-block:: yaml
|
72
|
-
|
73
|
-
in:
|
74
|
-
type: file
|
75
|
-
path_prefix: {{ env.path_prefix }}
|
76
|
-
decoders:
|
77
|
-
- {type: gzip}
|
78
|
-
parser:
|
79
|
-
...
|
80
|
-
out:
|
81
|
-
type: postgresql
|
82
|
-
host: {{ env.pg_host }}
|
83
|
-
port: {{ env.pg_port }}
|
84
|
-
user: {{ env.pg_user }}
|
85
|
-
password: "{{ env.pg_password }}"
|
86
|
-
database: embulk_load
|
87
|
-
mode: insert
|
88
|
-
table: {{ env.pg_table }}
|
89
|
-
|
90
|
-
|
91
|
-
Including files
|
92
|
-
~~~~~~~~~~~~~~~~
|
93
|
-
|
94
|
-
Configuration file can include another configuration file. To use it, configuration file name must end with ``.yml.liquid``.
|
95
|
-
|
96
|
-
File will be searched from the relative path of the input configuration file. And file name will be ``_<name>.yml.liquid``. For example, if you add ``{% include 'subdir/inc' %}`` tag to ``myconfig/config.yml.liquid`` file, it includes ``myconfig/subdir/_inc.yml.liquid`` file.
|
97
|
-
|
98
|
-
.. code-block:: liquid
|
99
|
-
|
100
|
-
# config.yml.liquid
|
101
|
-
{% include 'in_mysql' %}
|
102
|
-
out:
|
103
|
-
type: stdout
|
104
|
-
|
105
|
-
.. code-block:: yaml
|
106
|
-
|
107
|
-
# _in_mysql.yml.liquid
|
108
|
-
in:
|
109
|
-
type: mysql
|
110
|
-
|
111
|
-
With above 2 files, actual configuration file will be:
|
112
|
-
|
113
|
-
.. code-block:: yaml
|
114
|
-
|
115
|
-
# $ embulk run config.yml.liquid
|
116
|
-
in:
|
117
|
-
type: mysql
|
118
|
-
out:
|
119
|
-
type: stdout
|
120
|
-
|
121
|
-
|
122
|
-
|
123
|
-
Local file input plugin
|
124
|
-
------------------------
|
125
|
-
|
126
|
-
The ``file`` input plugin reads files from local file system.
|
127
|
-
|
128
|
-
Options
|
129
|
-
~~~~~~~~
|
130
|
-
|
131
|
-
+------------------+----------+------------------------------------------------+-----------------------+
|
132
|
-
| name | type | description | required? |
|
133
|
-
+==================+==========+================================================+=======================+
|
134
|
-
| path\_prefix | string | Path prefix of input files | required |
|
135
|
-
+------------------+----------+------------------------------------------------+-----------------------+
|
136
|
-
| parser | hash | Parser configuration (see below) | required |
|
137
|
-
+------------------+----------+------------------------------------------------+-----------------------+
|
138
|
-
| decoders | array | Decoder configuration (see below) | |
|
139
|
-
+------------------+----------+------------------------------------------------+-----------------------+
|
140
|
-
| last\_path | string | Name of last read file in previous operation | |
|
141
|
-
+------------------+----------+------------------------------------------------+-----------------------+
|
142
|
-
| follow\_symlinks | boolean | If `true`, follow symbolic link directories | ``false`` by default |
|
143
|
-
+------------------+----------+------------------------------------------------+-----------------------+
|
144
|
-
|
145
|
-
The ``path_prefix`` option is required. If you have files as following, you may set ``path_prefix: /path/to/files/sample_``:
|
146
|
-
|
147
|
-
::
|
148
|
-
|
149
|
-
.
|
150
|
-
`-- path
|
151
|
-
`-- to
|
152
|
-
`-- files
|
153
|
-
|-- sample_01.csv -> read
|
154
|
-
|-- sample_02.csv -> read
|
155
|
-
|-- sample_03.csv -> read
|
156
|
-
|-- sample_04.csv -> read
|
157
|
-
|
158
|
-
The ``last_path`` option is used to skip files older than or same with the file in dictionary order.
|
159
|
-
For example, if you set ``last_path: /path/to/files/sample_02.csv``, Embulk reads following files:
|
160
|
-
|
161
|
-
::
|
162
|
-
|
163
|
-
.
|
164
|
-
`-- path
|
165
|
-
`-- to
|
166
|
-
`-- files
|
167
|
-
|-- sample_01.csv -> skip
|
168
|
-
|-- sample_02.csv -> skip
|
169
|
-
|-- sample_03.csv -> read
|
170
|
-
|-- sample_04.csv -> read
|
171
|
-
|
172
|
-
Example
|
173
|
-
~~~~~~~~
|
174
|
-
|
175
|
-
.. code-block:: yaml
|
176
|
-
|
177
|
-
in:
|
178
|
-
type: file
|
179
|
-
path_prefix: /path/to/files/sample_
|
180
|
-
last_path: /path/to/files/sample_02.csv
|
181
|
-
parser:
|
182
|
-
...
|
183
|
-
|
184
|
-
In most of cases, you'll use guess to configure the parser and decoders. See also `Quick Start <https://github.com/embulk/embulk#quick-start>`_.
|
185
|
-
|
186
|
-
CSV parser plugin
|
187
|
-
------------------
|
188
|
-
|
189
|
-
The ``csv`` parser plugin parses CSV and TSV files.
|
190
|
-
|
191
|
-
Options
|
192
|
-
~~~~~~~~
|
193
|
-
|
194
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
195
|
-
| name | type | description | required? |
|
196
|
-
+============================+==========+================================================================================================================+============================================+
|
197
|
-
| delimiter | string | Delimiter character such as ``,`` for CSV, ``"\t"`` for TSV, ``"|"`` | ``,`` by default |
|
198
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
199
|
-
| quote | string | The character surrounding a quoted value. Setting ``null`` disables quoting. | ``"`` by default |
|
200
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
201
|
-
| escape | string | Escape character to escape a special character. Setting ``null`` disables escaping. | ``\\`` by default |
|
202
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
203
|
-
| skip\_header\_lines | integer | Skip this number of lines first. Set 1 if the file has header line. | ``0`` by default |
|
204
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
205
|
-
| null\_string | string | If a value is this string, converts it to NULL. For example, set ``\N`` for CSV files created by mysqldump | |
|
206
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
207
|
-
| trim\_if\_not\_quoted | boolean | If true, remove spaces of a value if the value is not surrounded by the quote character | ``false`` by default |
|
208
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
209
|
-
| quotes\_in\_quoted\_fields | enum | Specify how to deal with irregular unescaped quote characters in quoted fields | ``ACCEPT_ONLY_RFC4180_ESCAPED`` by default |
|
210
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
211
|
-
| comment\_line\_marker | string | Skip a line if the line begins with this string | null by default |
|
212
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
213
|
-
| allow\_optional\_columns | boolean | If true, set null to insufficient columns. Otherwise, skip the row in case of insufficient number of columns | ``false`` by default |
|
214
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
215
|
-
| allow\_extra\_columns | boolean | If true, ignore too many columns. Otherwise, skip the row in case of too many columns | ``false`` by default |
|
216
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
217
|
-
| max\_quoted\_size\_limit | integer | Maximum number of bytes of a quoted value. If a value exceeds the limit, the row will be skipped | ``131072`` by default |
|
218
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
219
|
-
| stop\_on\_invalid\_record | boolean | Stop bulk load transaction if a file includes invalid record (such as invalid timestamp) | ``false`` by default |
|
220
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
221
|
-
| default\_timezone | string | Time zone of timestamp columns if the value itself doesn't include time zone description (eg. Asia/Tokyo) | ``UTC`` by default |
|
222
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
223
|
-
| default\_date | string | Set date part if the format doesn’t include date part. | ``1970-01-01`` by default |
|
224
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
225
|
-
| newline | enum | Newline character (CRLF, LF or CR) | ``CRLF`` by default |
|
226
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
227
|
-
| charset | enum | Character encoding (eg. ISO-8859-1, UTF-8) | ``UTF-8`` by default |
|
228
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
229
|
-
| columns | hash | Columns (see below) | required |
|
230
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+--------------------------------------------+
|
231
|
-
|
232
|
-
The ``quotes_in_quoted_fields`` option specifies how to deal with irregular non-escaped stray quote characters.
|
233
|
-
|
234
|
-
+------------------------------------------------------+-----------------------------------------------------------------------------------------------------------------------------------------------------+
|
235
|
-
| name | description |
|
236
|
-
+======================================================+=====================================================================================================================================================+
|
237
|
-
| ACCEPT_ONLY_RFC4180_ESCAPED | Default. Accept only specified and RFC 4180-style escaped quote characters. |
|
238
|
-
+------------------------------------------------------+-----------------------------------------------------------------------------------------------------------------------------------------------------+
|
239
|
-
| ACCEPT_STRAY_QUOTES_ASSUMING_NO_DELIMITERS_IN_FIELDS | Accept stray quotes as-is in the field. Instead, it behaves undefined if delimiters are in fields. ``"a"b"`` goes ``a"b``. ``"a""b"`` goes ``a"b``. |
|
240
|
-
+------------------------------------------------------+-----------------------------------------------------------------------------------------------------------------------------------------------------+
|
241
|
-
|
242
|
-
The ``columns`` option declares the list of columns. This CSV parser plugin ignores the header line.
|
243
|
-
|
244
|
-
+----------+--------------------------------------------------------+
|
245
|
-
| name | description |
|
246
|
-
+==========+========================================================+
|
247
|
-
| name | Name of the column |
|
248
|
-
+----------+--------------------------------------------------------+
|
249
|
-
| type | Type of the column (see below) |
|
250
|
-
+----------+--------------------------------------------------------+
|
251
|
-
| format | Format of the timestamp if type is timestamp |
|
252
|
-
+----------+--------------------------------------------------------+
|
253
|
-
| date | Set date part if the format doesn’t include date part |
|
254
|
-
+----------+--------------------------------------------------------+
|
255
|
-
|
256
|
-
.. note::
|
257
|
-
|
258
|
-
The Timestamp format refers to `Ruby strftime format <https://docs.ruby-lang.org/en/2.4.0/Date.html#method-i-strftime>`_
|
259
|
-
|
260
|
-
List of types:
|
261
|
-
|
262
|
-
+-------------+----------------------------------------------+
|
263
|
-
| name | description |
|
264
|
-
+=============+==============================================+
|
265
|
-
| boolean | true or false |
|
266
|
-
+-------------+----------------------------------------------+
|
267
|
-
| long | 64-bit signed integers |
|
268
|
-
+-------------+----------------------------------------------+
|
269
|
-
| timestamp | Date and time with nano-seconds precision |
|
270
|
-
+-------------+----------------------------------------------+
|
271
|
-
| double | 64-bit floating point numbers |
|
272
|
-
+-------------+----------------------------------------------+
|
273
|
-
| string | Strings |
|
274
|
-
+-------------+----------------------------------------------+
|
275
|
-
|
276
|
-
The ``null_string`` option converts certain values to NULL. Values will be converted as following:
|
277
|
-
|
278
|
-
+---------------------------------+-------------------------+--------------------------+----------------+--------------------+
|
279
|
-
| | non-quoted empty string | quoted empty string ("") | non-quoted \\N | quoted \\N ("\\N") |
|
280
|
-
+=================================+=========================+==========================+================+====================+
|
281
|
-
| ``null_string: ""`` | NULL | NULL | ``\N`` | ``\N`` |
|
282
|
-
+---------------------------------+-------------------------+--------------------------+----------------+--------------------+
|
283
|
-
| ``null_string: \N`` | (empty string) | (empty string) | NULL | NULL |
|
284
|
-
+---------------------------------+-------------------------+--------------------------+----------------+--------------------+
|
285
|
-
| ``null_string: null`` (default) | NULL | (empty string) | ``\N`` | ``\N`` |
|
286
|
-
+---------------------------------+-------------------------+--------------------------+----------------+--------------------+
|
287
|
-
|
288
|
-
You can use ``guess`` to automatically generate the column settings. See also `Quick Start <https://github.com/embulk/embulk#quick-start>`_.
|
289
|
-
|
290
|
-
Example
|
291
|
-
~~~~~~~~
|
292
|
-
|
293
|
-
.. code-block:: yaml
|
294
|
-
|
295
|
-
in:
|
296
|
-
...
|
297
|
-
parser:
|
298
|
-
type: csv
|
299
|
-
charset: UTF-8
|
300
|
-
newline: CRLF
|
301
|
-
delimiter: "\t"
|
302
|
-
quote: '"'
|
303
|
-
escape: '"'
|
304
|
-
null_string: 'NULL'
|
305
|
-
skip_header_lines: 1
|
306
|
-
comment_line_marker: '#'
|
307
|
-
columns:
|
308
|
-
- {name: id, type: long}
|
309
|
-
- {name: account, type: long}
|
310
|
-
- {name: time, type: timestamp, format: '%Y-%m-%d %H:%M:%S'}
|
311
|
-
- {name: purchase, type: timestamp, format: '%Y%m%d'}
|
312
|
-
- {name: comment, type: string}
|
313
|
-
|
314
|
-
|
315
|
-
.. note::
|
316
|
-
|
317
|
-
CSV parser supports ``format: '%s'`` to parse UNIX timestamp in seconds (e.g. 1470148959) as timestamp.
|
318
|
-
|
319
|
-
However, CSV parser itself can't parse UNIX timestamp in millisecond (e.g. 1470148959542) as timestamp. You can still parse the column as ``long`` type first, then apply `timestamp_format <https://github.com/sonots/embulk-filter-timestamp_format>`_ filter plugin to convert long to timestamp. Here is an example:
|
320
|
-
|
321
|
-
.. code-block:: yaml
|
322
|
-
|
323
|
-
in:
|
324
|
-
type: file
|
325
|
-
path_prefix: /my_csv_files
|
326
|
-
parser:
|
327
|
-
...
|
328
|
-
columns:
|
329
|
-
- {name: timestamp_in_seconds, type: timestamp, format: '%s'}
|
330
|
-
- {name: timestamp_in_millis, type: long}
|
331
|
-
filters:
|
332
|
-
- type: timestamp_format
|
333
|
-
columns:
|
334
|
-
- {name: timestamp_in_millis, from_unit: ms}
|
335
|
-
|
336
|
-
|
337
|
-
JSON parser plugin
|
338
|
-
-------------------
|
339
|
-
|
340
|
-
The ``json`` parser plugin parses a JSON file that contains a sequence of JSON objects. Example:
|
341
|
-
|
342
|
-
.. code-block:: javascript
|
343
|
-
|
344
|
-
{"time":1455829282,"ip":"93.184.216.34","name":"frsyuki"}
|
345
|
-
{"time":1455829282,"ip":"172.36.8.109", "name":"sadayuki"}
|
346
|
-
{"time":1455829284,"ip":"example.com","name":"Treasure Data"}
|
347
|
-
{"time":1455829282,"ip":"10.98.43.1","name":"MessagePack"}
|
348
|
-
|
349
|
-
``json`` parser plugin outputs a single record named "record" (type is json).
|
350
|
-
|
351
|
-
Options
|
352
|
-
~~~~~~~~
|
353
|
-
|
354
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+------------------------------+
|
355
|
-
| name | type | description | required? |
|
356
|
-
+============================+==========+================================================================================================================+==============================+
|
357
|
-
| stop\_on\_invalid\_record | boolean | Stop bulk load transaction if a file includes invalid record (such as invalid json) | ``false`` by default |
|
358
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+------------------------------+
|
359
|
-
| invalid\_string\_escapes | enum | Escape strategy of invalid json string such as using invalid ``\`` like ``\a``. (PASSTHROUGH, SKIP, UNESCAPE) | ``PASSTHROUGH`` by default |
|
360
|
-
+----------------------------+----------+----------------------------------------------------------------------------------------------------------------+------------------------------+
|
361
|
-
|
362
|
-
|
363
|
-
if you set invalid\_string\_escapes and appear invalid JSON string (such as ``\a``), it makes following the action.
|
364
|
-
|
365
|
-
+----------------------------+------------------+
|
366
|
-
| invalid\_string\_escapes | convert to |
|
367
|
-
+============================+==================+
|
368
|
-
| PASSTHROUGH *1 | ``\a`` |
|
369
|
-
+----------------------------+------------------+
|
370
|
-
| SKIP | empty string |
|
371
|
-
+----------------------------+------------------+
|
372
|
-
| UNESCAPE | ``a`` |
|
373
|
-
+----------------------------+------------------+
|
374
|
-
|
375
|
-
(\*1): Throwing an exception.
|
376
|
-
|
377
|
-
|
378
|
-
Example
|
379
|
-
~~~~~~~~
|
380
|
-
|
381
|
-
.. code-block:: yaml
|
382
|
-
|
383
|
-
in:
|
384
|
-
parser:
|
385
|
-
type: json
|
386
|
-
|
387
|
-
Gzip decoder plugin
|
388
|
-
--------------------
|
389
|
-
|
390
|
-
The ``gzip`` decoder plugin decompresses gzip files before input plugins read them.
|
391
|
-
|
392
|
-
Options
|
393
|
-
~~~~~~~~
|
394
|
-
|
395
|
-
This plugin doesn't have any options.
|
396
|
-
|
397
|
-
Example
|
398
|
-
~~~~~~~~
|
399
|
-
|
400
|
-
.. code-block:: yaml
|
401
|
-
|
402
|
-
in:
|
403
|
-
...
|
404
|
-
decoders:
|
405
|
-
- {type: gzip}
|
406
|
-
|
407
|
-
|
408
|
-
BZip2 decoder plugin
|
409
|
-
---------------------
|
410
|
-
|
411
|
-
The ``bzip2`` decoder plugin decompresses bzip2 files before input plugins read them.
|
412
|
-
|
413
|
-
Options
|
414
|
-
~~~~~~~~
|
415
|
-
|
416
|
-
This plugin doesn't have any options.
|
417
|
-
|
418
|
-
Example
|
419
|
-
~~~~~~~~
|
420
|
-
|
421
|
-
.. code-block:: yaml
|
422
|
-
|
423
|
-
in:
|
424
|
-
...
|
425
|
-
decoders:
|
426
|
-
- {type: bzip2}
|
427
|
-
|
428
|
-
|
429
|
-
File output plugin
|
430
|
-
-------------------
|
431
|
-
|
432
|
-
The ``file`` output plugin writes records to local file system.
|
433
|
-
|
434
|
-
Options
|
435
|
-
~~~~~~~~
|
436
|
-
|
437
|
-
+--------------------+----------+---------------------------------------------------+----------------------------+
|
438
|
-
| name | type | description | required? |
|
439
|
-
+====================+==========+===================================================+============================+
|
440
|
-
| path\_prefix | string | Path prefix of the output files | required |
|
441
|
-
+--------------------+----------+---------------------------------------------------+----------------------------+
|
442
|
-
| sequence\_format | string | Format of the sequence number of the output files | ``%03d.%02d.`` by default |
|
443
|
-
+--------------------+----------+---------------------------------------------------+----------------------------+
|
444
|
-
| file\_ext | string | Path suffix of the output files (e.g. ``"csv"``) | required |
|
445
|
-
+--------------------+----------+---------------------------------------------------+----------------------------+
|
446
|
-
|
447
|
-
For example, if you set ``path_prefix: /path/to/output/sample_``, ``sequence_format: "%03d.%02d."``, and ``file_ext: csv``, name of the output files will be as following:
|
448
|
-
|
449
|
-
::
|
450
|
-
|
451
|
-
.
|
452
|
-
`-- path
|
453
|
-
`-- to
|
454
|
-
`-- output
|
455
|
-
|-- sample_01.000.csv
|
456
|
-
|-- sample_02.000.csv
|
457
|
-
|-- sample_03.000.csv
|
458
|
-
|-- sample_04.000.csv
|
459
|
-
|
460
|
-
``sequence_format`` formats task index and sequence number in a task.
|
461
|
-
|
462
|
-
Example
|
463
|
-
~~~~~~~~
|
464
|
-
|
465
|
-
.. code-block:: yaml
|
466
|
-
|
467
|
-
out:
|
468
|
-
type: file
|
469
|
-
path_prefix: /path/to/output/sample_
|
470
|
-
file_ext: csv
|
471
|
-
formatter:
|
472
|
-
...
|
473
|
-
|
474
|
-
CSV formatter plugin
|
475
|
-
---------------------
|
476
|
-
|
477
|
-
The ``csv`` formatter plugin formats records using CSV or TSV format.
|
478
|
-
|
479
|
-
Options
|
480
|
-
~~~~~~~~
|
481
|
-
|
482
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
483
|
-
| name | type | description | required? |
|
484
|
-
+======================+=========+=======================================================================================================+===============================+
|
485
|
-
| delimiter | string | Delimiter character such as ``,`` for CSV, ``"\t"`` for TSV, ``"|"`` or any single-byte character | ``,`` by default |
|
486
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
487
|
-
| quote | string | The character surrounding a quoted value | ``"`` by default |
|
488
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
489
|
-
| quote\_policy | enum | Policy for quote (ALL, MINIMAL, NONE) (see below) | ``MINIMAL`` by default |
|
490
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
491
|
-
| escape | string | Escape character to escape quote character | same with quote default (\*1) |
|
492
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
493
|
-
| header\_line | boolean | If true, write the header line with column name at the first line | ``true`` by default |
|
494
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
495
|
-
| null_string | string | Expression of NULL values | empty by default |
|
496
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
497
|
-
| newline | enum | Newline character (CRLF, LF or CR) | ``CRLF`` by default |
|
498
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
499
|
-
| newline\_in\_field | enum | Newline character in each field (CRLF, LF, CR) | ``LF`` by default |
|
500
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
501
|
-
| charset | enum | Character encoding (eg. ISO-8859-1, UTF-8) | ``UTF-8`` by default |
|
502
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
503
|
-
| default\_timezone | string | Time zone of timestamp columns. This can be overwritten for each column using ``column_options`` | ``UTC`` by default |
|
504
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
505
|
-
| column\_options | hash | See bellow | optional |
|
506
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-------------------------------+
|
507
|
-
|
508
|
-
(\*1): if quote\_policy is NONE, ``quote`` option is ignored, and default ``escape`` is ``\``.
|
509
|
-
|
510
|
-
The ``quote_policy`` option is used to determine field type to quote.
|
511
|
-
|
512
|
-
+------------+--------------------------------------------------------------------------------------------------------+
|
513
|
-
| name | description |
|
514
|
-
+============+========================================================================================================+
|
515
|
-
| ALL | Quote all fields |
|
516
|
-
+------------+--------------------------------------------------------------------------------------------------------+
|
517
|
-
| MINIMAL | Only quote those fields which contain delimiter, quote or any of the characters in lineterminator |
|
518
|
-
+------------+--------------------------------------------------------------------------------------------------------+
|
519
|
-
| NONE | Never quote fields. When the delimiter occurs in field, escape with escape char |
|
520
|
-
+------------+--------------------------------------------------------------------------------------------------------+
|
521
|
-
|
522
|
-
The ``column_options`` option is a map whose keys are name of columns, and values are configuration with following parameters:
|
523
|
-
|
524
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-----------------------------------------+
|
525
|
-
| name | type | description | required? |
|
526
|
-
+======================+=========+=======================================================================================================+=========================================+
|
527
|
-
| timezone | string | Time zone if type of this column is timestamp. If not set, ``default\_timezone`` is used. | optional |
|
528
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-----------------------------------------+
|
529
|
-
| format | string | Timestamp format if type of this column is timestamp. | ``%Y-%m-%d %H:%M:%S.%6N %z`` by default |
|
530
|
-
+----------------------+---------+-------------------------------------------------------------------------------------------------------+-----------------------------------------+
|
531
|
-
|
532
|
-
.. note::
|
533
|
-
|
534
|
-
The Timestamp format refers to `Ruby strftime format <https://docs.ruby-lang.org/en/2.4.0/Date.html#method-i-strftime>`_
|
535
|
-
|
536
|
-
Example
|
537
|
-
~~~~~~~~
|
538
|
-
|
539
|
-
.. code-block:: yaml
|
540
|
-
|
541
|
-
out:
|
542
|
-
...
|
543
|
-
formatter:
|
544
|
-
type: csv
|
545
|
-
delimiter: "\t"
|
546
|
-
newline: CRLF
|
547
|
-
newline_in_field: LF
|
548
|
-
charset: UTF-8
|
549
|
-
quote_policy: MINIMAL
|
550
|
-
quote: '"'
|
551
|
-
escape: "\\"
|
552
|
-
null_string: "\\N"
|
553
|
-
default_timezone: 'UTC'
|
554
|
-
column_options:
|
555
|
-
mycol1: {format: '%Y-%m-%d %H:%M:%S'}
|
556
|
-
mycol2: {format: '%Y-%m-%d %H:%M:%S', timezone: 'America/Los_Angeles'}
|
557
|
-
|
558
|
-
Gzip encoder plugin
|
559
|
-
--------------------
|
560
|
-
|
561
|
-
The ``gzip`` encoder plugin compresses output files using gzip.
|
562
|
-
|
563
|
-
Options
|
564
|
-
~~~~~~~~
|
565
|
-
|
566
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
567
|
-
| name | type | description | required? |
|
568
|
-
+=========+==========+======================================================================+====================+
|
569
|
-
| level | integer | Compression level. From 0 (no compression) to 9 (best compression). | ``6`` by default |
|
570
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
571
|
-
|
572
|
-
Example
|
573
|
-
~~~~~~~~
|
574
|
-
|
575
|
-
.. code-block:: yaml
|
576
|
-
|
577
|
-
out:
|
578
|
-
...
|
579
|
-
encoders:
|
580
|
-
- type: gzip
|
581
|
-
level: 1
|
582
|
-
|
583
|
-
|
584
|
-
BZip2 encoder plugin
|
585
|
-
---------------------
|
586
|
-
|
587
|
-
The ``bzip2`` encoder plugin compresses output files using bzip2.
|
588
|
-
|
589
|
-
Options
|
590
|
-
~~~~~~~~
|
591
|
-
|
592
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
593
|
-
| name | type | description | required? |
|
594
|
-
+=========+==========+======================================================================+====================+
|
595
|
-
| level | integer | Compression level. From 1 to 9 (best compression). | ``9`` by default |
|
596
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
597
|
-
|
598
|
-
Example
|
599
|
-
~~~~~~~~
|
600
|
-
|
601
|
-
.. code-block:: yaml
|
602
|
-
|
603
|
-
out:
|
604
|
-
...
|
605
|
-
encoders:
|
606
|
-
- type: bzip2
|
607
|
-
level: 6
|
608
|
-
|
609
|
-
|
610
|
-
Rename filter plugin
|
611
|
-
---------------------
|
612
|
-
|
613
|
-
The ``rename`` filter plugin changes column names. This plugin has no impact on performance.
|
614
|
-
|
615
|
-
Options
|
616
|
-
~~~~~~~~
|
617
|
-
|
618
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
619
|
-
| name | type | description | required? |
|
620
|
-
+=========+==========+======================================================================+====================+
|
621
|
-
| rules | array | An array of rule-based renaming operations. (See below for rules.) | ``[]`` by default |
|
622
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
623
|
-
| columns | hash | A map whose keys are existing column names. values are new names. | ``{}`` by default |
|
624
|
-
+---------+----------+----------------------------------------------------------------------+--------------------+
|
625
|
-
|
626
|
-
Renaming rules
|
627
|
-
~~~~~~~~~~~~~~~
|
628
|
-
|
629
|
-
The ``rules`` is an array of rules as below applied top-down for all the columns.
|
630
|
-
|
631
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
632
|
-
| rule | description |
|
633
|
-
+=========================+========================================================================================+
|
634
|
-
| character\_types | Restrict characters by types. Replace restricted characteres. |
|
635
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
636
|
-
| first\_character\_types | Restrict the first character by types. Prefix or replace first restricted characters. |
|
637
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
638
|
-
| lower\_to\_upper | Convert lower-case alphabets to upper-case. |
|
639
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
640
|
-
| regex\_replace | Replace with a regular expressions. |
|
641
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
642
|
-
| truncate | Truncate. |
|
643
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
644
|
-
| upper\_to\_lower | Convert upper-case alphabets to lower-case |
|
645
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
646
|
-
| unique\_number\_suffix | Make column names unique in the schema. |
|
647
|
-
+-------------------------+----------------------------------------------------------------------------------------+
|
648
|
-
|
649
|
-
Renaming rule: character\_types
|
650
|
-
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
651
|
-
|
652
|
-
The rule ``character_types`` replaces restricted characters.
|
653
|
-
|
654
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+--------------------+
|
655
|
-
| option | description | required? |
|
656
|
-
+===================+============================================================================================================================================+====================+
|
657
|
-
| pass\_characteres | Characters to be allowed. | ``""`` by default |
|
658
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+--------------------+
|
659
|
-
| pass\_types | Sets of characters to be allowed. The array must consist of "a-z" (lower-case alphabets), "A-Z" (upper-case alphabets), or "0-9" (digits). | ``[]`` by default |
|
660
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+--------------------+
|
661
|
-
| replace | A character that disallowed characters are replaced with. It must consist of just 1 character. | ``"_"`` by default |
|
662
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+--------------------+
|
663
|
-
|
664
|
-
Example
|
665
|
-
""""""""
|
666
|
-
|
667
|
-
.. code-block:: yaml
|
668
|
-
|
669
|
-
# This configuration replaces characters into "_" except for "_", lower-case alphabets, and digits.
|
670
|
-
filters:
|
671
|
-
...
|
672
|
-
- type: rename
|
673
|
-
rules:
|
674
|
-
- rule: character_types
|
675
|
-
pass_characters: "_"
|
676
|
-
pass_types: [ "a-z", "0-9" ]
|
677
|
-
|
678
|
-
|
679
|
-
Renaming rule: first\_character\_types
|
680
|
-
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
681
|
-
|
682
|
-
The rule ``first_character_types`` prefixes or replaces a restricted character at the beginning.
|
683
|
-
|
684
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+----------------------------------------------+
|
685
|
-
| option | description | required? |
|
686
|
-
+===================+============================================================================================================================================+==============================================+
|
687
|
-
| pass\_characteres | Characters to be allowed. | ``""`` by default |
|
688
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+----------------------------------------------+
|
689
|
-
| pass\_types | Sets of characters to be allowed. The array must consist of "a-z" (lower-case alphabets), "A-Z" (upper-case alphabets), or "0-9" (digits). | ``[]`` by default |
|
690
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+----------------------------------------------+
|
691
|
-
| prefix | A character that a disallowed first character is replaced with. | one of ``prefix`` or ``replace`` is required |
|
692
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+----------------------------------------------+
|
693
|
-
| replace | A character that a disallowed first character is prefixed with. | one of ``prefix`` or ``replace`` is required |
|
694
|
-
+-------------------+--------------------------------------------------------------------------------------------------------------------------------------------+----------------------------------------------+
|
695
|
-
|
696
|
-
Example
|
697
|
-
""""""""
|
698
|
-
|
699
|
-
.. code-block:: yaml
|
700
|
-
|
701
|
-
# This configuration prefixes a column name with "_" unless the name starts from "_" or a lower-case alphabet.
|
702
|
-
filters:
|
703
|
-
...
|
704
|
-
- type: rename
|
705
|
-
rules:
|
706
|
-
- rule: first_character_types
|
707
|
-
pass_characters: "_"
|
708
|
-
pass_types: [ "a-z" ]
|
709
|
-
prefix: "_"
|
710
|
-
|
711
|
-
Renaming rule: lower\_to\_upper
|
712
|
-
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
713
|
-
|
714
|
-
The rule ``lower_to_upper`` converts lower-case alphabets to upper-case.
|
715
|
-
|
716
|
-
Example
|
717
|
-
""""""""
|
718
|
-
|
719
|
-
.. code-block:: yaml
|
720
|
-
|
721
|
-
# This configuration converts all lower-case alphabets to upper-case.
|
722
|
-
filters:
|
723
|
-
...
|
724
|
-
- type: rename
|
725
|
-
rules:
|
726
|
-
- rule: lower_to_upper
|
727
|
-
|
728
|
-
|
729
|
-
Renaming rule: regex\_replace
|
730
|
-
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
731
|
-
|
732
|
-
The rule ``regex_replace`` replaces column names based on a regular expression.
|
733
|
-
|
734
|
-
+---------+--------------------------------------------------------------------------------------------------------------------------------------+-----------+
|
735
|
-
| option | description | required? |
|
736
|
-
+=========+======================================================================================================================================+===========+
|
737
|
-
| match | A `Java-style regular expression <https://docs.oracle.com/javase/tutorial/essential/regex/>`_ to which this string is to be matched. | required |
|
738
|
-
+---------+--------------------------------------------------------------------------------------------------------------------------------------+-----------+
|
739
|
-
| replace | A string to be substibuted for each match in Java-style. | required |
|
740
|
-
+---------+--------------------------------------------------------------------------------------------------------------------------------------+-----------+
|
741
|
-
|
742
|
-
Example
|
743
|
-
""""""""
|
744
|
-
|
745
|
-
.. code-block:: yaml
|
746
|
-
|
747
|
-
# This configuration replaces all patterns
|
748
|
-
filters:
|
749
|
-
...
|
750
|
-
- type: rename
|
751
|
-
rules:
|
752
|
-
- rule: regex_replace
|
753
|
-
match: "([0-9]+)_dollars"
|
754
|
-
replace: "USD$1"
|
755
|
-
|
756
|
-
|
757
|
-
Renaming rule: truncate
|
758
|
-
^^^^^^^^^^^^^^^^^^^^^^^^
|
759
|
-
|
760
|
-
The rule ``truncate`` truncates column names.
|
761
|
-
|
762
|
-
+------------+-----------------------------------------------------+--------------------+
|
763
|
-
| option | description | required? |
|
764
|
-
+============+=====================================================+====================+
|
765
|
-
| max_length | The length to which the column names are truncated. | ``128`` by default |
|
766
|
-
+------------+-----------------------------------------------------+--------------------+
|
767
|
-
|
768
|
-
Example
|
769
|
-
""""""""
|
770
|
-
|
771
|
-
.. code-block:: yaml
|
772
|
-
|
773
|
-
# This configuration drops all characters after the 20th character.
|
774
|
-
filters:
|
775
|
-
...
|
776
|
-
- type: rename
|
777
|
-
rules:
|
778
|
-
- rule: truncate
|
779
|
-
max_length: 20
|
780
|
-
|
781
|
-
Renaming rule: upper\_to\_lower
|
782
|
-
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
783
|
-
|
784
|
-
The rule ``upper_to_lower`` converts upper-case alphabets to lower-case.
|
785
|
-
|
786
|
-
Example
|
787
|
-
""""""""
|
788
|
-
|
789
|
-
.. code-block:: yaml
|
790
|
-
|
791
|
-
# This configuration converts all upper-case alphabets to lower-case.
|
792
|
-
filters:
|
793
|
-
...
|
794
|
-
- type: rename
|
795
|
-
rules:
|
796
|
-
- rule: upper_to_lower
|
797
|
-
|
798
|
-
Renaming rule: unique\_number\_suffix
|
799
|
-
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
800
|
-
|
801
|
-
The rule ``unique_number_suffix`` makes column names unique in the schema by suffixing numbers.
|
802
|
-
|
803
|
-
+------------+-----------------------------------------------------------------------------------------------------------------------------+--------------------+
|
804
|
-
| option | description | required? |
|
805
|
-
+============+=============================================================================================================================+====================+
|
806
|
-
| delimiter | A delimiter character inserted before a suffix number. It must be just 1 non-digit character. | ``"_"`` by default |
|
807
|
-
+------------+-----------------------------------------------------------------------------------------------------------------------------+--------------------+
|
808
|
-
| digits | An integer that specifies the number of zero-filled digits of a suffix number. The suffix number zero-filled to the digits. | optional |
|
809
|
-
+------------+-----------------------------------------------------------------------------------------------------------------------------+--------------------+
|
810
|
-
| max_length | The length to which the column names are truncated. The column name is truncated before the suffix number. | optional |
|
811
|
-
+------------+-----------------------------------------------------------------------------------------------------------------------------+--------------------+
|
812
|
-
| offset | An integer where the suffix number starts. The first duplicative column name is suffixed by (```offset``` + 1). | ``1`` by default |
|
813
|
-
+------------+-----------------------------------------------------------------------------------------------------------------------------+--------------------+
|
814
|
-
|
815
|
-
.. hint::
|
816
|
-
The procedure to make column names unique is not very trivial. There are many feasible ways. This renaming rule works as follows:
|
817
|
-
|
818
|
-
Basic policies:
|
819
|
-
|
820
|
-
* Suffix numbers are counted per original column name.
|
821
|
-
* Column names are fixed from the first column to the last column.
|
822
|
-
|
823
|
-
Actual procedure applied from the first (leftmost) column to the last (rightmost) column:
|
824
|
-
|
825
|
-
1. Fix the column name as-is with truncating if the truncated name is not duplicated with left columns.
|
826
|
-
2. Suffix the column name otherwise.
|
827
|
-
|
828
|
-
a. Try to append the suffix number for the original column name with truncating.
|
829
|
-
b. Fix it if the suffixed name is not duplicated with left columns nor original columns.
|
830
|
-
c. Retry (a) with the suffix number increased otherwise.
|
831
|
-
|
832
|
-
Example
|
833
|
-
""""""""
|
834
|
-
|
835
|
-
.. code-block:: yaml
|
836
|
-
|
837
|
-
# This configuration suffixes numbers to duplicative column names. (Ex. ["column", "column", "column"] goes to ["column", "column_2", "column_3"].)
|
838
|
-
filters:
|
839
|
-
...
|
840
|
-
- type: rename
|
841
|
-
rules:
|
842
|
-
- rule: unique_number_suffix
|
843
|
-
|
844
|
-
Example of renaming rules
|
845
|
-
~~~~~~~~~~~~~~~~~~~~~~~~~~
|
846
|
-
|
847
|
-
.. code-block:: yaml
|
848
|
-
|
849
|
-
filters:
|
850
|
-
...
|
851
|
-
- type: rename
|
852
|
-
rules:
|
853
|
-
- rule: upper_to_lower # All upper-case are converted to lower-case.
|
854
|
-
- rule: character_types # Only lower-case, digits and "_" are allowed. (No upper-case by the rule ahove.)
|
855
|
-
pass_types: [ "a-z", "0-9" ]
|
856
|
-
pass_characters: "_"
|
857
|
-
- rule: unique_number_suffix # Ensure all column names are unique.
|
858
|
-
|
859
|
-
Columns: not recommended
|
860
|
-
~~~~~~~~~~~~~~~~~~~~~~~~~
|
861
|
-
|
862
|
-
``columns`` is not recommended to use anymore. Consider using ``rules`` instead.
|
863
|
-
|
864
|
-
.. code-block:: yaml
|
865
|
-
|
866
|
-
filters:
|
867
|
-
...
|
868
|
-
- type: rename
|
869
|
-
columns:
|
870
|
-
my_existing_column1: new_column1
|
871
|
-
my_existing_column2: new_column2
|
872
|
-
|
873
|
-
.. hint::
|
874
|
-
``columns`` are applied before ``rules`` if ``columns`` and ``rules`` are specified together. (It is discouraged to specify them together, though.)
|
875
|
-
|
876
|
-
|
877
|
-
Remove columns filter plugin
|
878
|
-
-----------------------------
|
879
|
-
|
880
|
-
The ``remove_columns`` filter plugin removes columns from schema.
|
881
|
-
|
882
|
-
Options
|
883
|
-
~~~~~~~~
|
884
|
-
|
885
|
-
+--------------------------+----------+------------------------------------------------------------+-----------------------+
|
886
|
-
| name | type | description | required? |
|
887
|
-
+==========================+==========+============================================================+=======================+
|
888
|
-
| remove | array | An array of names of columns that it removes from schema. | ``[]`` by default |
|
889
|
-
+--------------------------+----------+------------------------------------------------------------+-----------------------+
|
890
|
-
| keep | array | An array of names of columns that it keeps in schema. | ``[]`` by default |
|
891
|
-
+--------------------------+----------+------------------------------------------------------------+-----------------------+
|
892
|
-
| accept_unmatched_columns | boolean | If true, skip columns that aren't included in schemas. | ``false`` by default |
|
893
|
-
+--------------------------+----------+------------------------------------------------------------+-----------------------+
|
894
|
-
|
895
|
-
|
896
|
-
remove: and keep: options are not multi-select.
|
897
|
-
|
898
|
-
Example
|
899
|
-
~~~~~~~~
|
900
|
-
|
901
|
-
.. code-block:: yaml
|
902
|
-
|
903
|
-
# This configuration removes "_c0" and "_c1" named columns from schema.
|
904
|
-
filters:
|
905
|
-
...
|
906
|
-
- type: remove_columns
|
907
|
-
remove: ["_c0", "_c1"]
|
908
|
-
|
909
|
-
|
910
|
-
Local executor plugin
|
911
|
-
----------------------
|
912
|
-
|
913
|
-
The ``local`` executor plugin runs tasks using local threads. This is the only built-in executor plugin.
|
914
|
-
|
915
|
-
Options
|
916
|
-
~~~~~~~~
|
917
|
-
|
918
|
-
+------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
919
|
-
| name | type | description | required? |
|
920
|
-
+==================+==========+======================================================================+======================================+
|
921
|
-
| max_threads | integer | Maximum number of threads to run concurrently. | 2x of available CPU cores by default |
|
922
|
-
+------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
923
|
-
| min_output_tasks | integer | Mimimum number of output tasks to enable page scattering. | 1x of available CPU cores by default |
|
924
|
-
+------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
925
|
-
|
926
|
-
|
927
|
-
The ``max_threads`` option controls maximum concurrency. Setting smaller number here is useful if too many threads make the destination or source storage overloaded. Setting larger number here is useful if CPU utilization is too low due to high latency.
|
928
|
-
|
929
|
-
The ``min_output_tasks`` option enables "page scattering". The feature is enabled if number of input tasks is less than ``min_output_tasks``. It uses multiple filter & output threads for each input task so that one input task can use multiple threads. Setting larger number here is useful if embulk doesn't use multi-threading with enough concurrency due to too few number of input tasks. Setting 1 here disables page scattering completely.
|
930
|
-
|
931
|
-
Example
|
932
|
-
~~~~~~~~
|
933
|
-
|
934
|
-
.. code-block:: yaml
|
935
|
-
|
936
|
-
exec:
|
937
|
-
max_threads: 8 # run at most 8 tasks concurrently
|
938
|
-
min_output_tasks: 1 # disable page scattering
|
939
|
-
in:
|
940
|
-
type: ...
|
941
|
-
...
|
942
|
-
out:
|
943
|
-
type: ...
|
944
|
-
...
|
945
|
-
|
946
|
-
Guess executor
|
947
|
-
---------------
|
948
|
-
|
949
|
-
The guess executor is called by ``guess`` command. It executes default guess plugins in a sequential order and suggests Embulk config by appropriate guess plugin. The default guess plugins and the order are ``gzip``, ``'bzip2``, ``json`` and ``csv``.
|
950
|
-
|
951
|
-
Options
|
952
|
-
~~~~~~~~
|
953
|
-
|
954
|
-
+---------------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
955
|
-
| name | type | description | required? |
|
956
|
-
+===========================+==========+======================================================================+======================================+
|
957
|
-
| guess_plugins | array | ``guess`` command uses specified guess plugins. | ``[]`` by default |
|
958
|
-
+---------------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
959
|
-
| exclude_guess_plugins | array | ``guess`` command doesn't use specified plugins. | ``[]`` by default |
|
960
|
-
+---------------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
961
|
-
| guess_sample_buffer_bytes | int | Bytes of sample buffer that it tries to read from input source. | 32768 (32KB) by default |
|
962
|
-
+-------------------------------+----------+----------------------------------------------------------------------+----------------------------------+
|
963
|
-
|
964
|
-
The ``guess_plugins`` option includes specified guess plugin in the bottom of the list of default guess plugins.
|
965
|
-
|
966
|
-
The ``exclude_guess_plugins`` option exclude specified guess plugins from the list of default guess plugins that the guess executor uses.
|
967
|
-
|
968
|
-
The ``guess_sample_buffer_bytes`` option controls the bytes of sample buffer that GuessExecutor tries to read from specified input source.
|
969
|
-
|
970
|
-
This example shows how to use ``csv_all_strings`` guess plugin, which suggests column types within CSV files as string types. It needs to be explicitly specified by users when it's used instead of ``csv`` guess plugin because the plugin is not included in default guess plugins. We also can exclude default ``csv`` guess plugin.
|
971
|
-
|
972
|
-
Example
|
973
|
-
~~~~~~~~
|
974
|
-
|
975
|
-
.. code-block:: yaml
|
976
|
-
|
977
|
-
exec:
|
978
|
-
guess_plugins: ['csv_all_strings']
|
979
|
-
exclude_guess_plugins: ['csv']
|
980
|
-
in:
|
981
|
-
type: ...
|
982
|
-
...
|
983
|
-
out:
|
984
|
-
type: ...
|
985
|
-
...
|
986
|
-
|
987
|
-
Preview executor
|
988
|
-
----------------
|
989
|
-
|
990
|
-
The preview executor is called by ``preview`` command. It tries to read sample buffer from a specified input source and writes them to Page objects. ``preview`` outputs the Page objects to console.
|
991
|
-
|
992
|
-
Options
|
993
|
-
~~~~~~~~
|
994
|
-
|
995
|
-
+-------------------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
996
|
-
| name | type | description | required? |
|
997
|
-
+===============================+==========+======================================================================+======================================+
|
998
|
-
| preview_sample_buffer_bytes | int | Bytes of sample buffer that it tries to read from input source. | 32768 (32KB) by default |
|
999
|
-
+-------------------------------+----------+----------------------------------------------------------------------+--------------------------------------+
|
1000
|
-
|
1001
|
-
The ``preview_sample_buffer_bytes`` option controls the bytes of sample buffer that PreviewExecutor tries to read from specified input source.
|
1002
|
-
|
1003
|
-
This example shows how to change the bytes of sample buffer.
|
1004
|
-
|
1005
|
-
Example
|
1006
|
-
~~~~~~~~
|
1007
|
-
|
1008
|
-
.. code-block:: yaml
|
1009
|
-
|
1010
|
-
exec:
|
1011
|
-
preview_sample_buffer_bytes: 65536 # 64KB
|
1012
|
-
in:
|
1013
|
-
type: ...
|
1014
|
-
...
|
1015
|
-
out:
|
1016
|
-
type: ...
|
1017
|
-
...
|