embulk-filter-copy 0.0.2 → 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +6 -1
- data/README.md +5 -1
- data/build.gradle +6 -5
- data/example/config.yml +1 -0
- data/example/data.tsv +5 -5
- data/gradle/wrapper/gradle-wrapper.jar +0 -0
- data/gradle/wrapper/gradle-wrapper.properties +1 -2
- data/gradlew +13 -10
- data/src/main/java/org/embulk/filter/copy/CopyFilterPlugin.java +26 -37
- data/src/main/java/org/embulk/filter/copy/forward/{ForwardBaseTask.java → ForwardParentTask.java} +1 -1
- data/src/main/java/org/embulk/filter/copy/forward/InForwardEventReader.java +67 -62
- data/src/main/java/org/embulk/filter/copy/forward/InForwardService.java +102 -35
- data/src/main/java/org/embulk/filter/copy/forward/OutForwardEventBuilder.java +66 -54
- data/src/main/java/org/embulk/filter/copy/forward/OutForwardService.java +2 -2
- data/src/main/java/org/embulk/filter/copy/plugin/InternalForwardInputPlugin.java +11 -13
- data/src/main/java/org/embulk/filter/copy/runner/AsyncEmbulkRunnerService.java +32 -0
- data/src/main/java/org/embulk/filter/copy/runner/EmbulkRunner.java +124 -0
- data/src/main/java/org/embulk/filter/copy/spi/DataBuilder.java +41 -0
- data/src/main/java/org/embulk/filter/copy/spi/DataReader.java +41 -0
- data/src/main/java/org/embulk/filter/copy/spi/ElapsedTime.java +81 -0
- data/src/main/java/org/embulk/filter/copy/spi/PageBuilder.java +16 -0
- data/src/main/java/org/embulk/filter/copy/spi/PageReader.java +13 -0
- data/src/main/java/org/embulk/filter/copy/{util → spi}/StandardColumnVisitor.java +6 -6
- data/src/test/java/org/embulk/filter/copy/TestCopyFilterPlugin.java +0 -11
- metadata +24 -16
- data/src/main/java/org/embulk/filter/copy/executor/EmbulkExecutor.java +0 -105
- data/src/main/java/org/embulk/filter/copy/executor/LocalThreadExecutor.java +0 -96
- data/src/main/java/org/embulk/filter/copy/forward/InForwardVisitor.java +0 -63
- data/src/main/java/org/embulk/filter/copy/forward/OutForwardVisitor.java +0 -63
- data/src/main/java/org/embulk/filter/copy/util/ElapsedTime.java +0 -165
@@ -1,105 +0,0 @@
|
|
1
|
-
package org.embulk.filter.copy.executor;
|
2
|
-
|
3
|
-
import com.fasterxml.jackson.annotation.JsonCreator;
|
4
|
-
import com.fasterxml.jackson.annotation.JsonValue;
|
5
|
-
import com.google.common.base.Joiner;
|
6
|
-
import com.google.inject.Injector;
|
7
|
-
import org.embulk.EmbulkEmbed;
|
8
|
-
import org.embulk.config.Config;
|
9
|
-
import org.embulk.config.ConfigDefault;
|
10
|
-
import org.embulk.config.ConfigException;
|
11
|
-
import org.embulk.config.ConfigSource;
|
12
|
-
import org.embulk.guice.LifeCycleInjector;
|
13
|
-
import org.embulk.spi.Exec;
|
14
|
-
import org.slf4j.Logger;
|
15
|
-
|
16
|
-
import java.lang.reflect.Constructor;
|
17
|
-
import java.lang.reflect.InvocationTargetException;
|
18
|
-
import java.util.Locale;
|
19
|
-
|
20
|
-
public abstract class EmbulkExecutor
|
21
|
-
{
|
22
|
-
static final Logger logger = Exec.getLogger(EmbulkExecutor.class);
|
23
|
-
|
24
|
-
public interface ExecutorTask
|
25
|
-
extends org.embulk.config.Task
|
26
|
-
{
|
27
|
-
@Config("\"type\"")
|
28
|
-
@ConfigDefault("\"local_thread\"")
|
29
|
-
ExecutorType getType();
|
30
|
-
|
31
|
-
enum ExecutorType
|
32
|
-
{
|
33
|
-
LOCAL_THREAD;
|
34
|
-
|
35
|
-
@JsonValue
|
36
|
-
@Override
|
37
|
-
public String toString()
|
38
|
-
{
|
39
|
-
return name().toLowerCase(Locale.ENGLISH);
|
40
|
-
}
|
41
|
-
|
42
|
-
@JsonCreator
|
43
|
-
public static ExecutorType fromString(String value)
|
44
|
-
{
|
45
|
-
switch (value) {
|
46
|
-
case "local_thread":
|
47
|
-
return LOCAL_THREAD;
|
48
|
-
default:
|
49
|
-
String values = Joiner.on(", ").join(values()).toLowerCase(Locale.ENGLISH);
|
50
|
-
throw new ConfigException(String.format("Unknown executor type '%s'. Supported executor types are %s", value, values));
|
51
|
-
}
|
52
|
-
}
|
53
|
-
}
|
54
|
-
|
55
|
-
}
|
56
|
-
|
57
|
-
public interface Task
|
58
|
-
extends org.embulk.config.Task
|
59
|
-
{
|
60
|
-
@Config("executor")
|
61
|
-
@ConfigDefault("{}")
|
62
|
-
ExecutorTask getExecutorTask();
|
63
|
-
}
|
64
|
-
|
65
|
-
public static EmbulkExecutor buildExecutor(Task task)
|
66
|
-
{
|
67
|
-
switch (task.getExecutorTask().getType()) {
|
68
|
-
case LOCAL_THREAD:
|
69
|
-
return new LocalThreadExecutor(task.getExecutorTask());
|
70
|
-
default:
|
71
|
-
String values = Joiner.on(", ").join(ExecutorTask.ExecutorType.values()).toLowerCase(Locale.ENGLISH);
|
72
|
-
throw new ConfigException(String.format("Unknown executor type '%s'. Supported executor types are %s", task.getExecutorTask().getType(), values));
|
73
|
-
}
|
74
|
-
}
|
75
|
-
|
76
|
-
final ExecutorTask task;
|
77
|
-
final Injector injector;
|
78
|
-
|
79
|
-
EmbulkExecutor(ExecutorTask task)
|
80
|
-
{
|
81
|
-
this.task = task;
|
82
|
-
this.injector = Exec.getInjector();
|
83
|
-
}
|
84
|
-
|
85
|
-
public abstract void setup();
|
86
|
-
|
87
|
-
public abstract void executeAsync(ConfigSource config);
|
88
|
-
|
89
|
-
public abstract void waitUntilExecutionFinished();
|
90
|
-
|
91
|
-
public abstract void shutdown();
|
92
|
-
|
93
|
-
EmbulkEmbed newEmbulkEmbed()
|
94
|
-
{
|
95
|
-
try {
|
96
|
-
Constructor<EmbulkEmbed> constructor = EmbulkEmbed.class
|
97
|
-
.getDeclaredConstructor(ConfigSource.class, LifeCycleInjector.class);
|
98
|
-
constructor.setAccessible(true);
|
99
|
-
return constructor.newInstance(null, injector);
|
100
|
-
}
|
101
|
-
catch (InstantiationException | IllegalAccessException | NoSuchMethodException | InvocationTargetException e) {
|
102
|
-
throw new ConfigException(e);
|
103
|
-
}
|
104
|
-
}
|
105
|
-
}
|
@@ -1,96 +0,0 @@
|
|
1
|
-
package org.embulk.filter.copy.executor;
|
2
|
-
|
3
|
-
import com.google.common.util.concurrent.FutureCallback;
|
4
|
-
import com.google.common.util.concurrent.Futures;
|
5
|
-
import com.google.common.util.concurrent.ListenableFuture;
|
6
|
-
import com.google.common.util.concurrent.ListeningExecutorService;
|
7
|
-
import com.google.common.util.concurrent.MoreExecutors;
|
8
|
-
import org.embulk.config.ConfigSource;
|
9
|
-
import org.embulk.exec.ExecutionResult;
|
10
|
-
import org.embulk.filter.copy.util.ElapsedTime;
|
11
|
-
|
12
|
-
import javax.annotation.Nullable;
|
13
|
-
|
14
|
-
import java.util.concurrent.Callable;
|
15
|
-
import java.util.concurrent.Executors;
|
16
|
-
|
17
|
-
public class LocalThreadExecutor
|
18
|
-
extends EmbulkExecutor
|
19
|
-
{
|
20
|
-
private static final String THREAD_NAME = "embulk executor service";
|
21
|
-
private static final int NUM_THREADS = 1;
|
22
|
-
private final ListeningExecutorService es;
|
23
|
-
private ListenableFuture<ExecutionResult> future;
|
24
|
-
|
25
|
-
LocalThreadExecutor(ExecutorTask task)
|
26
|
-
{
|
27
|
-
super(task);
|
28
|
-
this.es = MoreExecutors.listeningDecorator(
|
29
|
-
Executors.newFixedThreadPool(
|
30
|
-
NUM_THREADS,
|
31
|
-
r -> new Thread(r, THREAD_NAME)
|
32
|
-
));
|
33
|
-
}
|
34
|
-
|
35
|
-
@Override
|
36
|
-
public void setup()
|
37
|
-
{
|
38
|
-
}
|
39
|
-
|
40
|
-
@Override
|
41
|
-
public void executeAsync(ConfigSource config)
|
42
|
-
{
|
43
|
-
logger.debug("execute with this config: {}", config);
|
44
|
-
if (future != null) {
|
45
|
-
throw new IllegalStateException("executeAsync is already called.");
|
46
|
-
}
|
47
|
-
future = es.submit(embulkRun(config));
|
48
|
-
Futures.addCallback(future, resultFutureCallback());
|
49
|
-
}
|
50
|
-
|
51
|
-
@Override
|
52
|
-
public void waitUntilExecutionFinished()
|
53
|
-
{
|
54
|
-
if (future == null) {
|
55
|
-
throw new NullPointerException();
|
56
|
-
}
|
57
|
-
ElapsedTime.debugUntil(() -> future.isDone() || future.isCancelled(),
|
58
|
-
logger, "embulk executor", 3000L);
|
59
|
-
}
|
60
|
-
|
61
|
-
@Override
|
62
|
-
public void shutdown()
|
63
|
-
{
|
64
|
-
ElapsedTime.info(
|
65
|
-
logger,
|
66
|
-
"embulk executor service shutdown",
|
67
|
-
es::shutdown);
|
68
|
-
}
|
69
|
-
|
70
|
-
private Callable<ExecutionResult> embulkRun(ConfigSource config)
|
71
|
-
{
|
72
|
-
return () -> newEmbulkEmbed().run(config);
|
73
|
-
}
|
74
|
-
|
75
|
-
private FutureCallback<ExecutionResult> resultFutureCallback()
|
76
|
-
{
|
77
|
-
return new FutureCallback<ExecutionResult>()
|
78
|
-
{
|
79
|
-
@Override
|
80
|
-
public void onSuccess(@Nullable ExecutionResult result)
|
81
|
-
{
|
82
|
-
for (Throwable throwable : result.getIgnoredExceptions()) {
|
83
|
-
logger.warn("Ignored error ", throwable);
|
84
|
-
}
|
85
|
-
logger.info("Config diff: {}", result.getConfigDiff());
|
86
|
-
logger.debug("ExecutionResult: {}", result);
|
87
|
-
}
|
88
|
-
|
89
|
-
@Override
|
90
|
-
public void onFailure(Throwable t)
|
91
|
-
{
|
92
|
-
throw new RuntimeException(t);
|
93
|
-
}
|
94
|
-
};
|
95
|
-
}
|
96
|
-
}
|
@@ -1,63 +0,0 @@
|
|
1
|
-
package org.embulk.filter.copy.forward;
|
2
|
-
|
3
|
-
import org.embulk.spi.Column;
|
4
|
-
import org.embulk.spi.ColumnVisitor;
|
5
|
-
import org.embulk.spi.PageBuilder;
|
6
|
-
|
7
|
-
public class InForwardVisitor
|
8
|
-
implements ColumnVisitor
|
9
|
-
{
|
10
|
-
private final InForwardEventReader reader;
|
11
|
-
private final PageBuilder builder;
|
12
|
-
|
13
|
-
public InForwardVisitor(InForwardEventReader reader, PageBuilder builder)
|
14
|
-
{
|
15
|
-
this.reader = reader;
|
16
|
-
this.builder = builder;
|
17
|
-
}
|
18
|
-
|
19
|
-
private void nullOr(Column column, Runnable r)
|
20
|
-
{
|
21
|
-
if (reader.isNull(column)) {
|
22
|
-
builder.setNull(column);
|
23
|
-
return;
|
24
|
-
}
|
25
|
-
r.run();
|
26
|
-
}
|
27
|
-
|
28
|
-
@Override
|
29
|
-
public void booleanColumn(Column column)
|
30
|
-
{
|
31
|
-
nullOr(column, () -> builder.setBoolean(column, reader.getBoolean(column)));
|
32
|
-
}
|
33
|
-
|
34
|
-
@Override
|
35
|
-
public void longColumn(Column column)
|
36
|
-
{
|
37
|
-
nullOr(column, () -> builder.setLong(column, reader.getLong(column)));
|
38
|
-
}
|
39
|
-
|
40
|
-
@Override
|
41
|
-
public void doubleColumn(Column column)
|
42
|
-
{
|
43
|
-
nullOr(column, () -> builder.setDouble(column, reader.getDouble(column)));
|
44
|
-
}
|
45
|
-
|
46
|
-
@Override
|
47
|
-
public void stringColumn(Column column)
|
48
|
-
{
|
49
|
-
nullOr(column, () -> builder.setString(column, reader.getString(column)));
|
50
|
-
}
|
51
|
-
|
52
|
-
@Override
|
53
|
-
public void timestampColumn(Column column)
|
54
|
-
{
|
55
|
-
nullOr(column, () -> builder.setTimestamp(column, reader.getTimestamp(column)));
|
56
|
-
}
|
57
|
-
|
58
|
-
@Override
|
59
|
-
public void jsonColumn(Column column)
|
60
|
-
{
|
61
|
-
nullOr(column, () -> builder.setJson(column, reader.getJson(column)));
|
62
|
-
}
|
63
|
-
}
|
@@ -1,63 +0,0 @@
|
|
1
|
-
package org.embulk.filter.copy.forward;
|
2
|
-
|
3
|
-
import org.embulk.spi.Column;
|
4
|
-
import org.embulk.spi.ColumnVisitor;
|
5
|
-
import org.embulk.spi.PageReader;
|
6
|
-
|
7
|
-
public class OutForwardVisitor
|
8
|
-
implements ColumnVisitor
|
9
|
-
{
|
10
|
-
private final PageReader reader;
|
11
|
-
private final OutForwardEventBuilder builder;
|
12
|
-
|
13
|
-
public OutForwardVisitor(PageReader reader, OutForwardEventBuilder builder)
|
14
|
-
{
|
15
|
-
this.reader = reader;
|
16
|
-
this.builder = builder;
|
17
|
-
}
|
18
|
-
|
19
|
-
private void nullOr(Column column, Runnable r)
|
20
|
-
{
|
21
|
-
if (reader.isNull(column)) {
|
22
|
-
builder.setNull(column);
|
23
|
-
return;
|
24
|
-
}
|
25
|
-
r.run();
|
26
|
-
}
|
27
|
-
|
28
|
-
@Override
|
29
|
-
public void booleanColumn(Column column)
|
30
|
-
{
|
31
|
-
nullOr(column, () -> builder.setBoolean(column, reader.getBoolean(column)));
|
32
|
-
}
|
33
|
-
|
34
|
-
@Override
|
35
|
-
public void longColumn(Column column)
|
36
|
-
{
|
37
|
-
nullOr(column, () -> builder.setLong(column, reader.getLong(column)));
|
38
|
-
}
|
39
|
-
|
40
|
-
@Override
|
41
|
-
public void doubleColumn(Column column)
|
42
|
-
{
|
43
|
-
nullOr(column, () -> builder.setDouble(column, reader.getDouble(column)));
|
44
|
-
}
|
45
|
-
|
46
|
-
@Override
|
47
|
-
public void stringColumn(Column column)
|
48
|
-
{
|
49
|
-
nullOr(column, () -> builder.setString(column, reader.getString(column)));
|
50
|
-
}
|
51
|
-
|
52
|
-
@Override
|
53
|
-
public void timestampColumn(Column column)
|
54
|
-
{
|
55
|
-
nullOr(column, () -> builder.setTimestamp(column, reader.getTimestamp(column)));
|
56
|
-
}
|
57
|
-
|
58
|
-
@Override
|
59
|
-
public void jsonColumn(Column column)
|
60
|
-
{
|
61
|
-
nullOr(column, () -> builder.setJson(column, reader.getJson(column)));
|
62
|
-
}
|
63
|
-
}
|
@@ -1,165 +0,0 @@
|
|
1
|
-
package org.embulk.filter.copy.util;
|
2
|
-
|
3
|
-
import org.slf4j.Logger;
|
4
|
-
|
5
|
-
import java.util.function.Supplier;
|
6
|
-
|
7
|
-
public class ElapsedTime
|
8
|
-
{
|
9
|
-
private ElapsedTime()
|
10
|
-
{
|
11
|
-
}
|
12
|
-
|
13
|
-
private final static String TEMPLATE = " ({} ms)";
|
14
|
-
private enum LogLevel {TRACE, DEBUG, INFO, WARN, ERROR}
|
15
|
-
private enum Status {START, RUNNING, FINISHED}
|
16
|
-
|
17
|
-
private static void log(Logger logger, LogLevel level, String message, long elapsed)
|
18
|
-
{
|
19
|
-
String msgWithTmpl = message + TEMPLATE;
|
20
|
-
switch (level)
|
21
|
-
{
|
22
|
-
case TRACE:
|
23
|
-
logger.trace(msgWithTmpl, elapsed);
|
24
|
-
break;
|
25
|
-
case DEBUG:
|
26
|
-
logger.debug(msgWithTmpl, elapsed);
|
27
|
-
break;
|
28
|
-
case INFO:
|
29
|
-
logger.info(msgWithTmpl, elapsed);
|
30
|
-
break;
|
31
|
-
case WARN:
|
32
|
-
logger.warn(msgWithTmpl, elapsed);
|
33
|
-
break;
|
34
|
-
case ERROR:
|
35
|
-
logger.error(msgWithTmpl, elapsed);
|
36
|
-
break;
|
37
|
-
}
|
38
|
-
}
|
39
|
-
|
40
|
-
private static <T>T run(Logger logger, LogLevel level, String message, Supplier<T> proc)
|
41
|
-
{
|
42
|
-
long start = System.currentTimeMillis();
|
43
|
-
try {
|
44
|
-
return proc.get();
|
45
|
-
}
|
46
|
-
finally {
|
47
|
-
log(logger, level, message, System.currentTimeMillis() - start);
|
48
|
-
}
|
49
|
-
}
|
50
|
-
|
51
|
-
private static void run(Logger logger, LogLevel level, String message, Runnable proc)
|
52
|
-
{
|
53
|
-
long start = System.currentTimeMillis();
|
54
|
-
try {
|
55
|
-
proc.run();
|
56
|
-
}
|
57
|
-
finally {
|
58
|
-
log(logger, level, message, System.currentTimeMillis() - start);
|
59
|
-
}
|
60
|
-
}
|
61
|
-
|
62
|
-
public static <T>T trace(Logger logger, String message, Supplier<T> proc)
|
63
|
-
{
|
64
|
-
return run(logger, LogLevel.TRACE, message, proc);
|
65
|
-
}
|
66
|
-
|
67
|
-
public static <T>T debug(Logger logger, String message, Supplier<T> proc)
|
68
|
-
{
|
69
|
-
return run(logger, LogLevel.DEBUG, message, proc);
|
70
|
-
}
|
71
|
-
|
72
|
-
public static <T>T info(Logger logger, String message, Supplier<T> proc)
|
73
|
-
{
|
74
|
-
return run(logger, LogLevel.INFO, message, proc);
|
75
|
-
}
|
76
|
-
|
77
|
-
public static <T>T warn(Logger logger, String message, Supplier<T> proc)
|
78
|
-
{
|
79
|
-
return run(logger, LogLevel.WARN, message, proc);
|
80
|
-
}
|
81
|
-
|
82
|
-
public static <T>T error(Logger logger, String message, Supplier<T> proc)
|
83
|
-
{
|
84
|
-
return run(logger, LogLevel.ERROR, message, proc);
|
85
|
-
}
|
86
|
-
|
87
|
-
public static void trace(Logger logger, String message, Runnable proc)
|
88
|
-
{
|
89
|
-
run(logger, LogLevel.TRACE, message, proc);
|
90
|
-
}
|
91
|
-
|
92
|
-
public static void debug(Logger logger, String message, Runnable proc)
|
93
|
-
{
|
94
|
-
run(logger, LogLevel.DEBUG, message, proc);
|
95
|
-
}
|
96
|
-
|
97
|
-
public static void info(Logger logger, String message, Runnable proc)
|
98
|
-
{
|
99
|
-
run(logger, LogLevel.INFO, message, proc);
|
100
|
-
}
|
101
|
-
|
102
|
-
public static void warn(Logger logger, String message, Runnable proc)
|
103
|
-
{
|
104
|
-
run(logger, LogLevel.WARN, message, proc);
|
105
|
-
}
|
106
|
-
|
107
|
-
public static void error(Logger logger, String message, Runnable proc)
|
108
|
-
{
|
109
|
-
run(logger, LogLevel.ERROR, message, proc);
|
110
|
-
}
|
111
|
-
|
112
|
-
private static void logUntil(Supplier<Boolean> condition,
|
113
|
-
Logger logger, LogLevel level, String message, long sleep)
|
114
|
-
{
|
115
|
-
long start = System.currentTimeMillis();
|
116
|
-
log(logger, level, String.format("(%s) %s", Status.START, message),
|
117
|
-
System.currentTimeMillis() - start);
|
118
|
-
while (true) {
|
119
|
-
if (condition.get()) {
|
120
|
-
log(logger, level, String.format("(%s) %s", Status.FINISHED, message),
|
121
|
-
System.currentTimeMillis() - start);
|
122
|
-
break;
|
123
|
-
}
|
124
|
-
try {
|
125
|
-
Thread.sleep(sleep);
|
126
|
-
}
|
127
|
-
catch (InterruptedException e) {
|
128
|
-
logger.warn(e.getMessage(), e);
|
129
|
-
}
|
130
|
-
|
131
|
-
log(logger, level, String.format("(%s) %s", Status.RUNNING, message),
|
132
|
-
System.currentTimeMillis() - start);
|
133
|
-
}
|
134
|
-
}
|
135
|
-
|
136
|
-
public static void traceUntil(Supplier<Boolean> condition,
|
137
|
-
Logger logger, String message, long sleep)
|
138
|
-
{
|
139
|
-
logUntil(condition, logger, LogLevel.TRACE, message, sleep);
|
140
|
-
}
|
141
|
-
|
142
|
-
public static void debugUntil(Supplier<Boolean> condition,
|
143
|
-
Logger logger, String message, long sleep)
|
144
|
-
{
|
145
|
-
logUntil(condition, logger, LogLevel.DEBUG, message, sleep);
|
146
|
-
}
|
147
|
-
|
148
|
-
public static void infoUntil(Supplier<Boolean> condition,
|
149
|
-
Logger logger, String message, long sleep)
|
150
|
-
{
|
151
|
-
logUntil(condition, logger, LogLevel.INFO, message, sleep);
|
152
|
-
}
|
153
|
-
|
154
|
-
public static void warnUntil(Supplier<Boolean> condition,
|
155
|
-
Logger logger, String message, long sleep)
|
156
|
-
{
|
157
|
-
logUntil(condition, logger, LogLevel.WARN, message, sleep);
|
158
|
-
}
|
159
|
-
|
160
|
-
public static void errorUntil(Supplier<Boolean> condition,
|
161
|
-
Logger logger, String message, long sleep)
|
162
|
-
{
|
163
|
-
logUntil(condition, logger, LogLevel.ERROR, message, sleep);
|
164
|
-
}
|
165
|
-
}
|