RubyGems - embulk - Versions diffs - 0.10.24-java → 0.10.29-java - Mend

embulk 0.10.24-java → 0.10.29-java

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

checksums.yaml +4 -4
data/embulk.gemspec +2 -2
data/lib/embulk/gem_version.rb +3 -0
data/lib/embulk/logger.rb +2 -1
data/lib/embulk/version.rb +44 -1
metadata +4 -8
data/lib/embulk/guess/bzip2.rb +0 -23
data/lib/embulk/guess/csv.rb +0 -374
data/lib/embulk/guess/csv_all_strings.rb +0 -13
data/lib/embulk/guess/gzip.rb +0 -18
data/lib/embulk/guess/json.rb +0 -50

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: c7fcb1a8f1e94112700f6f4593f4038fc9861c4a
-  data.tar.gz: 8eb07cb5694b38a1937ecbd62d3c193a124a1253
+  metadata.gz: 66abd322277fe12424ea6d35c145ef4090d1be8b
+  data.tar.gz: e848487bf35166ed5111c4a86a5c3d2520239008
 SHA512:
-  metadata.gz: 9aac5551600bee7e5d0836b5f75d956cbcfc657793a062c9849129e6444505b24c38d3f9f9f2d1ce5a6c85a46e44bfa7059890c2a42b57f584ae03eb8712fc4c
-  data.tar.gz: 584c660fdcd24878c985ca63e55bc606eaad660cc7ed30e208641c08ec6ebe83573200b2f40d8bb908168abe86ea04e6ea9b07f8c87f39252465063cb473e8d4
+  metadata.gz: a7256a622d6a3c52ef7bcd2bea647eb60094b3d31803bcc055610a1175c4daeb7f15fffed39f6d12b8d135ae2e34da4e4692e3f425be901350c7bd4c0acb9c1a
+  data.tar.gz: a10d0105aea8eafbb30f7134bbc6bb38744e45671b6db53f9229d95eccbdd267f46e1b5f1015cc822ca84a8559a89e1501c480bd0bc5d056185ea03ec731019e

data/embulk.gemspec CHANGED Viewed

@@ -1,6 +1,6 @@
 Gem::Specification.new do |gem|
   gem.name = "embulk"
-  gem.version = "0.10.24"
+  gem.version = "0.10.29"
   gem.license = "Apache-2.0"
   gem.summary = "Embulk's runtime library for Ruby."
@@ -33,7 +33,7 @@ Gem::Specification.new do |gem|
       "documentation_uri" => "https://www.embulk.org/",
       "homepage_uri" => gem.homepage,
       # "mailing_list_uri"  => "",
-      "source_code_uri" => "https://github.com/embulk/embulk/tree/v0.10.24",
+      "source_code_uri" => "https://github.com/embulk/embulk/tree/v0.10.29",
       # "wiki_uri" => "",
     }
   end

data/lib/embulk/gem_version.rb ADDED Viewed

@@ -0,0 +1,3 @@
+module Embulk
+  GEM_VERSION_EMBEDDED = "0.10.29"
+end

data/lib/embulk/logger.rb CHANGED Viewed

@@ -1,5 +1,6 @@
 module Embulk
+  require 'embulk/version'  # 'embulk/version' is loaded in the very beginning.
   # this file is required before loading embulk-core.jar
   require 'logger'

data/lib/embulk/version.rb CHANGED Viewed

@@ -1,5 +1,48 @@
 module Embulk
+  CORE_VERSION = Java::org.embulk.EmbulkVersion::VERSION
   # Converts the original Java-style version string to Ruby-style.
   # E.g., "0.9.0-SNAPSHOT" (in Java) is converted to "0.9.0.snapshot" in Ruby.
-  VERSION = ::String.new(Java::org.embulk.EmbulkVersion::VERSION).tr('-', '.').downcase
+  CORE_VERSION_IN_RUBY_GEM_STYLE = ::String.new(CORE_VERSION).tr('-', '.').downcase
+  private_constant :CORE_VERSION_IN_RUBY_GEM_STYLE
+  begin
+    require 'embulk/gem_version'
+  rescue LoadError => e
+    raise LoadError, "[Internal Error] This embulk.gem is not properly built with embulk/gem_version.rb to declare its own version."
+  end
+  begin
+    GEM_VERSION = GEM_VERSION_EMBEDDED
+  rescue NameError => e
+    raise LoadError, "[Internal Error] This embulk.gem does not contain its own version defined properly."
+  end
+  if GEM_VERSION != CORE_VERSION_IN_RUBY_GEM_STYLE
+    # "embulk/logger" cannot be used because embulk/version.rb is loaded even before embulk/logger.rb.
+    STDERR.puts "*******************************************************************************************"
+    STDERR.puts "Running Embulk version (#{CORE_VERSION}) does not match the installed embulk.gem version (#{GEM_VERSION})."
+    STDERR.puts ""
+    STDERR.puts "If you use Embulk v0.9.* without Bundler:"
+    STDERR.puts "   Uninstall embulk.gem from your Gem path."
+    STDERR.puts "   An embulk.gem-equivalent should be embedded in your Embulk's core JAR of v0.9.*."
+    STDERR.puts ""
+    STDERR.puts "If you use Embulk v0.9.* with Bundler:"
+    STDERR.puts "   Try updating your Gemfile as below:"
+    STDERR.puts "     gem 'embulk', '< 0.10'"
+    STDERR.puts "   Bundler will find the embulk.gem-equivalent embedded in your Embulk's core JAR of v0.9.*."
+    STDERR.puts ""
+    STDERR.puts "If you use Embulk v0.10.*:"
+    STDERR.puts "   Be aware that v0.10.* is an unstable development series. If you are aware of that,"
+    STDERR.puts "   upgrade it to the latest v0.10.*, and use exactly the same version of embulk.gem."
+    STDERR.puts "   In case you use Bundler, your Gemfile should have 'embulk' as below:"
+    STDERR.puts "     gem 'embulk', '0.10.XX'  # Exactly the same version of your Embulk's core JAR."
+    STDERR.puts ""
+    STDERR.puts "If you use Embulk v0.8.* or earlier:"
+    STDERR.puts "   Update to the latest v0.9.*. v0.8 or earlier are deprecated."
+    STDERR.puts "*******************************************************************************************"
+    raise LoadError, "Running Embulk version (#{CORE_VERSION}) does not match the installed embulk.gem version (#{GEM_VERSION})."
+  end
+  VERSION = GEM_VERSION
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: embulk
 version: !ruby/object:Gem::Version
-  version: 0.10.24
+  version: 0.10.29
 platform: java
 authors:
 - Sadayuki Furuhashi
@@ -10,7 +10,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2021-01-19 00:00:00.000000000 Z
+date: 2021-04-07 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   requirement: !ruby/object:Gem::Requirement
@@ -51,12 +51,8 @@ files:
 - lib/embulk/file_output_plugin.rb
 - lib/embulk/filter_plugin.rb
 - lib/embulk/formatter_plugin.rb
-- lib/embulk/guess/bzip2.rb
+- lib/embulk/gem_version.rb
 - lib/embulk/guess/charset.rb
-- lib/embulk/guess/csv.rb
-- lib/embulk/guess/csv_all_strings.rb
-- lib/embulk/guess/gzip.rb
-- lib/embulk/guess/json.rb
 - lib/embulk/guess/newline.rb
 - lib/embulk/guess/schema_guess.rb
 - lib/embulk/guess/time_format_guess.rb
@@ -82,7 +78,7 @@ metadata:
   changelog_uri: https://github.com/embulk/embulk/releases
   documentation_uri: https://www.embulk.org/
   homepage_uri: https://www.embulk.org/
-  source_code_uri: https://github.com/embulk/embulk/tree/v0.10.24
+  source_code_uri: https://github.com/embulk/embulk/tree/v0.10.29
 post_install_message:
 rdoc_options: []
 require_paths:

data/lib/embulk/guess/bzip2.rb DELETED Viewed

@@ -1,23 +0,0 @@
-module Embulk
-  module Guess
-    class Bzip2GuessPlugin < GuessPlugin
-      Plugin.register_guess('bzip2', self)
-      # magic: BZ
-      # version: 'h' = bzip2
-      # blocksize: 1 .. 9
-      # block magic: 0x314159265359 (6 bytes)
-      block_magic = [0x31, 0x41, 0x59, 0x26, 0x53, 0x59].pack('C*')
-      BZIP2_HEADER_PATTERN = /BZh[1-9]#{Regexp.quote(block_magic)}/n
-      def guess(config, sample_buffer)
-        if sample_buffer[0,10] =~ BZIP2_HEADER_PATTERN
-          return {"decoders" => [{"type" => "bzip2"}]}
-        end
-        return {}
-      end
-    end
-  end
-end

data/lib/embulk/guess/csv.rb DELETED Viewed

@@ -1,374 +0,0 @@
-module Embulk
-  module Guess
-    require 'embulk/guess/schema_guess'
-    class CsvGuessPlugin < LineGuessPlugin
-      Plugin.register_guess('csv', self)
-      DELIMITER_CANDIDATES = [
-        ",", "\t", "|", ";"
-      ]
-      QUOTE_CANDIDATES = [
-        "\"", "'"
-      ]
-      ESCAPE_CANDIDATES = [
-        "\\", '"'
-      ]
-      NULL_STRING_CANDIDATES = [
-        "null",
-        "NULL",
-        "#N/A",
-        "\\N",  # MySQL LOAD, Hive STORED AS TEXTFILE
-      ]
-      COMMENT_LINE_MARKER_CANDIDATES = [
-        "#",
-        "//",
-      ]
-      MAX_SKIP_LINES = 10
-      NO_SKIP_DETECT_LINES = 10
-      def guess_lines(config, sample_lines)
-        return {} unless config.fetch("parser", {}).fetch("type", "csv") == "csv"
-        parser_config = config["parser"] || {}
-        if parser_config["type"] == "csv" && parser_config["delimiter"]
-          delim = parser_config["delimiter"]
-        else
-          delim = guess_delimiter(sample_lines)
-          unless delim
-            # assuming single column CSV
-            delim = DELIMITER_CANDIDATES.first
-          end
-        end
-        parser_guessed = DataSource.new.merge(parser_config).merge({"type" => "csv", "delimiter" => delim})
-        unless parser_guessed.has_key?("quote")
-          quote = guess_quote(sample_lines, delim)
-          unless quote
-            if !guess_force_no_quote(sample_lines, delim, '"')
-              # assuming CSV follows RFC for quoting
-              quote = '"'
-            else
-              # disable quoting (set null)
-            end
-          end
-          parser_guessed["quote"] = quote
-        end
-        parser_guessed["quote"] = '"' if parser_guessed["quote"] == ''  # setting '' is not allowed any more. this line converts obsoleted config syntax to explicit syntax.
-        unless parser_guessed.has_key?("escape")
-          if quote = parser_guessed["quote"]
-            escape = guess_escape(sample_lines, delim, quote)
-            unless escape
-              if quote == '"'
-                # assuming this CSV follows RFC for escaping
-                escape = '"'
-              else
-                # disable escaping (set null)
-              end
-            end
-            parser_guessed["escape"] = escape
-          else
-            # escape does nothing if quote is disabled
-          end
-        end
-        unless parser_guessed.has_key?("null_string")
-          null_string = guess_null_string(sample_lines, delim)
-          parser_guessed["null_string"] = null_string if null_string
-          # don't even set null_string to avoid confusion of null and 'null' in YAML format
-        end
-        # guessing skip_header_lines should be before guessing guess_comment_line_marker
-        # because lines supplied to CsvTokenizer already don't include skipped header lines.
-        # skipping empty lines is also disabled here because skipping header lines is done by
-        # CsvParser which doesn't skip empty lines automatically
-        sample_records = split_lines(parser_guessed, false, sample_lines, delim, {})
-        skip_header_lines = guess_skip_header_lines(sample_records)
-        sample_lines = sample_lines[skip_header_lines..-1]
-        sample_records = sample_records[skip_header_lines..-1]
-        unless parser_guessed.has_key?("comment_line_marker")
-          comment_line_marker, sample_lines =
-            guess_comment_line_marker(sample_lines, delim, parser_guessed["quote"], parser_guessed["null_string"])
-          if comment_line_marker
-            parser_guessed["comment_line_marker"] = comment_line_marker
-          end
-        end
-        sample_records = split_lines(parser_guessed, true, sample_lines, delim, {})
-        # It should fail if CSV parser cannot parse sample_lines.
-        if sample_records.nil? || sample_records.empty?
-          return {}
-        end
-        if sample_lines.size == 1
-          # The file contains only 1 line. Assume that there are no header line.
-          header_line = false
-          column_types = SchemaGuess.types_from_array_records(sample_records[0, 1])
-          unless parser_guessed.has_key?("trim_if_not_quoted")
-            sample_records_trimmed = split_lines(parser_guessed, true, sample_lines, delim, {"trim_if_not_quoted" => true})
-            column_types_trimmed = SchemaGuess.types_from_array_records(sample_records_trimmed)
-            if column_types != column_types_trimmed
-              parser_guessed["trim_if_not_quoted"] = true
-              column_types = column_types_trimmed
-            else
-              parser_guessed["trim_if_not_quoted"] = false
-            end
-          end
-        else
-          # The file contains more than 1 line. If guessed first line's column types are all strings or boolean, and the types are
-          # different from the other lines, assume that the first line is column names.
-          first_types = SchemaGuess.types_from_array_records(sample_records[0, 1])
-          other_types = SchemaGuess.types_from_array_records(sample_records[1..-1] || [])
-          unless parser_guessed.has_key?("trim_if_not_quoted")
-            sample_records_trimmed = split_lines(parser_guessed, true, sample_lines, delim, {"trim_if_not_quoted" => true})
-            other_types_trimmed = SchemaGuess.types_from_array_records(sample_records_trimmed[1..-1] || [])
-            if other_types != other_types_trimmed
-              parser_guessed["trim_if_not_quoted"] = true
-              other_types = other_types_trimmed
-            else
-              parser_guessed["trim_if_not_quoted"] = false
-            end
-          end
-          header_line = (first_types != other_types && first_types.all? {|t| ["string", "boolean"].include?(t) }) || guess_string_header_line(sample_records)
-          column_types = other_types
-        end
-        if column_types.empty?
-          # TODO here is making the guessing failed if the file doesn't contain any columns. However,
-          #      this may not be convenient for users.
-          return {}
-        end
-        if header_line
-          parser_guessed["skip_header_lines"] = skip_header_lines + 1
-        else
-          parser_guessed["skip_header_lines"] = skip_header_lines
-        end
-        parser_guessed["allow_extra_columns"] = false unless parser_guessed.has_key?("allow_extra_columns")
-        parser_guessed["allow_optional_columns"] = false unless parser_guessed.has_key?("allow_optional_columns")
-        if header_line
-          column_names = sample_records.first.map(&:strip)
-        else
-          column_names = (0..column_types.size).to_a.map {|i| "c#{i}" }
-        end
-        schema = []
-        column_names.zip(column_types).each do |name,type|
-          if name && type
-            schema << new_column(name, type)
-          end
-        end
-        parser_guessed["columns"] = schema
-        return {"parser" => parser_guessed}
-      end
-      def new_column(name, type)
-        if type.is_a?(SchemaGuess::TimestampTypeMatch)
-          {"name" => name, "type" => type, "format" => type.format}
-        else
-          {"name" => name, "type" => type}
-        end
-      end
-      private
-      def split_lines(parser_config, skip_empty_lines, sample_lines, delim, extra_config)
-        null_string = parser_config["null_string"]
-        config = parser_config.merge(extra_config).merge({"charset" => "UTF-8", "columns" => []})
-        parser_task = config.load_config(org.embulk.standards.CsvParserPlugin::PluginTask)
-        data = sample_lines.map {|line| line.force_encoding('UTF-8') }.join(parser_task.getNewline.getString.encode('UTF-8'))
-        sample = Buffer.from_ruby_string(data)
-        decoder = Java::LineDecoder.new(Java::ListFileInput.new([[sample.to_java]]), parser_task)
-        tokenizer = org.embulk.standards.CsvTokenizer.new(decoder, parser_task)
-        rows = []
-        while tokenizer.nextFile
-          while tokenizer.nextRecord(skip_empty_lines)
-            begin
-              columns = []
-              while true
-                begin
-                  column = tokenizer.nextColumn
-                  quoted = tokenizer.wasQuotedColumn
-                  if null_string && !quoted && column == null_string
-                    column = nil
-                  end
-                  columns << column
-                rescue org.embulk.standards.CsvTokenizer::TooFewColumnsException
-                  rows << columns
-                  break
-                end
-              end
-            rescue org.embulk.standards.CsvTokenizer::InvalidValueException
-              # TODO warning
-              tokenizer.skipCurrentLine
-            end
-          end
-        end
-        return rows
-      rescue
-        # TODO warning if fallback to this ad-hoc implementation
-        sample_lines.map {|line| line.split(delim) }
-      end
-      def guess_delimiter(sample_lines)
-        delim_weights = DELIMITER_CANDIDATES.map do |d|
-          counts = sample_lines.map {|line| line.count(d) }
-          total = array_sum(counts)
-          if total > 0
-            stddev = array_standard_deviation(counts)
-            stddev = 0.000000001 if stddev == 0.0
-            weight = total / stddev
-            [d, weight]
-          else
-            [nil, 0]
-          end
-        end
-        delim, weight = *delim_weights.sort_by {|d,weight| weight }.last
-        if delim != nil && weight > 1
-          return delim
-        else
-          return nil
-        end
-      end
-      def guess_quote(sample_lines, delim)
-        delim_regexp = Regexp.escape(delim)
-        quote_weights = QUOTE_CANDIDATES.map do |q|
-          weights = sample_lines.map do |line|
-            q_regexp = Regexp.escape(q)
-            count = line.count(q)
-            if count > 0
-              weight = count
-              weight += line.scan(/(?:\A|#{delim_regexp})\s*#{q_regexp}(?:(?!#{q_regexp}).)*\s*#{q_regexp}(?:$|#{delim_regexp})/).size * 20
-              weight += line.scan(/(?:\A|#{delim_regexp})\s*#{q_regexp}(?:(?!#{delim_regexp}).)*\s*#{q_regexp}(?:$|#{delim_regexp})/).size * 40
-              weight
-            else
-              nil
-            end
-          end.compact
-          weights.empty? ? 0 : array_avg(weights)
-        end
-        quote, weight = QUOTE_CANDIDATES.zip(quote_weights).sort_by {|q,w| w }.last
-        if weight >= 10.0
-          return quote
-        else
-          return nil
-        end
-      end
-      def guess_force_no_quote(sample_lines, delim, quote_candidate)
-        delim_regexp = Regexp.escape(delim)
-        q_regexp = Regexp.escape(quote_candidate)
-        sample_lines.any? do |line|
-          # quoting character appear at the middle of a non-quoted value
-          line =~ /(?:\A|#{delim_regexp})\s*[^#{q_regexp}]+#{q_regexp}/
-        end
-      end
-      def guess_escape(sample_lines, delim, quote)
-        guessed = ESCAPE_CANDIDATES.map do |str|
-          regexp = /#{Regexp.quote(str)}(?:#{Regexp.quote(delim)}|#{Regexp.quote(quote)})/
-          counts = sample_lines.map {|line| line.scan(regexp).count }
-          count = counts.inject(0) {|r,c| r + c }
-          [str, count]
-        end.select {|str,count| count > 0 }.sort_by {|str,count| -count }
-        found = guessed.first
-        return found ? found[0] : nil
-      end
-      def guess_null_string(sample_lines, delim)
-        guessed = NULL_STRING_CANDIDATES.map do |str|
-          regexp = /(?:^|#{Regexp.quote(delim)})#{Regexp.quote(str)}(?:$|#{Regexp.quote(delim)})/
-          counts = sample_lines.map {|line| line.scan(regexp).count }
-          count = counts.inject(0) {|r,c| r + c }
-          [str, count]
-        end.select {|str,count| count > 0 }.sort_by {|str,count| -count }
-        found_str, found_count = guessed.first
-        return found_str ? found_str : nil
-      end
-      def guess_skip_header_lines(sample_records)
-        counts = sample_records.map {|records| records.size }
-        (1..[MAX_SKIP_LINES, counts.length - 1].min).each do |i|
-          check_row_count = counts[i-1]
-          if counts[i, NO_SKIP_DETECT_LINES].all? {|c| c <= check_row_count }
-            return i - 1
-          end
-        end
-        return 0
-      end
-      def guess_comment_line_marker(sample_lines, delim, quote, null_string)
-        exclude = []
-        exclude << /^#{Regexp.escape(quote)}/ if quote && !quote.empty?
-        exclude << /^#{Regexp.escape(null_string)}(?:#{Regexp.escape(delim)}|$)/ if null_string
-        guessed = COMMENT_LINE_MARKER_CANDIDATES.map do |str|
-          regexp = /^#{Regexp.quote(str)}/
-          unmatch_lines = sample_lines.reject do |line|
-            exclude.all? {|ex| line !~ ex } && line =~ regexp
-          end
-          match_count = sample_lines.size - unmatch_lines.size
-          [str, match_count, unmatch_lines]
-        end.select {|str,match_count,unmatch_lines| match_count > 0 }.sort_by {|str,match_count,unmatch_lines| -match_count }
-        str, match_count, unmatch_lines = guessed.first
-        if str
-          return str, unmatch_lines
-        else
-          return nil, sample_lines
-        end
-      end
-      def guess_string_header_line(sample_records)
-        first = sample_records.first
-        first.count.times do |column_index|
-          lengths = sample_records.map {|row| row[column_index] }.compact.map {|v| v.to_s.size }
-          if lengths.size > 1
-            if array_variance(lengths[1..-1]) <= 0.2
-              avg = array_avg(lengths[1..-1])
-              if avg == 0.0 ? lengths[0] > 1 : (avg - lengths[0]).abs / avg > 0.7
-                return true
-              end
-            end
-          end
-        end
-        return false
-      end
-      def array_sum(array)
-        array.inject(0) {|r,i| r += i }
-      end
-      def array_avg(array)
-        array.inject(0.0) {|r,i| r += i } / array.size
-      end
-      def array_variance(array)
-        avg = array_avg(array)
-        array.inject(0.0) {|r,i| r += (i - avg) ** 2 } / array.size
-      end
-      def array_standard_deviation(array)
-        Math.sqrt(array_variance(array))
-      end
-    end
-  end
-end

data/lib/embulk/guess/csv_all_strings.rb DELETED Viewed

@@ -1,13 +0,0 @@
-module Embulk
-  module Guess
-    require 'embulk/guess/csv'
-    class CsvAllStringsGuessPlugin < CsvGuessPlugin
-      Plugin.register_guess("csv_all_strings", self)
-      def new_column(name, type)
-        {"name" => name, "type" => "string"}
-      end
-    end
-  end
-end

data/lib/embulk/guess/gzip.rb DELETED Viewed

@@ -1,18 +0,0 @@
-module Embulk
-  module Guess
-    class GzipGuessPlugin < GuessPlugin
-      Plugin.register_guess('gzip', self)
-      GZIP_HEADER = "\x1f\x8b".force_encoding('ASCII-8BIT').freeze
-      def guess(config, sample_buffer)
-        if sample_buffer[0,2] == GZIP_HEADER
-          return {"decoders" => [{"type" => "gzip"}]}
-        end
-        return {}
-      end
-    end
-  end
-end

data/lib/embulk/guess/json.rb DELETED Viewed

@@ -1,50 +0,0 @@
-module Embulk
-  module Guess
-    class JsonGuessPlugin < GuessPlugin
-      Plugin.register_guess('json', self)
-      java_import 'com.google.common.collect.Lists'
-      java_import 'java.io.ByteArrayInputStream'
-      java_import 'org.embulk.spi.Exec'
-      java_import 'org.embulk.spi.json.JsonParser'
-      java_import 'org.embulk.spi.json.JsonParseException'
-      java_import 'org.embulk.spi.util.FileInputInputStream'
-      java_import 'org.embulk.spi.util.InputStreamFileInput'
-      def guess(config, sample_buffer)
-        return {} unless config.fetch("parser", {}).fetch("type", "json") == "json"
-        # Use org.embulk.spi.json.JsonParser to respond to multi-line Json
-        json_parser = new_json_parser(sample_buffer)
-        one_json_parsed = false
-        begin
-          while (v = json_parser.next)
-            # "v" needs to be JSON object type (isMapValue) because:
-            # 1) Single-column CSV can be mis-guessed as JSON if JSON non-objects are accepted.
-            # 2) JsonParserPlugin accepts only the JSON object type.
-            raise JsonParseException.new("v must be JSON object type") unless v.isMapValue
-            one_json_parsed = true
-          end
-        rescue JsonParseException
-          # the exception is ignored
-        end
-        if one_json_parsed
-          return {"parser" => {"type" => "json"}} # if JsonParser can parse even one JSON data
-        else
-          return {}
-        end
-      end
-      private
-      def new_json_parser(buffer)
-        input_streams = Lists::newArrayList(ByteArrayInputStream.new(buffer.to_java_bytes))
-        iterator_provider = InputStreamFileInput::IteratorProvider.new(input_streams)
-        input = FileInputInputStream.new(InputStreamFileInput.new(Java::SPI::Exec.getBufferAllocator(), iterator_provider))
-        input.nextFile
-        JsonParser.new.open(input)
-      end
-    end
-  end
-end