RubyGems - logstash-codec-multiline - Versions diffs - 3.0.3 → 3.0.5 - Mend

logstash-codec-multiline 3.0.3 → 3.0.5

Files changed (9) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +3 -0
data/Gemfile +8 -1
data/docs/index.asciidoc +222 -0
data/lib/logstash/codecs/multiline.rb +15 -8
data/logstash-codec-multiline.gemspec +2 -2
data/spec/codecs/auto_flush_spec.rb +1 -0
data/spec/codecs/multiline_spec.rb +1 -0
metadata +3 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 26c71113b37e1292bbf9459af6716c724ee0f432
-  data.tar.gz: 6d75faf254ff4be96e8f37a1818a573e357e60be
+  metadata.gz: 0b83041012aa7d4c15fe3b86d61f5b626d1b71ff
+  data.tar.gz: 33fd5598cc32b5f1ea942593def59627757abc0a
 SHA512:
-  metadata.gz: e75491ca1f12432d886c53ab7d6aa4a4d65bb4f77ce71381b063fb779a0fc3564ad860287c91ac07484241d8ddabf6217c743eef868e9776fe51b76a53725377
-  data.tar.gz: 450aed6a82000a797973c1bdb19dc031cdd7ac0acde846af8e088adc0f6df8371cc9ed73c010068b5079cb1d7ca61f178ab8b588685f0a2999727da4fd95f92c
+  metadata.gz: fe261395e4de7c05f9694647e5bf5fdfa3da3b863b3034101beafa730560ce8f6c93b3cf10a4307381ef7b29acbb0021a88fcfe41cec2e541164d41526c3c850
+  data.tar.gz: db6015c51acade7a6d185393377124c7a58948e1381372bb36e2804e99f135321f7a7881810a2aeb8f7c4587d1b502a68785278dc2e98cf725516ae1dfaa92a6

data/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,6 @@
+## 3.0.3
+  - Docs: Add note indicating that the multiline codec should not be used with input plugins that support multiple hosts
 ## 3.0.2
   - Fix log levels

data/Gemfile CHANGED Viewed

@@ -1,4 +1,11 @@
 source 'https://rubygems.org'
-# Specify your gem's dependencies in logstash-mass_effect.gemspec
 gemspec
+logstash_path = ENV["LOGSTASH_PATH"] || "../../logstash"
+use_logstash_source = ENV["LOGSTASH_SOURCE"] && ENV["LOGSTASH_SOURCE"].to_s == "1"
+if Dir.exist?(logstash_path) && use_logstash_source
+  gem 'logstash-core', :path => "#{logstash_path}/logstash-core"
+  gem 'logstash-core-plugin-api', :path => "#{logstash_path}/logstash-core-plugin-api"
+end

data/docs/index.asciidoc ADDED Viewed

@@ -0,0 +1,222 @@
+:plugin: multiline
+:type: codec
+///////////////////////////////////////////
+START - GENERATED VARIABLES, DO NOT EDIT!
+///////////////////////////////////////////
+:version: %VERSION%
+:release_date: %RELEASE_DATE%
+:changelog_url: %CHANGELOG_URL%
+:include_path: ../../../../logstash/docs/include
+///////////////////////////////////////////
+END - GENERATED VARIABLES, DO NOT EDIT!
+///////////////////////////////////////////
+[id="plugins-{type}-{plugin}"]
+=== Multiline codec plugin
+include::{include_path}/plugin_header.asciidoc[]
+==== Description
+The multiline codec will collapse multiline messages and merge them into a
+single event.
+IMPORTANT: If you are using a Logstash input plugin that supports multiple
+hosts, such as the <<plugins-inputs-beats>> input plugin, you should not use
+the multiline codec to handle multiline events. Doing so may result in the
+mixing of streams and corrupted event data. In this situation, you need to
+handle multiline events before sending the event data to Logstash.
+The original goal of this codec was to allow joining of multiline messages
+from files into a single event. For example, joining Java exception and
+stacktrace messages into a single event.
+The config looks like this:
+[source,ruby]
+    input {
+      stdin {
+        codec => multiline {
+          pattern => "pattern, a regexp"
+          negate => "true" or "false"
+          what => "previous" or "next"
+        }
+      }
+    }
+The `pattern` should match what you believe to be an indicator that the field
+is part of a multi-line event.
+The `what` must be `previous` or `next` and indicates the relation
+to the multi-line event.
+The `negate` can be `true` or `false` (defaults to `false`). If `true`, a
+message not matching the pattern will constitute a match of the multiline
+filter and the `what` will be applied. (vice-versa is also true)
+For example, Java stack traces are multiline and usually have the message
+starting at the far-left, with each subsequent line indented. Do this:
+[source,ruby]
+    input {
+      stdin {
+        codec => multiline {
+          pattern => "^\s"
+          what => "previous"
+        }
+      }
+    }
+This says that any line starting with whitespace belongs to the previous line.
+Another example is to merge lines not starting with a date up to the previous
+line..
+[source,ruby]
+    input {
+      file {
+        path => "/var/log/someapp.log"
+        codec => multiline {
+          # Grok pattern names are valid! :)
+          pattern => "^%{TIMESTAMP_ISO8601} "
+          negate => true
+          what => "previous"
+        }
+      }
+    }
+This says that any line not starting with a timestamp should be merged with the previous line.
+One more common example is C line continuations (backslash). Here's how to do that:
+[source,ruby]
+    input {
+      stdin {
+        codec => multiline {
+          pattern => "\\$"
+          what => "next"
+        }
+      }
+    }
+This says that any line ending with a backslash should be combined with the
+following line.
+[id="plugins-{type}s-{plugin}-options"]
+==== Multiline Codec Configuration Options
+[cols="<,<,<",options="header",]
+|=======================================================================
+|Setting |Input type|Required
+| <<plugins-{type}s-{plugin}-auto_flush_interval>> |<<number,number>>|No
+| <<plugins-{type}s-{plugin}-charset>> |<<string,string>>, one of `["ASCII-8BIT", "UTF-8", "US-ASCII", "Big5", "Big5-HKSCS", "Big5-UAO", "CP949", "Emacs-Mule", "EUC-JP", "EUC-KR", "EUC-TW", "GB2312", "GB18030", "GBK", "ISO-8859-1", "ISO-8859-2", "ISO-8859-3", "ISO-8859-4", "ISO-8859-5", "ISO-8859-6", "ISO-8859-7", "ISO-8859-8", "ISO-8859-9", "ISO-8859-10", "ISO-8859-11", "ISO-8859-13", "ISO-8859-14", "ISO-8859-15", "ISO-8859-16", "KOI8-R", "KOI8-U", "Shift_JIS", "UTF-16BE", "UTF-16LE", "UTF-32BE", "UTF-32LE", "Windows-31J", "Windows-1250", "Windows-1251", "Windows-1252", "IBM437", "IBM737", "IBM775", "CP850", "IBM852", "CP852", "IBM855", "CP855", "IBM857", "IBM860", "IBM861", "IBM862", "IBM863", "IBM864", "IBM865", "IBM866", "IBM869", "Windows-1258", "GB1988", "macCentEuro", "macCroatian", "macCyrillic", "macGreek", "macIceland", "macRoman", "macRomania", "macThai", "macTurkish", "macUkraine", "CP950", "CP951", "IBM037", "stateless-ISO-2022-JP", "eucJP-ms", "CP51932", "EUC-JIS-2004", "GB12345", "ISO-2022-JP", "ISO-2022-JP-2", "CP50220", "CP50221", "Windows-1256", "Windows-1253", "Windows-1255", "Windows-1254", "TIS-620", "Windows-874", "Windows-1257", "MacJapanese", "UTF-7", "UTF8-MAC", "UTF-16", "UTF-32", "UTF8-DoCoMo", "SJIS-DoCoMo", "UTF8-KDDI", "SJIS-KDDI", "ISO-2022-JP-KDDI", "stateless-ISO-2022-JP-KDDI", "UTF8-SoftBank", "SJIS-SoftBank", "BINARY", "CP437", "CP737", "CP775", "IBM850", "CP857", "CP860", "CP861", "CP862", "CP863", "CP864", "CP865", "CP866", "CP869", "CP1258", "Big5-HKSCS:2008", "ebcdic-cp-us", "eucJP", "euc-jp-ms", "EUC-JISX0213", "eucKR", "eucTW", "EUC-CN", "eucCN", "CP936", "ISO2022-JP", "ISO2022-JP2", "ISO8859-1", "ISO8859-2", "ISO8859-3", "ISO8859-4", "ISO8859-5", "ISO8859-6", "CP1256", "ISO8859-7", "CP1253", "ISO8859-8", "CP1255", "ISO8859-9", "CP1254", "ISO8859-10", "ISO8859-11", "CP874", "ISO8859-13", "CP1257", "ISO8859-14", "ISO8859-15", "ISO8859-16", "CP878", "MacJapan", "ASCII", "ANSI_X3.4-1968", "646", "CP65000", "CP65001", "UTF-8-MAC", "UTF-8-HFS", "UCS-2BE", "UCS-4BE", "UCS-4LE", "CP932", "csWindows31J", "SJIS", "PCK", "CP1250", "CP1251", "CP1252", "external", "locale"]`|No
+| <<plugins-{type}s-{plugin}-max_bytes>> |<<bytes,bytes>>|No
+| <<plugins-{type}s-{plugin}-max_lines>> |<<number,number>>|No
+| <<plugins-{type}s-{plugin}-multiline_tag>> |<<string,string>>|No
+| <<plugins-{type}s-{plugin}-negate>> |<<boolean,boolean>>|No
+| <<plugins-{type}s-{plugin}-pattern>> |<<string,string>>|Yes
+| <<plugins-{type}s-{plugin}-patterns_dir>> |<<array,array>>|No
+| <<plugins-{type}s-{plugin}-what>> |<<string,string>>, one of `["previous", "next"]`|Yes
+|=======================================================================
+&nbsp;
+[id="plugins-{type}s-{plugin}-auto_flush_interval"]
+===== `auto_flush_interval`
+  * Value type is <<number,number>>
+  * There is no default value for this setting.
+The accumulation of multiple lines will be converted to an event when either a
+matching new line is seen or there has been no new data appended for this many
+seconds. No default.  If unset, no auto_flush. Units: seconds
+[id="plugins-{type}s-{plugin}-charset"]
+===== `charset`
+  * Value can be any of: `ASCII-8BIT`, `UTF-8`, `US-ASCII`, `Big5`, `Big5-HKSCS`, `Big5-UAO`, `CP949`, `Emacs-Mule`, `EUC-JP`, `EUC-KR`, `EUC-TW`, `GB2312`, `GB18030`, `GBK`, `ISO-8859-1`, `ISO-8859-2`, `ISO-8859-3`, `ISO-8859-4`, `ISO-8859-5`, `ISO-8859-6`, `ISO-8859-7`, `ISO-8859-8`, `ISO-8859-9`, `ISO-8859-10`, `ISO-8859-11`, `ISO-8859-13`, `ISO-8859-14`, `ISO-8859-15`, `ISO-8859-16`, `KOI8-R`, `KOI8-U`, `Shift_JIS`, `UTF-16BE`, `UTF-16LE`, `UTF-32BE`, `UTF-32LE`, `Windows-31J`, `Windows-1250`, `Windows-1251`, `Windows-1252`, `IBM437`, `IBM737`, `IBM775`, `CP850`, `IBM852`, `CP852`, `IBM855`, `CP855`, `IBM857`, `IBM860`, `IBM861`, `IBM862`, `IBM863`, `IBM864`, `IBM865`, `IBM866`, `IBM869`, `Windows-1258`, `GB1988`, `macCentEuro`, `macCroatian`, `macCyrillic`, `macGreek`, `macIceland`, `macRoman`, `macRomania`, `macThai`, `macTurkish`, `macUkraine`, `CP950`, `CP951`, `IBM037`, `stateless-ISO-2022-JP`, `eucJP-ms`, `CP51932`, `EUC-JIS-2004`, `GB12345`, `ISO-2022-JP`, `ISO-2022-JP-2`, `CP50220`, `CP50221`, `Windows-1256`, `Windows-1253`, `Windows-1255`, `Windows-1254`, `TIS-620`, `Windows-874`, `Windows-1257`, `MacJapanese`, `UTF-7`, `UTF8-MAC`, `UTF-16`, `UTF-32`, `UTF8-DoCoMo`, `SJIS-DoCoMo`, `UTF8-KDDI`, `SJIS-KDDI`, `ISO-2022-JP-KDDI`, `stateless-ISO-2022-JP-KDDI`, `UTF8-SoftBank`, `SJIS-SoftBank`, `BINARY`, `CP437`, `CP737`, `CP775`, `IBM850`, `CP857`, `CP860`, `CP861`, `CP862`, `CP863`, `CP864`, `CP865`, `CP866`, `CP869`, `CP1258`, `Big5-HKSCS:2008`, `ebcdic-cp-us`, `eucJP`, `euc-jp-ms`, `EUC-JISX0213`, `eucKR`, `eucTW`, `EUC-CN`, `eucCN`, `CP936`, `ISO2022-JP`, `ISO2022-JP2`, `ISO8859-1`, `ISO8859-2`, `ISO8859-3`, `ISO8859-4`, `ISO8859-5`, `ISO8859-6`, `CP1256`, `ISO8859-7`, `CP1253`, `ISO8859-8`, `CP1255`, `ISO8859-9`, `CP1254`, `ISO8859-10`, `ISO8859-11`, `CP874`, `ISO8859-13`, `CP1257`, `ISO8859-14`, `ISO8859-15`, `ISO8859-16`, `CP878`, `MacJapan`, `ASCII`, `ANSI_X3.4-1968`, `646`, `CP65000`, `CP65001`, `UTF-8-MAC`, `UTF-8-HFS`, `UCS-2BE`, `UCS-4BE`, `UCS-4LE`, `CP932`, `csWindows31J`, `SJIS`, `PCK`, `CP1250`, `CP1251`, `CP1252`, `external`, `locale`
+  * Default value is `"UTF-8"`
+The character encoding used in this input. Examples include `UTF-8`
+and `cp1252`
+This setting is useful if your log files are in `Latin-1` (aka `cp1252`)
+or in another character set other than `UTF-8`.
+This only affects "plain" format logs since JSON is `UTF-8` already.
+[id="plugins-{type}s-{plugin}-max_bytes"]
+===== `max_bytes`
+  * Value type is <<bytes,bytes>>
+  * Default value is `"10 MiB"`
+The accumulation of events can make logstash exit with an out of memory error
+if event boundaries are not correctly defined. This settings make sure to flush
+multiline events after reaching a number of bytes, it is used in combination
+max_lines.
+[id="plugins-{type}s-{plugin}-max_lines"]
+===== `max_lines`
+  * Value type is <<number,number>>
+  * Default value is `500`
+The accumulation of events can make logstash exit with an out of memory error
+if event boundaries are not correctly defined. This settings make sure to flush
+multiline events after reaching a number of lines, it is used in combination
+max_bytes.
+[id="plugins-{type}s-{plugin}-multiline_tag"]
+===== `multiline_tag`
+  * Value type is <<string,string>>
+  * Default value is `"multiline"`
+Tag multiline events with a given tag. This tag will only be added
+to events that actually have multiple lines in them.
+[id="plugins-{type}s-{plugin}-negate"]
+===== `negate`
+  * Value type is <<boolean,boolean>>
+  * Default value is `false`
+Negate the regexp pattern ('if not matched').
+[id="plugins-{type}s-{plugin}-pattern"]
+===== `pattern`
+  * This is a required setting.
+  * Value type is <<string,string>>
+  * There is no default value for this setting.
+The regular expression to match.
+[id="plugins-{type}s-{plugin}-patterns_dir"]
+===== `patterns_dir`
+  * Value type is <<array,array>>
+  * Default value is `[]`
+Logstash ships by default with a bunch of patterns, so you don't
+necessarily need to define this yourself unless you are adding additional
+patterns.
+Pattern files are plain text with format:
+[source,ruby]
+    NAME PATTERN
+For example:
+[source,ruby]
+    NUMBER \d+
+[id="plugins-{type}s-{plugin}-what"]
+===== `what`
+  * This is a required setting.
+  * Value can be any of: `previous`, `next`
+  * There is no default value for this setting.
+If the pattern matched, does event belong to the next or previous event?

data/lib/logstash/codecs/multiline.rb CHANGED Viewed

@@ -7,6 +7,12 @@ require "logstash/codecs/auto_flush"
 # The multiline codec will collapse multiline messages and merge them into a
 # single event.
 #
+# IMPORTANT: If you are using a Logstash input plugin that supports multiple
+# hosts, such as the <<plugins-inputs-beats>> input plugin, you should not use
+# the multiline codec to handle multiline events. Doing so may result in the
+# mixing of streams and corrupted event data. In this situation, you need to
+# handle multiline events before sending the event data to Logstash.
+#
 # The original goal of this codec was to allow joining of multiline messages
 # from files into a single event. For example, joining Java exception and
 # stacktrace messages into a single event.
@@ -57,7 +63,7 @@ require "logstash/codecs/auto_flush"
 #           # Grok pattern names are valid! :)
 #           pattern => "^%{TIMESTAMP_ISO8601} "
 #           negate => true
-#           what => previous
+#           what => "previous"
 #         }
 #       }
 #     }
@@ -66,11 +72,12 @@ require "logstash/codecs/auto_flush"
 #
 # One more common example is C line continuations (backslash). Here's how to do that:
 # [source,ruby]
-#     filter {
-#       multiline {
-#         type => "somefiletype"
-#         pattern => "\\$"
-#         what => "next"
+#     input {
+#       stdin {
+#         codec => multiline {
+#           pattern => "\\$"
+#           what => "next"
+#         }
 #       }
 #     }
 #
@@ -128,8 +135,8 @@ module LogStash module Codecs class Multiline < LogStash::Codecs::Base
   config :max_bytes, :validate => :bytes, :default => "10 MiB"
   # The accumulation of multiple lines will be converted to an event when either a
-  # matching new line is seen or there has been no new data appended for this time
-  # auto_flush_interval. No default.  If unset, no auto_flush. Units: seconds
+  # matching new line is seen or there has been no new data appended for this many
+  # seconds. No default.  If unset, no auto_flush. Units: seconds
   config :auto_flush_interval, :validate => :number
   public

data/logstash-codec-multiline.gemspec CHANGED Viewed

@@ -1,7 +1,7 @@
 Gem::Specification.new do |s|
   s.name            = 'logstash-codec-multiline'
-  s.version         = '3.0.3'
+  s.version         = '3.0.5'
   s.licenses        = ['Apache License (2.0)']
   s.summary         = "The multiline codec will collapse multiline messages and merge them into a single event."
   s.description     = "This gem is a Logstash plugin required to be installed on top of the Logstash core pipeline using $LS_HOME/bin/logstash-plugin install gemname. This gem is not a stand-alone program"
@@ -11,7 +11,7 @@ Gem::Specification.new do |s|
   s.require_paths = ["lib"]
   # Files
-  s.files = Dir['lib/**/*','spec/**/*','vendor/**/*','*.gemspec','*.md','CONTRIBUTORS','Gemfile','LICENSE','NOTICE.TXT']
+  s.files = Dir["lib/**/*","spec/**/*","*.gemspec","*.md","CONTRIBUTORS","Gemfile","LICENSE","NOTICE.TXT", "vendor/jar-dependencies/**/*.jar", "vendor/jar-dependencies/**/*.rb", "VERSION", "docs/**/*"]
   # Tests
   s.test_files = s.files.grep(%r{^(test|spec|features)/})

data/spec/codecs/auto_flush_spec.rb CHANGED Viewed

@@ -1,4 +1,5 @@
 # encoding: utf-8
+require "logstash/devutils/rspec/spec_helper"
 require "logstash/codecs/auto_flush"
 require "logstash/codecs/multiline"
 require_relative "../supports/helpers.rb"

data/spec/codecs/multiline_spec.rb CHANGED Viewed

@@ -1,4 +1,5 @@
 # encoding: utf-8
+require "logstash/devutils/rspec/spec_helper"
 require "logstash/codecs/multiline"
 require "logstash/event"
 require "insist"

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: logstash-codec-multiline
 version: !ruby/object:Gem::Version
-  version: 3.0.3
+  version: 3.0.5
 platform: ruby
 authors:
 - Elastic
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2016-09-15 00:00:00.000000000 Z
+date: 2017-06-23 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   requirement: !ruby/object:Gem::Requirement
@@ -84,6 +84,7 @@ files:
 - LICENSE
 - NOTICE.TXT
 - README.md
+- docs/index.asciidoc
 - lib/logstash/codecs/auto_flush.rb
 - lib/logstash/codecs/identity_map_codec.rb
 - lib/logstash/codecs/multiline.rb