logstash-filter-kv 4.3.3 → 4.6.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +12 -0
- data/LICENSE +199 -10
- data/README.md +1 -1
- data/docs/index.asciidoc +31 -0
- data/lib/logstash/filters/kv.rb +59 -133
- data/logstash-filter-kv.gemspec +4 -1
- data/spec/filters/kv_spec.rb +53 -0
- metadata +45 -4
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 2127186e4a039aaadb013f982c1ed9815827b4c629979a9572a2000a961f3fb1
|
4
|
+
data.tar.gz: e79ab76e7787bb89b4aa0e901a78bc0412c3e9344ff6ac7ac23554b56f8f526b
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 237975f6ce46e4d5e5ac94742ea4b7adc323691d22a670ea37d9ff68f111523ca0f5b6dd3f81bf8c5dd60a60b6dafd11d579e5c4fcfc383c356a43b72f8e277d
|
7
|
+
data.tar.gz: bc354d05d413b8781e0baf3076521cd6257baaa49a84650b3182fd076aa91b962558d247d9a8b55ee8485427ccc74e33e0505f97ca38b784b8b3c00333ea926b
|
data/CHANGELOG.md
CHANGED
@@ -1,3 +1,15 @@
|
|
1
|
+
## 4.6.0
|
2
|
+
- Added `allow_empty_values` option [#72](https://github.com/logstash-plugins/logstash-filter-kv/pull/72)
|
3
|
+
|
4
|
+
## 4.5.0
|
5
|
+
- Feat: check that target is set in ECS mode [#96](https://github.com/logstash-plugins/logstash-filter-kv/pull/96)
|
6
|
+
|
7
|
+
## 4.4.1
|
8
|
+
- Fixed issue where a `field_split_pattern` containing a literal backslash failed to match correctly [#87](https://github.com/logstash-plugins/logstash-filter-kv/issues/87)
|
9
|
+
|
10
|
+
## 4.4.0
|
11
|
+
- Changed timeout handling using the Timeout class [#84](https://github.com/logstash-plugins/logstash-filter-kv/pull/84)
|
12
|
+
|
1
13
|
## 4.3.3
|
2
14
|
- Fixed asciidoc formatting in docs
|
3
15
|
|
data/LICENSE
CHANGED
@@ -1,13 +1,202 @@
|
|
1
|
-
Copyright (c) 2012-2018 Elasticsearch <http://www.elastic.co>
|
2
1
|
|
3
|
-
|
4
|
-
|
5
|
-
|
2
|
+
Apache License
|
3
|
+
Version 2.0, January 2004
|
4
|
+
http://www.apache.org/licenses/
|
6
5
|
|
7
|
-
|
6
|
+
TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
|
8
7
|
|
9
|
-
|
10
|
-
|
11
|
-
|
12
|
-
|
13
|
-
|
8
|
+
1. Definitions.
|
9
|
+
|
10
|
+
"License" shall mean the terms and conditions for use, reproduction,
|
11
|
+
and distribution as defined by Sections 1 through 9 of this document.
|
12
|
+
|
13
|
+
"Licensor" shall mean the copyright owner or entity authorized by
|
14
|
+
the copyright owner that is granting the License.
|
15
|
+
|
16
|
+
"Legal Entity" shall mean the union of the acting entity and all
|
17
|
+
other entities that control, are controlled by, or are under common
|
18
|
+
control with that entity. For the purposes of this definition,
|
19
|
+
"control" means (i) the power, direct or indirect, to cause the
|
20
|
+
direction or management of such entity, whether by contract or
|
21
|
+
otherwise, or (ii) ownership of fifty percent (50%) or more of the
|
22
|
+
outstanding shares, or (iii) beneficial ownership of such entity.
|
23
|
+
|
24
|
+
"You" (or "Your") shall mean an individual or Legal Entity
|
25
|
+
exercising permissions granted by this License.
|
26
|
+
|
27
|
+
"Source" form shall mean the preferred form for making modifications,
|
28
|
+
including but not limited to software source code, documentation
|
29
|
+
source, and configuration files.
|
30
|
+
|
31
|
+
"Object" form shall mean any form resulting from mechanical
|
32
|
+
transformation or translation of a Source form, including but
|
33
|
+
not limited to compiled object code, generated documentation,
|
34
|
+
and conversions to other media types.
|
35
|
+
|
36
|
+
"Work" shall mean the work of authorship, whether in Source or
|
37
|
+
Object form, made available under the License, as indicated by a
|
38
|
+
copyright notice that is included in or attached to the work
|
39
|
+
(an example is provided in the Appendix below).
|
40
|
+
|
41
|
+
"Derivative Works" shall mean any work, whether in Source or Object
|
42
|
+
form, that is based on (or derived from) the Work and for which the
|
43
|
+
editorial revisions, annotations, elaborations, or other modifications
|
44
|
+
represent, as a whole, an original work of authorship. For the purposes
|
45
|
+
of this License, Derivative Works shall not include works that remain
|
46
|
+
separable from, or merely link (or bind by name) to the interfaces of,
|
47
|
+
the Work and Derivative Works thereof.
|
48
|
+
|
49
|
+
"Contribution" shall mean any work of authorship, including
|
50
|
+
the original version of the Work and any modifications or additions
|
51
|
+
to that Work or Derivative Works thereof, that is intentionally
|
52
|
+
submitted to Licensor for inclusion in the Work by the copyright owner
|
53
|
+
or by an individual or Legal Entity authorized to submit on behalf of
|
54
|
+
the copyright owner. For the purposes of this definition, "submitted"
|
55
|
+
means any form of electronic, verbal, or written communication sent
|
56
|
+
to the Licensor or its representatives, including but not limited to
|
57
|
+
communication on electronic mailing lists, source code control systems,
|
58
|
+
and issue tracking systems that are managed by, or on behalf of, the
|
59
|
+
Licensor for the purpose of discussing and improving the Work, but
|
60
|
+
excluding communication that is conspicuously marked or otherwise
|
61
|
+
designated in writing by the copyright owner as "Not a Contribution."
|
62
|
+
|
63
|
+
"Contributor" shall mean Licensor and any individual or Legal Entity
|
64
|
+
on behalf of whom a Contribution has been received by Licensor and
|
65
|
+
subsequently incorporated within the Work.
|
66
|
+
|
67
|
+
2. Grant of Copyright License. Subject to the terms and conditions of
|
68
|
+
this License, each Contributor hereby grants to You a perpetual,
|
69
|
+
worldwide, non-exclusive, no-charge, royalty-free, irrevocable
|
70
|
+
copyright license to reproduce, prepare Derivative Works of,
|
71
|
+
publicly display, publicly perform, sublicense, and distribute the
|
72
|
+
Work and such Derivative Works in Source or Object form.
|
73
|
+
|
74
|
+
3. Grant of Patent License. Subject to the terms and conditions of
|
75
|
+
this License, each Contributor hereby grants to You a perpetual,
|
76
|
+
worldwide, non-exclusive, no-charge, royalty-free, irrevocable
|
77
|
+
(except as stated in this section) patent license to make, have made,
|
78
|
+
use, offer to sell, sell, import, and otherwise transfer the Work,
|
79
|
+
where such license applies only to those patent claims licensable
|
80
|
+
by such Contributor that are necessarily infringed by their
|
81
|
+
Contribution(s) alone or by combination of their Contribution(s)
|
82
|
+
with the Work to which such Contribution(s) was submitted. If You
|
83
|
+
institute patent litigation against any entity (including a
|
84
|
+
cross-claim or counterclaim in a lawsuit) alleging that the Work
|
85
|
+
or a Contribution incorporated within the Work constitutes direct
|
86
|
+
or contributory patent infringement, then any patent licenses
|
87
|
+
granted to You under this License for that Work shall terminate
|
88
|
+
as of the date such litigation is filed.
|
89
|
+
|
90
|
+
4. Redistribution. You may reproduce and distribute copies of the
|
91
|
+
Work or Derivative Works thereof in any medium, with or without
|
92
|
+
modifications, and in Source or Object form, provided that You
|
93
|
+
meet the following conditions:
|
94
|
+
|
95
|
+
(a) You must give any other recipients of the Work or
|
96
|
+
Derivative Works a copy of this License; and
|
97
|
+
|
98
|
+
(b) You must cause any modified files to carry prominent notices
|
99
|
+
stating that You changed the files; and
|
100
|
+
|
101
|
+
(c) You must retain, in the Source form of any Derivative Works
|
102
|
+
that You distribute, all copyright, patent, trademark, and
|
103
|
+
attribution notices from the Source form of the Work,
|
104
|
+
excluding those notices that do not pertain to any part of
|
105
|
+
the Derivative Works; and
|
106
|
+
|
107
|
+
(d) If the Work includes a "NOTICE" text file as part of its
|
108
|
+
distribution, then any Derivative Works that You distribute must
|
109
|
+
include a readable copy of the attribution notices contained
|
110
|
+
within such NOTICE file, excluding those notices that do not
|
111
|
+
pertain to any part of the Derivative Works, in at least one
|
112
|
+
of the following places: within a NOTICE text file distributed
|
113
|
+
as part of the Derivative Works; within the Source form or
|
114
|
+
documentation, if provided along with the Derivative Works; or,
|
115
|
+
within a display generated by the Derivative Works, if and
|
116
|
+
wherever such third-party notices normally appear. The contents
|
117
|
+
of the NOTICE file are for informational purposes only and
|
118
|
+
do not modify the License. You may add Your own attribution
|
119
|
+
notices within Derivative Works that You distribute, alongside
|
120
|
+
or as an addendum to the NOTICE text from the Work, provided
|
121
|
+
that such additional attribution notices cannot be construed
|
122
|
+
as modifying the License.
|
123
|
+
|
124
|
+
You may add Your own copyright statement to Your modifications and
|
125
|
+
may provide additional or different license terms and conditions
|
126
|
+
for use, reproduction, or distribution of Your modifications, or
|
127
|
+
for any such Derivative Works as a whole, provided Your use,
|
128
|
+
reproduction, and distribution of the Work otherwise complies with
|
129
|
+
the conditions stated in this License.
|
130
|
+
|
131
|
+
5. Submission of Contributions. Unless You explicitly state otherwise,
|
132
|
+
any Contribution intentionally submitted for inclusion in the Work
|
133
|
+
by You to the Licensor shall be under the terms and conditions of
|
134
|
+
this License, without any additional terms or conditions.
|
135
|
+
Notwithstanding the above, nothing herein shall supersede or modify
|
136
|
+
the terms of any separate license agreement you may have executed
|
137
|
+
with Licensor regarding such Contributions.
|
138
|
+
|
139
|
+
6. Trademarks. This License does not grant permission to use the trade
|
140
|
+
names, trademarks, service marks, or product names of the Licensor,
|
141
|
+
except as required for reasonable and customary use in describing the
|
142
|
+
origin of the Work and reproducing the content of the NOTICE file.
|
143
|
+
|
144
|
+
7. Disclaimer of Warranty. Unless required by applicable law or
|
145
|
+
agreed to in writing, Licensor provides the Work (and each
|
146
|
+
Contributor provides its Contributions) on an "AS IS" BASIS,
|
147
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
|
148
|
+
implied, including, without limitation, any warranties or conditions
|
149
|
+
of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
|
150
|
+
PARTICULAR PURPOSE. You are solely responsible for determining the
|
151
|
+
appropriateness of using or redistributing the Work and assume any
|
152
|
+
risks associated with Your exercise of permissions under this License.
|
153
|
+
|
154
|
+
8. Limitation of Liability. In no event and under no legal theory,
|
155
|
+
whether in tort (including negligence), contract, or otherwise,
|
156
|
+
unless required by applicable law (such as deliberate and grossly
|
157
|
+
negligent acts) or agreed to in writing, shall any Contributor be
|
158
|
+
liable to You for damages, including any direct, indirect, special,
|
159
|
+
incidental, or consequential damages of any character arising as a
|
160
|
+
result of this License or out of the use or inability to use the
|
161
|
+
Work (including but not limited to damages for loss of goodwill,
|
162
|
+
work stoppage, computer failure or malfunction, or any and all
|
163
|
+
other commercial damages or losses), even if such Contributor
|
164
|
+
has been advised of the possibility of such damages.
|
165
|
+
|
166
|
+
9. Accepting Warranty or Additional Liability. While redistributing
|
167
|
+
the Work or Derivative Works thereof, You may choose to offer,
|
168
|
+
and charge a fee for, acceptance of support, warranty, indemnity,
|
169
|
+
or other liability obligations and/or rights consistent with this
|
170
|
+
License. However, in accepting such obligations, You may act only
|
171
|
+
on Your own behalf and on Your sole responsibility, not on behalf
|
172
|
+
of any other Contributor, and only if You agree to indemnify,
|
173
|
+
defend, and hold each Contributor harmless for any liability
|
174
|
+
incurred by, or claims asserted against, such Contributor by reason
|
175
|
+
of your accepting any such warranty or additional liability.
|
176
|
+
|
177
|
+
END OF TERMS AND CONDITIONS
|
178
|
+
|
179
|
+
APPENDIX: How to apply the Apache License to your work.
|
180
|
+
|
181
|
+
To apply the Apache License to your work, attach the following
|
182
|
+
boilerplate notice, with the fields enclosed by brackets "[]"
|
183
|
+
replaced with your own identifying information. (Don't include
|
184
|
+
the brackets!) The text should be enclosed in the appropriate
|
185
|
+
comment syntax for the file format. We also recommend that a
|
186
|
+
file or class name and description of purpose be included on the
|
187
|
+
same "printed page" as the copyright notice for easier
|
188
|
+
identification within third-party archives.
|
189
|
+
|
190
|
+
Copyright 2020 Elastic and contributors
|
191
|
+
|
192
|
+
Licensed under the Apache License, Version 2.0 (the "License");
|
193
|
+
you may not use this file except in compliance with the License.
|
194
|
+
You may obtain a copy of the License at
|
195
|
+
|
196
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
197
|
+
|
198
|
+
Unless required by applicable law or agreed to in writing, software
|
199
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
200
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
201
|
+
See the License for the specific language governing permissions and
|
202
|
+
limitations under the License.
|
data/README.md
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
# Logstash Plugin
|
2
2
|
|
3
|
-
[![Travis Build Status](https://travis-ci.
|
3
|
+
[![Travis Build Status](https://travis-ci.com/logstash-plugins/logstash-filter-kv.svg)](https://travis-ci.com/logstash-plugins/logstash-filter-kv)
|
4
4
|
|
5
5
|
This is a plugin for [Logstash](https://github.com/elastic/logstash).
|
6
6
|
|
data/docs/index.asciidoc
CHANGED
@@ -44,6 +44,13 @@ in case your data is not structured using `=` signs and whitespace.
|
|
44
44
|
For example, this filter can also be used to parse query parameters like
|
45
45
|
`foo=bar&baz=fizz` by setting the `field_split` parameter to `&`.
|
46
46
|
|
47
|
+
[id="plugins-{type}s-{plugin}-ecs_metadata"]
|
48
|
+
==== Event Metadata and the Elastic Common Schema (ECS)
|
49
|
+
|
50
|
+
The plugin behaves the same regardless of ECS compatibility, except giving a warning when ECS is enabled and `target` isn't set.
|
51
|
+
|
52
|
+
TIP: Set the `target` option to avoid potential schema conflicts.
|
53
|
+
|
47
54
|
[id="plugins-{type}s-{plugin}-options"]
|
48
55
|
==== Kv Filter Configuration Options
|
49
56
|
|
@@ -53,7 +60,9 @@ This plugin supports the following configuration options plus the <<plugins-{typ
|
|
53
60
|
|=======================================================================
|
54
61
|
|Setting |Input type|Required
|
55
62
|
| <<plugins-{type}s-{plugin}-allow_duplicate_values>> |<<boolean,boolean>>|No
|
63
|
+
| <<plugins-{type}s-{plugin}-allow_empty_values>> |<<boolean,boolean>>|No
|
56
64
|
| <<plugins-{type}s-{plugin}-default_keys>> |<<hash,hash>>|No
|
65
|
+
| <<plugins-{type}s-{plugin}-ecs_compatibility>> | <<string,string>>|No
|
57
66
|
| <<plugins-{type}s-{plugin}-exclude_keys>> |<<array,array>>|No
|
58
67
|
| <<plugins-{type}s-{plugin}-field_split>> |<<string,string>>|No
|
59
68
|
| <<plugins-{type}s-{plugin}-field_split_pattern>> |<<string,string>>|No
|
@@ -101,6 +110,17 @@ you could use this configuration:
|
|
101
110
|
}
|
102
111
|
}
|
103
112
|
|
113
|
+
[id="plugins-{type}s-{plugin}-allow_empty_values"]
|
114
|
+
===== `allow_empty_values`
|
115
|
+
|
116
|
+
* Value type is <<boolean,boolean>>
|
117
|
+
* Default value is `false`
|
118
|
+
|
119
|
+
A bool option for explicitly including empty values.
|
120
|
+
When set to true, empty values will be added to the event.
|
121
|
+
|
122
|
+
NOTE: Parsing empty values typically requires <<plugins-{type}s-{plugin}-whitespace,`whitespace => strict`>>.
|
123
|
+
|
104
124
|
[id="plugins-{type}s-{plugin}-default_keys"]
|
105
125
|
===== `default_keys`
|
106
126
|
|
@@ -117,6 +137,17 @@ in case these keys do not exist in the source field being parsed.
|
|
117
137
|
}
|
118
138
|
}
|
119
139
|
|
140
|
+
[id="plugins-{type}s-{plugin}-ecs_compatibility"]
|
141
|
+
===== `ecs_compatibility`
|
142
|
+
|
143
|
+
* Value type is <<string,string>>
|
144
|
+
* Supported values are:
|
145
|
+
** `disabled`: does not use ECS-compatible field names
|
146
|
+
** `v1`: Elastic Common Schema compliant behavior (warns when `target` isn't set)
|
147
|
+
|
148
|
+
Controls this plugin's compatibility with the {ecs-ref}[Elastic Common Schema (ECS)].
|
149
|
+
See <<plugins-{type}s-{plugin}-ecs_metadata>> for detailed information.
|
150
|
+
|
120
151
|
[id="plugins-{type}s-{plugin}-exclude_keys"]
|
121
152
|
===== `exclude_keys`
|
122
153
|
|
data/lib/logstash/filters/kv.rb
CHANGED
@@ -2,6 +2,10 @@
|
|
2
2
|
|
3
3
|
require "logstash/filters/base"
|
4
4
|
require "logstash/namespace"
|
5
|
+
require 'logstash/plugin_mixins/ecs_compatibility_support'
|
6
|
+
require 'logstash/plugin_mixins/ecs_compatibility_support/target_check'
|
7
|
+
require 'logstash/plugin_mixins/validator_support/field_reference_validation_adapter'
|
8
|
+
require "timeout"
|
5
9
|
|
6
10
|
# This filter helps automatically parse messages (or specific event fields)
|
7
11
|
# which are of the `foo=bar` variety.
|
@@ -29,6 +33,11 @@ require "logstash/namespace"
|
|
29
33
|
class LogStash::Filters::KV < LogStash::Filters::Base
|
30
34
|
config_name "kv"
|
31
35
|
|
36
|
+
include LogStash::PluginMixins::ECSCompatibilitySupport
|
37
|
+
include LogStash::PluginMixins::ECSCompatibilitySupport::TargetCheck
|
38
|
+
|
39
|
+
extend LogStash::PluginMixins::ValidatorSupport::FieldReferenceValidationAdapter
|
40
|
+
|
32
41
|
# Constants used for transform check
|
33
42
|
TRANSFORM_LOWERCASE_KEY = "lowercase"
|
34
43
|
TRANSFORM_UPPERCASE_KEY = "uppercase"
|
@@ -200,7 +209,7 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
200
209
|
# For example, to process the `not_the_message` field:
|
201
210
|
# [source,ruby]
|
202
211
|
# filter { kv { source => "not_the_message" } }
|
203
|
-
config :source, :validate => :
|
212
|
+
config :source, :validate => :field_reference, :default => "message"
|
204
213
|
|
205
214
|
# The name of the container to put all of the key-value pairs into.
|
206
215
|
#
|
@@ -210,7 +219,7 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
210
219
|
# For example, to place all keys into the event field kv:
|
211
220
|
# [source,ruby]
|
212
221
|
# filter { kv { target => "kv" } }
|
213
|
-
config :target, :validate => :
|
222
|
+
config :target, :validate => :field_reference
|
214
223
|
|
215
224
|
# An array specifying the parsed keys which should be added to the event.
|
216
225
|
# By default all keys will be added.
|
@@ -263,6 +272,9 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
263
272
|
# }
|
264
273
|
config :allow_duplicate_values, :validate => :boolean, :default => true
|
265
274
|
|
275
|
+
# A bool option for keeping empty or nil values.
|
276
|
+
config :allow_empty_values, :validate => :boolean, :default => false
|
277
|
+
|
266
278
|
# A boolean specifying whether to treat square brackets, angle brackets,
|
267
279
|
# and parentheses as value "wrappers" that should be removed from the value.
|
268
280
|
# [source,ruby]
|
@@ -319,8 +331,6 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
319
331
|
|
320
332
|
# Attempt to terminate regexps after this amount of time.
|
321
333
|
# This applies per source field value if event has multiple values in the source field.
|
322
|
-
# This will never timeout early, but may take a little longer to timeout.
|
323
|
-
# Actual timeout is approximate based on a 250ms quantization.
|
324
334
|
# Set to 0 to disable timeouts
|
325
335
|
config :timeout_millis, :validate => :number, :default => 30_000
|
326
336
|
|
@@ -330,7 +340,16 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
330
340
|
# Tag to apply if kv errors
|
331
341
|
config :tag_on_failure, :validate => :string, :default => '_kv_filter_error'
|
332
342
|
|
343
|
+
|
344
|
+
EMPTY_STRING = ''.freeze
|
345
|
+
|
333
346
|
def register
|
347
|
+
# Too late to set the regexp interruptible flag, at least warn if it is not set.
|
348
|
+
require 'java'
|
349
|
+
if java.lang.System.getProperty("jruby.regexp.interruptible") != "true"
|
350
|
+
logger.warn("KV Filter registered without jruby interruptible regular expressions enabled (`-Djruby.regexp.interruptible=true`); timeouts may not be respected.")
|
351
|
+
end
|
352
|
+
|
334
353
|
if @value_split.empty?
|
335
354
|
raise LogStash::ConfigurationError, I18n.t(
|
336
355
|
"logstash.runner.configuration.invalid_plugin_register",
|
@@ -406,26 +425,17 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
406
425
|
|
407
426
|
@logger.debug? && @logger.debug("KV scan regex", :regex => @scan_re.inspect)
|
408
427
|
|
409
|
-
|
410
|
-
|
428
|
+
# divide by float to allow fractionnal seconds, the Timeout class timeout value is in seconds but the underlying
|
429
|
+
# executor resolution is in microseconds so fractionnal second parameter down to microseconds is possible.
|
430
|
+
# see https://github.com/jruby/jruby/blob/9.2.7.0/core/src/main/java/org/jruby/ext/timeout/Timeout.java#L125
|
431
|
+
@timeout_seconds = @timeout_millis / 1000.0
|
411
432
|
end
|
412
433
|
|
413
434
|
def filter(event)
|
414
|
-
kv = Hash.new
|
415
435
|
value = event.get(@source)
|
416
436
|
|
417
|
-
|
418
|
-
|
419
|
-
when nil
|
420
|
-
# Nothing to do
|
421
|
-
when String
|
422
|
-
parse(value, event, kv)
|
423
|
-
when Array
|
424
|
-
value.each { |v| parse(v, event, kv) }
|
425
|
-
else
|
426
|
-
@logger.warn("kv filter has no support for this type of data", :type => value.class, :value => value)
|
427
|
-
end
|
428
|
-
end
|
437
|
+
# if timeout is 0 avoid creating a closure although Timeout.timeout has a bypass for 0s timeouts.
|
438
|
+
kv = @timeout_seconds > 0.0 ? Timeout.timeout(@timeout_seconds, TimeoutException) { parse_value(value, event) } : parse_value(value, event)
|
429
439
|
|
430
440
|
# Add default key-values for missing keys
|
431
441
|
kv = @default_keys.merge(kv)
|
@@ -433,7 +443,9 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
433
443
|
return if kv.empty?
|
434
444
|
|
435
445
|
if @target
|
436
|
-
|
446
|
+
if event.include?(@target)
|
447
|
+
@logger.debug? && @logger.debug("Overwriting existing target field", field: @target, existing_value: event.get(@target))
|
448
|
+
end
|
437
449
|
event.set(@target, kv)
|
438
450
|
else
|
439
451
|
kv.each{|k, v| event.set(k, v)}
|
@@ -452,11 +464,27 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
452
464
|
end
|
453
465
|
|
454
466
|
def close
|
455
|
-
@timeout_enforcer.stop!
|
456
467
|
end
|
457
468
|
|
458
469
|
private
|
459
470
|
|
471
|
+
def parse_value(value, event)
|
472
|
+
kv = Hash.new
|
473
|
+
|
474
|
+
case value
|
475
|
+
when nil
|
476
|
+
# Nothing to do
|
477
|
+
when String
|
478
|
+
parse(value, event, kv)
|
479
|
+
when Array
|
480
|
+
value.each { |v| parse(v, event, kv) }
|
481
|
+
else
|
482
|
+
@logger.warn("kv filter has no support for this type of data", :type => value.class, :value => value)
|
483
|
+
end
|
484
|
+
|
485
|
+
kv
|
486
|
+
end
|
487
|
+
|
460
488
|
# @overload summarize(value)
|
461
489
|
# @param value [Array]
|
462
490
|
# @return [String]
|
@@ -474,13 +502,7 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
474
502
|
|
475
503
|
value.bytesize < 255 ? "`#{value}`" : "entry too large; first 255 chars are `#{value[0..255].dump}`"
|
476
504
|
end
|
477
|
-
|
478
|
-
def initialize_timeout_enforcer
|
479
|
-
return NULL_TIMEOUT_ENFORCER if @timeout_millis <= 0
|
480
|
-
|
481
|
-
TimeoutEnforcer.new(logger, @timeout_millis * 1_000_000)
|
482
|
-
end
|
483
|
-
|
505
|
+
|
484
506
|
def has_value_splitter?(s)
|
485
507
|
s =~ @value_split_re
|
486
508
|
end
|
@@ -513,7 +535,7 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
513
535
|
# @return [Regexp]
|
514
536
|
def unquoted_capture_until_pattern(*patterns)
|
515
537
|
pattern = patterns.size > 1 ? Regexp.union(patterns) : patterns.first
|
516
|
-
/((
|
538
|
+
/((?:(?!#{pattern})(?:\\.|.))+)/
|
517
539
|
end
|
518
540
|
|
519
541
|
# Helper function for generating *capturing* `Regexp` that will _efficiently_ match any sequence of characters
|
@@ -553,12 +575,12 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
553
575
|
exclude_keys = @exclude_keys.map{|key| event.sprintf(key)}
|
554
576
|
|
555
577
|
text.scan(@scan_re) do |key, *value_candidates|
|
556
|
-
value = value_candidates.compact.first
|
557
|
-
next if value.
|
578
|
+
value = value_candidates.compact.first || EMPTY_STRING
|
579
|
+
next if value.empty? && !@allow_empty_values
|
558
580
|
|
559
|
-
key =
|
560
|
-
key =
|
561
|
-
key =
|
581
|
+
key = key.gsub(@trim_key_re, EMPTY_STRING) if @trim_key
|
582
|
+
key = key.gsub(@remove_char_key_re, EMPTY_STRING) if @remove_char_key
|
583
|
+
key = transform(key, @transform_key) if @transform_key
|
562
584
|
|
563
585
|
# Bail out as per the values of include_keys and exclude_keys
|
564
586
|
next if not include_keys.empty? and not include_keys.include?(key)
|
@@ -567,9 +589,9 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
567
589
|
|
568
590
|
key = event.sprintf(@prefix) + key
|
569
591
|
|
570
|
-
value =
|
571
|
-
value =
|
572
|
-
value =
|
592
|
+
value = value.gsub(@trim_value_re, EMPTY_STRING) if @trim_value
|
593
|
+
value = value.gsub(@remove_char_value_re, EMPTY_STRING) if @remove_char_value
|
594
|
+
value = transform(value, @transform_value) if @transform_value
|
573
595
|
|
574
596
|
# Bail out if inserting duplicate value in key mapping when unique_values
|
575
597
|
# option is set to true.
|
@@ -596,100 +618,4 @@ class LogStash::Filters::KV < LogStash::Filters::Base
|
|
596
618
|
|
597
619
|
class TimeoutException < RuntimeError
|
598
620
|
end
|
599
|
-
|
600
|
-
class TimeoutEnforcer
|
601
|
-
def initialize(logger, timeout_nanos)
|
602
|
-
@logger = logger
|
603
|
-
@running = java.util.concurrent.atomic.AtomicBoolean.new(false)
|
604
|
-
@timeout_nanos = timeout_nanos
|
605
|
-
|
606
|
-
# Stores running matches with their start time, this is used to cancel long running matches
|
607
|
-
# Is a map of Thread => start_time
|
608
|
-
@threads_to_start_time = java.util.concurrent.ConcurrentHashMap.new
|
609
|
-
end
|
610
|
-
|
611
|
-
def execute(&block)
|
612
|
-
# If the enforcer is not running, either we failed to start it or it has
|
613
|
-
# already been stopped; in either case, we cannot reliably enforce the timeout
|
614
|
-
# so we raise a RuntimeError instead.
|
615
|
-
fail("TimeoutEnforcer not running.") unless alive?
|
616
|
-
|
617
|
-
begin
|
618
|
-
thread = java.lang.Thread.currentThread()
|
619
|
-
@threads_to_start_time.put(thread, java.lang.System.nanoTime)
|
620
|
-
|
621
|
-
yield
|
622
|
-
|
623
|
-
rescue InterruptedRegexpError, java.lang.InterruptedException => e
|
624
|
-
raise TimeoutException.new
|
625
|
-
ensure
|
626
|
-
# If the block finished, but interrupt was called after, we'll want to
|
627
|
-
# clear the interrupted status anyway
|
628
|
-
@threads_to_start_time.remove(thread)
|
629
|
-
thread.interrupted
|
630
|
-
end
|
631
|
-
end
|
632
|
-
|
633
|
-
def start!
|
634
|
-
@running.set(true)
|
635
|
-
@logger.debug("Starting timeout enforcer (#{@timeout_nanos}ns)")
|
636
|
-
@timer_thread = Thread.new do
|
637
|
-
while @running.get() || !@threads_to_start_time.is_empty
|
638
|
-
begin
|
639
|
-
cancel_timed_out!
|
640
|
-
rescue Exception => e
|
641
|
-
@logger.error("Error while attempting to check/cancel excessively long kv patterns",
|
642
|
-
:message => e.message,
|
643
|
-
:class => e.class.name,
|
644
|
-
:backtrace => e.backtrace
|
645
|
-
)
|
646
|
-
end
|
647
|
-
sleep 0.25
|
648
|
-
end
|
649
|
-
end
|
650
|
-
end
|
651
|
-
|
652
|
-
def stop!
|
653
|
-
@running.set(false)
|
654
|
-
@logger.debug("Shutting down timeout enforcer")
|
655
|
-
# Check for the thread mostly for a fast start/shutdown scenario
|
656
|
-
@timer_thread.join if @timer_thread
|
657
|
-
end
|
658
|
-
|
659
|
-
def alive?
|
660
|
-
@running.get() && @timer_thread && @timer_thread.alive?
|
661
|
-
end
|
662
|
-
|
663
|
-
private
|
664
|
-
|
665
|
-
def cancel_timed_out!
|
666
|
-
now = java.lang.System.nanoTime # save ourselves some nanotime calls
|
667
|
-
@threads_to_start_time.keySet.each do |thread|
|
668
|
-
# Use compute to lock this value
|
669
|
-
@threads_to_start_time.computeIfPresent(thread) do |thread, start_time|
|
670
|
-
if start_time < now && now - start_time > @timeout_nanos
|
671
|
-
thread.interrupt
|
672
|
-
nil # Delete the key
|
673
|
-
else
|
674
|
-
start_time # preserve the key
|
675
|
-
end
|
676
|
-
end
|
677
|
-
end
|
678
|
-
end
|
679
|
-
end
|
680
|
-
|
681
|
-
class NullTimeoutEnforcer
|
682
|
-
def execute(&block)
|
683
|
-
yield
|
684
|
-
end
|
685
|
-
|
686
|
-
def start!
|
687
|
-
# no-op
|
688
|
-
end
|
689
|
-
|
690
|
-
def stop!
|
691
|
-
# no-op
|
692
|
-
end
|
693
|
-
end
|
694
|
-
NULL_TIMEOUT_ENFORCER = NullTimeoutEnforcer.new
|
695
621
|
end
|
data/logstash-filter-kv.gemspec
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
Gem::Specification.new do |s|
|
2
2
|
|
3
3
|
s.name = 'logstash-filter-kv'
|
4
|
-
s.version = '4.
|
4
|
+
s.version = '4.6.0'
|
5
5
|
s.licenses = ['Apache License (2.0)']
|
6
6
|
s.summary = "Parses key-value pairs"
|
7
7
|
s.description = "This gem is a Logstash plugin required to be installed on top of the Logstash core pipeline using $LS_HOME/bin/logstash-plugin install gemname. This gem is not a stand-alone program"
|
@@ -21,6 +21,9 @@ Gem::Specification.new do |s|
|
|
21
21
|
|
22
22
|
# Gem dependencies
|
23
23
|
s.add_runtime_dependency "logstash-core-plugin-api", ">= 1.60", "<= 2.99"
|
24
|
+
s.add_runtime_dependency 'logstash-mixin-ecs_compatibility_support', '~> 1.3'
|
25
|
+
s.add_runtime_dependency 'logstash-mixin-validator_support', '~> 1.0'
|
24
26
|
|
25
27
|
s.add_development_dependency 'logstash-devutils'
|
28
|
+
s.add_development_dependency 'insist'
|
26
29
|
end
|
data/spec/filters/kv_spec.rb
CHANGED
@@ -1,8 +1,16 @@
|
|
1
1
|
# encoding: utf-8
|
2
2
|
|
3
3
|
require "logstash/devutils/rspec/spec_helper"
|
4
|
+
require "insist"
|
4
5
|
require "logstash/filters/kv"
|
5
6
|
|
7
|
+
# Logstash starts JRuby with a special flag to ensure that regexp's are
|
8
|
+
# executed in an interruptible fashion.
|
9
|
+
require 'java'
|
10
|
+
if java.lang.System.getProperty("jruby.regexp.interruptible") != "true"
|
11
|
+
fail("Java must be started with `-Djruby.regexp.interruptible=true`")
|
12
|
+
end
|
13
|
+
|
6
14
|
describe LogStash::Filters::KV do
|
7
15
|
|
8
16
|
describe "defaults" do
|
@@ -487,6 +495,30 @@ describe LogStash::Filters::KV do
|
|
487
495
|
end
|
488
496
|
end
|
489
497
|
|
498
|
+
describe 'field_split_pattern with literal backslashes' do
|
499
|
+
config <<-CONFIG
|
500
|
+
filter {
|
501
|
+
kv {
|
502
|
+
source => headers
|
503
|
+
field_split_pattern => "\\\\r\\\\n"
|
504
|
+
value_split_pattern => ": "
|
505
|
+
whitespace => strict
|
506
|
+
target => headerskv
|
507
|
+
}
|
508
|
+
}
|
509
|
+
CONFIG
|
510
|
+
|
511
|
+
sample({"headers"=>"Host: foo.com\\r\\nUser-Agent: Qwerty/1.2.3 (www.qwerty.org)\\r\\nContent-Type: text/xml; charset=utf-8\\r\\nAccept: */*\\r\\nAccept-Encoding: gzip, deflate\\r\\nContent-Length: 123\\r\\nX-UUID: 0:15713435944943992\\r\\n\\r\\n"}) do
|
512
|
+
insist { subject.get("[headerskv][Host]") } == "foo.com"
|
513
|
+
insist { subject.get("[headerskv][User-Agent]") } == "Qwerty/1.2.3 (www.qwerty.org)"
|
514
|
+
insist { subject.get("[headerskv][Content-Type]") } == "text/xml; charset=utf-8"
|
515
|
+
insist { subject.get("[headerskv][Accept]") } == "*/*"
|
516
|
+
insist { subject.get("[headerskv][Accept-Encoding]") } == "gzip, deflate"
|
517
|
+
insist { subject.get("[headerskv][Content-Length]") } == "123"
|
518
|
+
insist { subject.get("[headerskv][X-UUID]") } == "0:15713435944943992"
|
519
|
+
end
|
520
|
+
end
|
521
|
+
|
490
522
|
|
491
523
|
describe "test data from specific sub source and target" do
|
492
524
|
config <<-CONFIG
|
@@ -689,6 +721,27 @@ describe LogStash::Filters::KV do
|
|
689
721
|
end
|
690
722
|
end
|
691
723
|
|
724
|
+
describe "Allowing empty values" do
|
725
|
+
config <<-CONFIG
|
726
|
+
filter {
|
727
|
+
kv {
|
728
|
+
field_split => " "
|
729
|
+
source => "source"
|
730
|
+
allow_empty_values => true
|
731
|
+
whitespace => strict
|
732
|
+
}
|
733
|
+
}
|
734
|
+
CONFIG
|
735
|
+
|
736
|
+
sample("source" => "present=one empty= emptyquoted='' present=two emptybracketed=[] endofinput=") do
|
737
|
+
insist { subject.get('[present]') } == ['one','two']
|
738
|
+
insist { subject.get('[empty]') } == ''
|
739
|
+
insist { subject.get('[emptyquoted]') } == ''
|
740
|
+
insist { subject.get('[emptybracketed]') } == ''
|
741
|
+
insist { subject.get('[endofinput]') } == ''
|
742
|
+
end
|
743
|
+
end
|
744
|
+
|
692
745
|
describe "Allow duplicate key/value pairs by default" do
|
693
746
|
config <<-CONFIG
|
694
747
|
filter {
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: logstash-filter-kv
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 4.
|
4
|
+
version: 4.6.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Elastic
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2022-01-31 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
requirement: !ruby/object:Gem::Requirement
|
@@ -30,6 +30,34 @@ dependencies:
|
|
30
30
|
- - "<="
|
31
31
|
- !ruby/object:Gem::Version
|
32
32
|
version: '2.99'
|
33
|
+
- !ruby/object:Gem::Dependency
|
34
|
+
requirement: !ruby/object:Gem::Requirement
|
35
|
+
requirements:
|
36
|
+
- - "~>"
|
37
|
+
- !ruby/object:Gem::Version
|
38
|
+
version: '1.3'
|
39
|
+
name: logstash-mixin-ecs_compatibility_support
|
40
|
+
prerelease: false
|
41
|
+
type: :runtime
|
42
|
+
version_requirements: !ruby/object:Gem::Requirement
|
43
|
+
requirements:
|
44
|
+
- - "~>"
|
45
|
+
- !ruby/object:Gem::Version
|
46
|
+
version: '1.3'
|
47
|
+
- !ruby/object:Gem::Dependency
|
48
|
+
requirement: !ruby/object:Gem::Requirement
|
49
|
+
requirements:
|
50
|
+
- - "~>"
|
51
|
+
- !ruby/object:Gem::Version
|
52
|
+
version: '1.0'
|
53
|
+
name: logstash-mixin-validator_support
|
54
|
+
prerelease: false
|
55
|
+
type: :runtime
|
56
|
+
version_requirements: !ruby/object:Gem::Requirement
|
57
|
+
requirements:
|
58
|
+
- - "~>"
|
59
|
+
- !ruby/object:Gem::Version
|
60
|
+
version: '1.0'
|
33
61
|
- !ruby/object:Gem::Dependency
|
34
62
|
requirement: !ruby/object:Gem::Requirement
|
35
63
|
requirements:
|
@@ -44,6 +72,20 @@ dependencies:
|
|
44
72
|
- - ">="
|
45
73
|
- !ruby/object:Gem::Version
|
46
74
|
version: '0'
|
75
|
+
- !ruby/object:Gem::Dependency
|
76
|
+
requirement: !ruby/object:Gem::Requirement
|
77
|
+
requirements:
|
78
|
+
- - ">="
|
79
|
+
- !ruby/object:Gem::Version
|
80
|
+
version: '0'
|
81
|
+
name: insist
|
82
|
+
prerelease: false
|
83
|
+
type: :development
|
84
|
+
version_requirements: !ruby/object:Gem::Requirement
|
85
|
+
requirements:
|
86
|
+
- - ">="
|
87
|
+
- !ruby/object:Gem::Version
|
88
|
+
version: '0'
|
47
89
|
description: This gem is a Logstash plugin required to be installed on top of the
|
48
90
|
Logstash core pipeline using $LS_HOME/bin/logstash-plugin install gemname. This
|
49
91
|
gem is not a stand-alone program
|
@@ -83,8 +125,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
83
125
|
- !ruby/object:Gem::Version
|
84
126
|
version: '0'
|
85
127
|
requirements: []
|
86
|
-
|
87
|
-
rubygems_version: 2.6.13
|
128
|
+
rubygems_version: 3.1.6
|
88
129
|
signing_key:
|
89
130
|
specification_version: 4
|
90
131
|
summary: Parses key-value pairs
|