elasticgraph-opensearch 0.18.0.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA256:
3
+ metadata.gz: af83310eb66d78a17317a02ba1c62e052dead3d24a3ea7882d3593eb650a88a2
4
+ data.tar.gz: f80f785ba656811a3f1464b70621cd35bbaf5dcd77172f58c3b6b5e59ca6b5b3
5
+ SHA512:
6
+ metadata.gz: 4d0c0bd2a60b02c9dce6ac6da9ef5a60a7441631491a877749b7f7780eef899972bc7b0698f277a3a804ad9e234ec589cc4402533a99d3f2633142cf6805ed0d
7
+ data.tar.gz: 554632704faac8a60529f59a87718af041b3f890ce833c660f5ad169e5173cce6f92995bf4fb629651ed274c2423733f5bae1286417af23498358a2b4ff848c7
data/LICENSE.txt ADDED
@@ -0,0 +1,21 @@
1
+ The MIT License (MIT)
2
+
3
+ Copyright (c) 2024 Block, Inc.
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in
13
+ all copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,3 @@
1
+ # ElasticGraph::OpenSearch
2
+
3
+ Wraps the official OpenSearch client for use by ElasticGraph.
@@ -0,0 +1,20 @@
1
+ # Copyright 2024 Block, Inc.
2
+ #
3
+ # Use of this source code is governed by an MIT-style
4
+ # license that can be found in the LICENSE file or at
5
+ # https://opensource.org/licenses/MIT.
6
+ #
7
+ # frozen_string_literal: true
8
+
9
+ require_relative "../gemspec_helper"
10
+
11
+ ElasticGraphGemspecHelper.define_elasticgraph_gem(gemspec_file: __FILE__, category: :datastore_adapter) do |spec, eg_version|
12
+ spec.summary = "Wraps the OpenSearch client for use by ElasticGraph."
13
+
14
+ spec.add_dependency "elasticgraph-support", eg_version
15
+ spec.add_dependency "faraday", "~> 2.10"
16
+ spec.add_dependency "faraday-retry", "~> 2.2"
17
+ spec.add_dependency "opensearch-ruby", "~> 3.1"
18
+
19
+ spec.add_development_dependency "httpx", ">= 1.2.6", "< 2.0"
20
+ end
@@ -0,0 +1,218 @@
1
+ # Copyright 2024 Block, Inc.
2
+ #
3
+ # Use of this source code is governed by an MIT-style
4
+ # license that can be found in the LICENSE file or at
5
+ # https://opensource.org/licenses/MIT.
6
+ #
7
+ # frozen_string_literal: true
8
+
9
+ require "elastic_graph/constants"
10
+ require "elastic_graph/error"
11
+ require "elastic_graph/support/faraday_middleware/msearch_using_get_instead_of_post"
12
+ require "elastic_graph/support/faraday_middleware/support_timeouts"
13
+ require "elastic_graph/support/hash_util"
14
+ require "faraday"
15
+ require "faraday/retry"
16
+ require "opensearch"
17
+
18
+ module ElasticGraph
19
+ module OpenSearch
20
+ class Client
21
+ # @dynamic cluster_name
22
+ attr_reader :cluster_name
23
+
24
+ def initialize(cluster_name, url:, faraday_adapter: nil, retry_on_failure: 3, logger: nil)
25
+ @cluster_name = cluster_name
26
+
27
+ @raw_client = ::OpenSearch::Client.new(
28
+ adapter: faraday_adapter,
29
+ url: url,
30
+ retry_on_failure: retry_on_failure,
31
+ # We use `logger` for both the tracer and logger to log everything we can. While the trace and log output do overlap, one is
32
+ # not a strict superset of the other (for example, warnings go to `logger`, while full request bodies go to `tracer`).
33
+ logger: logger,
34
+ tracer: logger
35
+ ) do |faraday|
36
+ faraday.use Support::FaradayMiddleware::MSearchUsingGetInsteadOfPost
37
+ faraday.use Support::FaradayMiddleware::SupportTimeouts
38
+
39
+ # Note: this overrides the default retry exceptions, which includes `Faraday::TimeoutError`.
40
+ # That's important because we do NOT want a retry on timeout -- a timeout indicates a slow,
41
+ # expensive query, and is transformed to a `RequestExceededDeadlineError` by `SupportTimeouts`,
42
+ # anyway.
43
+ #
44
+ # In addition, it's worth noting that the retry middleware ONLY retries known idempotent HTTP
45
+ # methods (e.g. get/put/delete/head/options). POST requests will not be retried. We could
46
+ # configure it to make it retry POSTs but we'd need to do an analysis of all ElasticGraph requests to
47
+ # make sure all POST requests are truly idempotent, and at least for now, it's sufficient to skip
48
+ # any POST requests we make.
49
+ faraday.request :retry,
50
+ exceptions: [::Faraday::ConnectionFailed, ::Faraday::RetriableResponse],
51
+ max: retry_on_failure,
52
+ retry_statuses: [500, 502, 503] # Internal Server Error, Bad Gateway, Service Unavailable
53
+
54
+ yield faraday if block_given?
55
+ end
56
+
57
+ # Here we call `app` on each Faraday connection as a way to force it to resolve
58
+ # all configured middlewares and adapters. If it cannot load a required dependency
59
+ # (e.g. `httpx`), it'll fail fast with a clear error.
60
+ #
61
+ # Without this, we would instead get an error when the client was used to make
62
+ # a request for the first time, which isn't as ideal.
63
+ @raw_client.transport.transport.connections.each { |c| c.connection.app }
64
+ end
65
+
66
+ # Cluster APIs
67
+
68
+ def get_cluster_health
69
+ transform_errors { |c| c.cluster.health }
70
+ end
71
+
72
+ def get_node_os_stats
73
+ transform_errors { |c| c.nodes.stats(metric: "os") }
74
+ end
75
+
76
+ def get_flat_cluster_settings
77
+ transform_errors { |c| c.cluster.get_settings(flat_settings: true) }
78
+ end
79
+
80
+ # We only support persistent settings here because the Elasticsearch docs recommend against using transient settings:
81
+ # https://www.elastic.co/guide/en/elasticsearch/reference/8.13/cluster-update-settings.html
82
+ #
83
+ # > We no longer recommend using transient cluster settings. Use persistent cluster settings instead. If a cluster becomes unstable,
84
+ # > transient settings can clear unexpectedly, resulting in a potentially undesired cluster configuration.
85
+ #
86
+ # The OpenSearch documentation doesn't specifically mention this, but the same principle applies.
87
+ def put_persistent_cluster_settings(settings)
88
+ transform_errors { |c| c.cluster.put_settings(body: {persistent: settings}) }
89
+ end
90
+
91
+ # Script APIs
92
+
93
+ # Gets the script with the given ID. Returns `nil` if the script does not exist.
94
+ def get_script(id:)
95
+ transform_errors { |c| c.get_script(id: id) }
96
+ rescue ::OpenSearch::Transport::Transport::Errors::NotFound
97
+ nil
98
+ end
99
+
100
+ def put_script(id:, body:, context:)
101
+ transform_errors { |c| c.put_script(id: id, body: body, context: context) }
102
+ end
103
+
104
+ def delete_script(id:)
105
+ transform_errors { |c| c.delete_script(id: id) }
106
+ rescue ::OpenSearch::Transport::Transport::Errors::NotFound
107
+ # it's ok if it's already not there.
108
+ end
109
+
110
+ # Index Template APIs
111
+
112
+ def get_index_template(index_template_name)
113
+ transform_errors do |client|
114
+ client.indices.get_index_template(name: index_template_name)
115
+ .fetch("index_templates").to_h do |entry|
116
+ index_template = entry.fetch("index_template")
117
+
118
+ # OpenSearch ignores `flat_settings` on the `/_index_template` API (but _only_ returns flattened settings from the index
119
+ # API). Here we flatten the settings to align with the flattened form ElasticGraph expects and uses everywhere.
120
+ flattened_settings = Support::HashUtil.flatten_and_stringify_keys(index_template.fetch("template").fetch("settings"))
121
+
122
+ index_template = index_template.merge({
123
+ "template" => index_template.fetch("template").merge({
124
+ "settings" => flattened_settings
125
+ })
126
+ })
127
+
128
+ [entry.fetch("name"), index_template]
129
+ end.dig(index_template_name) || {}
130
+ end
131
+ rescue ::OpenSearch::Transport::Transport::Errors::NotFound
132
+ {}
133
+ end
134
+
135
+ def put_index_template(name:, body:)
136
+ transform_errors { |c| c.indices.put_index_template(name: name, body: body) }
137
+ end
138
+
139
+ def delete_index_template(index_template_name)
140
+ transform_errors { |c| c.indices.delete_index_template(name: [index_template_name], ignore: [404]) }
141
+ end
142
+
143
+ # Index APIs
144
+
145
+ def get_index(index_name)
146
+ transform_errors do |client|
147
+ client.indices.get(
148
+ index: index_name,
149
+ ignore_unavailable: true,
150
+ flat_settings: true
151
+ )[index_name] || {}
152
+ end
153
+ end
154
+
155
+ def list_indices_matching(index_expression)
156
+ transform_errors do |client|
157
+ client
158
+ .cat
159
+ .indices(index: index_expression, format: "json", h: ["index"])
160
+ .map { |index_hash| index_hash.fetch("index") }
161
+ end
162
+ end
163
+
164
+ def create_index(index:, body:)
165
+ transform_errors { |c| c.indices.create(index: index, body: body) }
166
+ end
167
+
168
+ def put_index_mapping(index:, body:)
169
+ transform_errors { |c| c.indices.put_mapping(index: index, body: body) }
170
+ end
171
+
172
+ def put_index_settings(index:, body:)
173
+ transform_errors { |c| c.indices.put_settings(index: index, body: body) }
174
+ end
175
+
176
+ def delete_indices(*index_names)
177
+ # `allow_no_indices: true` is needed when we attempt to delete a non-existing index to avoid errors. For rollover indices,
178
+ # when we delete the actual indices, we will always perform a wildcard deletion, and `allow_no_indices: true` is needed.
179
+ #
180
+ # Note that the Elasticsearch API documentation[^1] says that `allow_no_indices` defaults to `true` but a Elasticsearch Ruby
181
+ # client code comment[^2] says it defaults to `false`. Regardless, we don't want to rely on the default behavior that could change.
182
+ #
183
+ # [^1]: https://www.elastic.co/guide/en/elasticsearch/reference/8.12/indices-delete-index.html#delete-index-api-query-params
184
+ # [^2]: https://github.com/elastic/elasticsearch-ruby/blob/8.12/elasticsearch-api/lib/elasticsearch/api/actions/indices/delete.rb#L31
185
+ transform_errors do |client|
186
+ client.indices.delete(index: index_names, ignore_unavailable: true, allow_no_indices: true)
187
+ end
188
+ end
189
+
190
+ # Document APIs
191
+
192
+ def msearch(body:, headers: nil)
193
+ transform_errors { |c| c.msearch(body: body, headers: headers) }
194
+ end
195
+
196
+ def bulk(body:, refresh: false)
197
+ transform_errors { |c| c.bulk(body: body, filter_path: DATASTORE_BULK_FILTER_PATH, refresh: refresh) }
198
+ end
199
+
200
+ # Synchronously deletes all documents in the cluster. Intended for tests to give ourselves a clean slate.
201
+ # Supports an `index` argument so the caller can limit the deletion to a specific "scope" (e.g. a set of indices with a common prefix).
202
+ #
203
+ # Overrides `scroll` to `10s` to avoid getting a "Trying to create too many scroll contexts" error, as discussed here:
204
+ # https://discuss.elastic.co/t/too-many-scroll-contexts-with-update-by-query-and-or-delete-by-query/282325/1
205
+ def delete_all_documents(index: "_all")
206
+ transform_errors { |c| c.delete_by_query(index: index, body: {query: {match_all: _ = {}}}, refresh: true, scroll: "10s") }
207
+ end
208
+
209
+ private
210
+
211
+ def transform_errors
212
+ yield @raw_client
213
+ rescue ::OpenSearch::Transport::Transport::Errors::BadRequest => ex
214
+ raise BadDatastoreRequest, ex.message
215
+ end
216
+ end
217
+ end
218
+ end
metadata ADDED
@@ -0,0 +1,290 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: elasticgraph-opensearch
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.18.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Myron Marston
8
+ autorequire:
9
+ bindir: exe
10
+ cert_chain: []
11
+ date: 2024-08-27 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: rubocop-factory_bot
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '2.26'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '2.26'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rubocop-rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '0.6'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '0.6'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rubocop-rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '3.0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: '3.0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: standard
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - "~>"
60
+ - !ruby/object:Gem::Version
61
+ version: 1.39.0
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - "~>"
67
+ - !ruby/object:Gem::Version
68
+ version: 1.39.0
69
+ - !ruby/object:Gem::Dependency
70
+ name: steep
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - "~>"
74
+ - !ruby/object:Gem::Version
75
+ version: '1.7'
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - "~>"
81
+ - !ruby/object:Gem::Version
82
+ version: '1.7'
83
+ - !ruby/object:Gem::Dependency
84
+ name: coderay
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - "~>"
88
+ - !ruby/object:Gem::Version
89
+ version: '1.1'
90
+ type: :development
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - "~>"
95
+ - !ruby/object:Gem::Version
96
+ version: '1.1'
97
+ - !ruby/object:Gem::Dependency
98
+ name: flatware-rspec
99
+ requirement: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - ">="
102
+ - !ruby/object:Gem::Version
103
+ version: 2.3.2
104
+ - - "<"
105
+ - !ruby/object:Gem::Version
106
+ version: '3.0'
107
+ type: :development
108
+ prerelease: false
109
+ version_requirements: !ruby/object:Gem::Requirement
110
+ requirements:
111
+ - - ">="
112
+ - !ruby/object:Gem::Version
113
+ version: 2.3.2
114
+ - - "<"
115
+ - !ruby/object:Gem::Version
116
+ version: '3.0'
117
+ - !ruby/object:Gem::Dependency
118
+ name: rspec
119
+ requirement: !ruby/object:Gem::Requirement
120
+ requirements:
121
+ - - "~>"
122
+ - !ruby/object:Gem::Version
123
+ version: '3.13'
124
+ type: :development
125
+ prerelease: false
126
+ version_requirements: !ruby/object:Gem::Requirement
127
+ requirements:
128
+ - - "~>"
129
+ - !ruby/object:Gem::Version
130
+ version: '3.13'
131
+ - !ruby/object:Gem::Dependency
132
+ name: super_diff
133
+ requirement: !ruby/object:Gem::Requirement
134
+ requirements:
135
+ - - ">="
136
+ - !ruby/object:Gem::Version
137
+ version: 0.12.1
138
+ type: :development
139
+ prerelease: false
140
+ version_requirements: !ruby/object:Gem::Requirement
141
+ requirements:
142
+ - - ">="
143
+ - !ruby/object:Gem::Version
144
+ version: 0.12.1
145
+ - !ruby/object:Gem::Dependency
146
+ name: simplecov
147
+ requirement: !ruby/object:Gem::Requirement
148
+ requirements:
149
+ - - "~>"
150
+ - !ruby/object:Gem::Version
151
+ version: '0.22'
152
+ type: :development
153
+ prerelease: false
154
+ version_requirements: !ruby/object:Gem::Requirement
155
+ requirements:
156
+ - - "~>"
157
+ - !ruby/object:Gem::Version
158
+ version: '0.22'
159
+ - !ruby/object:Gem::Dependency
160
+ name: simplecov-console
161
+ requirement: !ruby/object:Gem::Requirement
162
+ requirements:
163
+ - - ">="
164
+ - !ruby/object:Gem::Version
165
+ version: 0.9.1
166
+ - - "<"
167
+ - !ruby/object:Gem::Version
168
+ version: '1.0'
169
+ type: :development
170
+ prerelease: false
171
+ version_requirements: !ruby/object:Gem::Requirement
172
+ requirements:
173
+ - - ">="
174
+ - !ruby/object:Gem::Version
175
+ version: 0.9.1
176
+ - - "<"
177
+ - !ruby/object:Gem::Version
178
+ version: '1.0'
179
+ - !ruby/object:Gem::Dependency
180
+ name: elasticgraph-support
181
+ requirement: !ruby/object:Gem::Requirement
182
+ requirements:
183
+ - - '='
184
+ - !ruby/object:Gem::Version
185
+ version: 0.18.0.0
186
+ type: :runtime
187
+ prerelease: false
188
+ version_requirements: !ruby/object:Gem::Requirement
189
+ requirements:
190
+ - - '='
191
+ - !ruby/object:Gem::Version
192
+ version: 0.18.0.0
193
+ - !ruby/object:Gem::Dependency
194
+ name: faraday
195
+ requirement: !ruby/object:Gem::Requirement
196
+ requirements:
197
+ - - "~>"
198
+ - !ruby/object:Gem::Version
199
+ version: '2.10'
200
+ type: :runtime
201
+ prerelease: false
202
+ version_requirements: !ruby/object:Gem::Requirement
203
+ requirements:
204
+ - - "~>"
205
+ - !ruby/object:Gem::Version
206
+ version: '2.10'
207
+ - !ruby/object:Gem::Dependency
208
+ name: faraday-retry
209
+ requirement: !ruby/object:Gem::Requirement
210
+ requirements:
211
+ - - "~>"
212
+ - !ruby/object:Gem::Version
213
+ version: '2.2'
214
+ type: :runtime
215
+ prerelease: false
216
+ version_requirements: !ruby/object:Gem::Requirement
217
+ requirements:
218
+ - - "~>"
219
+ - !ruby/object:Gem::Version
220
+ version: '2.2'
221
+ - !ruby/object:Gem::Dependency
222
+ name: opensearch-ruby
223
+ requirement: !ruby/object:Gem::Requirement
224
+ requirements:
225
+ - - "~>"
226
+ - !ruby/object:Gem::Version
227
+ version: '3.1'
228
+ type: :runtime
229
+ prerelease: false
230
+ version_requirements: !ruby/object:Gem::Requirement
231
+ requirements:
232
+ - - "~>"
233
+ - !ruby/object:Gem::Version
234
+ version: '3.1'
235
+ - !ruby/object:Gem::Dependency
236
+ name: httpx
237
+ requirement: !ruby/object:Gem::Requirement
238
+ requirements:
239
+ - - ">="
240
+ - !ruby/object:Gem::Version
241
+ version: 1.2.6
242
+ - - "<"
243
+ - !ruby/object:Gem::Version
244
+ version: '2.0'
245
+ type: :development
246
+ prerelease: false
247
+ version_requirements: !ruby/object:Gem::Requirement
248
+ requirements:
249
+ - - ">="
250
+ - !ruby/object:Gem::Version
251
+ version: 1.2.6
252
+ - - "<"
253
+ - !ruby/object:Gem::Version
254
+ version: '2.0'
255
+ description:
256
+ email:
257
+ - myron@squareup.com
258
+ executables: []
259
+ extensions: []
260
+ extra_rdoc_files: []
261
+ files:
262
+ - LICENSE.txt
263
+ - README.md
264
+ - elasticgraph-opensearch.gemspec
265
+ - lib/elastic_graph/opensearch/client.rb
266
+ homepage:
267
+ licenses:
268
+ - MIT
269
+ metadata:
270
+ gem_category: datastore_adapter
271
+ post_install_message:
272
+ rdoc_options: []
273
+ require_paths:
274
+ - lib
275
+ required_ruby_version: !ruby/object:Gem::Requirement
276
+ requirements:
277
+ - - "~>"
278
+ - !ruby/object:Gem::Version
279
+ version: '3.2'
280
+ required_rubygems_version: !ruby/object:Gem::Requirement
281
+ requirements:
282
+ - - ">="
283
+ - !ruby/object:Gem::Version
284
+ version: '0'
285
+ requirements: []
286
+ rubygems_version: 3.5.9
287
+ signing_key:
288
+ specification_version: 4
289
+ summary: Wraps the OpenSearch client for use by ElasticGraph.
290
+ test_files: []