elasticgraph-opensearch 0.18.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA256:
3
+ metadata.gz: af83310eb66d78a17317a02ba1c62e052dead3d24a3ea7882d3593eb650a88a2
4
+ data.tar.gz: f80f785ba656811a3f1464b70621cd35bbaf5dcd77172f58c3b6b5e59ca6b5b3
5
+ SHA512:
6
+ metadata.gz: 4d0c0bd2a60b02c9dce6ac6da9ef5a60a7441631491a877749b7f7780eef899972bc7b0698f277a3a804ad9e234ec589cc4402533a99d3f2633142cf6805ed0d
7
+ data.tar.gz: 554632704faac8a60529f59a87718af041b3f890ce833c660f5ad169e5173cce6f92995bf4fb629651ed274c2423733f5bae1286417af23498358a2b4ff848c7
data/LICENSE.txt ADDED
@@ -0,0 +1,21 @@
1
+ The MIT License (MIT)
2
+
3
+ Copyright (c) 2024 Block, Inc.
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in
13
+ all copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,3 @@
1
+ # ElasticGraph::OpenSearch
2
+
3
+ Wraps the official OpenSearch client for use by ElasticGraph.
@@ -0,0 +1,20 @@
1
+ # Copyright 2024 Block, Inc.
2
+ #
3
+ # Use of this source code is governed by an MIT-style
4
+ # license that can be found in the LICENSE file or at
5
+ # https://opensource.org/licenses/MIT.
6
+ #
7
+ # frozen_string_literal: true
8
+
9
+ require_relative "../gemspec_helper"
10
+
11
+ ElasticGraphGemspecHelper.define_elasticgraph_gem(gemspec_file: __FILE__, category: :datastore_adapter) do |spec, eg_version|
12
+ spec.summary = "Wraps the OpenSearch client for use by ElasticGraph."
13
+
14
+ spec.add_dependency "elasticgraph-support", eg_version
15
+ spec.add_dependency "faraday", "~> 2.10"
16
+ spec.add_dependency "faraday-retry", "~> 2.2"
17
+ spec.add_dependency "opensearch-ruby", "~> 3.1"
18
+
19
+ spec.add_development_dependency "httpx", ">= 1.2.6", "< 2.0"
20
+ end
@@ -0,0 +1,218 @@
1
+ # Copyright 2024 Block, Inc.
2
+ #
3
+ # Use of this source code is governed by an MIT-style
4
+ # license that can be found in the LICENSE file or at
5
+ # https://opensource.org/licenses/MIT.
6
+ #
7
+ # frozen_string_literal: true
8
+
9
+ require "elastic_graph/constants"
10
+ require "elastic_graph/error"
11
+ require "elastic_graph/support/faraday_middleware/msearch_using_get_instead_of_post"
12
+ require "elastic_graph/support/faraday_middleware/support_timeouts"
13
+ require "elastic_graph/support/hash_util"
14
+ require "faraday"
15
+ require "faraday/retry"
16
+ require "opensearch"
17
+
18
+ module ElasticGraph
19
+ module OpenSearch
20
+ class Client
21
+ # @dynamic cluster_name
22
+ attr_reader :cluster_name
23
+
24
+ def initialize(cluster_name, url:, faraday_adapter: nil, retry_on_failure: 3, logger: nil)
25
+ @cluster_name = cluster_name
26
+
27
+ @raw_client = ::OpenSearch::Client.new(
28
+ adapter: faraday_adapter,
29
+ url: url,
30
+ retry_on_failure: retry_on_failure,
31
+ # We use `logger` for both the tracer and logger to log everything we can. While the trace and log output do overlap, one is
32
+ # not a strict superset of the other (for example, warnings go to `logger`, while full request bodies go to `tracer`).
33
+ logger: logger,
34
+ tracer: logger
35
+ ) do |faraday|
36
+ faraday.use Support::FaradayMiddleware::MSearchUsingGetInsteadOfPost
37
+ faraday.use Support::FaradayMiddleware::SupportTimeouts
38
+
39
+ # Note: this overrides the default retry exceptions, which includes `Faraday::TimeoutError`.
40
+ # That's important because we do NOT want a retry on timeout -- a timeout indicates a slow,
41
+ # expensive query, and is transformed to a `RequestExceededDeadlineError` by `SupportTimeouts`,
42
+ # anyway.
43
+ #
44
+ # In addition, it's worth noting that the retry middleware ONLY retries known idempotent HTTP
45
+ # methods (e.g. get/put/delete/head/options). POST requests will not be retried. We could
46
+ # configure it to make it retry POSTs but we'd need to do an analysis of all ElasticGraph requests to
47
+ # make sure all POST requests are truly idempotent, and at least for now, it's sufficient to skip
48
+ # any POST requests we make.
49
+ faraday.request :retry,
50
+ exceptions: [::Faraday::ConnectionFailed, ::Faraday::RetriableResponse],
51
+ max: retry_on_failure,
52
+ retry_statuses: [500, 502, 503] # Internal Server Error, Bad Gateway, Service Unavailable
53
+
54
+ yield faraday if block_given?
55
+ end
56
+
57
+ # Here we call `app` on each Faraday connection as a way to force it to resolve
58
+ # all configured middlewares and adapters. If it cannot load a required dependency
59
+ # (e.g. `httpx`), it'll fail fast with a clear error.
60
+ #
61
+ # Without this, we would instead get an error when the client was used to make
62
+ # a request for the first time, which isn't as ideal.
63
+ @raw_client.transport.transport.connections.each { |c| c.connection.app }
64
+ end
65
+
66
+ # Cluster APIs
67
+
68
+ def get_cluster_health
69
+ transform_errors { |c| c.cluster.health }
70
+ end
71
+
72
+ def get_node_os_stats
73
+ transform_errors { |c| c.nodes.stats(metric: "os") }
74
+ end
75
+
76
+ def get_flat_cluster_settings
77
+ transform_errors { |c| c.cluster.get_settings(flat_settings: true) }
78
+ end
79
+
80
+ # We only support persistent settings here because the Elasticsearch docs recommend against using transient settings:
81
+ # https://www.elastic.co/guide/en/elasticsearch/reference/8.13/cluster-update-settings.html
82
+ #
83
+ # > We no longer recommend using transient cluster settings. Use persistent cluster settings instead. If a cluster becomes unstable,
84
+ # > transient settings can clear unexpectedly, resulting in a potentially undesired cluster configuration.
85
+ #
86
+ # The OpenSearch documentation doesn't specifically mention this, but the same principle applies.
87
+ def put_persistent_cluster_settings(settings)
88
+ transform_errors { |c| c.cluster.put_settings(body: {persistent: settings}) }
89
+ end
90
+
91
+ # Script APIs
92
+
93
+ # Gets the script with the given ID. Returns `nil` if the script does not exist.
94
+ def get_script(id:)
95
+ transform_errors { |c| c.get_script(id: id) }
96
+ rescue ::OpenSearch::Transport::Transport::Errors::NotFound
97
+ nil
98
+ end
99
+
100
+ def put_script(id:, body:, context:)
101
+ transform_errors { |c| c.put_script(id: id, body: body, context: context) }
102
+ end
103
+
104
+ def delete_script(id:)
105
+ transform_errors { |c| c.delete_script(id: id) }
106
+ rescue ::OpenSearch::Transport::Transport::Errors::NotFound
107
+ # it's ok if it's already not there.
108
+ end
109
+
110
+ # Index Template APIs
111
+
112
+ def get_index_template(index_template_name)
113
+ transform_errors do |client|
114
+ client.indices.get_index_template(name: index_template_name)
115
+ .fetch("index_templates").to_h do |entry|
116
+ index_template = entry.fetch("index_template")
117
+
118
+ # OpenSearch ignores `flat_settings` on the `/_index_template` API (but _only_ returns flattened settings from the index
119
+ # API). Here we flatten the settings to align with the flattened form ElasticGraph expects and uses everywhere.
120
+ flattened_settings = Support::HashUtil.flatten_and_stringify_keys(index_template.fetch("template").fetch("settings"))
121
+
122
+ index_template = index_template.merge({
123
+ "template" => index_template.fetch("template").merge({
124
+ "settings" => flattened_settings
125
+ })
126
+ })
127
+
128
+ [entry.fetch("name"), index_template]
129
+ end.dig(index_template_name) || {}
130
+ end
131
+ rescue ::OpenSearch::Transport::Transport::Errors::NotFound
132
+ {}
133
+ end
134
+
135
+ def put_index_template(name:, body:)
136
+ transform_errors { |c| c.indices.put_index_template(name: name, body: body) }
137
+ end
138
+
139
+ def delete_index_template(index_template_name)
140
+ transform_errors { |c| c.indices.delete_index_template(name: [index_template_name], ignore: [404]) }
141
+ end
142
+
143
+ # Index APIs
144
+
145
+ def get_index(index_name)
146
+ transform_errors do |client|
147
+ client.indices.get(
148
+ index: index_name,
149
+ ignore_unavailable: true,
150
+ flat_settings: true
151
+ )[index_name] || {}
152
+ end
153
+ end
154
+
155
+ def list_indices_matching(index_expression)
156
+ transform_errors do |client|
157
+ client
158
+ .cat
159
+ .indices(index: index_expression, format: "json", h: ["index"])
160
+ .map { |index_hash| index_hash.fetch("index") }
161
+ end
162
+ end
163
+
164
+ def create_index(index:, body:)
165
+ transform_errors { |c| c.indices.create(index: index, body: body) }
166
+ end
167
+
168
+ def put_index_mapping(index:, body:)
169
+ transform_errors { |c| c.indices.put_mapping(index: index, body: body) }
170
+ end
171
+
172
+ def put_index_settings(index:, body:)
173
+ transform_errors { |c| c.indices.put_settings(index: index, body: body) }
174
+ end
175
+
176
+ def delete_indices(*index_names)
177
+ # `allow_no_indices: true` is needed when we attempt to delete a non-existing index to avoid errors. For rollover indices,
178
+ # when we delete the actual indices, we will always perform a wildcard deletion, and `allow_no_indices: true` is needed.
179
+ #
180
+ # Note that the Elasticsearch API documentation[^1] says that `allow_no_indices` defaults to `true` but a Elasticsearch Ruby
181
+ # client code comment[^2] says it defaults to `false`. Regardless, we don't want to rely on the default behavior that could change.
182
+ #
183
+ # [^1]: https://www.elastic.co/guide/en/elasticsearch/reference/8.12/indices-delete-index.html#delete-index-api-query-params
184
+ # [^2]: https://github.com/elastic/elasticsearch-ruby/blob/8.12/elasticsearch-api/lib/elasticsearch/api/actions/indices/delete.rb#L31
185
+ transform_errors do |client|
186
+ client.indices.delete(index: index_names, ignore_unavailable: true, allow_no_indices: true)
187
+ end
188
+ end
189
+
190
+ # Document APIs
191
+
192
+ def msearch(body:, headers: nil)
193
+ transform_errors { |c| c.msearch(body: body, headers: headers) }
194
+ end
195
+
196
+ def bulk(body:, refresh: false)
197
+ transform_errors { |c| c.bulk(body: body, filter_path: DATASTORE_BULK_FILTER_PATH, refresh: refresh) }
198
+ end
199
+
200
+ # Synchronously deletes all documents in the cluster. Intended for tests to give ourselves a clean slate.
201
+ # Supports an `index` argument so the caller can limit the deletion to a specific "scope" (e.g. a set of indices with a common prefix).
202
+ #
203
+ # Overrides `scroll` to `10s` to avoid getting a "Trying to create too many scroll contexts" error, as discussed here:
204
+ # https://discuss.elastic.co/t/too-many-scroll-contexts-with-update-by-query-and-or-delete-by-query/282325/1
205
+ def delete_all_documents(index: "_all")
206
+ transform_errors { |c| c.delete_by_query(index: index, body: {query: {match_all: _ = {}}}, refresh: true, scroll: "10s") }
207
+ end
208
+
209
+ private
210
+
211
+ def transform_errors
212
+ yield @raw_client
213
+ rescue ::OpenSearch::Transport::Transport::Errors::BadRequest => ex
214
+ raise BadDatastoreRequest, ex.message
215
+ end
216
+ end
217
+ end
218
+ end
metadata ADDED
@@ -0,0 +1,290 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: elasticgraph-opensearch
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.18.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Myron Marston
8
+ autorequire:
9
+ bindir: exe
10
+ cert_chain: []
11
+ date: 2024-08-27 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: rubocop-factory_bot
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '2.26'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '2.26'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rubocop-rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '0.6'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '0.6'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rubocop-rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '3.0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: '3.0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: standard
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - "~>"
60
+ - !ruby/object:Gem::Version
61
+ version: 1.39.0
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - "~>"
67
+ - !ruby/object:Gem::Version
68
+ version: 1.39.0
69
+ - !ruby/object:Gem::Dependency
70
+ name: steep
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - "~>"
74
+ - !ruby/object:Gem::Version
75
+ version: '1.7'
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - "~>"
81
+ - !ruby/object:Gem::Version
82
+ version: '1.7'
83
+ - !ruby/object:Gem::Dependency
84
+ name: coderay
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - "~>"
88
+ - !ruby/object:Gem::Version
89
+ version: '1.1'
90
+ type: :development
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - "~>"
95
+ - !ruby/object:Gem::Version
96
+ version: '1.1'
97
+ - !ruby/object:Gem::Dependency
98
+ name: flatware-rspec
99
+ requirement: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - ">="
102
+ - !ruby/object:Gem::Version
103
+ version: 2.3.2
104
+ - - "<"
105
+ - !ruby/object:Gem::Version
106
+ version: '3.0'
107
+ type: :development
108
+ prerelease: false
109
+ version_requirements: !ruby/object:Gem::Requirement
110
+ requirements:
111
+ - - ">="
112
+ - !ruby/object:Gem::Version
113
+ version: 2.3.2
114
+ - - "<"
115
+ - !ruby/object:Gem::Version
116
+ version: '3.0'
117
+ - !ruby/object:Gem::Dependency
118
+ name: rspec
119
+ requirement: !ruby/object:Gem::Requirement
120
+ requirements:
121
+ - - "~>"
122
+ - !ruby/object:Gem::Version
123
+ version: '3.13'
124
+ type: :development
125
+ prerelease: false
126
+ version_requirements: !ruby/object:Gem::Requirement
127
+ requirements:
128
+ - - "~>"
129
+ - !ruby/object:Gem::Version
130
+ version: '3.13'
131
+ - !ruby/object:Gem::Dependency
132
+ name: super_diff
133
+ requirement: !ruby/object:Gem::Requirement
134
+ requirements:
135
+ - - ">="
136
+ - !ruby/object:Gem::Version
137
+ version: 0.12.1
138
+ type: :development
139
+ prerelease: false
140
+ version_requirements: !ruby/object:Gem::Requirement
141
+ requirements:
142
+ - - ">="
143
+ - !ruby/object:Gem::Version
144
+ version: 0.12.1
145
+ - !ruby/object:Gem::Dependency
146
+ name: simplecov
147
+ requirement: !ruby/object:Gem::Requirement
148
+ requirements:
149
+ - - "~>"
150
+ - !ruby/object:Gem::Version
151
+ version: '0.22'
152
+ type: :development
153
+ prerelease: false
154
+ version_requirements: !ruby/object:Gem::Requirement
155
+ requirements:
156
+ - - "~>"
157
+ - !ruby/object:Gem::Version
158
+ version: '0.22'
159
+ - !ruby/object:Gem::Dependency
160
+ name: simplecov-console
161
+ requirement: !ruby/object:Gem::Requirement
162
+ requirements:
163
+ - - ">="
164
+ - !ruby/object:Gem::Version
165
+ version: 0.9.1
166
+ - - "<"
167
+ - !ruby/object:Gem::Version
168
+ version: '1.0'
169
+ type: :development
170
+ prerelease: false
171
+ version_requirements: !ruby/object:Gem::Requirement
172
+ requirements:
173
+ - - ">="
174
+ - !ruby/object:Gem::Version
175
+ version: 0.9.1
176
+ - - "<"
177
+ - !ruby/object:Gem::Version
178
+ version: '1.0'
179
+ - !ruby/object:Gem::Dependency
180
+ name: elasticgraph-support
181
+ requirement: !ruby/object:Gem::Requirement
182
+ requirements:
183
+ - - '='
184
+ - !ruby/object:Gem::Version
185
+ version: 0.18.0.0
186
+ type: :runtime
187
+ prerelease: false
188
+ version_requirements: !ruby/object:Gem::Requirement
189
+ requirements:
190
+ - - '='
191
+ - !ruby/object:Gem::Version
192
+ version: 0.18.0.0
193
+ - !ruby/object:Gem::Dependency
194
+ name: faraday
195
+ requirement: !ruby/object:Gem::Requirement
196
+ requirements:
197
+ - - "~>"
198
+ - !ruby/object:Gem::Version
199
+ version: '2.10'
200
+ type: :runtime
201
+ prerelease: false
202
+ version_requirements: !ruby/object:Gem::Requirement
203
+ requirements:
204
+ - - "~>"
205
+ - !ruby/object:Gem::Version
206
+ version: '2.10'
207
+ - !ruby/object:Gem::Dependency
208
+ name: faraday-retry
209
+ requirement: !ruby/object:Gem::Requirement
210
+ requirements:
211
+ - - "~>"
212
+ - !ruby/object:Gem::Version
213
+ version: '2.2'
214
+ type: :runtime
215
+ prerelease: false
216
+ version_requirements: !ruby/object:Gem::Requirement
217
+ requirements:
218
+ - - "~>"
219
+ - !ruby/object:Gem::Version
220
+ version: '2.2'
221
+ - !ruby/object:Gem::Dependency
222
+ name: opensearch-ruby
223
+ requirement: !ruby/object:Gem::Requirement
224
+ requirements:
225
+ - - "~>"
226
+ - !ruby/object:Gem::Version
227
+ version: '3.1'
228
+ type: :runtime
229
+ prerelease: false
230
+ version_requirements: !ruby/object:Gem::Requirement
231
+ requirements:
232
+ - - "~>"
233
+ - !ruby/object:Gem::Version
234
+ version: '3.1'
235
+ - !ruby/object:Gem::Dependency
236
+ name: httpx
237
+ requirement: !ruby/object:Gem::Requirement
238
+ requirements:
239
+ - - ">="
240
+ - !ruby/object:Gem::Version
241
+ version: 1.2.6
242
+ - - "<"
243
+ - !ruby/object:Gem::Version
244
+ version: '2.0'
245
+ type: :development
246
+ prerelease: false
247
+ version_requirements: !ruby/object:Gem::Requirement
248
+ requirements:
249
+ - - ">="
250
+ - !ruby/object:Gem::Version
251
+ version: 1.2.6
252
+ - - "<"
253
+ - !ruby/object:Gem::Version
254
+ version: '2.0'
255
+ description:
256
+ email:
257
+ - myron@squareup.com
258
+ executables: []
259
+ extensions: []
260
+ extra_rdoc_files: []
261
+ files:
262
+ - LICENSE.txt
263
+ - README.md
264
+ - elasticgraph-opensearch.gemspec
265
+ - lib/elastic_graph/opensearch/client.rb
266
+ homepage:
267
+ licenses:
268
+ - MIT
269
+ metadata:
270
+ gem_category: datastore_adapter
271
+ post_install_message:
272
+ rdoc_options: []
273
+ require_paths:
274
+ - lib
275
+ required_ruby_version: !ruby/object:Gem::Requirement
276
+ requirements:
277
+ - - "~>"
278
+ - !ruby/object:Gem::Version
279
+ version: '3.2'
280
+ required_rubygems_version: !ruby/object:Gem::Requirement
281
+ requirements:
282
+ - - ">="
283
+ - !ruby/object:Gem::Version
284
+ version: '0'
285
+ requirements: []
286
+ rubygems_version: 3.5.9
287
+ signing_key:
288
+ specification_version: 4
289
+ summary: Wraps the OpenSearch client for use by ElasticGraph.
290
+ test_files: []