elasticsearch 9.1.3__py3-none-any.whl → 9.2.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (60) hide show
  1. elasticsearch/_async/client/__init__.py +91 -24
  2. elasticsearch/_async/client/async_search.py +7 -0
  3. elasticsearch/_async/client/autoscaling.py +7 -0
  4. elasticsearch/_async/client/cat.py +8 -1
  5. elasticsearch/_async/client/cluster.py +7 -7
  6. elasticsearch/_async/client/eql.py +7 -0
  7. elasticsearch/_async/client/esql.py +26 -3
  8. elasticsearch/_async/client/indices.py +153 -7
  9. elasticsearch/_async/client/inference.py +315 -42
  10. elasticsearch/_async/client/ingest.py +8 -0
  11. elasticsearch/_async/client/license.py +4 -2
  12. elasticsearch/_async/client/ml.py +2 -2
  13. elasticsearch/_async/client/nodes.py +2 -4
  14. elasticsearch/_async/client/project.py +68 -0
  15. elasticsearch/_async/client/security.py +39 -0
  16. elasticsearch/_async/client/shutdown.py +6 -0
  17. elasticsearch/_async/client/simulate.py +8 -0
  18. elasticsearch/_async/client/snapshot.py +20 -10
  19. elasticsearch/_async/client/sql.py +7 -0
  20. elasticsearch/_async/client/streams.py +2 -3
  21. elasticsearch/_async/helpers.py +28 -15
  22. elasticsearch/_sync/client/__init__.py +91 -24
  23. elasticsearch/_sync/client/async_search.py +7 -0
  24. elasticsearch/_sync/client/autoscaling.py +7 -0
  25. elasticsearch/_sync/client/cat.py +8 -1
  26. elasticsearch/_sync/client/cluster.py +7 -7
  27. elasticsearch/_sync/client/eql.py +7 -0
  28. elasticsearch/_sync/client/esql.py +26 -3
  29. elasticsearch/_sync/client/indices.py +153 -7
  30. elasticsearch/_sync/client/inference.py +315 -42
  31. elasticsearch/_sync/client/ingest.py +8 -0
  32. elasticsearch/_sync/client/license.py +4 -2
  33. elasticsearch/_sync/client/ml.py +2 -2
  34. elasticsearch/_sync/client/nodes.py +2 -4
  35. elasticsearch/_sync/client/project.py +68 -0
  36. elasticsearch/_sync/client/security.py +39 -0
  37. elasticsearch/_sync/client/shutdown.py +6 -0
  38. elasticsearch/_sync/client/simulate.py +8 -0
  39. elasticsearch/_sync/client/snapshot.py +20 -10
  40. elasticsearch/_sync/client/sql.py +7 -0
  41. elasticsearch/_sync/client/streams.py +2 -3
  42. elasticsearch/_version.py +2 -2
  43. elasticsearch/client.py +2 -0
  44. elasticsearch/compat.py +2 -15
  45. elasticsearch/dsl/_async/document.py +2 -1
  46. elasticsearch/dsl/_sync/document.py +2 -1
  47. elasticsearch/dsl/document_base.py +38 -13
  48. elasticsearch/dsl/field.py +8 -0
  49. elasticsearch/dsl/pydantic.py +152 -0
  50. elasticsearch/dsl/query.py +5 -1
  51. elasticsearch/dsl/search_base.py +5 -1
  52. elasticsearch/dsl/types.py +37 -9
  53. elasticsearch/esql/esql.py +331 -41
  54. elasticsearch/esql/functions.py +88 -0
  55. elasticsearch/helpers/actions.py +1 -1
  56. {elasticsearch-9.1.3.dist-info → elasticsearch-9.2.1.dist-info}/METADATA +26 -4
  57. {elasticsearch-9.1.3.dist-info → elasticsearch-9.2.1.dist-info}/RECORD +60 -57
  58. {elasticsearch-9.1.3.dist-info → elasticsearch-9.2.1.dist-info}/WHEEL +0 -0
  59. {elasticsearch-9.1.3.dist-info → elasticsearch-9.2.1.dist-info}/licenses/LICENSE +0 -0
  60. {elasticsearch-9.1.3.dist-info → elasticsearch-9.2.1.dist-info}/licenses/NOTICE +0 -0
@@ -104,8 +104,10 @@ class LicenseClient(NamespacedClient):
104
104
  license types. If `false`, this parameter returns platinum for both platinum
105
105
  and enterprise license types. This behavior is maintained for backwards compatibility.
106
106
  This parameter is deprecated and will always be set to true in 8.x.
107
- :param local: Specifies whether to retrieve local information. The default value
108
- is `false`, which means the information is retrieved from the master node.
107
+ :param local: Specifies whether to retrieve local information. From 9.2 onwards
108
+ the default value is `true`, which means the information is retrieved from
109
+ the responding node. In earlier versions the default is `false`, which means
110
+ the information is retrieved from the elected master node.
109
111
  """
110
112
  __path_parts: t.Dict[str, str] = {}
111
113
  __path = "/_license"
@@ -2397,7 +2397,7 @@ class MlClient(NamespacedClient):
2397
2397
  exclude_interim: t.Optional[bool] = None,
2398
2398
  filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
2399
2399
  human: t.Optional[bool] = None,
2400
- overall_score: t.Optional[t.Union[float, str]] = None,
2400
+ overall_score: t.Optional[float] = None,
2401
2401
  pretty: t.Optional[bool] = None,
2402
2402
  start: t.Optional[t.Union[str, t.Any]] = None,
2403
2403
  top_n: t.Optional[int] = None,
@@ -5755,7 +5755,7 @@ class MlClient(NamespacedClient):
5755
5755
  <p>Validate an anomaly detection job.</p>
5756
5756
 
5757
5757
 
5758
- `<https://www.elastic.co/guide/en/machine-learning/9.1/ml-jobs.html>`_
5758
+ `<https://www.elastic.co/guide/en/machine-learning/9.2/ml-jobs.html>`_
5759
5759
 
5760
5760
  :param analysis_config:
5761
5761
  :param analysis_limits:
@@ -368,9 +368,7 @@ class NodesClient(NamespacedClient):
368
368
  human: t.Optional[bool] = None,
369
369
  include_segment_file_sizes: t.Optional[bool] = None,
370
370
  include_unloaded_segments: t.Optional[bool] = None,
371
- level: t.Optional[
372
- t.Union[str, t.Literal["cluster", "indices", "shards"]]
373
- ] = None,
371
+ level: t.Optional[t.Union[str, t.Literal["indices", "node", "shards"]]] = None,
374
372
  pretty: t.Optional[bool] = None,
375
373
  timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
376
374
  types: t.Optional[t.Sequence[str]] = None,
@@ -387,7 +385,7 @@ class NodesClient(NamespacedClient):
387
385
 
388
386
  :param node_id: Comma-separated list of node IDs or names used to limit returned
389
387
  information.
390
- :param metric:
388
+ :param metric: Limits the information returned to the specific metrics.
391
389
  :param index_metric: Limit the information returned for indices metric to the
392
390
  specific index metrics. It can be used only if indices (or all) metric is
393
391
  specified.
@@ -0,0 +1,68 @@
1
+ # Licensed to Elasticsearch B.V. under one or more contributor
2
+ # license agreements. See the NOTICE file distributed with
3
+ # this work for additional information regarding copyright
4
+ # ownership. Elasticsearch B.V. licenses this file to you under
5
+ # the Apache License, Version 2.0 (the "License"); you may
6
+ # not use this file except in compliance with the License.
7
+ # You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing,
12
+ # software distributed under the License is distributed on an
13
+ # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
+ # KIND, either express or implied. See the License for the
15
+ # specific language governing permissions and limitations
16
+ # under the License.
17
+
18
+ import typing as t
19
+
20
+ from elastic_transport import ObjectApiResponse
21
+
22
+ from ._base import NamespacedClient
23
+ from .utils import (
24
+ Stability,
25
+ _availability_warning,
26
+ _rewrite_parameters,
27
+ )
28
+
29
+
30
+ class ProjectClient(NamespacedClient):
31
+
32
+ @_rewrite_parameters()
33
+ @_availability_warning(Stability.EXPERIMENTAL)
34
+ def tags(
35
+ self,
36
+ *,
37
+ error_trace: t.Optional[bool] = None,
38
+ filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
39
+ human: t.Optional[bool] = None,
40
+ pretty: t.Optional[bool] = None,
41
+ ) -> ObjectApiResponse[t.Any]:
42
+ """
43
+ .. raw:: html
44
+
45
+ <p>Get tags.</p>
46
+ <p>Get the tags that are defined for the project.</p>
47
+
48
+ """
49
+ __path_parts: t.Dict[str, str] = {}
50
+ __path = "/_project/tags"
51
+ __query: t.Dict[str, t.Any] = {}
52
+ if error_trace is not None:
53
+ __query["error_trace"] = error_trace
54
+ if filter_path is not None:
55
+ __query["filter_path"] = filter_path
56
+ if human is not None:
57
+ __query["human"] = human
58
+ if pretty is not None:
59
+ __query["pretty"] = pretty
60
+ __headers = {"accept": "application/json"}
61
+ return self.perform_request( # type: ignore[return-value]
62
+ "GET",
63
+ __path,
64
+ params=__query,
65
+ headers=__headers,
66
+ endpoint_id="project.tags",
67
+ path_parts=__path_parts,
68
+ )
@@ -2052,6 +2052,45 @@ class SecurityClient(NamespacedClient):
2052
2052
  path_parts=__path_parts,
2053
2053
  )
2054
2054
 
2055
+ @_rewrite_parameters()
2056
+ def get_stats(
2057
+ self,
2058
+ *,
2059
+ error_trace: t.Optional[bool] = None,
2060
+ filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
2061
+ human: t.Optional[bool] = None,
2062
+ pretty: t.Optional[bool] = None,
2063
+ ) -> ObjectApiResponse[t.Any]:
2064
+ """
2065
+ .. raw:: html
2066
+
2067
+ <p>Get security stats.</p>
2068
+ <p>Gather security usage statistics from all node(s) within the cluster.</p>
2069
+
2070
+
2071
+ `<https://www.elastic.co/docs/api/doc/elasticsearch/operation/operation-security-get-stats>`_
2072
+ """
2073
+ __path_parts: t.Dict[str, str] = {}
2074
+ __path = "/_security/stats"
2075
+ __query: t.Dict[str, t.Any] = {}
2076
+ if error_trace is not None:
2077
+ __query["error_trace"] = error_trace
2078
+ if filter_path is not None:
2079
+ __query["filter_path"] = filter_path
2080
+ if human is not None:
2081
+ __query["human"] = human
2082
+ if pretty is not None:
2083
+ __query["pretty"] = pretty
2084
+ __headers = {"accept": "application/json"}
2085
+ return self.perform_request( # type: ignore[return-value]
2086
+ "GET",
2087
+ __path,
2088
+ params=__query,
2089
+ headers=__headers,
2090
+ endpoint_id="security.get_stats",
2091
+ path_parts=__path_parts,
2092
+ )
2093
+
2055
2094
  @_rewrite_parameters(
2056
2095
  body_fields=(
2057
2096
  "grant_type",
@@ -22,6 +22,9 @@ from elastic_transport import ObjectApiResponse
22
22
  from ._base import NamespacedClient
23
23
  from .utils import (
24
24
  SKIP_IN_PATH,
25
+ Stability,
26
+ Visibility,
27
+ _availability_warning,
25
28
  _quote,
26
29
  _rewrite_parameters,
27
30
  )
@@ -30,6 +33,7 @@ from .utils import (
30
33
  class ShutdownClient(NamespacedClient):
31
34
 
32
35
  @_rewrite_parameters()
36
+ @_availability_warning(Stability.STABLE, Visibility.PRIVATE)
33
37
  def delete_node(
34
38
  self,
35
39
  *,
@@ -90,6 +94,7 @@ class ShutdownClient(NamespacedClient):
90
94
  )
91
95
 
92
96
  @_rewrite_parameters()
97
+ @_availability_warning(Stability.STABLE, Visibility.PRIVATE)
93
98
  def get_node(
94
99
  self,
95
100
  *,
@@ -149,6 +154,7 @@ class ShutdownClient(NamespacedClient):
149
154
  @_rewrite_parameters(
150
155
  body_fields=("reason", "type", "allocation_delay", "target_node_name"),
151
156
  )
157
+ @_availability_warning(Stability.STABLE, Visibility.PRIVATE)
152
158
  def put_node(
153
159
  self,
154
160
  *,
@@ -56,6 +56,7 @@ class SimulateClient(NamespacedClient):
56
56
  t.Mapping[str, t.Mapping[str, t.Any]]
57
57
  ] = None,
58
58
  mapping_addition: t.Optional[t.Mapping[str, t.Any]] = None,
59
+ merge_type: t.Optional[t.Union[str, t.Literal["index", "template"]]] = None,
59
60
  pipeline: t.Optional[str] = None,
60
61
  pipeline_substitutions: t.Optional[
61
62
  t.Mapping[str, t.Mapping[str, t.Any]]
@@ -93,6 +94,11 @@ class SimulateClient(NamespacedClient):
93
94
  :param index_template_substitutions: A map of index template names to substitute
94
95
  index template definition objects.
95
96
  :param mapping_addition:
97
+ :param merge_type: The mapping merge type if mapping overrides are being provided
98
+ in mapping_addition. The allowed values are one of index or template. The
99
+ index option merges mappings the way they would be merged into an existing
100
+ index. The template option merges mappings the way they would be merged into
101
+ a template.
96
102
  :param pipeline: The pipeline to use as the default pipeline. This value can
97
103
  be used to override the default pipeline of the index.
98
104
  :param pipeline_substitutions: Pipelines to test. If you don’t specify the `pipeline`
@@ -116,6 +122,8 @@ class SimulateClient(NamespacedClient):
116
122
  __query["filter_path"] = filter_path
117
123
  if human is not None:
118
124
  __query["human"] = human
125
+ if merge_type is not None:
126
+ __query["merge_type"] = merge_type
119
127
  if pipeline is not None:
120
128
  __query["pipeline"] = pipeline
121
129
  if pretty is not None:
@@ -872,35 +872,40 @@ class SnapshotClient(NamespacedClient):
872
872
 
873
873
  :param name: The name of the repository.
874
874
  :param blob_count: The total number of blobs to write to the repository during
875
- the test. For realistic experiments, you should set it to at least `2000`.
875
+ the test. For realistic experiments, set this parameter to at least `2000`.
876
876
  :param concurrency: The number of operations to run concurrently during the test.
877
+ For realistic experiments, leave this parameter unset.
877
878
  :param detailed: Indicates whether to return detailed results, including timing
878
879
  information for every operation performed during the analysis. If false,
879
880
  it returns only a summary of the analysis.
880
881
  :param early_read_node_count: The number of nodes on which to perform an early
881
882
  read operation while writing each blob. Early read operations are only rarely
882
- performed.
883
+ performed. For realistic experiments, leave this parameter unset.
883
884
  :param max_blob_size: The maximum size of a blob to be written during the test.
884
- For realistic experiments, you should set it to at least `2gb`.
885
+ For realistic experiments, set this parameter to at least `2gb`.
885
886
  :param max_total_data_size: An upper limit on the total size of all the blobs
886
- written during the test. For realistic experiments, you should set it to
887
+ written during the test. For realistic experiments, set this parameter to
887
888
  at least `1tb`.
888
889
  :param rare_action_probability: The probability of performing a rare action such
889
- as an early read, an overwrite, or an aborted write on each blob.
890
+ as an early read, an overwrite, or an aborted write on each blob. For realistic
891
+ experiments, leave this parameter unset.
890
892
  :param rarely_abort_writes: Indicates whether to rarely cancel writes before
891
- they complete.
893
+ they complete. For realistic experiments, leave this parameter unset.
892
894
  :param read_node_count: The number of nodes on which to read a blob after writing.
895
+ For realistic experiments, leave this parameter unset.
893
896
  :param register_operation_count: The minimum number of linearizable register
894
- operations to perform in total. For realistic experiments, you should set
895
- it to at least `100`.
897
+ operations to perform in total. For realistic experiments, set this parameter
898
+ to at least `100`.
896
899
  :param seed: The seed for the pseudo-random number generator used to generate
897
900
  the list of operations performed during the test. To repeat the same set
898
901
  of operations in multiple experiments, use the same seed in each experiment.
899
902
  Note that the operations are performed concurrently so might not always happen
900
- in the same order on each run.
903
+ in the same order on each run. For realistic experiments, leave this parameter
904
+ unset.
901
905
  :param timeout: The period of time to wait for the test to complete. If no response
902
906
  is received before the timeout expires, the test is cancelled and returns
903
- an error.
907
+ an error. For realistic experiments, set this parameter sufficiently long
908
+ to allow the test to complete.
904
909
  """
905
910
  if name in SKIP_IN_PATH:
906
911
  raise ValueError("Empty value passed for parameter 'name'")
@@ -1266,6 +1271,11 @@ class SnapshotClient(NamespacedClient):
1266
1271
  <p>If you omit the <code>&lt;snapshot&gt;</code> request path parameter, the request retrieves information only for currently running snapshots.
1267
1272
  This usage is preferred.
1268
1273
  If needed, you can specify <code>&lt;repository&gt;</code> and <code>&lt;snapshot&gt;</code> to retrieve information for specific snapshots, even if they're not currently running.</p>
1274
+ <p>Note that the stats will not be available for any shard snapshots in an ongoing snapshot completed by a node that (even momentarily) left the cluster.
1275
+ Loading the stats from the repository is an expensive operation (see the WARNING below).
1276
+ Therefore the stats values for such shards will be -1 even though the &quot;stage&quot; value will be &quot;DONE&quot;, in order to minimize latency.
1277
+ A &quot;description&quot; field will be present for a shard snapshot completed by a departed node explaining why the shard snapshot's stats results are invalid.
1278
+ Consequently, the total stats for the index will be less than expected due to the missing values from these shards.</p>
1269
1279
  <p>WARNING: Using the API to return the status of any snapshots other than currently running snapshots can be expensive.
1270
1280
  The API requires a read from the repository for each shard in each snapshot.
1271
1281
  For example, if you have 100 snapshots with 1,000 shards each, an API request that includes all snapshots will require 100,000 reads (100 snapshots x 1,000 shards).</p>
@@ -285,6 +285,7 @@ class SqlClient(NamespacedClient):
285
285
  page_timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
286
286
  params: t.Optional[t.Sequence[t.Any]] = None,
287
287
  pretty: t.Optional[bool] = None,
288
+ project_routing: t.Optional[str] = None,
288
289
  query: t.Optional[str] = None,
289
290
  request_timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
290
291
  runtime_mappings: t.Optional[t.Mapping[str, t.Mapping[str, t.Any]]] = None,
@@ -332,6 +333,10 @@ class SqlClient(NamespacedClient):
332
333
  is no longer available. Subsequent scroll requests prolong the lifetime of
333
334
  the scroll cursor by the duration of `page_timeout` in the scroll request.
334
335
  :param params: The values for parameters in the query.
336
+ :param project_routing: Specifies a subset of projects to target for the search
337
+ using project metadata tags in a subset of Lucene query syntax. Allowed Lucene
338
+ queries: the _alias tag and a single value (possibly wildcarded). Examples:
339
+ _alias:my-project _alias:_origin _alias:*pr* Supported in serverless only.
335
340
  :param query: The SQL query to run.
336
341
  :param request_timeout: The timeout before the request fails.
337
342
  :param runtime_mappings: One or more runtime fields for the search request. These
@@ -357,6 +362,8 @@ class SqlClient(NamespacedClient):
357
362
  __query["human"] = human
358
363
  if pretty is not None:
359
364
  __query["pretty"] = pretty
365
+ if project_routing is not None:
366
+ __query["project_routing"] = project_routing
360
367
  if not __body:
361
368
  if allow_partial_search_results is not None:
362
369
  __body["allow_partial_search_results"] = allow_partial_search_results
@@ -15,6 +15,7 @@
15
15
  # specific language governing permissions and limitations
16
16
  # under the License.
17
17
 
18
+
18
19
  import typing as t
19
20
 
20
21
  from elastic_transport import ObjectApiResponse, TextApiResponse
@@ -144,9 +145,7 @@ class StreamsClient(NamespacedClient):
144
145
  error_trace: t.Optional[bool] = None,
145
146
  filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
146
147
  human: t.Optional[bool] = None,
147
- master_timeout: t.Optional[
148
- t.Union[str, t.Literal["d", "h", "m", "micros", "ms", "nanos", "s"]]
149
- ] = None,
148
+ master_timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
150
149
  pretty: t.Optional[bool] = None,
151
150
  ) -> ObjectApiResponse[t.Any]:
152
151
  """
elasticsearch/_version.py CHANGED
@@ -15,5 +15,5 @@
15
15
  # specific language governing permissions and limitations
16
16
  # under the License.
17
17
 
18
- __versionstr__ = "9.1.3"
19
- __es_specification_commit__ = "69144c05ec6727c4ee39aec454f7ad6a57d240fc"
18
+ __versionstr__ = "9.2.1"
19
+ __es_specification_commit__ = "4ab58cf013706c9104d18daafae4361cf7351a55"
elasticsearch/client.py CHANGED
@@ -47,6 +47,7 @@ from ._sync.client.migration import MigrationClient as MigrationClient # noqa:
47
47
  from ._sync.client.ml import MlClient as MlClient # noqa: F401
48
48
  from ._sync.client.monitoring import MonitoringClient as MonitoringClient # noqa: F401
49
49
  from ._sync.client.nodes import NodesClient as NodesClient # noqa: F401
50
+ from ._sync.client.project import ProjectClient as ProjectClient # noqa: F401
50
51
  from ._sync.client.query_rules import QueryRulesClient as QueryRulesClient # noqa: F401
51
52
  from ._sync.client.rollup import RollupClient as RollupClient # noqa: F401
52
53
  from ._sync.client.search_application import ( # noqa: F401
@@ -106,6 +107,7 @@ __all__ = [
106
107
  "MlClient",
107
108
  "MonitoringClient",
108
109
  "NodesClient",
110
+ "ProjectClient",
109
111
  "RollupClient",
110
112
  "SearchApplicationClient",
111
113
  "SearchableSnapshotsClient",
elasticsearch/compat.py CHANGED
@@ -15,14 +15,13 @@
15
15
  # specific language governing permissions and limitations
16
16
  # under the License.
17
17
 
18
- import asyncio
19
18
  import inspect
20
19
  import os
21
20
  import sys
22
- from contextlib import asynccontextmanager, contextmanager
21
+ from contextlib import contextmanager
23
22
  from pathlib import Path
24
23
  from threading import Thread
25
- from typing import Any, AsyncIterator, Callable, Coroutine, Iterator, Tuple, Type, Union
24
+ from typing import Any, Callable, Iterator, Tuple, Type, Union
26
25
 
27
26
  string_types: Tuple[Type[str], Type[bytes]] = (str, bytes)
28
27
 
@@ -105,22 +104,10 @@ def safe_thread(
105
104
  raise captured_exception
106
105
 
107
106
 
108
- @asynccontextmanager
109
- async def safe_task(coro: Coroutine[Any, Any, Any]) -> AsyncIterator[asyncio.Task[Any]]:
110
- """Run a background task within a context manager block.
111
-
112
- The task is awaited when the block ends.
113
- """
114
- task = asyncio.create_task(coro)
115
- yield task
116
- await task
117
-
118
-
119
107
  __all__ = [
120
108
  "string_types",
121
109
  "to_str",
122
110
  "to_bytes",
123
111
  "warn_stacklevel",
124
112
  "safe_thread",
125
- "safe_task",
126
113
  ]
@@ -125,9 +125,10 @@ class AsyncDocument(DocumentBase, metaclass=AsyncIndexMeta):
125
125
  Create an :class:`~elasticsearch.dsl.Search` instance that will search
126
126
  over this ``Document``.
127
127
  """
128
- return AsyncSearch(
128
+ s = AsyncSearch[Self](
129
129
  using=cls._get_using(using), index=cls._default_index(index), doc_type=[cls]
130
130
  )
131
+ return s.source(exclude_vectors=False)
131
132
 
132
133
  @classmethod
133
134
  async def get(
@@ -119,9 +119,10 @@ class Document(DocumentBase, metaclass=IndexMeta):
119
119
  Create an :class:`~elasticsearch.dsl.Search` instance that will search
120
120
  over this ``Document``.
121
121
  """
122
- return Search(
122
+ s = Search[Self](
123
123
  using=cls._get_using(using), index=cls._default_index(index), doc_type=[cls]
124
124
  )
125
+ return s.source(exclude_vectors=False)
125
126
 
126
127
  @classmethod
127
128
  def get(
@@ -34,6 +34,8 @@ from typing import (
34
34
  overload,
35
35
  )
36
36
 
37
+ from typing_extensions import _AnnotatedAlias
38
+
37
39
  try:
38
40
  import annotationlib
39
41
  except ImportError:
@@ -358,6 +360,10 @@ class DocumentOptions:
358
360
  # the field has a type annotation, so next we try to figure out
359
361
  # what field type we can use
360
362
  type_ = annotations[name]
363
+ type_metadata = []
364
+ if isinstance(type_, _AnnotatedAlias):
365
+ type_metadata = type_.__metadata__
366
+ type_ = type_.__origin__
361
367
  skip = False
362
368
  required = True
363
369
  multi = False
@@ -404,6 +410,12 @@ class DocumentOptions:
404
410
  # use best field type for the type hint provided
405
411
  field, field_kwargs = self.type_annotation_map[type_] # type: ignore[assignment]
406
412
 
413
+ # if this field does not have a right-hand value, we look in the metadata
414
+ # of the annotation to see if we find it there
415
+ for md in type_metadata:
416
+ if isinstance(md, (_FieldMetadataDict, Field)):
417
+ attrs[name] = md
418
+
407
419
  if field:
408
420
  field_kwargs = {
409
421
  "multi": multi,
@@ -416,17 +428,20 @@ class DocumentOptions:
416
428
  # this field has a right-side value, which can be field
417
429
  # instance on its own or wrapped with mapped_field()
418
430
  attr_value = attrs[name]
419
- if isinstance(attr_value, dict):
431
+ if isinstance(attr_value, _FieldMetadataDict):
420
432
  # the mapped_field() wrapper function was used so we need
421
433
  # to look for the field instance and also record any
422
434
  # dataclass-style defaults
435
+ if attr_value.get("exclude"):
436
+ # skip this field
437
+ continue
423
438
  attr_value = attrs[name].get("_field")
424
439
  default_value = attrs[name].get("default") or attrs[name].get(
425
440
  "default_factory"
426
441
  )
427
442
  if default_value:
428
443
  field_defaults[name] = default_value
429
- if attr_value:
444
+ if isinstance(attr_value, Field):
430
445
  value = attr_value
431
446
  if required is not None:
432
447
  value._required = required
@@ -505,12 +520,19 @@ class Mapped(Generic[_FieldType]):
505
520
  M = Mapped
506
521
 
507
522
 
523
+ class _FieldMetadataDict(dict[str, Any]):
524
+ """This class is used to identify metadata returned by the `mapped_field()` function."""
525
+
526
+ pass
527
+
528
+
508
529
  def mapped_field(
509
530
  field: Optional[Field] = None,
510
531
  *,
511
532
  init: bool = True,
512
533
  default: Any = None,
513
534
  default_factory: Optional[Callable[[], Any]] = None,
535
+ exclude: bool = False,
514
536
  **kwargs: Any,
515
537
  ) -> Any:
516
538
  """Construct a field using dataclass behaviors
@@ -520,22 +542,25 @@ def mapped_field(
520
542
  options.
521
543
 
522
544
  :param field: The instance of ``Field`` to use for this field. If not provided,
523
- an instance that is appropriate for the type given to the field is used.
545
+ an instance that is appropriate for the type given to the field is used.
524
546
  :param init: a value of ``True`` adds this field to the constructor, and a
525
- value of ``False`` omits it from it. The default is ``True``.
547
+ value of ``False`` omits it from it. The default is ``True``.
526
548
  :param default: a default value to use for this field when one is not provided
527
- explicitly.
549
+ explicitly.
528
550
  :param default_factory: a callable that returns a default value for the field,
529
- when one isn't provided explicitly. Only one of ``factory`` and
530
- ``default_factory`` can be used.
551
+ when one isn't provided explicitly. Only one of ``factory`` and
552
+ ``default_factory`` can be used.
553
+ :param exclude: Set to ``True`` to exclude this field from the Elasticsearch
554
+ index.
531
555
  """
532
- return {
533
- "_field": field,
534
- "init": init,
535
- "default": default,
536
- "default_factory": default_factory,
556
+ return _FieldMetadataDict(
557
+ _field=field,
558
+ init=init,
559
+ default=default,
560
+ default_factory=default_factory,
561
+ exclude=exclude,
537
562
  **kwargs,
538
- }
563
+ )
539
564
 
540
565
 
541
566
  @dataclass_transform(field_specifiers=(mapped_field,))
@@ -3866,6 +3866,9 @@ class SemanticText(Field):
3866
3866
  by using the Update mapping API. Use the Create inference API to
3867
3867
  create the endpoint. If not specified, the inference endpoint
3868
3868
  defined by inference_id will be used at both index and query time.
3869
+ :arg index_options: Settings for index_options that override any
3870
+ defaults used by semantic_text, for example specific quantization
3871
+ settings.
3869
3872
  :arg chunking_settings: Settings for chunking text into smaller
3870
3873
  passages. If specified, these will override the chunking settings
3871
3874
  sent in the inference endpoint associated with inference_id. If
@@ -3885,6 +3888,9 @@ class SemanticText(Field):
3885
3888
  meta: Union[Mapping[str, str], "DefaultType"] = DEFAULT,
3886
3889
  inference_id: Union[str, "DefaultType"] = DEFAULT,
3887
3890
  search_inference_id: Union[str, "DefaultType"] = DEFAULT,
3891
+ index_options: Union[
3892
+ "types.SemanticTextIndexOptions", Dict[str, Any], "DefaultType"
3893
+ ] = DEFAULT,
3888
3894
  chunking_settings: Union[
3889
3895
  "types.ChunkingSettings", Dict[str, Any], "DefaultType"
3890
3896
  ] = DEFAULT,
@@ -3897,6 +3903,8 @@ class SemanticText(Field):
3897
3903
  kwargs["inference_id"] = inference_id
3898
3904
  if search_inference_id is not DEFAULT:
3899
3905
  kwargs["search_inference_id"] = search_inference_id
3906
+ if index_options is not DEFAULT:
3907
+ kwargs["index_options"] = index_options
3900
3908
  if chunking_settings is not DEFAULT:
3901
3909
  kwargs["chunking_settings"] = chunking_settings
3902
3910
  if fields is not DEFAULT: