unstructured-ingest 1.0.16__py3-none-any.whl → 1.0.17__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

@@ -1 +1 @@
1
- __version__ = "1.0.16" # pragma: no cover
1
+ __version__ = "1.0.17" # pragma: no cover
@@ -25,8 +25,9 @@ class AzureOpenAIEmbeddingConfig(OpenAIEmbeddingConfig):
25
25
  def get_client(self) -> "AzureOpenAI":
26
26
  from openai import AzureOpenAI
27
27
 
28
+ api_key = self.api_key.get_secret_value() if self.api_key else None
28
29
  return AzureOpenAI(
29
- api_key=self.api_key.get_secret_value(),
30
+ api_key=api_key,
30
31
  api_version=self.api_version,
31
32
  azure_endpoint=self.azure_endpoint,
32
33
  )
@@ -35,8 +36,9 @@ class AzureOpenAIEmbeddingConfig(OpenAIEmbeddingConfig):
35
36
  def get_async_client(self) -> "AsyncAzureOpenAI":
36
37
  from openai import AsyncAzureOpenAI
37
38
 
39
+ api_key = self.api_key.get_secret_value() if self.api_key else None
38
40
  return AsyncAzureOpenAI(
39
- api_key=self.api_key.get_secret_value(),
41
+ api_key=api_key,
40
42
  api_version=self.api_version,
41
43
  azure_endpoint=self.azure_endpoint,
42
44
  )
@@ -1,5 +1,5 @@
1
1
  from dataclasses import dataclass
2
- from typing import TYPE_CHECKING
2
+ from typing import TYPE_CHECKING, Optional
3
3
 
4
4
  from pydantic import Field, SecretStr
5
5
 
@@ -24,7 +24,7 @@ if TYPE_CHECKING:
24
24
 
25
25
 
26
26
  class OctoAiEmbeddingConfig(EmbeddingConfig):
27
- api_key: SecretStr
27
+ api_key: Optional[SecretStr] = Field(description="API key for OctoAI", default=None)
28
28
  embedder_model_name: str = Field(
29
29
  default="thenlper/gte-large", alias="model_name", description="octoai model name"
30
30
  )
@@ -77,7 +77,8 @@ class OctoAiEmbeddingConfig(EmbeddingConfig):
77
77
  """Creates an OpenAI python client to embed elements. Uses the OpenAI SDK."""
78
78
  from openai import OpenAI
79
79
 
80
- return OpenAI(api_key=self.api_key.get_secret_value(), base_url=self.base_url)
80
+ api_key = self.api_key.get_secret_value() if self.api_key else None
81
+ return OpenAI(api_key=api_key, base_url=self.base_url)
81
82
 
82
83
  @requires_dependencies(
83
84
  ["openai", "tiktoken"],
@@ -87,7 +88,8 @@ class OctoAiEmbeddingConfig(EmbeddingConfig):
87
88
  """Creates an OpenAI python client to embed elements. Uses the OpenAI SDK."""
88
89
  from openai import AsyncOpenAI
89
90
 
90
- return AsyncOpenAI(api_key=self.api_key.get_secret_value(), base_url=self.base_url)
91
+ api_key = self.api_key.get_secret_value() if self.api_key else None
92
+ return AsyncOpenAI(api_key=api_key, base_url=self.base_url)
91
93
 
92
94
 
93
95
  @dataclass
@@ -24,7 +24,7 @@ if TYPE_CHECKING:
24
24
 
25
25
 
26
26
  class OpenAIEmbeddingConfig(EmbeddingConfig):
27
- api_key: SecretStr = Field(description="API key for OpenAI")
27
+ api_key: Optional[SecretStr] = Field(description="API key for OpenAI", default=None)
28
28
  embedder_model_name: str = Field(
29
29
  default="text-embedding-ada-002", alias="model_name", description="OpenAI model name"
30
30
  )
@@ -88,13 +88,15 @@ class OpenAIEmbeddingConfig(EmbeddingConfig):
88
88
  def get_client(self) -> "OpenAI":
89
89
  from openai import OpenAI
90
90
 
91
- return OpenAI(api_key=self.api_key.get_secret_value(), base_url=self.base_url)
91
+ api_key = self.api_key.get_secret_value() if self.api_key else None
92
+ return OpenAI(api_key=api_key, base_url=self.base_url)
92
93
 
93
94
  @requires_dependencies(["openai"], extras="openai")
94
95
  def get_async_client(self) -> "AsyncOpenAI":
95
96
  from openai import AsyncOpenAI
96
97
 
97
- return AsyncOpenAI(api_key=self.api_key.get_secret_value(), base_url=self.base_url)
98
+ api_key = self.api_key.get_secret_value() if self.api_key else None
99
+ return AsyncOpenAI(api_key=api_key, base_url=self.base_url)
98
100
 
99
101
 
100
102
  @dataclass
@@ -1,5 +1,5 @@
1
1
  from dataclasses import dataclass
2
- from typing import TYPE_CHECKING, Any
2
+ from typing import TYPE_CHECKING, Any, Optional
3
3
 
4
4
  from pydantic import Field, SecretStr
5
5
 
@@ -20,7 +20,7 @@ if TYPE_CHECKING:
20
20
 
21
21
 
22
22
  class TogetherAIEmbeddingConfig(EmbeddingConfig):
23
- api_key: SecretStr = Field(description="API key for Together AI")
23
+ api_key: Optional[SecretStr] = Field(description="API key for Together AI", default=None)
24
24
  embedder_model_name: str = Field(
25
25
  default="togethercomputer/m2-bert-80M-8k-retrieval",
26
26
  alias="model_name",
@@ -58,13 +58,15 @@ class TogetherAIEmbeddingConfig(EmbeddingConfig):
58
58
  def get_client(self) -> "Together":
59
59
  from together import Together
60
60
 
61
- return Together(api_key=self.api_key.get_secret_value())
61
+ api_key = self.api_key.get_secret_value() if self.api_key else None
62
+ return Together(api_key=api_key)
62
63
 
63
64
  @requires_dependencies(["together"], extras="togetherai")
64
65
  def get_async_client(self) -> "AsyncTogether":
65
66
  from together import AsyncTogether
66
67
 
67
- return AsyncTogether(api_key=self.api_key.get_secret_value())
68
+ api_key = self.api_key.get_secret_value() if self.api_key else None
69
+ return AsyncTogether(api_key=api_key)
68
70
 
69
71
 
70
72
  @dataclass
@@ -26,7 +26,7 @@ class VoyageAIEmbeddingConfig(EmbeddingConfig):
26
26
  le=128,
27
27
  description="Batch size for embedding requests. VoyageAI has a limit of 128.",
28
28
  )
29
- api_key: SecretStr = Field(description="API key for VoyageAI")
29
+ api_key: Optional[SecretStr] = Field(description="API key for VoyageAI", default=None)
30
30
  embedder_model_name: str = Field(
31
31
  default="voyage-3", alias="model_name", description="VoyageAI model name"
32
32
  )
@@ -65,8 +65,9 @@ class VoyageAIEmbeddingConfig(EmbeddingConfig):
65
65
  """Creates a VoyageAI python client to embed elements."""
66
66
  from voyageai import Client as VoyageAIClient
67
67
 
68
+ api_key = self.api_key.get_secret_value() if self.api_key else None
68
69
  client = VoyageAIClient(
69
- api_key=self.api_key.get_secret_value(),
70
+ api_key=api_key,
70
71
  max_retries=self.max_retries,
71
72
  timeout=self.timeout_in_seconds,
72
73
  )
@@ -80,8 +81,9 @@ class VoyageAIEmbeddingConfig(EmbeddingConfig):
80
81
  """Creates a VoyageAI python client to embed elements."""
81
82
  from voyageai import AsyncClient as AsyncVoyageAIClient
82
83
 
84
+ api_key = self.api_key.get_secret_value() if self.api_key else None
83
85
  client = AsyncVoyageAIClient(
84
- api_key=self.api_key.get_secret_value(),
86
+ api_key=api_key,
85
87
  max_retries=self.max_retries,
86
88
  timeout=self.timeout_in_seconds,
87
89
  )
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: unstructured_ingest
3
- Version: 1.0.16
3
+ Version: 1.0.17
4
4
  Summary: Local ETL data pipeline to get data RAG ready
5
5
  Author-email: Unstructured Technologies <devops@unstructuredai.io>
6
6
  License-Expression: Apache-2.0
@@ -73,7 +73,7 @@ Provides-Extra: duckdb
73
73
  Requires-Dist: duckdb; extra == 'duckdb'
74
74
  Requires-Dist: pandas; extra == 'duckdb'
75
75
  Provides-Extra: elasticsearch
76
- Requires-Dist: elasticsearch[async]; extra == 'elasticsearch'
76
+ Requires-Dist: elasticsearch[async]<9.0.0; extra == 'elasticsearch'
77
77
  Provides-Extra: epub
78
78
  Requires-Dist: unstructured[epub]; extra == 'epub'
79
79
  Provides-Extra: gcs
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=NfSrbEsbtpdSSGDsN8yPzjM7DstYUTj04Lqn9H8oysI,43
2
+ unstructured_ingest/__version__.py,sha256=HJycVzTiDHeRdW4JUDAnGRPwiviRO2FPCxl56CUWKGY,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/errors_v2.py,sha256=9RuRCi7lbDxCguDz07y5RiHoQiFIOWwOD7xqzJ2B3Yw,436
5
5
  unstructured_ingest/logger.py,sha256=7e_7UeK6hVOd5BQ6i9NzRUAPCS_DF839Y8TjUDywraY,1428
@@ -22,16 +22,16 @@ unstructured_ingest/data_types/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5
22
22
  unstructured_ingest/data_types/entities.py,sha256=ECc6EkZ5_ZUvK7uaALYOynfFmofIrHYIJZfb67hUIxA,371
23
23
  unstructured_ingest/data_types/file_data.py,sha256=J0RQa7YXhhxiLVzhPbF5Hl2nzSpxLFK9vrP6RTBWlSg,3833
24
24
  unstructured_ingest/embed/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
25
- unstructured_ingest/embed/azure_openai.py,sha256=fk9yTG-Xr1TSu4n4l8O3DQo9-oceVL9fX_8rehwXsNM,1798
25
+ unstructured_ingest/embed/azure_openai.py,sha256=nHEkvWH7mETrJB-C9qlci6bEpSEPiW9peG82EUDQ954,1902
26
26
  unstructured_ingest/embed/bedrock.py,sha256=dzfCsatB0i8hUp1YnXmoImoxgvUdZ4srKI6eSvn-lYM,9132
27
27
  unstructured_ingest/embed/huggingface.py,sha256=6Gx9L3xa3cv9fX4AMuLsePJQF4T_jwkKjovfqF5X1NM,2435
28
28
  unstructured_ingest/embed/interfaces.py,sha256=Y3PLhgWnMDmtpugE37hlAiBIbC8izrFFXXkrPVby-HY,5137
29
29
  unstructured_ingest/embed/mixedbreadai.py,sha256=pmpGQ0E-bfkkg4rvPvsFxL6Oc7H5f0mJGguHtfL7oLc,4592
30
- unstructured_ingest/embed/octoai.py,sha256=3_xcD0jWfcMzn8OoOgHaIo8SWjeErrZH2DQ4Q9UVwOA,4498
31
- unstructured_ingest/embed/openai.py,sha256=TMEOPVfm_OSs4tb3Ymd6q5J49R_-YKvO4TOqCHb3bwk,4647
32
- unstructured_ingest/embed/togetherai.py,sha256=EehrzTRx4sd_P6AG9JkHAGwTG-o93GMaV5ufmJaxKWs,3629
30
+ unstructured_ingest/embed/octoai.py,sha256=imuH_vLlmDd3GgAgiA0AaXB1fGjaI9lPpCCBG5HbpU8,4678
31
+ unstructured_ingest/embed/openai.py,sha256=yYqpSZcD8kUZOT36oj39hN8sCFpPKShTHVyV4dI3Bbg,4775
32
+ unstructured_ingest/embed/togetherai.py,sha256=19Le-SdMLp2U1qy5mTk_kO90b-AbOG_-a7Fslp1caJA,3767
33
33
  unstructured_ingest/embed/vertexai.py,sha256=jA3Y-AysVVaYwqkVd_OgRKF0JdHLAgZlRgfgddcZV2o,3763
34
- unstructured_ingest/embed/voyageai.py,sha256=EOrYzaoXOZ6C4fNkMlCgb8KA8rdfgVXN3USMFpnn0Bs,4698
34
+ unstructured_ingest/embed/voyageai.py,sha256=-aKSxZm6G5NcKlloA6je70HmT30WSgcnZWCGEoz9PPo,4826
35
35
  unstructured_ingest/interfaces/__init__.py,sha256=QIkWqjsq9INTa89gPuXlMlQL4s3y5TqLmPkuVuTyXcs,795
36
36
  unstructured_ingest/interfaces/connector.py,sha256=qUFFJ3qgDMenTCZMtVRjq1DIwsVak6pxNjQOH2eVkMw,1623
37
37
  unstructured_ingest/interfaces/downloader.py,sha256=xX0ZzsFRSzZb7SAeoeQph8sIbVq13DRw-3MYkdADrY0,2918
@@ -231,8 +231,8 @@ unstructured_ingest/utils/ndjson.py,sha256=nz8VUOPEgAFdhaDOpuveknvCU4x82fVwqE01q
231
231
  unstructured_ingest/utils/pydantic_models.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3rJn1PHTI_G_A_EHY,1720
232
232
  unstructured_ingest/utils/string_and_date_utils.py,sha256=oXOI6rxXq-8ncbk7EoJK0WCcTXWj75EzKl8pfQMID3U,2522
233
233
  unstructured_ingest/utils/table.py,sha256=WZechczgVFvlodUWFcsnCGvBNh1xRm6hr0VbJTPxKAc,3669
234
- unstructured_ingest-1.0.16.dist-info/METADATA,sha256=VKRwEluZjChUvNhdtBQrtuFdgfTzVusL_BGbr-fUprM,8688
235
- unstructured_ingest-1.0.16.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
236
- unstructured_ingest-1.0.16.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
237
- unstructured_ingest-1.0.16.dist-info/licenses/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
238
- unstructured_ingest-1.0.16.dist-info/RECORD,,
234
+ unstructured_ingest-1.0.17.dist-info/METADATA,sha256=XvwbN72yhaJKn5uYKyWePqbH5ZmptqS9I0RP___NbXQ,8694
235
+ unstructured_ingest-1.0.17.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
236
+ unstructured_ingest-1.0.17.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
237
+ unstructured_ingest-1.0.17.dist-info/licenses/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
238
+ unstructured_ingest-1.0.17.dist-info/RECORD,,