unstructured-ingest 1.2.19__py3-none-any.whl → 1.2.21__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of unstructured-ingest might be problematic. Click here for more details.
- unstructured_ingest/__version__.py +1 -1
- unstructured_ingest/processes/connectors/databricks/volumes.py +5 -1
- unstructured_ingest/processes/connectors/weaviate/weaviate.py +4 -1
- {unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/METADATA +2 -2
- {unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/RECORD +8 -8
- {unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/WHEEL +0 -0
- {unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/entry_points.txt +0 -0
- {unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/licenses/LICENSE.md +0 -0
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.21" # pragma: no cover
|
|
@@ -1,3 +1,4 @@
|
|
|
1
|
+
import io
|
|
1
2
|
import os
|
|
2
3
|
from abc import ABC
|
|
3
4
|
from dataclasses import dataclass
|
|
@@ -220,9 +221,12 @@ class DatabricksVolumesUploader(Uploader, ABC):
|
|
|
220
221
|
output_path = self.get_output_path(file_data=file_data)
|
|
221
222
|
with open(path, "rb") as elements_file:
|
|
222
223
|
try:
|
|
224
|
+
# Read file bytes and wrap in BytesIO to create BinaryIO object
|
|
225
|
+
file_bytes = elements_file.read()
|
|
226
|
+
binary_data = io.BytesIO(file_bytes)
|
|
223
227
|
self.connection_config.get_client().files.upload(
|
|
224
228
|
file_path=output_path,
|
|
225
|
-
|
|
229
|
+
content=binary_data, # Changed from 'contents' to 'content' in SDK 0.70.0+
|
|
226
230
|
overwrite=True,
|
|
227
231
|
)
|
|
228
232
|
except Exception as e:
|
|
@@ -220,7 +220,10 @@ class WeaviateUploader(VectorDBUploader, ABC):
|
|
|
220
220
|
|
|
221
221
|
def precheck(self) -> None:
|
|
222
222
|
try:
|
|
223
|
-
self.connection_config.get_client()
|
|
223
|
+
with self.connection_config.get_client():
|
|
224
|
+
# Connection test successful - client is available but not needed
|
|
225
|
+
pass
|
|
226
|
+
|
|
224
227
|
# only if collection name populated should we check that it exists
|
|
225
228
|
if self.upload_config.collection and not self._collection_exists():
|
|
226
229
|
raise DestinationConnectionError(
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: unstructured_ingest
|
|
3
|
-
Version: 1.2.
|
|
3
|
+
Version: 1.2.21
|
|
4
4
|
Summary: Local ETL data pipeline to get data RAG ready
|
|
5
5
|
Author-email: Unstructured Technologies <devops@unstructuredai.io>
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -56,7 +56,7 @@ Provides-Extra: databricks-delta-tables
|
|
|
56
56
|
Requires-Dist: databricks-sql-connector; extra == 'databricks-delta-tables'
|
|
57
57
|
Requires-Dist: pandas; extra == 'databricks-delta-tables'
|
|
58
58
|
Provides-Extra: databricks-volumes
|
|
59
|
-
Requires-Dist: databricks-sdk; extra == 'databricks-volumes'
|
|
59
|
+
Requires-Dist: databricks-sdk>=0.70.0; extra == 'databricks-volumes'
|
|
60
60
|
Provides-Extra: delta-table
|
|
61
61
|
Requires-Dist: boto3; extra == 'delta-table'
|
|
62
62
|
Requires-Dist: deltalake; extra == 'delta-table'
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
|
|
2
|
-
unstructured_ingest/__version__.py,sha256=
|
|
2
|
+
unstructured_ingest/__version__.py,sha256=xjNu-CZa5urpmHhb26SfyioexKsNLKIe5ekLUG349-g,43
|
|
3
3
|
unstructured_ingest/error.py,sha256=chM7zQSTKjaKaQt_2_QkoZDUwY5XPNeACML7JqOWRLY,4036
|
|
4
4
|
unstructured_ingest/errors_v2.py,sha256=chM7zQSTKjaKaQt_2_QkoZDUwY5XPNeACML7JqOWRLY,4036
|
|
5
5
|
unstructured_ingest/logger.py,sha256=7e_7UeK6hVOd5BQ6i9NzRUAPCS_DF839Y8TjUDywraY,1428
|
|
@@ -92,7 +92,7 @@ unstructured_ingest/processes/connectors/assets/__init__.py,sha256=47DEQpj8HBSa-
|
|
|
92
92
|
unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql,sha256=8a9HTcRWA6IuswSD632b_uZSO6Dax_0rUYnflqktcek,226
|
|
93
93
|
unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json,sha256=SJlIO0kXxy866tWQ8bEzvwLwflsoUMIS-OKlxMvHIuE,504
|
|
94
94
|
unstructured_ingest/processes/connectors/databricks/__init__.py,sha256=RtKAPyNtXh6fzEsOQ08pA0-vC1uMr3KqYG6cqiBoo70,2133
|
|
95
|
-
unstructured_ingest/processes/connectors/databricks/volumes.py,sha256=
|
|
95
|
+
unstructured_ingest/processes/connectors/databricks/volumes.py,sha256=2uUdwgCcDO7-R3eV3OzwixmCfQxdQDE6WAnooGzS2KE,8699
|
|
96
96
|
unstructured_ingest/processes/connectors/databricks/volumes_aws.py,sha256=WhGTp6aRTLSdc4GChCL4mz2b-IanderW8j1IqezX6YA,2958
|
|
97
97
|
unstructured_ingest/processes/connectors/databricks/volumes_azure.py,sha256=pF2d6uAIbwJJUeOIG5xknUMCGc5d9Aztmc2776wp-a0,3740
|
|
98
98
|
unstructured_ingest/processes/connectors/databricks/volumes_gcp.py,sha256=y9AvVl6PtnIxlTlrPj_wyHBDBRJNq3uoTOuZwTryNg8,2994
|
|
@@ -214,7 +214,7 @@ unstructured_ingest/processes/connectors/weaviate/__init__.py,sha256=1Vnz8hm_Cf3
|
|
|
214
214
|
unstructured_ingest/processes/connectors/weaviate/cloud.py,sha256=QEUfnrGMaDH7IS-jkxIBynez8F0xpzzVqg0yDOx8D6k,6294
|
|
215
215
|
unstructured_ingest/processes/connectors/weaviate/embedded.py,sha256=buizqBd6PSbd9VgRrOj43GZEorBpDFkUIkE6sN9emhw,3008
|
|
216
216
|
unstructured_ingest/processes/connectors/weaviate/local.py,sha256=4fgZsL9dgnWuaSNqVlKROm-S3Ql3naLmKvigLBgUQdw,2195
|
|
217
|
-
unstructured_ingest/processes/connectors/weaviate/weaviate.py,sha256=
|
|
217
|
+
unstructured_ingest/processes/connectors/weaviate/weaviate.py,sha256=dlnf1J2lRsk7DNIl1EzFDviHced2Lqy_J879TOwi_14,13769
|
|
218
218
|
unstructured_ingest/processes/connectors/zendesk/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
219
219
|
unstructured_ingest/processes/connectors/zendesk/client.py,sha256=21NS12u3ECubqgiyTvfuFUDUQs-zWWz75xXGr_wDGIU,12028
|
|
220
220
|
unstructured_ingest/processes/connectors/zendesk/zendesk.py,sha256=4sM6tKmgtgd2VacBtYlSfkxUF6vDb3raeoh1jHuI-tQ,9364
|
|
@@ -235,8 +235,8 @@ unstructured_ingest/utils/pydantic_models.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3r
|
|
|
235
235
|
unstructured_ingest/utils/string_and_date_utils.py,sha256=oXOI6rxXq-8ncbk7EoJK0WCcTXWj75EzKl8pfQMID3U,2522
|
|
236
236
|
unstructured_ingest/utils/table.py,sha256=WZechczgVFvlodUWFcsnCGvBNh1xRm6hr0VbJTPxKAc,3669
|
|
237
237
|
unstructured_ingest/utils/tls.py,sha256=Ra8Mii1F4VqErRreg76PBI0eAqPBC009l0sSHa8FdnA,448
|
|
238
|
-
unstructured_ingest-1.2.
|
|
239
|
-
unstructured_ingest-1.2.
|
|
240
|
-
unstructured_ingest-1.2.
|
|
241
|
-
unstructured_ingest-1.2.
|
|
242
|
-
unstructured_ingest-1.2.
|
|
238
|
+
unstructured_ingest-1.2.21.dist-info/METADATA,sha256=LcUO2yZ_gDlNRHyRxwJYz8QXPACjNYpct0uhhUjLoCE,8897
|
|
239
|
+
unstructured_ingest-1.2.21.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
|
240
|
+
unstructured_ingest-1.2.21.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
|
|
241
|
+
unstructured_ingest-1.2.21.dist-info/licenses/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
|
|
242
|
+
unstructured_ingest-1.2.21.dist-info/RECORD,,
|
|
File without changes
|
{unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
{unstructured_ingest-1.2.19.dist-info → unstructured_ingest-1.2.21.dist-info}/licenses/LICENSE.md
RENAMED
|
File without changes
|