unstructured-ingest 1.0.48__py3-none-any.whl → 1.0.51__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

@@ -1 +1 @@
1
- __version__ = "1.0.48" # pragma: no cover
1
+ __version__ = "1.0.51" # pragma: no cover
@@ -7,7 +7,7 @@ source and destination connectors.
7
7
 
8
8
  To manually run the cli:
9
9
  ```shell
10
- PYTHONPATH=. python unstructured_ingest/v2/main.py --help
10
+ PYTHONPATH=. python unstructured_ingest/main.py --help
11
11
  ```
12
12
 
13
13
  The `main.py` file simply wraps the generated Click command created in `cli.py`.
@@ -90,6 +90,22 @@ class MongoDBConnectionConfig(ConnectionConfig):
90
90
  "server_api": ServerApi(version=SERVER_API_VERSION),
91
91
  }
92
92
  with MongoClient(**client_kwargs) as client:
93
+ # UnsupportedDigestmodError means that SCRAM-SHA-1 is disabled
94
+ # It uses md5 which is unavailable on FIPS images
95
+ try:
96
+ from hashlib import UnsupportedDigestmodError # type: ignore[attr-defined]
97
+ except ImportError:
98
+ from _hashlib import UnsupportedDigestmodError # type: ignore[attr-defined]
99
+
100
+ # Check if the authentication mechanism is supported
101
+ try:
102
+ client.admin.command("ping")
103
+ except UnsupportedDigestmodError as e:
104
+ raise ConnectionError(
105
+ "Authentication using SCRAM-SHA-1 is disabled. "
106
+ "Use SCRAM-SHA-256 instead. "
107
+ "See: https://www.mongodb.com/docs/manual/core/security-scram/"
108
+ ) from e
93
109
  yield client
94
110
 
95
111
 
@@ -117,7 +133,7 @@ class MongoDBIndexer(Indexer):
117
133
  database_names = client.list_database_names()
118
134
  database_name = self.index_config.database
119
135
  if database_name not in database_names:
120
- raise DestinationConnectionError(
136
+ raise SourceConnectionError(
121
137
  "database {} does not exist: {}".format(
122
138
  database_name, ", ".join(database_names)
123
139
  )
@@ -303,7 +319,7 @@ class MongoDBUploader(Uploader):
303
319
  collection_names = database.list_collection_names()
304
320
  collection_name = self.upload_config.collection
305
321
  if collection_name not in collection_names:
306
- raise SourceConnectionError(
322
+ raise DestinationConnectionError(
307
323
  "collection {} does not exist: {}".format(
308
324
  collection_name, ", ".join(collection_names)
309
325
  )
@@ -150,6 +150,7 @@ class SharepointDownloader(OnedriveDownloader):
150
150
  site_drive_item = self.connection_config._get_drive_item(client_site)
151
151
  except ClientRequestException:
152
152
  logger.info("Site not found")
153
+ raise SourceConnectionError(f"Site not found: {self.connection_config.site}")
153
154
  file = site_drive_item.get_by_path(server_relative_path).get().execute_query()
154
155
 
155
156
  if not file:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: unstructured_ingest
3
- Version: 1.0.48
3
+ Version: 1.0.51
4
4
  Summary: Local ETL data pipeline to get data RAG ready
5
5
  Author-email: Unstructured Technologies <devops@unstructuredai.io>
6
6
  License-Expression: Apache-2.0
@@ -1,12 +1,12 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=oxIYGy4gQ782VEa3kKpqmMWHoZ9FUqF1PhsN2QyWE88,43
2
+ unstructured_ingest/__version__.py,sha256=jkcvVBVHKL5jaZGZh7CF4yFZfuGwbHAHHUGV-bTIVBs,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/errors_v2.py,sha256=9RuRCi7lbDxCguDz07y5RiHoQiFIOWwOD7xqzJ2B3Yw,436
5
5
  unstructured_ingest/logger.py,sha256=7e_7UeK6hVOd5BQ6i9NzRUAPCS_DF839Y8TjUDywraY,1428
6
6
  unstructured_ingest/main.py,sha256=82G_7eG4PNhc_xIqj4Y_sFbDV9VI-nwSfsfJQMzovMk,169
7
7
  unstructured_ingest/otel.py,sha256=NsUqOolA0gt69eFhZLABjVpcKoM9aus-AbxIKqWqPTc,4127
8
8
  unstructured_ingest/unstructured_api.py,sha256=4e2ZNWIihk0eje4R3ZQ0NOYNbmMZDv_O-rnJo94kaGE,5127
9
- unstructured_ingest/cli/README.md,sha256=5LfM0ys1aFyCiCjlwZsi_9Mb5Nrq3MmYt3IpmUybnCE,1507
9
+ unstructured_ingest/cli/README.md,sha256=lfsXY2jOO__OuDYcIs8N0yLhZWzrSQ_dyXbSFtEMlQ8,1504
10
10
  unstructured_ingest/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
11
11
  unstructured_ingest/cli/cli.py,sha256=ZeIE9jP8fe7260nE8v7xYgLdqX9OtkQXAXSGWIkHLcA,645
12
12
  unstructured_ingest/cli/cmds.py,sha256=EhDW5UX4V-N8Svjba4w7YWnRYl26__ADwzNXrfFBxM4,483
@@ -77,14 +77,14 @@ unstructured_ingest/processes/connectors/jira.py,sha256=DCP1pSagcjmQP0he1N726WNL
77
77
  unstructured_ingest/processes/connectors/kdbai.py,sha256=XhxYpKSAoFPBsDQWwNuLX03DCxOVr7yquj9VYM55Rtc,5174
78
78
  unstructured_ingest/processes/connectors/local.py,sha256=CesMduUiSPqdJpqIyW28icGvGAo4hfa-4fzbYajmMSo,7450
79
79
  unstructured_ingest/processes/connectors/milvus.py,sha256=L-PM5osheNyNsLGYZmiF3rRmeulp7Ejk92JCoaQ_F9Y,12075
80
- unstructured_ingest/processes/connectors/mongodb.py,sha256=OmbbmE_pSDVjrn1YfjrQMTTs6JhTOJUU5d_jULxgtaM,14545
80
+ unstructured_ingest/processes/connectors/mongodb.py,sha256=idjolwS5TXShcIz2jR_socSgh8HOzJwyOnzE1qLUPBw,15362
81
81
  unstructured_ingest/processes/connectors/neo4j.py,sha256=ztxvI9KY8RF5kYUuMGSzzN5mz7Fu_4Ai9P7dqCpJLc0,20267
82
82
  unstructured_ingest/processes/connectors/onedrive.py,sha256=nZt6hsFMlURgB5-BioFBzJySieRVU8xi99QhOCtorxQ,19343
83
83
  unstructured_ingest/processes/connectors/outlook.py,sha256=6HHubZI_zttEfYp0XNd4Y1vhjsS8uSg7aZ2LBrTjfHk,9376
84
84
  unstructured_ingest/processes/connectors/pinecone.py,sha256=jCabAqKQyBFzaGjphxLMr57y7P0Z15Jd9Jj-JM40YnU,15090
85
85
  unstructured_ingest/processes/connectors/redisdb.py,sha256=rTihbfv0Mlk1eo5Izn-JXRu5Ad5C-KD58nSqeKsaZJ8,8024
86
86
  unstructured_ingest/processes/connectors/salesforce.py,sha256=N_UoebrhzXZNWw-X7lg8_qAziXx5L_d8XHnHWKNNYR8,11767
87
- unstructured_ingest/processes/connectors/sharepoint.py,sha256=vIfLIactYXcdetccHvKlYOay6NOzGj2X0CkXbY0KuRo,6213
87
+ unstructured_ingest/processes/connectors/sharepoint.py,sha256=oGBZ8czM3XwcfhYwqnkb9A9YVAGWTmCvD5vE3Q_vfUs,6303
88
88
  unstructured_ingest/processes/connectors/slack.py,sha256=oboIfX7ayBMK0te5Nv50iyL3FQJFXJbRxZSQaCMp3kM,9318
89
89
  unstructured_ingest/processes/connectors/utils.py,sha256=TAd0hb1f291N-q7-TUe6JKSCGkhqDyo7Ij8zmliBZUc,2071
90
90
  unstructured_ingest/processes/connectors/vectara.py,sha256=xrC6jkgW8BII4UjdzUelDu122xT484cpfMTK2wl-sko,12292
@@ -231,8 +231,8 @@ unstructured_ingest/utils/ndjson.py,sha256=nz8VUOPEgAFdhaDOpuveknvCU4x82fVwqE01q
231
231
  unstructured_ingest/utils/pydantic_models.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3rJn1PHTI_G_A_EHY,1720
232
232
  unstructured_ingest/utils/string_and_date_utils.py,sha256=oXOI6rxXq-8ncbk7EoJK0WCcTXWj75EzKl8pfQMID3U,2522
233
233
  unstructured_ingest/utils/table.py,sha256=WZechczgVFvlodUWFcsnCGvBNh1xRm6hr0VbJTPxKAc,3669
234
- unstructured_ingest-1.0.48.dist-info/METADATA,sha256=mFnSAhVaigxOwDyNbTK1XCVXRwY40tsATd3zYSEQE9k,8842
235
- unstructured_ingest-1.0.48.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
236
- unstructured_ingest-1.0.48.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
237
- unstructured_ingest-1.0.48.dist-info/licenses/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
238
- unstructured_ingest-1.0.48.dist-info/RECORD,,
234
+ unstructured_ingest-1.0.51.dist-info/METADATA,sha256=-YIqizM0jt0c3B2u2Kh9kzTlQ0_FK3JDr0dkuLpbELU,8842
235
+ unstructured_ingest-1.0.51.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
236
+ unstructured_ingest-1.0.51.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
237
+ unstructured_ingest-1.0.51.dist-info/licenses/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
238
+ unstructured_ingest-1.0.51.dist-info/RECORD,,