unstructured-ingest 0.0.21__py3-none-any.whl → 0.0.22__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (41) hide show
  1. unstructured_ingest/__version__.py +1 -1
  2. unstructured_ingest/embed/bedrock.py +56 -19
  3. unstructured_ingest/embed/huggingface.py +22 -22
  4. unstructured_ingest/embed/interfaces.py +11 -4
  5. unstructured_ingest/embed/mixedbreadai.py +17 -17
  6. unstructured_ingest/embed/octoai.py +7 -7
  7. unstructured_ingest/embed/openai.py +15 -20
  8. unstructured_ingest/embed/vertexai.py +25 -17
  9. unstructured_ingest/embed/voyageai.py +22 -17
  10. unstructured_ingest/v2/cli/base/cmd.py +1 -1
  11. unstructured_ingest/v2/interfaces/connector.py +1 -1
  12. unstructured_ingest/v2/pipeline/pipeline.py +3 -1
  13. unstructured_ingest/v2/pipeline/steps/chunk.py +1 -1
  14. unstructured_ingest/v2/pipeline/steps/download.py +6 -2
  15. unstructured_ingest/v2/pipeline/steps/embed.py +1 -1
  16. unstructured_ingest/v2/pipeline/steps/filter.py +1 -1
  17. unstructured_ingest/v2/pipeline/steps/index.py +4 -2
  18. unstructured_ingest/v2/pipeline/steps/partition.py +1 -1
  19. unstructured_ingest/v2/pipeline/steps/stage.py +3 -1
  20. unstructured_ingest/v2/pipeline/steps/uncompress.py +1 -1
  21. unstructured_ingest/v2/pipeline/steps/upload.py +6 -2
  22. unstructured_ingest/v2/processes/connectors/airtable.py +1 -1
  23. unstructured_ingest/v2/processes/connectors/databricks_volumes.py +1 -1
  24. unstructured_ingest/v2/processes/connectors/elasticsearch.py +2 -2
  25. unstructured_ingest/v2/processes/connectors/fsspec/azure.py +31 -5
  26. unstructured_ingest/v2/processes/connectors/fsspec/box.py +31 -2
  27. unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +36 -8
  28. unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +25 -77
  29. unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +30 -1
  30. unstructured_ingest/v2/processes/connectors/fsspec/s3.py +15 -18
  31. unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +22 -1
  32. unstructured_ingest/v2/processes/connectors/milvus.py +2 -2
  33. unstructured_ingest/v2/processes/connectors/opensearch.py +2 -2
  34. unstructured_ingest/v2/utils.py +1 -1
  35. unstructured_ingest-0.0.22.dist-info/METADATA +186 -0
  36. {unstructured_ingest-0.0.21.dist-info → unstructured_ingest-0.0.22.dist-info}/RECORD +40 -40
  37. {unstructured_ingest-0.0.21.dist-info → unstructured_ingest-0.0.22.dist-info}/WHEEL +1 -1
  38. unstructured_ingest-0.0.21.dist-info/METADATA +0 -639
  39. {unstructured_ingest-0.0.21.dist-info → unstructured_ingest-0.0.22.dist-info}/LICENSE.md +0 -0
  40. {unstructured_ingest-0.0.21.dist-info → unstructured_ingest-0.0.22.dist-info}/entry_points.txt +0 -0
  41. {unstructured_ingest-0.0.21.dist-info → unstructured_ingest-0.0.22.dist-info}/top_level.txt +0 -0
@@ -48,8 +48,8 @@ class MilvusConnectionConfig(ConnectionConfig):
48
48
 
49
49
  def get_connection_kwargs(self) -> dict[str, Any]:
50
50
  access_config = self.access_config.get_secret_value()
51
- access_config_dict = access_config.dict()
52
- connection_config_dict = self.dict()
51
+ access_config_dict = access_config.model_dump()
52
+ connection_config_dict = self.model_dump()
53
53
  connection_config_dict.pop("access_config", None)
54
54
  connection_config_dict.update(access_config_dict)
55
55
  # Drop any that were not set explicitly
@@ -101,8 +101,8 @@ class OpenSearchConnectionConfig(ConnectionConfig):
101
101
  if self.username and access_config.password:
102
102
  client_input_kwargs["http_auth"] = (self.username, access_config.password)
103
103
  client_input = OpenSearchClientInput(**client_input_kwargs)
104
- logger.debug(f"opensearch client inputs mapped to: {client_input.dict()}")
105
- client_kwargs = client_input.dict()
104
+ logger.debug(f"opensearch client inputs mapped to: {client_input.model_dump()}")
105
+ client_kwargs = client_input.model_dump()
106
106
  if client_input.http_auth is not None:
107
107
  client_kwargs["http_auth"] = client_input.http_auth.get_secret_value()
108
108
  client_kwargs = {k: v for k, v in client_kwargs.items() if v is not None}
@@ -19,7 +19,7 @@ def is_secret(value: Any) -> bool:
19
19
 
20
20
  def serialize_base_model(model: BaseModel) -> dict:
21
21
  # To get the full serialized dict regardless of if values are marked as Secret
22
- model_dict = model.dict()
22
+ model_dict = model.model_dump()
23
23
  return serialize_base_dict(model_dict=model_dict)
24
24
 
25
25
 
@@ -0,0 +1,186 @@
1
+ Metadata-Version: 2.1
2
+ Name: unstructured-ingest
3
+ Version: 0.0.22
4
+ Summary: A library that prepares raw documents for downstream ML tasks.
5
+ Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
+ Author: Unstructured Technologies
7
+ Author-email: devops@unstructuredai.io
8
+ License: Apache-2.0
9
+ Keywords: NLP PDF HTML CV XML parsing preprocessing
10
+ Classifier: Development Status :: 4 - Beta
11
+ Classifier: Intended Audience :: Developers
12
+ Classifier: Intended Audience :: Education
13
+ Classifier: Intended Audience :: Science/Research
14
+ Classifier: License :: OSI Approved :: Apache Software License
15
+ Classifier: Operating System :: OS Independent
16
+ Classifier: Programming Language :: Python :: 3
17
+ Classifier: Programming Language :: Python :: 3.9
18
+ Classifier: Programming Language :: Python :: 3.10
19
+ Classifier: Programming Language :: Python :: 3.11
20
+ Classifier: Programming Language :: Python :: 3.12
21
+ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
+ Requires-Python: >=3.9.0,<3.13
23
+ Description-Content-Type: text/markdown
24
+ License-File: LICENSE.md
25
+ Requires-Dist: pandas
26
+ Requires-Dist: dataclasses-json
27
+ Requires-Dist: opentelemetry-sdk
28
+ Requires-Dist: python-dateutil
29
+ Requires-Dist: click
30
+ Requires-Dist: tqdm
31
+ Requires-Dist: pydantic>=2.7
32
+ Provides-Extra: airtable
33
+ Requires-Dist: pyairtable; extra == "airtable"
34
+ Provides-Extra: astradb
35
+ Requires-Dist: astrapy; extra == "astradb"
36
+ Provides-Extra: azure
37
+ Requires-Dist: adlfs; extra == "azure"
38
+ Requires-Dist: fsspec; extra == "azure"
39
+ Provides-Extra: azure-cognitive-search
40
+ Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
41
+ Provides-Extra: bedrock
42
+ Requires-Dist: boto3; extra == "bedrock"
43
+ Provides-Extra: biomed
44
+ Requires-Dist: bs4; extra == "biomed"
45
+ Requires-Dist: requests; extra == "biomed"
46
+ Provides-Extra: box
47
+ Requires-Dist: boxfs; extra == "box"
48
+ Requires-Dist: fsspec; extra == "box"
49
+ Provides-Extra: chroma
50
+ Requires-Dist: chromadb; extra == "chroma"
51
+ Provides-Extra: clarifai
52
+ Requires-Dist: clarifai; extra == "clarifai"
53
+ Provides-Extra: confluence
54
+ Requires-Dist: atlassian-python-api; extra == "confluence"
55
+ Requires-Dist: requests; extra == "confluence"
56
+ Provides-Extra: couchbase
57
+ Requires-Dist: couchbase; extra == "couchbase"
58
+ Provides-Extra: csv
59
+ Requires-Dist: unstructured[tsv]; extra == "csv"
60
+ Provides-Extra: databricks-volumes
61
+ Requires-Dist: databricks-sdk; extra == "databricks-volumes"
62
+ Provides-Extra: delta-table
63
+ Requires-Dist: deltalake; extra == "delta-table"
64
+ Requires-Dist: fsspec; extra == "delta-table"
65
+ Provides-Extra: discord
66
+ Requires-Dist: discord-py; extra == "discord"
67
+ Provides-Extra: doc
68
+ Requires-Dist: unstructured[docx]; extra == "doc"
69
+ Provides-Extra: docx
70
+ Requires-Dist: unstructured[docx]; extra == "docx"
71
+ Provides-Extra: dropbox
72
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
73
+ Requires-Dist: fsspec; extra == "dropbox"
74
+ Provides-Extra: elasticsearch
75
+ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
76
+ Provides-Extra: embed-huggingface
77
+ Requires-Dist: sentence-transformers; extra == "embed-huggingface"
78
+ Provides-Extra: embed-mixedbreadai
79
+ Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
80
+ Provides-Extra: embed-octoai
81
+ Requires-Dist: openai; extra == "embed-octoai"
82
+ Requires-Dist: tiktoken; extra == "embed-octoai"
83
+ Provides-Extra: embed-vertexai
84
+ Requires-Dist: vertexai; extra == "embed-vertexai"
85
+ Provides-Extra: embed-voyageai
86
+ Requires-Dist: voyageai; extra == "embed-voyageai"
87
+ Provides-Extra: epub
88
+ Requires-Dist: unstructured[epub]; extra == "epub"
89
+ Provides-Extra: gcs
90
+ Requires-Dist: bs4; extra == "gcs"
91
+ Requires-Dist: gcsfs; extra == "gcs"
92
+ Requires-Dist: fsspec; extra == "gcs"
93
+ Provides-Extra: github
94
+ Requires-Dist: pygithub>1.58.0; extra == "github"
95
+ Requires-Dist: requests; extra == "github"
96
+ Provides-Extra: gitlab
97
+ Requires-Dist: python-gitlab; extra == "gitlab"
98
+ Provides-Extra: google-drive
99
+ Requires-Dist: google-api-python-client; extra == "google-drive"
100
+ Provides-Extra: hubspot
101
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
102
+ Requires-Dist: urllib3; extra == "hubspot"
103
+ Provides-Extra: jira
104
+ Requires-Dist: atlassian-python-api; extra == "jira"
105
+ Provides-Extra: kafka
106
+ Requires-Dist: confluent-kafka; extra == "kafka"
107
+ Provides-Extra: kdbai
108
+ Requires-Dist: kdbai-client; extra == "kdbai"
109
+ Provides-Extra: md
110
+ Requires-Dist: unstructured[md]; extra == "md"
111
+ Provides-Extra: milvus
112
+ Requires-Dist: pymilvus; extra == "milvus"
113
+ Provides-Extra: mongodb
114
+ Requires-Dist: pymongo; extra == "mongodb"
115
+ Provides-Extra: msg
116
+ Requires-Dist: unstructured[msg]; extra == "msg"
117
+ Provides-Extra: notion
118
+ Requires-Dist: httpx; extra == "notion"
119
+ Requires-Dist: notion-client; extra == "notion"
120
+ Requires-Dist: htmlBuilder; extra == "notion"
121
+ Requires-Dist: backoff; extra == "notion"
122
+ Provides-Extra: odt
123
+ Requires-Dist: unstructured[odt]; extra == "odt"
124
+ Provides-Extra: onedrive
125
+ Requires-Dist: msal; extra == "onedrive"
126
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
127
+ Requires-Dist: bs4; extra == "onedrive"
128
+ Provides-Extra: openai
129
+ Requires-Dist: openai; extra == "openai"
130
+ Requires-Dist: tiktoken; extra == "openai"
131
+ Provides-Extra: opensearch
132
+ Requires-Dist: opensearch-py; extra == "opensearch"
133
+ Provides-Extra: org
134
+ Requires-Dist: unstructured[org]; extra == "org"
135
+ Provides-Extra: outlook
136
+ Requires-Dist: msal; extra == "outlook"
137
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
138
+ Provides-Extra: pdf
139
+ Requires-Dist: unstructured[pdf]; extra == "pdf"
140
+ Provides-Extra: pinecone
141
+ Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
142
+ Provides-Extra: postgres
143
+ Requires-Dist: psycopg2-binary; extra == "postgres"
144
+ Provides-Extra: ppt
145
+ Requires-Dist: unstructured[pptx]; extra == "ppt"
146
+ Provides-Extra: pptx
147
+ Requires-Dist: unstructured[pptx]; extra == "pptx"
148
+ Provides-Extra: qdrant
149
+ Requires-Dist: qdrant-client; extra == "qdrant"
150
+ Provides-Extra: reddit
151
+ Requires-Dist: praw; extra == "reddit"
152
+ Provides-Extra: remote
153
+ Requires-Dist: unstructured-client>=0.25.8; extra == "remote"
154
+ Provides-Extra: rst
155
+ Requires-Dist: unstructured[rst]; extra == "rst"
156
+ Provides-Extra: rtf
157
+ Requires-Dist: unstructured[rtf]; extra == "rtf"
158
+ Provides-Extra: s3
159
+ Requires-Dist: s3fs; extra == "s3"
160
+ Requires-Dist: fsspec; extra == "s3"
161
+ Provides-Extra: salesforce
162
+ Requires-Dist: simple-salesforce; extra == "salesforce"
163
+ Provides-Extra: sftp
164
+ Requires-Dist: fsspec; extra == "sftp"
165
+ Requires-Dist: paramiko; extra == "sftp"
166
+ Provides-Extra: sharepoint
167
+ Requires-Dist: msal; extra == "sharepoint"
168
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
169
+ Provides-Extra: singlestore
170
+ Requires-Dist: singlestoredb; extra == "singlestore"
171
+ Provides-Extra: slack
172
+ Requires-Dist: slack-sdk; extra == "slack"
173
+ Provides-Extra: tsv
174
+ Requires-Dist: unstructured[tsv]; extra == "tsv"
175
+ Provides-Extra: vectara
176
+ Requires-Dist: requests; extra == "vectara"
177
+ Provides-Extra: weaviate
178
+ Requires-Dist: weaviate-client; extra == "weaviate"
179
+ Provides-Extra: wikipedia
180
+ Requires-Dist: wikipedia; extra == "wikipedia"
181
+ Provides-Extra: xlsx
182
+ Requires-Dist: unstructured[xlsx]; extra == "xlsx"
183
+
184
+ # Unstructured Ingest
185
+
186
+ For details, see the [Unstructured Ingest overview](https://docs.unstructured.io/ingestion/overview) in the Unstructured documentation.
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=jKsHPdCiaS4Mdql3-_XwS3BGWgrosIEEQ7-K8uTyviU,43
2
+ unstructured_ingest/__version__.py,sha256=s86WG6OgfRK15ii3W6pb0AczHH8T1QB33x5r6twQpCY,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/interfaces.py,sha256=LuY-85clq5iyOtDd9vDABjK2MZCm6wRWK53cdb4SROY,31411
5
5
  unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
@@ -167,14 +167,14 @@ unstructured_ingest/connector/notion/types/database_properties/unique_id.py,sha2
167
167
  unstructured_ingest/connector/notion/types/database_properties/url.py,sha256=iXQ2tVUm9UlKVtDA0NQiFIRJ5PHYW9wOaWt2vFfSVCg,862
168
168
  unstructured_ingest/connector/notion/types/database_properties/verification.py,sha256=J_DLjY-v2T6xDGMQ7FkI0YMKMA6SG6Y3yYW7qUD1hKA,2334
169
169
  unstructured_ingest/embed/__init__.py,sha256=whnTiGsSbNqaLObr058CKG5iGxk5OkN_41IBEtHQYW8,900
170
- unstructured_ingest/embed/bedrock.py,sha256=5uq1S9-7uKaaHiniohm1HXNLhudIYN9TEcctUe2JIpM,2514
171
- unstructured_ingest/embed/huggingface.py,sha256=fHgZ865I2Efs3QT43n57gmccF9sBzI6T4yhcu_r7zwM,2727
172
- unstructured_ingest/embed/interfaces.py,sha256=O_USsEcVHRzE2dpHCJEJWKq04NLfdAnm55ZHHTQ3GO0,900
173
- unstructured_ingest/embed/mixedbreadai.py,sha256=wMdY1a4PyynguIZQ4fPFImKGk9ryqHv0NRL3e3iSPEI,5491
174
- unstructured_ingest/embed/octoai.py,sha256=ERJby6VdqcIO6NLTqLXVHmX7LNIM0Fsmhf3dn10Z4is,2347
175
- unstructured_ingest/embed/openai.py,sha256=zOh3GHg1sPVUd3YzZLS5JIV21emYyrCHGYzqH5MIAiY,2250
176
- unstructured_ingest/embed/vertexai.py,sha256=DuOQNHUzickx9kIobfIz2RjhJ712OsZhIoYJiXxaMco,3309
177
- unstructured_ingest/embed/voyageai.py,sha256=PwyW-_dXZT1AGSkeF3c2heM-pdBxciUxdtP7PluCauY,2430
170
+ unstructured_ingest/embed/bedrock.py,sha256=5-pKWwOEGHKOHa06wYuKOhvT8Xu72ke6nrpCnRtkAaU,3872
171
+ unstructured_ingest/embed/huggingface.py,sha256=ku_JQr72KBG8n5b6KRkXIbeBGzdgLw_KKIEm1dFK3oM,2729
172
+ unstructured_ingest/embed/interfaces.py,sha256=L5WimR69bmEvliIBlZ8wOCH_YDA9DWteCu6QEsKCV5I,1113
173
+ unstructured_ingest/embed/mixedbreadai.py,sha256=NSrAt1_bjphTHLUnlzzWSBU25UBCZlpYaLdWSRSGyqs,5504
174
+ unstructured_ingest/embed/octoai.py,sha256=0zxAUAMzodGkqMwqMkEvSfgWLNHtEnhdvUofvJDQD1A,2368
175
+ unstructured_ingest/embed/openai.py,sha256=4Ee4A2rQ8OlSh_yiJSFmok_qqRDi1A3KyayB5YiPLFw,2058
176
+ unstructured_ingest/embed/vertexai.py,sha256=pclpjjacvGTex74tD_3yZKhR-X5BR0fAHbgZUE62uh0,3608
177
+ unstructured_ingest/embed/voyageai.py,sha256=8l-EGVdOcR9jLoc0DV4aPOvJsvRnInI8w12C9jxiUWA,2664
178
178
  unstructured_ingest/enhanced_dataclass/__init__.py,sha256=gDZOUsv5eo-8jm4Yu7DdDwi101aGbfG7JctTdOYnTOM,151
179
179
  unstructured_ingest/enhanced_dataclass/core.py,sha256=d6aUkDynuKX87cHx9_N5UDUWrvISR4jYRFRTvd_avlI,3038
180
180
  unstructured_ingest/enhanced_dataclass/dataclasses.py,sha256=aZMsoCzAGRb8Rmh3BTSBFtNr6FmFTY93KYGLk3gYJKQ,1949
@@ -266,12 +266,12 @@ unstructured_ingest/v2/logger.py,sha256=wcln4s5Nyp2fjjJux9iM3d6t9aQFNJ2H1IAZXmIk
266
266
  unstructured_ingest/v2/main.py,sha256=WFdLEqEXRy6E9_G-dF20MK2AtgX51Aan1sp_N67U2B8,172
267
267
  unstructured_ingest/v2/otel.py,sha256=2fGj1c7cVcC3J8NwL6MNYhyPEAXiB33DsilvRDkrdLo,4130
268
268
  unstructured_ingest/v2/unstructured_api.py,sha256=1EQVuL-TojmFxWoWFzXr1oCFPEC3IkCQqhjXM8spdTY,3373
269
- unstructured_ingest/v2/utils.py,sha256=9LnhpI8Otpq5HPcN2Dtkp7APD_euq1ylKhIsybuK99Y,1714
269
+ unstructured_ingest/v2/utils.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3rJn1PHTI_G_A_EHY,1720
270
270
  unstructured_ingest/v2/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
271
271
  unstructured_ingest/v2/cli/cli.py,sha256=qHXIs-PcvMgDZhP1AR9iDMxh8FXBMJCEDksPBfiMULE,648
272
272
  unstructured_ingest/v2/cli/cmds.py,sha256=wWUTbvvxEqKAy6bNE6XhPnj0ELMeSbb9_r1NZl58xMM,489
273
273
  unstructured_ingest/v2/cli/base/__init__.py,sha256=zXCa7F4FMqItmzxfUIVmyI-CeGh8X85yF8lRxwX_OYQ,83
274
- unstructured_ingest/v2/cli/base/cmd.py,sha256=a2NE9ZjUfuLIevz0aEs25UsLGCOroJwI-bPc6vBrMCw,11484
274
+ unstructured_ingest/v2/cli/base/cmd.py,sha256=fO1gXvMFgRMoXgVF4Nwk8J-MYU-U59ubchZU_Gx1mK4,11490
275
275
  unstructured_ingest/v2/cli/base/dest.py,sha256=zDjqek7anr0JQ2ptEl8KIAsUXuCuHRnBQnJhoPj4NVM,3198
276
276
  unstructured_ingest/v2/cli/base/importer.py,sha256=nRt0QQ3qpi264-n_mR0l55C2ddM8nowTNzT1jsWaam8,1128
277
277
  unstructured_ingest/v2/cli/base/src.py,sha256=cpQ43qQju4e5s_YSaPxUtA70BaisRkTBdjtlPhqn5Mg,2872
@@ -279,7 +279,7 @@ unstructured_ingest/v2/cli/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRk
279
279
  unstructured_ingest/v2/cli/utils/click.py,sha256=Wn2s3PuvBCKB0lsK-W7X_Y0eYyWnS6Y9wWo1OhVBOzY,6344
280
280
  unstructured_ingest/v2/cli/utils/model_conversion.py,sha256=73DKHQQ6Tm0Lz5NCRduDlyfOhY2KH-MZN1n6jUgrsuU,7480
281
281
  unstructured_ingest/v2/interfaces/__init__.py,sha256=Rfa8crx6De7WNOK-EjsWWwFVpsUfCc6gY8B8tQ3ae9I,899
282
- unstructured_ingest/v2/interfaces/connector.py,sha256=Lm7wJTlKUfVKJjk-BchS0RtZ9_Lo9tzZ62rPtF3HOGY,759
282
+ unstructured_ingest/v2/interfaces/connector.py,sha256=KG0pHdAcpuO5h72xrAkJzADmjxbav31TZ2Wo3PBvwT0,765
283
283
  unstructured_ingest/v2/interfaces/downloader.py,sha256=PKT1kr79Mz1urW_8xCyq9sBuK93gDvyTXg5e4ma4htU,2871
284
284
  unstructured_ingest/v2/interfaces/file_data.py,sha256=ieJK-hqHCEOmoYNGoFbCHziSaZyMtRS9VpSoYbwoKCE,1944
285
285
  unstructured_ingest/v2/interfaces/indexer.py,sha256=Bd1S-gTLsxhJBLEh1lYm_gXqwQLaEZMoqPq9yGxtN_E,713
@@ -290,17 +290,17 @@ unstructured_ingest/v2/interfaces/uploader.py,sha256=JmZDl1blJa5rS61YHCae3Hfet84
290
290
  unstructured_ingest/v2/pipeline/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
291
291
  unstructured_ingest/v2/pipeline/interfaces.py,sha256=-Y6gPnl-SbNxIx5-dQCmiYSPKUMjivrRlBLIKIUWVeM,8658
292
292
  unstructured_ingest/v2/pipeline/otel.py,sha256=K3pQvWVgWzyOWMKCBUofsH7wTZPJ0Ysw5sLjMBLW41I,1088
293
- unstructured_ingest/v2/pipeline/pipeline.py,sha256=GrcQNotpGl1EtKbpauNh2iHZVNm9vigjEOu7svlUOvM,15660
293
+ unstructured_ingest/v2/pipeline/pipeline.py,sha256=x6hanD7Cj7Wd5MBUvb33UwXQMZxubzwlAiYyBCMukuc,15693
294
294
  unstructured_ingest/v2/pipeline/steps/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
295
- unstructured_ingest/v2/pipeline/steps/chunk.py,sha256=gTIxhkK_n6MC3JbLsqnDsrExmYSl1wSnA_CJsOnVZ3w,3124
296
- unstructured_ingest/v2/pipeline/steps/download.py,sha256=Ld2dp1Znt-BqCcSOkBzBtZV-cGI8Kd-w0wN9Ez9h3Y8,8103
297
- unstructured_ingest/v2/pipeline/steps/embed.py,sha256=zsOZ-FZzJWOqdKKRnvGJ6c8h18d3Wkscx8wEdkGxcmw,3102
298
- unstructured_ingest/v2/pipeline/steps/filter.py,sha256=VAob-9p3bsacv_whb3Hb3rUqA6duL1d-zcUsJg7mxJ8,1188
299
- unstructured_ingest/v2/pipeline/steps/index.py,sha256=0LrzRT-T1-dzZp_ot4ibajaavdhlXdsAwBQXvrEQS2I,2632
300
- unstructured_ingest/v2/pipeline/steps/partition.py,sha256=-jhNtIZwru5gFs3-C_fXXtdRz8NE8MX8Y2ih0iKQKdk,3182
301
- unstructured_ingest/v2/pipeline/steps/stage.py,sha256=ZvP-Rz_A5UkhZNoRUvVgciJbGXlP2WIbN5QIZ9wzP8I,2211
302
- unstructured_ingest/v2/pipeline/steps/uncompress.py,sha256=pEu7VU27Fuu53eqBddAmXihV74A6JTwTfnjKeb__edY,1745
303
- unstructured_ingest/v2/pipeline/steps/upload.py,sha256=G9z8QQe9b_WokI5qyr4UOOqaepEVgwFqMn9pWcta9gI,1917
295
+ unstructured_ingest/v2/pipeline/steps/chunk.py,sha256=rYVcHSXeQSzWszg6VmtYlNc66Gsx-22Ti0BxPyQaJak,3135
296
+ unstructured_ingest/v2/pipeline/steps/download.py,sha256=lzvOl5SoUK6OCCVVeG4CzdPIGj6eKKCGdciNo_0RMNk,8173
297
+ unstructured_ingest/v2/pipeline/steps/embed.py,sha256=-YFvmchdsonWiSXxaD7PJfuUUtMLklaQM_8kZCQxCdM,3113
298
+ unstructured_ingest/v2/pipeline/steps/filter.py,sha256=q7bNieaFMprqoF8Mx7w-ZN6jyA5peiGeTGyPtvcV-uw,1199
299
+ unstructured_ingest/v2/pipeline/steps/index.py,sha256=nfDo-wt5sooKtMHKG7sI42m1L44uw-pxErDlDB1engw,2678
300
+ unstructured_ingest/v2/pipeline/steps/partition.py,sha256=9MQViptxK3ALKco8uE4gK9PpEoGq5JjzyU14C_18blU,3193
301
+ unstructured_ingest/v2/pipeline/steps/stage.py,sha256=cphKgHScLz2rNLZRI5Olsb6dAH-MKGu3p6MYS1BEzkA,2246
302
+ unstructured_ingest/v2/pipeline/steps/uncompress.py,sha256=CFSy4tGp6BAvF0oIwWFN8v4zFzh5pRDeESjEn5iP9hE,1756
303
+ unstructured_ingest/v2/pipeline/steps/upload.py,sha256=zlgXgwReX9TBOdfTpS9hETah4SeSmzPB2g8dAGfLIvM,1987
304
304
  unstructured_ingest/v2/processes/__init__.py,sha256=FaHWSCGyc7GWVnAsNEUUj7L8hT8gCVY3_hUE2VzWtUg,462
305
305
  unstructured_ingest/v2/processes/chunker.py,sha256=76PrpCSd8k3DpfdZcl8I10u7vciKzhSV9ZByrrp302g,5476
306
306
  unstructured_ingest/v2/processes/connector_registry.py,sha256=vkEe6jpgdYtZCxMj59s5atWGgmPuxAEXRUoTt-MJ7wc,2198
@@ -309,20 +309,20 @@ unstructured_ingest/v2/processes/filter.py,sha256=kjUmMw2SDq2bme0JCAOxs6cJriIG6T
309
309
  unstructured_ingest/v2/processes/partitioner.py,sha256=bpqmZDsKKi6qtxNWdIWBfQmr1ccQUhU0axecpGAUf_4,7739
310
310
  unstructured_ingest/v2/processes/uncompress.py,sha256=Z_XfsITGdyaRwhtNUc7bMj5Y2jLuBge8KoK4nxhqKag,2425
311
311
  unstructured_ingest/v2/processes/connectors/__init__.py,sha256=6iBdoH6BW8oMK1ZvEi0IgEchuk0cNUPoNIaikpzeML8,4992
312
- unstructured_ingest/v2/processes/connectors/airtable.py,sha256=LLz3qVhbcZrHXeK1xu8lywj828wsDwYDfSsaNB2CwrA,8915
312
+ unstructured_ingest/v2/processes/connectors/airtable.py,sha256=Yi7PEv_FejZ9_y3BPY3gu5YGVfeLh-9YX-qLyQHjJsY,8921
313
313
  unstructured_ingest/v2/processes/connectors/astradb.py,sha256=ZctZRfXcOAMBGPkKgHvhTmV_-2F0YN5vqwfY9UCHIlU,5791
314
314
  unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py,sha256=S55v7TXu30rEdgythMBB_2VcuomyMPmcPtLYykbhw_E,8466
315
315
  unstructured_ingest/v2/processes/connectors/chroma.py,sha256=skrxRPHZ8y3JxNa0dt5SVitHiDQ5WVxLvY_kh2-QUrQ,8029
316
316
  unstructured_ingest/v2/processes/connectors/couchbase.py,sha256=SONLywyEfoAlLc-HPabXeGzoiwKnekMHIbRMXd4CGXs,12146
317
- unstructured_ingest/v2/processes/connectors/databricks_volumes.py,sha256=c5rVY2vrqJw3vINExMhFoANnjBCVnYil0Jm97u_WJ7g,6024
318
- unstructured_ingest/v2/processes/connectors/elasticsearch.py,sha256=H8svPr-Yk3UniHT1O9kUd2QhTfrJdzbqRNLFZIMiITQ,16750
317
+ unstructured_ingest/v2/processes/connectors/databricks_volumes.py,sha256=E_4DzeemC4mhZsVuLmSXtfy4MR1MoU6CNyvpRqsKnJU,6030
318
+ unstructured_ingest/v2/processes/connectors/elasticsearch.py,sha256=ojxMUHkLa6ZG50aTGn2YWhDHZ1n38uFRn5p8_ghAIvM,16762
319
319
  unstructured_ingest/v2/processes/connectors/google_drive.py,sha256=7xOQthcqBd9auJxB0nxZlhh1vdjXpMX_CtQZa6YfZz0,13088
320
320
  unstructured_ingest/v2/processes/connectors/kdbai.py,sha256=D71gt8fsPOXi2-Rir8mATw6dRM3BdzYGnn62qG1iaBw,5586
321
321
  unstructured_ingest/v2/processes/connectors/local.py,sha256=a3stgnIkhBbXPIQD0O-RaRM-Eb-szHj9Yy4Fz881-9c,6723
322
- unstructured_ingest/v2/processes/connectors/milvus.py,sha256=oJCsCHgbMSKZ8AphU_vO_R_4OmGv9Nm7gFdNDUmcu7E,7675
322
+ unstructured_ingest/v2/processes/connectors/milvus.py,sha256=ZUlyAQyTt0U1JoapFYHQW3IIaGYY50b3URDSLEAFjtk,7687
323
323
  unstructured_ingest/v2/processes/connectors/mongodb.py,sha256=2_R_hrEAaTU4vJTCK9oKblWTgv6BKjyUhFtC7uq3q2w,4859
324
324
  unstructured_ingest/v2/processes/connectors/onedrive.py,sha256=ZiUo-dFo1LMOvFwphSLRZiR1PcrN8GWLTHhsh4TU6n0,9207
325
- unstructured_ingest/v2/processes/connectors/opensearch.py,sha256=PNkJGLCCkwxLvxKX6vF_0jy-LC4wKu8PCXzmULEo9sk,6755
325
+ unstructured_ingest/v2/processes/connectors/opensearch.py,sha256=dfDSNrWIEk19wuHdlMJpp_SLMOteNPlkDBPlAwu1LVY,6767
326
326
  unstructured_ingest/v2/processes/connectors/pinecone.py,sha256=gCueI1Px7UkI1flNovLMRvcbPGczHI3IlYhOPYlb3WU,6748
327
327
  unstructured_ingest/v2/processes/connectors/salesforce.py,sha256=2CiO2ZZiZ1Y1-nB7wcDlDVcpW2B7ut9wCj66rkkqho0,11616
328
328
  unstructured_ingest/v2/processes/connectors/sharepoint.py,sha256=hOaV5gBcHFc6N5Rbu3MgM-5Aol1ht-QkNIN4PqjvfxE,19665
@@ -331,17 +331,17 @@ unstructured_ingest/v2/processes/connectors/sql.py,sha256=srj2ECKnkGR_iEFBdpa8sx
331
331
  unstructured_ingest/v2/processes/connectors/utils.py,sha256=8kd0g7lo9NqnpaIkjeO-Ut6erhwUNH_gS9koevpe3WE,878
332
332
  unstructured_ingest/v2/processes/connectors/weaviate.py,sha256=Ss0YyD5T6k-00eJ6dr5lSo2H0LcOjVTMmozehyTvnAo,8866
333
333
  unstructured_ingest/v2/processes/connectors/fsspec/__init__.py,sha256=TtdeImM7Ypl_n6sl7I1JqX6bGSG0t_FqvCqE3Cy24og,1846
334
- unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=dzOuy1RuozGnCCFJ6CiE3brijcv5WHBnUVVJXx75bks,6057
335
- unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=_yOII2D1zCnI-ae_G7Fx7lb5GuTiaELIHtIyfeDOKGE,4343
336
- unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=pjDsOVf-a3ERBL3PVop7fI8wIrJc4-51CHzolivLwY8,4686
337
- unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=Ri1TscAbQyIb3QZXDIC3vYJyGRgFWAOrzaQsngsCl-Q,12785
338
- unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=eKcFYwnUNr3TwEGyriV9lvXRo9AZEOw_dvVyibVD0dM,5915
339
- unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=UfI4MxUd74K0i1odJx9KZOfJtvwixL6n2DWvhLOgkfo,6302
340
- unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=NkcU4U2DQWWuM8UHkez67C3SEOZpVyRtmtNS-z-F0Fw,6056
334
+ unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=Y01BuVRql0Kvzc_cdaZE9dDGYjJzrwJu-etfUrEGcUU,7061
335
+ unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=Cjk0LUxqOCDbme0GmnD_5_b1hfStjI23cKw6BquKNrg,5488
336
+ unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=NNAxIRdOQxUncfwhu7J7SnQRM6BSStNOyQZi-4E51iY,5816
337
+ unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=usLzU2NA5D_a1juhja4jyJP_CzW4h-5rZ22bWVwvZGQ,10853
338
+ unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=-_pYHbsBG9FyRyNIaf_xyFbPiiR7pnWEEg_8mp0rIZ8,7053
339
+ unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=je1BDqFWlyMfPa4oAMMNFQLLQtCY9quuqx3xjTwF8OQ,6251
340
+ unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=dwpyqDq0qceCBWX3zM1hiUlgXB4hzX6ObOr-sh-5CJs,6926
341
341
  unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
342
- unstructured_ingest-0.0.21.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
343
- unstructured_ingest-0.0.21.dist-info/METADATA,sha256=0LbQTW5dTus7hdY_JkPxbeOitzVoAgzQy0ikdF48Sc0,28507
344
- unstructured_ingest-0.0.21.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
345
- unstructured_ingest-0.0.21.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
346
- unstructured_ingest-0.0.21.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
347
- unstructured_ingest-0.0.21.dist-info/RECORD,,
342
+ unstructured_ingest-0.0.22.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
343
+ unstructured_ingest-0.0.22.dist-info/METADATA,sha256=JteQ0j_D7rNBM7XNdb3dSgJMx26-OV8mLUVqubvhSMY,7108
344
+ unstructured_ingest-0.0.22.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
345
+ unstructured_ingest-0.0.22.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
346
+ unstructured_ingest-0.0.22.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
347
+ unstructured_ingest-0.0.22.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: bdist_wheel (0.44.0)
2
+ Generator: setuptools (75.1.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5