unstructured-ingest 0.5.1__py3-none-any.whl → 0.5.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (25) hide show
  1. test/integration/connectors/test_google_drive.py +141 -0
  2. test/unit/v2/embedders/test_bedrock.py +1 -1
  3. test/unit/v2/embedders/test_huggingface.py +1 -1
  4. unstructured_ingest/__version__.py +1 -1
  5. unstructured_ingest/embed/azure_openai.py +6 -0
  6. unstructured_ingest/embed/bedrock.py +29 -12
  7. unstructured_ingest/embed/huggingface.py +14 -5
  8. unstructured_ingest/embed/interfaces.py +63 -44
  9. unstructured_ingest/embed/mixedbreadai.py +28 -105
  10. unstructured_ingest/embed/octoai.py +19 -44
  11. unstructured_ingest/embed/openai.py +17 -48
  12. unstructured_ingest/embed/togetherai.py +16 -49
  13. unstructured_ingest/embed/vertexai.py +15 -39
  14. unstructured_ingest/embed/voyageai.py +16 -42
  15. unstructured_ingest/v2/errors.py +7 -0
  16. unstructured_ingest/v2/processes/connectors/google_drive.py +132 -3
  17. unstructured_ingest/v2/processes/connectors/neo4j.py +129 -43
  18. unstructured_ingest/v2/processes/connectors/sql/snowflake.py +53 -3
  19. unstructured_ingest/v2/processes/embedder.py +9 -7
  20. {unstructured_ingest-0.5.1.dist-info → unstructured_ingest-0.5.3.dist-info}/METADATA +99 -87
  21. {unstructured_ingest-0.5.1.dist-info → unstructured_ingest-0.5.3.dist-info}/RECORD +25 -25
  22. {unstructured_ingest-0.5.1.dist-info → unstructured_ingest-0.5.3.dist-info}/WHEEL +1 -1
  23. {unstructured_ingest-0.5.1.dist-info → unstructured_ingest-0.5.3.dist-info}/LICENSE.md +0 -0
  24. {unstructured_ingest-0.5.1.dist-info → unstructured_ingest-0.5.3.dist-info}/entry_points.txt +0 -0
  25. {unstructured_ingest-0.5.1.dist-info → unstructured_ingest-0.5.3.dist-info}/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
- Metadata-Version: 2.1
1
+ Metadata-Version: 2.2
2
2
  Name: unstructured-ingest
3
- Version: 0.5.1
3
+ Version: 0.5.3
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,31 +22,60 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.14
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: dataclasses-json
26
- Requires-Dist: click
27
25
  Requires-Dist: opentelemetry-sdk
26
+ Requires-Dist: click
28
27
  Requires-Dist: pydantic>=2.7
29
28
  Requires-Dist: python-dateutil
29
+ Requires-Dist: dataclasses_json
30
30
  Requires-Dist: pandas
31
31
  Requires-Dist: tqdm
32
+ Provides-Extra: remote
33
+ Requires-Dist: unstructured-client>=0.26.1; extra == "remote"
34
+ Provides-Extra: csv
35
+ Requires-Dist: unstructured[tsv]; extra == "csv"
36
+ Provides-Extra: doc
37
+ Requires-Dist: unstructured[docx]; extra == "doc"
38
+ Provides-Extra: docx
39
+ Requires-Dist: unstructured[docx]; extra == "docx"
40
+ Provides-Extra: epub
41
+ Requires-Dist: unstructured[epub]; extra == "epub"
42
+ Provides-Extra: md
43
+ Requires-Dist: unstructured[md]; extra == "md"
44
+ Provides-Extra: msg
45
+ Requires-Dist: unstructured[msg]; extra == "msg"
46
+ Provides-Extra: odt
47
+ Requires-Dist: unstructured[odt]; extra == "odt"
48
+ Provides-Extra: org
49
+ Requires-Dist: unstructured[org]; extra == "org"
50
+ Provides-Extra: pdf
51
+ Requires-Dist: unstructured[pdf]; extra == "pdf"
52
+ Provides-Extra: ppt
53
+ Requires-Dist: unstructured[pptx]; extra == "ppt"
54
+ Provides-Extra: pptx
55
+ Requires-Dist: unstructured[pptx]; extra == "pptx"
56
+ Provides-Extra: rtf
57
+ Requires-Dist: unstructured[rtf]; extra == "rtf"
58
+ Provides-Extra: rst
59
+ Requires-Dist: unstructured[rst]; extra == "rst"
60
+ Provides-Extra: tsv
61
+ Requires-Dist: unstructured[tsv]; extra == "tsv"
62
+ Provides-Extra: xlsx
63
+ Requires-Dist: unstructured[xlsx]; extra == "xlsx"
32
64
  Provides-Extra: airtable
33
65
  Requires-Dist: pyairtable; extra == "airtable"
34
66
  Provides-Extra: astradb
35
67
  Requires-Dist: astrapy; extra == "astradb"
36
68
  Provides-Extra: azure
37
- Requires-Dist: adlfs; extra == "azure"
38
69
  Requires-Dist: fsspec; extra == "azure"
70
+ Requires-Dist: adlfs; extra == "azure"
39
71
  Provides-Extra: azure-ai-search
40
72
  Requires-Dist: azure-search-documents; extra == "azure-ai-search"
41
- Provides-Extra: bedrock
42
- Requires-Dist: aioboto3; extra == "bedrock"
43
- Requires-Dist: boto3; extra == "bedrock"
44
73
  Provides-Extra: biomed
45
- Requires-Dist: requests; extra == "biomed"
46
74
  Requires-Dist: bs4; extra == "biomed"
75
+ Requires-Dist: requests; extra == "biomed"
47
76
  Provides-Extra: box
48
- Requires-Dist: boxfs; extra == "box"
49
77
  Requires-Dist: fsspec; extra == "box"
78
+ Requires-Dist: boxfs; extra == "box"
50
79
  Provides-Extra: chroma
51
80
  Requires-Dist: chromadb; extra == "chroma"
52
81
  Provides-Extra: clarifai
@@ -56,48 +85,25 @@ Requires-Dist: atlassian-python-api; extra == "confluence"
56
85
  Requires-Dist: requests; extra == "confluence"
57
86
  Provides-Extra: couchbase
58
87
  Requires-Dist: couchbase; extra == "couchbase"
59
- Provides-Extra: csv
60
- Requires-Dist: unstructured[tsv]; extra == "csv"
61
- Provides-Extra: databricks-delta-tables
62
- Requires-Dist: databricks-sql-connector; extra == "databricks-delta-tables"
63
- Provides-Extra: databricks-volumes
64
- Requires-Dist: databricks-sdk; extra == "databricks-volumes"
65
88
  Provides-Extra: delta-table
66
- Requires-Dist: boto3; extra == "delta-table"
67
89
  Requires-Dist: deltalake; extra == "delta-table"
90
+ Requires-Dist: boto3; extra == "delta-table"
68
91
  Provides-Extra: discord
69
92
  Requires-Dist: discord.py; extra == "discord"
70
- Provides-Extra: doc
71
- Requires-Dist: unstructured[docx]; extra == "doc"
72
- Provides-Extra: docx
73
- Requires-Dist: unstructured[docx]; extra == "docx"
74
93
  Provides-Extra: dropbox
75
- Requires-Dist: dropboxdrivefs; extra == "dropbox"
76
94
  Requires-Dist: fsspec; extra == "dropbox"
95
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
77
96
  Provides-Extra: duckdb
78
97
  Requires-Dist: duckdb; extra == "duckdb"
79
98
  Provides-Extra: elasticsearch
80
99
  Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
81
- Provides-Extra: embed-huggingface
82
- Requires-Dist: sentence-transformers; extra == "embed-huggingface"
83
- Provides-Extra: embed-mixedbreadai
84
- Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
85
- Provides-Extra: embed-octoai
86
- Requires-Dist: openai; extra == "embed-octoai"
87
- Requires-Dist: tiktoken; extra == "embed-octoai"
88
- Provides-Extra: embed-vertexai
89
- Requires-Dist: vertexai; extra == "embed-vertexai"
90
- Provides-Extra: embed-voyageai
91
- Requires-Dist: voyageai; extra == "embed-voyageai"
92
- Provides-Extra: epub
93
- Requires-Dist: unstructured[epub]; extra == "epub"
94
100
  Provides-Extra: gcs
95
- Requires-Dist: gcsfs; extra == "gcs"
96
- Requires-Dist: bs4; extra == "gcs"
97
101
  Requires-Dist: fsspec; extra == "gcs"
102
+ Requires-Dist: bs4; extra == "gcs"
103
+ Requires-Dist: gcsfs; extra == "gcs"
98
104
  Provides-Extra: github
99
- Requires-Dist: requests; extra == "github"
100
105
  Requires-Dist: pygithub>1.58.0; extra == "github"
106
+ Requires-Dist: requests; extra == "github"
101
107
  Provides-Extra: gitlab
102
108
  Requires-Dist: python-gitlab; extra == "gitlab"
103
109
  Provides-Extra: google-drive
@@ -113,97 +119,103 @@ Provides-Extra: kdbai
113
119
  Requires-Dist: kdbai-client>=1.4.0; extra == "kdbai"
114
120
  Provides-Extra: lancedb
115
121
  Requires-Dist: lancedb; extra == "lancedb"
116
- Provides-Extra: md
117
- Requires-Dist: unstructured[md]; extra == "md"
118
122
  Provides-Extra: milvus
119
123
  Requires-Dist: pymilvus; extra == "milvus"
120
124
  Provides-Extra: mongodb
121
125
  Requires-Dist: pymongo; extra == "mongodb"
122
- Provides-Extra: msg
123
- Requires-Dist: unstructured[msg]; extra == "msg"
124
126
  Provides-Extra: neo4j
125
- Requires-Dist: neo4j; extra == "neo4j"
127
+ Requires-Dist: neo4j-rust-ext; extra == "neo4j"
126
128
  Requires-Dist: cymple; extra == "neo4j"
127
129
  Requires-Dist: networkx; extra == "neo4j"
128
130
  Provides-Extra: notion
129
- Requires-Dist: backoff; extra == "notion"
130
131
  Requires-Dist: htmlBuilder; extra == "notion"
131
132
  Requires-Dist: httpx; extra == "notion"
133
+ Requires-Dist: backoff; extra == "notion"
132
134
  Requires-Dist: notion-client; extra == "notion"
133
- Provides-Extra: odt
134
- Requires-Dist: unstructured[odt]; extra == "odt"
135
135
  Provides-Extra: onedrive
136
+ Requires-Dist: bs4; extra == "onedrive"
136
137
  Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
137
138
  Requires-Dist: msal; extra == "onedrive"
138
- Requires-Dist: bs4; extra == "onedrive"
139
- Provides-Extra: openai
140
- Requires-Dist: openai; extra == "openai"
141
- Requires-Dist: tiktoken; extra == "openai"
142
139
  Provides-Extra: opensearch
143
140
  Requires-Dist: opensearch-py; extra == "opensearch"
144
- Provides-Extra: org
145
- Requires-Dist: unstructured[org]; extra == "org"
146
141
  Provides-Extra: outlook
147
142
  Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
148
143
  Requires-Dist: msal; extra == "outlook"
149
- Provides-Extra: pdf
150
- Requires-Dist: unstructured[pdf]; extra == "pdf"
151
144
  Provides-Extra: pinecone
152
145
  Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
153
146
  Provides-Extra: postgres
154
147
  Requires-Dist: psycopg2-binary; extra == "postgres"
155
- Provides-Extra: ppt
156
- Requires-Dist: unstructured[pptx]; extra == "ppt"
157
- Provides-Extra: pptx
158
- Requires-Dist: unstructured[pptx]; extra == "pptx"
159
148
  Provides-Extra: qdrant
160
149
  Requires-Dist: qdrant-client; extra == "qdrant"
161
150
  Provides-Extra: reddit
162
151
  Requires-Dist: praw; extra == "reddit"
163
152
  Provides-Extra: redis
164
153
  Requires-Dist: redis; extra == "redis"
165
- Provides-Extra: remote
166
- Requires-Dist: unstructured-client>=0.26.1; extra == "remote"
167
- Provides-Extra: rst
168
- Requires-Dist: unstructured[rst]; extra == "rst"
169
- Provides-Extra: rtf
170
- Requires-Dist: unstructured[rtf]; extra == "rtf"
171
154
  Provides-Extra: s3
172
155
  Requires-Dist: fsspec; extra == "s3"
173
156
  Requires-Dist: s3fs; extra == "s3"
157
+ Provides-Extra: sharepoint
158
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
159
+ Requires-Dist: msal; extra == "sharepoint"
174
160
  Provides-Extra: salesforce
175
161
  Requires-Dist: simple-salesforce; extra == "salesforce"
176
162
  Provides-Extra: sftp
177
- Requires-Dist: paramiko; extra == "sftp"
178
163
  Requires-Dist: fsspec; extra == "sftp"
179
- Provides-Extra: sharepoint
180
- Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
181
- Requires-Dist: msal; extra == "sharepoint"
182
- Provides-Extra: singlestore
183
- Requires-Dist: singlestoredb; extra == "singlestore"
164
+ Requires-Dist: paramiko; extra == "sftp"
184
165
  Provides-Extra: slack
185
- Requires-Dist: slack-sdk[optional]; extra == "slack"
166
+ Requires-Dist: slack_sdk[optional]; extra == "slack"
186
167
  Provides-Extra: snowflake
187
- Requires-Dist: snowflake-connector-python; extra == "snowflake"
188
168
  Requires-Dist: psycopg2-binary; extra == "snowflake"
189
- Provides-Extra: togetherai
190
- Requires-Dist: together; extra == "togetherai"
191
- Provides-Extra: tsv
192
- Requires-Dist: unstructured[tsv]; extra == "tsv"
193
- Provides-Extra: vastdb
194
- Requires-Dist: pyarrow; extra == "vastdb"
195
- Requires-Dist: vastdb; extra == "vastdb"
196
- Requires-Dist: ibis; extra == "vastdb"
169
+ Requires-Dist: snowflake-connector-python; extra == "snowflake"
170
+ Provides-Extra: wikipedia
171
+ Requires-Dist: wikipedia; extra == "wikipedia"
172
+ Provides-Extra: weaviate
173
+ Requires-Dist: weaviate-client; extra == "weaviate"
174
+ Provides-Extra: databricks-volumes
175
+ Requires-Dist: databricks-sdk; extra == "databricks-volumes"
176
+ Provides-Extra: databricks-delta-tables
177
+ Requires-Dist: databricks-sql-connector; extra == "databricks-delta-tables"
178
+ Provides-Extra: singlestore
179
+ Requires-Dist: singlestoredb; extra == "singlestore"
197
180
  Provides-Extra: vectara
181
+ Requires-Dist: aiofiles; extra == "vectara"
198
182
  Requires-Dist: httpx; extra == "vectara"
199
183
  Requires-Dist: requests; extra == "vectara"
200
- Requires-Dist: aiofiles; extra == "vectara"
201
- Provides-Extra: weaviate
202
- Requires-Dist: weaviate-client; extra == "weaviate"
203
- Provides-Extra: wikipedia
204
- Requires-Dist: wikipedia; extra == "wikipedia"
205
- Provides-Extra: xlsx
206
- Requires-Dist: unstructured[xlsx]; extra == "xlsx"
184
+ Provides-Extra: vastdb
185
+ Requires-Dist: pyarrow; extra == "vastdb"
186
+ Requires-Dist: ibis; extra == "vastdb"
187
+ Requires-Dist: vastdb; extra == "vastdb"
188
+ Provides-Extra: embed-huggingface
189
+ Requires-Dist: sentence-transformers; extra == "embed-huggingface"
190
+ Provides-Extra: embed-octoai
191
+ Requires-Dist: openai; extra == "embed-octoai"
192
+ Requires-Dist: tiktoken; extra == "embed-octoai"
193
+ Provides-Extra: embed-vertexai
194
+ Requires-Dist: vertexai; extra == "embed-vertexai"
195
+ Provides-Extra: embed-voyageai
196
+ Requires-Dist: voyageai; extra == "embed-voyageai"
197
+ Provides-Extra: embed-mixedbreadai
198
+ Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
199
+ Provides-Extra: openai
200
+ Requires-Dist: openai; extra == "openai"
201
+ Requires-Dist: tiktoken; extra == "openai"
202
+ Provides-Extra: bedrock
203
+ Requires-Dist: aioboto3; extra == "bedrock"
204
+ Requires-Dist: boto3; extra == "bedrock"
205
+ Provides-Extra: togetherai
206
+ Requires-Dist: together; extra == "togetherai"
207
+ Dynamic: author
208
+ Dynamic: author-email
209
+ Dynamic: classifier
210
+ Dynamic: description
211
+ Dynamic: description-content-type
212
+ Dynamic: home-page
213
+ Dynamic: keywords
214
+ Dynamic: license
215
+ Dynamic: provides-extra
216
+ Dynamic: requires-dist
217
+ Dynamic: requires-python
218
+ Dynamic: summary
207
219
 
208
220
  # Unstructured Ingest
209
221
 
@@ -10,7 +10,7 @@ test/integration/connectors/test_azure_ai_search.py,sha256=MxFwk84vI_HT4taQTGrNp
10
10
  test/integration/connectors/test_chroma.py,sha256=NuQv0PWPM0_LQfdPeUd6IYKqaKKXWmVaHGWjq5aBfOY,3721
11
11
  test/integration/connectors/test_confluence.py,sha256=Ju0gRQbD2g9l9iRf2HDZKi7RyPnBGtFRWcGpsqhO3F8,3588
12
12
  test/integration/connectors/test_delta_table.py,sha256=4qm2Arfc9Eb7SOZOnOlLF-vNpHy6Eqvr5Q45svfX1PY,6911
13
- test/integration/connectors/test_google_drive.py,sha256=0zJZ4UJOq4TkfU-bkc556_abV7q6zVS9ZgIvW9qcTU4,4204
13
+ test/integration/connectors/test_google_drive.py,sha256=ubjn3wvMhgpGHQs-wT_5icGgTIx2coS6hwNkAHOCEI8,10306
14
14
  test/integration/connectors/test_lancedb.py,sha256=8MBxK_CUtOt87-4B7svDDK82NFII5psceo5cNN8HJMs,9228
15
15
  test/integration/connectors/test_milvus.py,sha256=7mI6zznN0PTxDL9DLogH1k3dxx6R8DgGzlpyevsFu2w,7173
16
16
  test/integration/connectors/test_mongodb.py,sha256=0A6DvF-iTCSZzOefisd_i20j9li8uNWTF2wyLGwlhco,12446
@@ -94,8 +94,8 @@ test/unit/v2/connectors/motherduck/test_base.py,sha256=f3W7hppEZ904_I_fKax-5LVDp
94
94
  test/unit/v2/connectors/sql/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
95
95
  test/unit/v2/connectors/sql/test_sql.py,sha256=51-AKUBxw6ThO68bjenLopUUuxM88YZb2rMUV8L6YwY,2464
96
96
  test/unit/v2/embedders/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
97
- test/unit/v2/embedders/test_bedrock.py,sha256=sW-Vv-u3Yiw8rHPOfE5x_reywXlnozxO49rIMx6_xjo,1071
98
- test/unit/v2/embedders/test_huggingface.py,sha256=mkVPym7TZkRJchwHedujgFXWdL9sVMi1W90jpmZ_vxg,1543
97
+ test/unit/v2/embedders/test_bedrock.py,sha256=HMaweO_v_9Y1SE2m5QImXP73cb26vNTUfc1onTBa1-g,1074
98
+ test/unit/v2/embedders/test_huggingface.py,sha256=TOHUKC7hAadl6XTotr8UqOCq28kbQxOIkPSrMxr2PLU,1546
99
99
  test/unit/v2/embedders/test_mixedbread.py,sha256=8yT942TVVXC5EkrT_ReZie1In537BaAD6esRjntgxuU,1021
100
100
  test/unit/v2/embedders/test_octoai.py,sha256=JMfrFz25QfEh0ieB4bJneZd4XtNcdPOnNsN1Fj7gU-Q,1012
101
101
  test/unit/v2/embedders/test_openai.py,sha256=HoEW95289Ijgo3PJ-pEaDOknfdkSjPXTgkXmE6jJomY,1012
@@ -107,7 +107,7 @@ test/unit/v2/partitioners/test_partitioner.py,sha256=iIYg7IpftV3LusoO4H8tr1IHY1U
107
107
  test/unit/v2/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
108
108
  test/unit/v2/utils/data_generator.py,sha256=UoYVNjG4S4wlaA9gceQ82HIpF9_6I1UTHD1_GrQBHp0,973
109
109
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
110
- unstructured_ingest/__version__.py,sha256=LXdgOM6QWErpDu1oCqJrypfmAkBaXzRxVPcjHL8yPrI,42
110
+ unstructured_ingest/__version__.py,sha256=qWgfAaALtcimLu1dKMS-KpBB0Tnw60hH7XF06t-OzjI,42
111
111
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
112
112
  unstructured_ingest/interfaces.py,sha256=7DOnDpGvUNlCoFR7UPRGmOarqH5sFtuUOO5vf8X3oTM,31489
113
113
  unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
@@ -275,16 +275,16 @@ unstructured_ingest/connector/notion/types/database_properties/unique_id.py,sha2
275
275
  unstructured_ingest/connector/notion/types/database_properties/url.py,sha256=iXQ2tVUm9UlKVtDA0NQiFIRJ5PHYW9wOaWt2vFfSVCg,862
276
276
  unstructured_ingest/connector/notion/types/database_properties/verification.py,sha256=J_DLjY-v2T6xDGMQ7FkI0YMKMA6SG6Y3yYW7qUD1hKA,2334
277
277
  unstructured_ingest/embed/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
278
- unstructured_ingest/embed/azure_openai.py,sha256=u9reyZzY6BtsT5U_TdIfS6vH_42lvohVBwKMPQAqvkI,1528
279
- unstructured_ingest/embed/bedrock.py,sha256=50G8PBEdW3ILwyWXAWl4w-gUA9I0AR7LuFq6NLz-sWI,7284
280
- unstructured_ingest/embed/huggingface.py,sha256=Avcc16st9Cp2xGScG6TeNEEd3T8YjjnESNN4OdIlnh0,2119
281
- unstructured_ingest/embed/interfaces.py,sha256=7jsQ3rLOXy1hq__muf-EPcLnv17XzNQaD05AyGbZeNo,3739
282
- unstructured_ingest/embed/mixedbreadai.py,sha256=OhF5cMxWMq8-0mt8_-Xe3ZkjGjf2u6QYzfzgHnOEYtU,6838
283
- unstructured_ingest/embed/octoai.py,sha256=oLNlM02W1CNUYRG_j6qWyI7yE24vYGKYradNzeeP6mE,5062
284
- unstructured_ingest/embed/openai.py,sha256=H1sURGuRvXBUSXJcAVzrLObV5wSCVM29tkaXJ-9ZR30,4727
285
- unstructured_ingest/embed/togetherai.py,sha256=SUd16JEUPlR8aCrd4q_T3CHwMTRUi-1yenq_r1AWlak,4266
286
- unstructured_ingest/embed/vertexai.py,sha256=CPptS7U5W1CgvxIN8CgVz5J1Ia4FctV6BsmpN9c92A0,4890
287
- unstructured_ingest/embed/voyageai.py,sha256=lydMASUDcTuyfWBPS3uIqDJPQbjf95bEI5Kr4tytONs,5111
278
+ unstructured_ingest/embed/azure_openai.py,sha256=_-I-nwd-wdCiKkSdYBL4UKrTZ2UPWsM_0T69fcObs_I,1707
279
+ unstructured_ingest/embed/bedrock.py,sha256=tZumLLXafSr1zIFVjckapRoiiY-7u65GPuWmwsdhY0I,7726
280
+ unstructured_ingest/embed/huggingface.py,sha256=EWU1kd5Cm6ajgCw6hP5w_4pniGSgxnR0wM9vjuPQ6Yk,2334
281
+ unstructured_ingest/embed/interfaces.py,sha256=C_R_RZJafm3gq8Q0T-HJs-OlbnXpUrCKl4D7Ryv9-Ss,4894
282
+ unstructured_ingest/embed/mixedbreadai.py,sha256=-Y0J27G9CL1t3ZTIeNjTjRviErSMAzJRf2zgDgMHUmg,4499
283
+ unstructured_ingest/embed/octoai.py,sha256=hNLEskDEP-2qWExUgVz2Eyw3KTIFwdUE9elbJ5qp4Ao,3855
284
+ unstructured_ingest/embed/openai.py,sha256=Fe_17y-YpkiGcfrOxZFmgjV-Y-u8svhDVYyAjV-GeBM,3279
285
+ unstructured_ingest/embed/togetherai.py,sha256=i1qeX2fwWtUf1vdGOGnpA_bJB__VzU1NQsR8k-KhxIw,2983
286
+ unstructured_ingest/embed/vertexai.py,sha256=EcXhhm1IbCZVq4KA0sbJjyABu8jpF2ZL3JCqmuxPsjo,3688
287
+ unstructured_ingest/embed/voyageai.py,sha256=tuUZ28B_t2sVDVC6EiHdQEQycMEY2nybE3DFcpxSqh0,3992
288
288
  unstructured_ingest/enhanced_dataclass/__init__.py,sha256=gDZOUsv5eo-8jm4Yu7DdDwi101aGbfG7JctTdOYnTOM,151
289
289
  unstructured_ingest/enhanced_dataclass/core.py,sha256=d6aUkDynuKX87cHx9_N5UDUWrvISR4jYRFRTvd_avlI,3038
290
290
  unstructured_ingest/enhanced_dataclass/dataclasses.py,sha256=aZMsoCzAGRb8Rmh3BTSBFtNr6FmFTY93KYGLk3gYJKQ,1949
@@ -375,7 +375,7 @@ unstructured_ingest/utils/string_and_date_utils.py,sha256=kijtPlGAbH376vVjFSo5H_
375
375
  unstructured_ingest/utils/table.py,sha256=aWjcowDVSClNpEAdR6PY3H7khKu4T6T3QqQE6GjmQ_M,3469
376
376
  unstructured_ingest/v2/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
377
377
  unstructured_ingest/v2/constants.py,sha256=pDspTYz-nEojHBqrZNfssGEiujmVa02pIWL63PQP9sU,103
378
- unstructured_ingest/v2/errors.py,sha256=y1tGvobuhQdcR9vw5APuFigiQSfsQKrAYGDr4biGDdw,207
378
+ unstructured_ingest/v2/errors.py,sha256=9RuRCi7lbDxCguDz07y5RiHoQiFIOWwOD7xqzJ2B3Yw,436
379
379
  unstructured_ingest/v2/logger.py,sha256=wcln4s5Nyp2fjjJux9iM3d6t9aQFNJ2H1IAZXmIknjI,4323
380
380
  unstructured_ingest/v2/main.py,sha256=WFdLEqEXRy6E9_G-dF20MK2AtgX51Aan1sp_N67U2B8,172
381
381
  unstructured_ingest/v2/otel.py,sha256=2fGj1c7cVcC3J8NwL6MNYhyPEAXiB33DsilvRDkrdLo,4130
@@ -418,7 +418,7 @@ unstructured_ingest/v2/pipeline/steps/upload.py,sha256=We4OAtStuZwWKKBCOPhfeAz_v
418
418
  unstructured_ingest/v2/processes/__init__.py,sha256=FaHWSCGyc7GWVnAsNEUUj7L8hT8gCVY3_hUE2VzWtUg,462
419
419
  unstructured_ingest/v2/processes/chunker.py,sha256=31-7ojsM2coIt2rMR0KOb82IxLVJfNHbqYUOsDkhxN8,5491
420
420
  unstructured_ingest/v2/processes/connector_registry.py,sha256=vkEe6jpgdYtZCxMj59s5atWGgmPuxAEXRUoTt-MJ7wc,2198
421
- unstructured_ingest/v2/processes/embedder.py,sha256=PTBlRgNbAXkSaLg7JrZzHwAoqpHmopg8jNU1TmaXguU,7804
421
+ unstructured_ingest/v2/processes/embedder.py,sha256=64mWxKMzDtrm0_QWDUA3J8gChPDEVLP6bFnac_JPBRY,7925
422
422
  unstructured_ingest/v2/processes/filter.py,sha256=kjUmMw2SDq2bme0JCAOxs6cJriIG6Ty09KOznS-xz08,2145
423
423
  unstructured_ingest/v2/processes/partitioner.py,sha256=ZC9mt85I3o_SLR4DvE7vPBGphMET994phFkTuT-L9B8,9998
424
424
  unstructured_ingest/v2/processes/uncompress.py,sha256=Z_XfsITGdyaRwhtNUc7bMj5Y2jLuBge8KoK4nxhqKag,2425
@@ -432,12 +432,12 @@ unstructured_ingest/v2/processes/connectors/couchbase.py,sha256=i7vuNKsUkN93JRVm
432
432
  unstructured_ingest/v2/processes/connectors/delta_table.py,sha256=SotSXZQ85_6TO906YvFi3yTml8jE9A_zV6nBJ4oTx8A,7075
433
433
  unstructured_ingest/v2/processes/connectors/discord.py,sha256=-e4-cBK4TnHkknK1qIb86AIVMy81lBgC288_iLpTzM8,5246
434
434
  unstructured_ingest/v2/processes/connectors/gitlab.py,sha256=ufE65Z8q_tC4oppGg5BsGXwSaL7RbEXcaagJQYsylNo,9984
435
- unstructured_ingest/v2/processes/connectors/google_drive.py,sha256=tSbyibwm9RQyXD-HJGZa1Y9lBSCXaEFnvxpf6bHwBSE,13394
435
+ unstructured_ingest/v2/processes/connectors/google_drive.py,sha256=QzcHNelUbnubsDtanFIgDCRzmYTuP-GjJ_g9y8fButE,19623
436
436
  unstructured_ingest/v2/processes/connectors/kdbai.py,sha256=VRDAiou_7oWOIAgQTdOGQWxudzQEDopXM8XkfkQ2j6g,5004
437
437
  unstructured_ingest/v2/processes/connectors/local.py,sha256=ZvWTj6ZYkwnvQMNFsZWoaQyp9zp0WVqAywMaHJ2kcAc,7153
438
438
  unstructured_ingest/v2/processes/connectors/milvus.py,sha256=wmcu9NVy3gYlQGT25inN5w_QrhFoL8-hRq0pJFSNw8g,8866
439
439
  unstructured_ingest/v2/processes/connectors/mongodb.py,sha256=cL0QUQZF_s2brh3nNNeAywXVpaIiND4b5JTAFlYjLjw,14273
440
- unstructured_ingest/v2/processes/connectors/neo4j.py,sha256=HU1IwchTM7Q1kkeIFVe-Lg6gInMItBpgkDkVwuTvkGY,14259
440
+ unstructured_ingest/v2/processes/connectors/neo4j.py,sha256=sjwQWp6gPP_MR8vh4aaMJUzPmkGT_3FODTlB5-7tVh0,17525
441
441
  unstructured_ingest/v2/processes/connectors/onedrive.py,sha256=EM9fq67RsiudZvZbi6nDXkS-i6W0xLvbkNvD0G-Ni5E,17779
442
442
  unstructured_ingest/v2/processes/connectors/outlook.py,sha256=KgNGM8hImRhy6_SpswRP2VwRD4VOrqqJoySgxf2oduI,9290
443
443
  unstructured_ingest/v2/processes/connectors/pinecone.py,sha256=U5gSa8S08JvCwmAhE8aV0yxGTIFnUlKVsQDybE8Fqb8,10746
@@ -558,7 +558,7 @@ unstructured_ingest/v2/processes/connectors/sql/__init__.py,sha256=NSEZwJDHh_9kF
558
558
  unstructured_ingest/v2/processes/connectors/sql/databricks_delta_tables.py,sha256=xbZ90rmehiCnBoqFXMz-3ZMXeYb0PzWB6iobCNSHTmQ,8955
559
559
  unstructured_ingest/v2/processes/connectors/sql/postgres.py,sha256=BATfX1PQGT2kl8jAbdNKXTojYKJxh3pJV9-h3OBnHGo,5124
560
560
  unstructured_ingest/v2/processes/connectors/sql/singlestore.py,sha256=OPBDQ2c_5KjWHEFfqXxf3pQ2tWC-N4MtslMulMgP1Wc,5503
561
- unstructured_ingest/v2/processes/connectors/sql/snowflake.py,sha256=QE-WBqrPVjCgcxR5EdVD9iTHBjgDSSSQgWYvq5N61qU,7746
561
+ unstructured_ingest/v2/processes/connectors/sql/snowflake.py,sha256=0hfiX_u7V38k_RfoeDmXJp8WIHZ19ilIHnrgZVSleKw,9270
562
562
  unstructured_ingest/v2/processes/connectors/sql/sql.py,sha256=F5PPUxt2W8JaAQGfz5Od0FvKqYa15RfwMIlnrdJu1nk,15317
563
563
  unstructured_ingest/v2/processes/connectors/sql/sqlite.py,sha256=PRjN_S7UQv0k4ZpSyclW1AJrsrugyxbR-GoOrHvBpks,5200
564
564
  unstructured_ingest/v2/processes/connectors/sql/vastdb.py,sha256=0rxrb1ByXIefB9umzMTEJbpvzdTttXHK5DjRY97-GG8,9618
@@ -567,9 +567,9 @@ unstructured_ingest/v2/processes/connectors/weaviate/cloud.py,sha256=bXtfEYLquR-
567
567
  unstructured_ingest/v2/processes/connectors/weaviate/embedded.py,sha256=S8Zg8StuZT-k7tCg1D5YShO1-vJYYk9-M1bE1fIqx64,3014
568
568
  unstructured_ingest/v2/processes/connectors/weaviate/local.py,sha256=LuTBKPseVewsz8VqxRPRLfGEm3BeI9nBZxpy7ZU5tOA,2201
569
569
  unstructured_ingest/v2/processes/connectors/weaviate/weaviate.py,sha256=yJza_jBSEFnzZRq5L6vJ0Mm3uS1uxkOiKIimPpUyQds,12418
570
- unstructured_ingest-0.5.1.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
571
- unstructured_ingest-0.5.1.dist-info/METADATA,sha256=4fo4K5ac0RNRlWGGyNumZ5gXJf-0PwknZWjS6HvAD6w,8051
572
- unstructured_ingest-0.5.1.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
573
- unstructured_ingest-0.5.1.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
574
- unstructured_ingest-0.5.1.dist-info/top_level.txt,sha256=DMuDMHZRMdeay8v8Kdi855muIv92F0OkutvBCaBEW6M,25
575
- unstructured_ingest-0.5.1.dist-info/RECORD,,
570
+ unstructured_ingest-0.5.3.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
571
+ unstructured_ingest-0.5.3.dist-info/METADATA,sha256=Ypb6HJHp4T_Y7kfL2hmU03MfYFJYe8LptQZ4JzzRFEY,8316
572
+ unstructured_ingest-0.5.3.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
573
+ unstructured_ingest-0.5.3.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
574
+ unstructured_ingest-0.5.3.dist-info/top_level.txt,sha256=DMuDMHZRMdeay8v8Kdi855muIv92F0OkutvBCaBEW6M,25
575
+ unstructured_ingest-0.5.3.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (75.1.0)
2
+ Generator: setuptools (75.8.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5