unstructured-ingest 0.0.19__py3-none-any.whl → 0.0.22__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (47) hide show
  1. unstructured_ingest/__version__.py +1 -1
  2. unstructured_ingest/cli/cmds/astradb.py +2 -2
  3. unstructured_ingest/connector/astradb.py +54 -24
  4. unstructured_ingest/embed/bedrock.py +56 -19
  5. unstructured_ingest/embed/huggingface.py +22 -22
  6. unstructured_ingest/embed/interfaces.py +11 -4
  7. unstructured_ingest/embed/mixedbreadai.py +17 -17
  8. unstructured_ingest/embed/octoai.py +7 -7
  9. unstructured_ingest/embed/openai.py +15 -20
  10. unstructured_ingest/embed/vertexai.py +25 -17
  11. unstructured_ingest/embed/voyageai.py +22 -17
  12. unstructured_ingest/v2/cli/base/cmd.py +1 -1
  13. unstructured_ingest/v2/interfaces/connector.py +1 -1
  14. unstructured_ingest/v2/pipeline/pipeline.py +3 -1
  15. unstructured_ingest/v2/pipeline/steps/chunk.py +1 -1
  16. unstructured_ingest/v2/pipeline/steps/download.py +6 -2
  17. unstructured_ingest/v2/pipeline/steps/embed.py +1 -1
  18. unstructured_ingest/v2/pipeline/steps/filter.py +1 -1
  19. unstructured_ingest/v2/pipeline/steps/index.py +4 -2
  20. unstructured_ingest/v2/pipeline/steps/partition.py +1 -1
  21. unstructured_ingest/v2/pipeline/steps/stage.py +3 -1
  22. unstructured_ingest/v2/pipeline/steps/uncompress.py +1 -1
  23. unstructured_ingest/v2/pipeline/steps/upload.py +6 -2
  24. unstructured_ingest/v2/processes/chunker.py +8 -29
  25. unstructured_ingest/v2/processes/connectors/airtable.py +1 -1
  26. unstructured_ingest/v2/processes/connectors/astradb.py +26 -19
  27. unstructured_ingest/v2/processes/connectors/databricks_volumes.py +11 -8
  28. unstructured_ingest/v2/processes/connectors/elasticsearch.py +2 -2
  29. unstructured_ingest/v2/processes/connectors/fsspec/azure.py +31 -5
  30. unstructured_ingest/v2/processes/connectors/fsspec/box.py +31 -2
  31. unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +36 -8
  32. unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +25 -77
  33. unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +30 -1
  34. unstructured_ingest/v2/processes/connectors/fsspec/s3.py +15 -18
  35. unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +22 -1
  36. unstructured_ingest/v2/processes/connectors/milvus.py +2 -2
  37. unstructured_ingest/v2/processes/connectors/opensearch.py +2 -2
  38. unstructured_ingest/v2/processes/partitioner.py +9 -55
  39. unstructured_ingest/v2/unstructured_api.py +87 -0
  40. unstructured_ingest/v2/utils.py +1 -1
  41. unstructured_ingest-0.0.22.dist-info/METADATA +186 -0
  42. {unstructured_ingest-0.0.19.dist-info → unstructured_ingest-0.0.22.dist-info}/RECORD +46 -45
  43. {unstructured_ingest-0.0.19.dist-info → unstructured_ingest-0.0.22.dist-info}/WHEEL +1 -1
  44. unstructured_ingest-0.0.19.dist-info/METADATA +0 -639
  45. {unstructured_ingest-0.0.19.dist-info → unstructured_ingest-0.0.22.dist-info}/LICENSE.md +0 -0
  46. {unstructured_ingest-0.0.19.dist-info → unstructured_ingest-0.0.22.dist-info}/entry_points.txt +0 -0
  47. {unstructured_ingest-0.0.19.dist-info → unstructured_ingest-0.0.22.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,186 @@
1
+ Metadata-Version: 2.1
2
+ Name: unstructured-ingest
3
+ Version: 0.0.22
4
+ Summary: A library that prepares raw documents for downstream ML tasks.
5
+ Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
+ Author: Unstructured Technologies
7
+ Author-email: devops@unstructuredai.io
8
+ License: Apache-2.0
9
+ Keywords: NLP PDF HTML CV XML parsing preprocessing
10
+ Classifier: Development Status :: 4 - Beta
11
+ Classifier: Intended Audience :: Developers
12
+ Classifier: Intended Audience :: Education
13
+ Classifier: Intended Audience :: Science/Research
14
+ Classifier: License :: OSI Approved :: Apache Software License
15
+ Classifier: Operating System :: OS Independent
16
+ Classifier: Programming Language :: Python :: 3
17
+ Classifier: Programming Language :: Python :: 3.9
18
+ Classifier: Programming Language :: Python :: 3.10
19
+ Classifier: Programming Language :: Python :: 3.11
20
+ Classifier: Programming Language :: Python :: 3.12
21
+ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
+ Requires-Python: >=3.9.0,<3.13
23
+ Description-Content-Type: text/markdown
24
+ License-File: LICENSE.md
25
+ Requires-Dist: pandas
26
+ Requires-Dist: dataclasses-json
27
+ Requires-Dist: opentelemetry-sdk
28
+ Requires-Dist: python-dateutil
29
+ Requires-Dist: click
30
+ Requires-Dist: tqdm
31
+ Requires-Dist: pydantic>=2.7
32
+ Provides-Extra: airtable
33
+ Requires-Dist: pyairtable; extra == "airtable"
34
+ Provides-Extra: astradb
35
+ Requires-Dist: astrapy; extra == "astradb"
36
+ Provides-Extra: azure
37
+ Requires-Dist: adlfs; extra == "azure"
38
+ Requires-Dist: fsspec; extra == "azure"
39
+ Provides-Extra: azure-cognitive-search
40
+ Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
41
+ Provides-Extra: bedrock
42
+ Requires-Dist: boto3; extra == "bedrock"
43
+ Provides-Extra: biomed
44
+ Requires-Dist: bs4; extra == "biomed"
45
+ Requires-Dist: requests; extra == "biomed"
46
+ Provides-Extra: box
47
+ Requires-Dist: boxfs; extra == "box"
48
+ Requires-Dist: fsspec; extra == "box"
49
+ Provides-Extra: chroma
50
+ Requires-Dist: chromadb; extra == "chroma"
51
+ Provides-Extra: clarifai
52
+ Requires-Dist: clarifai; extra == "clarifai"
53
+ Provides-Extra: confluence
54
+ Requires-Dist: atlassian-python-api; extra == "confluence"
55
+ Requires-Dist: requests; extra == "confluence"
56
+ Provides-Extra: couchbase
57
+ Requires-Dist: couchbase; extra == "couchbase"
58
+ Provides-Extra: csv
59
+ Requires-Dist: unstructured[tsv]; extra == "csv"
60
+ Provides-Extra: databricks-volumes
61
+ Requires-Dist: databricks-sdk; extra == "databricks-volumes"
62
+ Provides-Extra: delta-table
63
+ Requires-Dist: deltalake; extra == "delta-table"
64
+ Requires-Dist: fsspec; extra == "delta-table"
65
+ Provides-Extra: discord
66
+ Requires-Dist: discord-py; extra == "discord"
67
+ Provides-Extra: doc
68
+ Requires-Dist: unstructured[docx]; extra == "doc"
69
+ Provides-Extra: docx
70
+ Requires-Dist: unstructured[docx]; extra == "docx"
71
+ Provides-Extra: dropbox
72
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
73
+ Requires-Dist: fsspec; extra == "dropbox"
74
+ Provides-Extra: elasticsearch
75
+ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
76
+ Provides-Extra: embed-huggingface
77
+ Requires-Dist: sentence-transformers; extra == "embed-huggingface"
78
+ Provides-Extra: embed-mixedbreadai
79
+ Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
80
+ Provides-Extra: embed-octoai
81
+ Requires-Dist: openai; extra == "embed-octoai"
82
+ Requires-Dist: tiktoken; extra == "embed-octoai"
83
+ Provides-Extra: embed-vertexai
84
+ Requires-Dist: vertexai; extra == "embed-vertexai"
85
+ Provides-Extra: embed-voyageai
86
+ Requires-Dist: voyageai; extra == "embed-voyageai"
87
+ Provides-Extra: epub
88
+ Requires-Dist: unstructured[epub]; extra == "epub"
89
+ Provides-Extra: gcs
90
+ Requires-Dist: bs4; extra == "gcs"
91
+ Requires-Dist: gcsfs; extra == "gcs"
92
+ Requires-Dist: fsspec; extra == "gcs"
93
+ Provides-Extra: github
94
+ Requires-Dist: pygithub>1.58.0; extra == "github"
95
+ Requires-Dist: requests; extra == "github"
96
+ Provides-Extra: gitlab
97
+ Requires-Dist: python-gitlab; extra == "gitlab"
98
+ Provides-Extra: google-drive
99
+ Requires-Dist: google-api-python-client; extra == "google-drive"
100
+ Provides-Extra: hubspot
101
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
102
+ Requires-Dist: urllib3; extra == "hubspot"
103
+ Provides-Extra: jira
104
+ Requires-Dist: atlassian-python-api; extra == "jira"
105
+ Provides-Extra: kafka
106
+ Requires-Dist: confluent-kafka; extra == "kafka"
107
+ Provides-Extra: kdbai
108
+ Requires-Dist: kdbai-client; extra == "kdbai"
109
+ Provides-Extra: md
110
+ Requires-Dist: unstructured[md]; extra == "md"
111
+ Provides-Extra: milvus
112
+ Requires-Dist: pymilvus; extra == "milvus"
113
+ Provides-Extra: mongodb
114
+ Requires-Dist: pymongo; extra == "mongodb"
115
+ Provides-Extra: msg
116
+ Requires-Dist: unstructured[msg]; extra == "msg"
117
+ Provides-Extra: notion
118
+ Requires-Dist: httpx; extra == "notion"
119
+ Requires-Dist: notion-client; extra == "notion"
120
+ Requires-Dist: htmlBuilder; extra == "notion"
121
+ Requires-Dist: backoff; extra == "notion"
122
+ Provides-Extra: odt
123
+ Requires-Dist: unstructured[odt]; extra == "odt"
124
+ Provides-Extra: onedrive
125
+ Requires-Dist: msal; extra == "onedrive"
126
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
127
+ Requires-Dist: bs4; extra == "onedrive"
128
+ Provides-Extra: openai
129
+ Requires-Dist: openai; extra == "openai"
130
+ Requires-Dist: tiktoken; extra == "openai"
131
+ Provides-Extra: opensearch
132
+ Requires-Dist: opensearch-py; extra == "opensearch"
133
+ Provides-Extra: org
134
+ Requires-Dist: unstructured[org]; extra == "org"
135
+ Provides-Extra: outlook
136
+ Requires-Dist: msal; extra == "outlook"
137
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
138
+ Provides-Extra: pdf
139
+ Requires-Dist: unstructured[pdf]; extra == "pdf"
140
+ Provides-Extra: pinecone
141
+ Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
142
+ Provides-Extra: postgres
143
+ Requires-Dist: psycopg2-binary; extra == "postgres"
144
+ Provides-Extra: ppt
145
+ Requires-Dist: unstructured[pptx]; extra == "ppt"
146
+ Provides-Extra: pptx
147
+ Requires-Dist: unstructured[pptx]; extra == "pptx"
148
+ Provides-Extra: qdrant
149
+ Requires-Dist: qdrant-client; extra == "qdrant"
150
+ Provides-Extra: reddit
151
+ Requires-Dist: praw; extra == "reddit"
152
+ Provides-Extra: remote
153
+ Requires-Dist: unstructured-client>=0.25.8; extra == "remote"
154
+ Provides-Extra: rst
155
+ Requires-Dist: unstructured[rst]; extra == "rst"
156
+ Provides-Extra: rtf
157
+ Requires-Dist: unstructured[rtf]; extra == "rtf"
158
+ Provides-Extra: s3
159
+ Requires-Dist: s3fs; extra == "s3"
160
+ Requires-Dist: fsspec; extra == "s3"
161
+ Provides-Extra: salesforce
162
+ Requires-Dist: simple-salesforce; extra == "salesforce"
163
+ Provides-Extra: sftp
164
+ Requires-Dist: fsspec; extra == "sftp"
165
+ Requires-Dist: paramiko; extra == "sftp"
166
+ Provides-Extra: sharepoint
167
+ Requires-Dist: msal; extra == "sharepoint"
168
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
169
+ Provides-Extra: singlestore
170
+ Requires-Dist: singlestoredb; extra == "singlestore"
171
+ Provides-Extra: slack
172
+ Requires-Dist: slack-sdk; extra == "slack"
173
+ Provides-Extra: tsv
174
+ Requires-Dist: unstructured[tsv]; extra == "tsv"
175
+ Provides-Extra: vectara
176
+ Requires-Dist: requests; extra == "vectara"
177
+ Provides-Extra: weaviate
178
+ Requires-Dist: weaviate-client; extra == "weaviate"
179
+ Provides-Extra: wikipedia
180
+ Requires-Dist: wikipedia; extra == "wikipedia"
181
+ Provides-Extra: xlsx
182
+ Requires-Dist: unstructured[xlsx]; extra == "xlsx"
183
+
184
+ # Unstructured Ingest
185
+
186
+ For details, see the [Unstructured Ingest overview](https://docs.unstructured.io/ingestion/overview) in the Unstructured documentation.
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=UrqvjMtyRqmfxHactmUZmtzBzqFVCEoTlMEeH_VmexE,43
2
+ unstructured_ingest/__version__.py,sha256=s86WG6OgfRK15ii3W6pb0AczHH8T1QB33x5r6twQpCY,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/interfaces.py,sha256=LuY-85clq5iyOtDd9vDABjK2MZCm6wRWK53cdb4SROY,31411
5
5
  unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
@@ -17,7 +17,7 @@ unstructured_ingest/cli/base/dest.py,sha256=uN44l7kPErm_BQqKFUgaiz_Xu6UKk-mnB1B8
17
17
  unstructured_ingest/cli/base/src.py,sha256=gDLZlBuOCEGMAAFCLkoURFQKmrmE34WQ5DbT0w1ssy4,2179
18
18
  unstructured_ingest/cli/cmds/__init__.py,sha256=TtVhAdlPv7e1DKYZ_D2q0wauE-1IjF-AtHp0RIskoD8,5932
19
19
  unstructured_ingest/cli/cmds/airtable.py,sha256=SgdUztUCFbabWP3K937TwdYlhrdY2PUtE4TXUHfBGtw,2629
20
- unstructured_ingest/cli/cmds/astradb.py,sha256=T5Ccz29BDNewuHlL1PN5MDnBggQ93o2lGZgxDgTNtys,2931
20
+ unstructured_ingest/cli/cmds/astradb.py,sha256=2subkQvVHOxSs98Zu3bPKtIUl-uzjNEMarcYQaPYCh0,2929
21
21
  unstructured_ingest/cli/cmds/azure_cognitive_search.py,sha256=PcM55PtpRMHbP69trW0JCTz-gx6tKMLUaMU4GGXv0g8,1927
22
22
  unstructured_ingest/cli/cmds/biomed.py,sha256=M2jc7_-EvbAeDtDwtZNrPI48QJ1Tm401LcSUD0Ayd20,1442
23
23
  unstructured_ingest/cli/cmds/chroma.py,sha256=zO17L7LgUaDfKutfQjSE-QjZJcREyeSpWZetja243lE,3267
@@ -59,7 +59,7 @@ unstructured_ingest/cli/cmds/fsspec/s3.py,sha256=v-24oFxhabdShryK2dhP4cDBvVyoQ-8
59
59
  unstructured_ingest/cli/cmds/fsspec/sftp.py,sha256=TCB7sf_GYoifryQbbttknYSt9Q1kRCPtu8B8QgXl3lw,1537
60
60
  unstructured_ingest/connector/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
61
61
  unstructured_ingest/connector/airtable.py,sha256=KcLt-FEabO9D5ev5E4xUf06VYHpYpypP-adTVyhGcb8,10585
62
- unstructured_ingest/connector/astradb.py,sha256=kDDcITwmUqgZ2y0cYMxMIsEr3c7s8SXrRI1LplTRlos,8635
62
+ unstructured_ingest/connector/astradb.py,sha256=jU2rS5Xips6eNNrHvNIxIYD-2u7wwPzW08aMc5NKZOE,9814
63
63
  unstructured_ingest/connector/azure_cognitive_search.py,sha256=cqQdAaEzt4coU7sxnl4GY8Em4a6azFLyAKM6enkmjBA,5850
64
64
  unstructured_ingest/connector/biomed.py,sha256=uwtBuKzpHfxbJckHAHcsnKo4dTCdag66tCDtCqKNSZM,10847
65
65
  unstructured_ingest/connector/chroma.py,sha256=Nma6HebQxNY7CCWwWArkX3kMXf2xVv6L-jrfRjMi9LE,5713
@@ -167,14 +167,14 @@ unstructured_ingest/connector/notion/types/database_properties/unique_id.py,sha2
167
167
  unstructured_ingest/connector/notion/types/database_properties/url.py,sha256=iXQ2tVUm9UlKVtDA0NQiFIRJ5PHYW9wOaWt2vFfSVCg,862
168
168
  unstructured_ingest/connector/notion/types/database_properties/verification.py,sha256=J_DLjY-v2T6xDGMQ7FkI0YMKMA6SG6Y3yYW7qUD1hKA,2334
169
169
  unstructured_ingest/embed/__init__.py,sha256=whnTiGsSbNqaLObr058CKG5iGxk5OkN_41IBEtHQYW8,900
170
- unstructured_ingest/embed/bedrock.py,sha256=5uq1S9-7uKaaHiniohm1HXNLhudIYN9TEcctUe2JIpM,2514
171
- unstructured_ingest/embed/huggingface.py,sha256=fHgZ865I2Efs3QT43n57gmccF9sBzI6T4yhcu_r7zwM,2727
172
- unstructured_ingest/embed/interfaces.py,sha256=O_USsEcVHRzE2dpHCJEJWKq04NLfdAnm55ZHHTQ3GO0,900
173
- unstructured_ingest/embed/mixedbreadai.py,sha256=wMdY1a4PyynguIZQ4fPFImKGk9ryqHv0NRL3e3iSPEI,5491
174
- unstructured_ingest/embed/octoai.py,sha256=ERJby6VdqcIO6NLTqLXVHmX7LNIM0Fsmhf3dn10Z4is,2347
175
- unstructured_ingest/embed/openai.py,sha256=zOh3GHg1sPVUd3YzZLS5JIV21emYyrCHGYzqH5MIAiY,2250
176
- unstructured_ingest/embed/vertexai.py,sha256=DuOQNHUzickx9kIobfIz2RjhJ712OsZhIoYJiXxaMco,3309
177
- unstructured_ingest/embed/voyageai.py,sha256=PwyW-_dXZT1AGSkeF3c2heM-pdBxciUxdtP7PluCauY,2430
170
+ unstructured_ingest/embed/bedrock.py,sha256=5-pKWwOEGHKOHa06wYuKOhvT8Xu72ke6nrpCnRtkAaU,3872
171
+ unstructured_ingest/embed/huggingface.py,sha256=ku_JQr72KBG8n5b6KRkXIbeBGzdgLw_KKIEm1dFK3oM,2729
172
+ unstructured_ingest/embed/interfaces.py,sha256=L5WimR69bmEvliIBlZ8wOCH_YDA9DWteCu6QEsKCV5I,1113
173
+ unstructured_ingest/embed/mixedbreadai.py,sha256=NSrAt1_bjphTHLUnlzzWSBU25UBCZlpYaLdWSRSGyqs,5504
174
+ unstructured_ingest/embed/octoai.py,sha256=0zxAUAMzodGkqMwqMkEvSfgWLNHtEnhdvUofvJDQD1A,2368
175
+ unstructured_ingest/embed/openai.py,sha256=4Ee4A2rQ8OlSh_yiJSFmok_qqRDi1A3KyayB5YiPLFw,2058
176
+ unstructured_ingest/embed/vertexai.py,sha256=pclpjjacvGTex74tD_3yZKhR-X5BR0fAHbgZUE62uh0,3608
177
+ unstructured_ingest/embed/voyageai.py,sha256=8l-EGVdOcR9jLoc0DV4aPOvJsvRnInI8w12C9jxiUWA,2664
178
178
  unstructured_ingest/enhanced_dataclass/__init__.py,sha256=gDZOUsv5eo-8jm4Yu7DdDwi101aGbfG7JctTdOYnTOM,151
179
179
  unstructured_ingest/enhanced_dataclass/core.py,sha256=d6aUkDynuKX87cHx9_N5UDUWrvISR4jYRFRTvd_avlI,3038
180
180
  unstructured_ingest/enhanced_dataclass/dataclasses.py,sha256=aZMsoCzAGRb8Rmh3BTSBFtNr6FmFTY93KYGLk3gYJKQ,1949
@@ -265,12 +265,13 @@ unstructured_ingest/v2/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LG
265
265
  unstructured_ingest/v2/logger.py,sha256=wcln4s5Nyp2fjjJux9iM3d6t9aQFNJ2H1IAZXmIknjI,4323
266
266
  unstructured_ingest/v2/main.py,sha256=WFdLEqEXRy6E9_G-dF20MK2AtgX51Aan1sp_N67U2B8,172
267
267
  unstructured_ingest/v2/otel.py,sha256=2fGj1c7cVcC3J8NwL6MNYhyPEAXiB33DsilvRDkrdLo,4130
268
- unstructured_ingest/v2/utils.py,sha256=9LnhpI8Otpq5HPcN2Dtkp7APD_euq1ylKhIsybuK99Y,1714
268
+ unstructured_ingest/v2/unstructured_api.py,sha256=1EQVuL-TojmFxWoWFzXr1oCFPEC3IkCQqhjXM8spdTY,3373
269
+ unstructured_ingest/v2/utils.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3rJn1PHTI_G_A_EHY,1720
269
270
  unstructured_ingest/v2/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
270
271
  unstructured_ingest/v2/cli/cli.py,sha256=qHXIs-PcvMgDZhP1AR9iDMxh8FXBMJCEDksPBfiMULE,648
271
272
  unstructured_ingest/v2/cli/cmds.py,sha256=wWUTbvvxEqKAy6bNE6XhPnj0ELMeSbb9_r1NZl58xMM,489
272
273
  unstructured_ingest/v2/cli/base/__init__.py,sha256=zXCa7F4FMqItmzxfUIVmyI-CeGh8X85yF8lRxwX_OYQ,83
273
- unstructured_ingest/v2/cli/base/cmd.py,sha256=a2NE9ZjUfuLIevz0aEs25UsLGCOroJwI-bPc6vBrMCw,11484
274
+ unstructured_ingest/v2/cli/base/cmd.py,sha256=fO1gXvMFgRMoXgVF4Nwk8J-MYU-U59ubchZU_Gx1mK4,11490
274
275
  unstructured_ingest/v2/cli/base/dest.py,sha256=zDjqek7anr0JQ2ptEl8KIAsUXuCuHRnBQnJhoPj4NVM,3198
275
276
  unstructured_ingest/v2/cli/base/importer.py,sha256=nRt0QQ3qpi264-n_mR0l55C2ddM8nowTNzT1jsWaam8,1128
276
277
  unstructured_ingest/v2/cli/base/src.py,sha256=cpQ43qQju4e5s_YSaPxUtA70BaisRkTBdjtlPhqn5Mg,2872
@@ -278,7 +279,7 @@ unstructured_ingest/v2/cli/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRk
278
279
  unstructured_ingest/v2/cli/utils/click.py,sha256=Wn2s3PuvBCKB0lsK-W7X_Y0eYyWnS6Y9wWo1OhVBOzY,6344
279
280
  unstructured_ingest/v2/cli/utils/model_conversion.py,sha256=73DKHQQ6Tm0Lz5NCRduDlyfOhY2KH-MZN1n6jUgrsuU,7480
280
281
  unstructured_ingest/v2/interfaces/__init__.py,sha256=Rfa8crx6De7WNOK-EjsWWwFVpsUfCc6gY8B8tQ3ae9I,899
281
- unstructured_ingest/v2/interfaces/connector.py,sha256=Lm7wJTlKUfVKJjk-BchS0RtZ9_Lo9tzZ62rPtF3HOGY,759
282
+ unstructured_ingest/v2/interfaces/connector.py,sha256=KG0pHdAcpuO5h72xrAkJzADmjxbav31TZ2Wo3PBvwT0,765
282
283
  unstructured_ingest/v2/interfaces/downloader.py,sha256=PKT1kr79Mz1urW_8xCyq9sBuK93gDvyTXg5e4ma4htU,2871
283
284
  unstructured_ingest/v2/interfaces/file_data.py,sha256=ieJK-hqHCEOmoYNGoFbCHziSaZyMtRS9VpSoYbwoKCE,1944
284
285
  unstructured_ingest/v2/interfaces/indexer.py,sha256=Bd1S-gTLsxhJBLEh1lYm_gXqwQLaEZMoqPq9yGxtN_E,713
@@ -289,39 +290,39 @@ unstructured_ingest/v2/interfaces/uploader.py,sha256=JmZDl1blJa5rS61YHCae3Hfet84
289
290
  unstructured_ingest/v2/pipeline/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
290
291
  unstructured_ingest/v2/pipeline/interfaces.py,sha256=-Y6gPnl-SbNxIx5-dQCmiYSPKUMjivrRlBLIKIUWVeM,8658
291
292
  unstructured_ingest/v2/pipeline/otel.py,sha256=K3pQvWVgWzyOWMKCBUofsH7wTZPJ0Ysw5sLjMBLW41I,1088
292
- unstructured_ingest/v2/pipeline/pipeline.py,sha256=GrcQNotpGl1EtKbpauNh2iHZVNm9vigjEOu7svlUOvM,15660
293
+ unstructured_ingest/v2/pipeline/pipeline.py,sha256=x6hanD7Cj7Wd5MBUvb33UwXQMZxubzwlAiYyBCMukuc,15693
293
294
  unstructured_ingest/v2/pipeline/steps/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
294
- unstructured_ingest/v2/pipeline/steps/chunk.py,sha256=gTIxhkK_n6MC3JbLsqnDsrExmYSl1wSnA_CJsOnVZ3w,3124
295
- unstructured_ingest/v2/pipeline/steps/download.py,sha256=Ld2dp1Znt-BqCcSOkBzBtZV-cGI8Kd-w0wN9Ez9h3Y8,8103
296
- unstructured_ingest/v2/pipeline/steps/embed.py,sha256=zsOZ-FZzJWOqdKKRnvGJ6c8h18d3Wkscx8wEdkGxcmw,3102
297
- unstructured_ingest/v2/pipeline/steps/filter.py,sha256=VAob-9p3bsacv_whb3Hb3rUqA6duL1d-zcUsJg7mxJ8,1188
298
- unstructured_ingest/v2/pipeline/steps/index.py,sha256=0LrzRT-T1-dzZp_ot4ibajaavdhlXdsAwBQXvrEQS2I,2632
299
- unstructured_ingest/v2/pipeline/steps/partition.py,sha256=-jhNtIZwru5gFs3-C_fXXtdRz8NE8MX8Y2ih0iKQKdk,3182
300
- unstructured_ingest/v2/pipeline/steps/stage.py,sha256=ZvP-Rz_A5UkhZNoRUvVgciJbGXlP2WIbN5QIZ9wzP8I,2211
301
- unstructured_ingest/v2/pipeline/steps/uncompress.py,sha256=pEu7VU27Fuu53eqBddAmXihV74A6JTwTfnjKeb__edY,1745
302
- unstructured_ingest/v2/pipeline/steps/upload.py,sha256=G9z8QQe9b_WokI5qyr4UOOqaepEVgwFqMn9pWcta9gI,1917
295
+ unstructured_ingest/v2/pipeline/steps/chunk.py,sha256=rYVcHSXeQSzWszg6VmtYlNc66Gsx-22Ti0BxPyQaJak,3135
296
+ unstructured_ingest/v2/pipeline/steps/download.py,sha256=lzvOl5SoUK6OCCVVeG4CzdPIGj6eKKCGdciNo_0RMNk,8173
297
+ unstructured_ingest/v2/pipeline/steps/embed.py,sha256=-YFvmchdsonWiSXxaD7PJfuUUtMLklaQM_8kZCQxCdM,3113
298
+ unstructured_ingest/v2/pipeline/steps/filter.py,sha256=q7bNieaFMprqoF8Mx7w-ZN6jyA5peiGeTGyPtvcV-uw,1199
299
+ unstructured_ingest/v2/pipeline/steps/index.py,sha256=nfDo-wt5sooKtMHKG7sI42m1L44uw-pxErDlDB1engw,2678
300
+ unstructured_ingest/v2/pipeline/steps/partition.py,sha256=9MQViptxK3ALKco8uE4gK9PpEoGq5JjzyU14C_18blU,3193
301
+ unstructured_ingest/v2/pipeline/steps/stage.py,sha256=cphKgHScLz2rNLZRI5Olsb6dAH-MKGu3p6MYS1BEzkA,2246
302
+ unstructured_ingest/v2/pipeline/steps/uncompress.py,sha256=CFSy4tGp6BAvF0oIwWFN8v4zFzh5pRDeESjEn5iP9hE,1756
303
+ unstructured_ingest/v2/pipeline/steps/upload.py,sha256=zlgXgwReX9TBOdfTpS9hETah4SeSmzPB2g8dAGfLIvM,1987
303
304
  unstructured_ingest/v2/processes/__init__.py,sha256=FaHWSCGyc7GWVnAsNEUUj7L8hT8gCVY3_hUE2VzWtUg,462
304
- unstructured_ingest/v2/processes/chunker.py,sha256=W2qPIddT-QEhHTKpA1krUhBrR0UFOq4nuko2eBjlG_I,6675
305
+ unstructured_ingest/v2/processes/chunker.py,sha256=76PrpCSd8k3DpfdZcl8I10u7vciKzhSV9ZByrrp302g,5476
305
306
  unstructured_ingest/v2/processes/connector_registry.py,sha256=vkEe6jpgdYtZCxMj59s5atWGgmPuxAEXRUoTt-MJ7wc,2198
306
307
  unstructured_ingest/v2/processes/embedder.py,sha256=ZBCIm0oHxWmtUEQYyAjXACqTYPt3LnvXLtoFhu6mu8A,6077
307
308
  unstructured_ingest/v2/processes/filter.py,sha256=kjUmMw2SDq2bme0JCAOxs6cJriIG6Ty09KOznS-xz08,2145
308
- unstructured_ingest/v2/processes/partitioner.py,sha256=KyWCo7qOQb1wyU8GJ2krejWSNE1vWRHvhEl1V_oDEU8,10040
309
+ unstructured_ingest/v2/processes/partitioner.py,sha256=bpqmZDsKKi6qtxNWdIWBfQmr1ccQUhU0axecpGAUf_4,7739
309
310
  unstructured_ingest/v2/processes/uncompress.py,sha256=Z_XfsITGdyaRwhtNUc7bMj5Y2jLuBge8KoK4nxhqKag,2425
310
311
  unstructured_ingest/v2/processes/connectors/__init__.py,sha256=6iBdoH6BW8oMK1ZvEi0IgEchuk0cNUPoNIaikpzeML8,4992
311
- unstructured_ingest/v2/processes/connectors/airtable.py,sha256=LLz3qVhbcZrHXeK1xu8lywj828wsDwYDfSsaNB2CwrA,8915
312
- unstructured_ingest/v2/processes/connectors/astradb.py,sha256=bjlzJVNANnpTxRm8Ba8ZS0KetJ_yxmEyEoPJDwUkcOw,5774
312
+ unstructured_ingest/v2/processes/connectors/airtable.py,sha256=Yi7PEv_FejZ9_y3BPY3gu5YGVfeLh-9YX-qLyQHjJsY,8921
313
+ unstructured_ingest/v2/processes/connectors/astradb.py,sha256=ZctZRfXcOAMBGPkKgHvhTmV_-2F0YN5vqwfY9UCHIlU,5791
313
314
  unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py,sha256=S55v7TXu30rEdgythMBB_2VcuomyMPmcPtLYykbhw_E,8466
314
315
  unstructured_ingest/v2/processes/connectors/chroma.py,sha256=skrxRPHZ8y3JxNa0dt5SVitHiDQ5WVxLvY_kh2-QUrQ,8029
315
316
  unstructured_ingest/v2/processes/connectors/couchbase.py,sha256=SONLywyEfoAlLc-HPabXeGzoiwKnekMHIbRMXd4CGXs,12146
316
- unstructured_ingest/v2/processes/connectors/databricks_volumes.py,sha256=UL_tAMP9uFzU_BQArFlx0RtrR_Z6P6Ksqg5bonxPt4E,5843
317
- unstructured_ingest/v2/processes/connectors/elasticsearch.py,sha256=H8svPr-Yk3UniHT1O9kUd2QhTfrJdzbqRNLFZIMiITQ,16750
317
+ unstructured_ingest/v2/processes/connectors/databricks_volumes.py,sha256=E_4DzeemC4mhZsVuLmSXtfy4MR1MoU6CNyvpRqsKnJU,6030
318
+ unstructured_ingest/v2/processes/connectors/elasticsearch.py,sha256=ojxMUHkLa6ZG50aTGn2YWhDHZ1n38uFRn5p8_ghAIvM,16762
318
319
  unstructured_ingest/v2/processes/connectors/google_drive.py,sha256=7xOQthcqBd9auJxB0nxZlhh1vdjXpMX_CtQZa6YfZz0,13088
319
320
  unstructured_ingest/v2/processes/connectors/kdbai.py,sha256=D71gt8fsPOXi2-Rir8mATw6dRM3BdzYGnn62qG1iaBw,5586
320
321
  unstructured_ingest/v2/processes/connectors/local.py,sha256=a3stgnIkhBbXPIQD0O-RaRM-Eb-szHj9Yy4Fz881-9c,6723
321
- unstructured_ingest/v2/processes/connectors/milvus.py,sha256=oJCsCHgbMSKZ8AphU_vO_R_4OmGv9Nm7gFdNDUmcu7E,7675
322
+ unstructured_ingest/v2/processes/connectors/milvus.py,sha256=ZUlyAQyTt0U1JoapFYHQW3IIaGYY50b3URDSLEAFjtk,7687
322
323
  unstructured_ingest/v2/processes/connectors/mongodb.py,sha256=2_R_hrEAaTU4vJTCK9oKblWTgv6BKjyUhFtC7uq3q2w,4859
323
324
  unstructured_ingest/v2/processes/connectors/onedrive.py,sha256=ZiUo-dFo1LMOvFwphSLRZiR1PcrN8GWLTHhsh4TU6n0,9207
324
- unstructured_ingest/v2/processes/connectors/opensearch.py,sha256=PNkJGLCCkwxLvxKX6vF_0jy-LC4wKu8PCXzmULEo9sk,6755
325
+ unstructured_ingest/v2/processes/connectors/opensearch.py,sha256=dfDSNrWIEk19wuHdlMJpp_SLMOteNPlkDBPlAwu1LVY,6767
325
326
  unstructured_ingest/v2/processes/connectors/pinecone.py,sha256=gCueI1Px7UkI1flNovLMRvcbPGczHI3IlYhOPYlb3WU,6748
326
327
  unstructured_ingest/v2/processes/connectors/salesforce.py,sha256=2CiO2ZZiZ1Y1-nB7wcDlDVcpW2B7ut9wCj66rkkqho0,11616
327
328
  unstructured_ingest/v2/processes/connectors/sharepoint.py,sha256=hOaV5gBcHFc6N5Rbu3MgM-5Aol1ht-QkNIN4PqjvfxE,19665
@@ -330,17 +331,17 @@ unstructured_ingest/v2/processes/connectors/sql.py,sha256=srj2ECKnkGR_iEFBdpa8sx
330
331
  unstructured_ingest/v2/processes/connectors/utils.py,sha256=8kd0g7lo9NqnpaIkjeO-Ut6erhwUNH_gS9koevpe3WE,878
331
332
  unstructured_ingest/v2/processes/connectors/weaviate.py,sha256=Ss0YyD5T6k-00eJ6dr5lSo2H0LcOjVTMmozehyTvnAo,8866
332
333
  unstructured_ingest/v2/processes/connectors/fsspec/__init__.py,sha256=TtdeImM7Ypl_n6sl7I1JqX6bGSG0t_FqvCqE3Cy24og,1846
333
- unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=dzOuy1RuozGnCCFJ6CiE3brijcv5WHBnUVVJXx75bks,6057
334
- unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=_yOII2D1zCnI-ae_G7Fx7lb5GuTiaELIHtIyfeDOKGE,4343
335
- unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=pjDsOVf-a3ERBL3PVop7fI8wIrJc4-51CHzolivLwY8,4686
336
- unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=Ri1TscAbQyIb3QZXDIC3vYJyGRgFWAOrzaQsngsCl-Q,12785
337
- unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=eKcFYwnUNr3TwEGyriV9lvXRo9AZEOw_dvVyibVD0dM,5915
338
- unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=UfI4MxUd74K0i1odJx9KZOfJtvwixL6n2DWvhLOgkfo,6302
339
- unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=NkcU4U2DQWWuM8UHkez67C3SEOZpVyRtmtNS-z-F0Fw,6056
334
+ unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=Y01BuVRql0Kvzc_cdaZE9dDGYjJzrwJu-etfUrEGcUU,7061
335
+ unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=Cjk0LUxqOCDbme0GmnD_5_b1hfStjI23cKw6BquKNrg,5488
336
+ unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=NNAxIRdOQxUncfwhu7J7SnQRM6BSStNOyQZi-4E51iY,5816
337
+ unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=usLzU2NA5D_a1juhja4jyJP_CzW4h-5rZ22bWVwvZGQ,10853
338
+ unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=-_pYHbsBG9FyRyNIaf_xyFbPiiR7pnWEEg_8mp0rIZ8,7053
339
+ unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=je1BDqFWlyMfPa4oAMMNFQLLQtCY9quuqx3xjTwF8OQ,6251
340
+ unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=dwpyqDq0qceCBWX3zM1hiUlgXB4hzX6ObOr-sh-5CJs,6926
340
341
  unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
341
- unstructured_ingest-0.0.19.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
342
- unstructured_ingest-0.0.19.dist-info/METADATA,sha256=zKtqMpSxKXmy-fe4FBx70-JgASRdcxPXXYq9r22FlZI,28507
343
- unstructured_ingest-0.0.19.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
344
- unstructured_ingest-0.0.19.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
345
- unstructured_ingest-0.0.19.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
346
- unstructured_ingest-0.0.19.dist-info/RECORD,,
342
+ unstructured_ingest-0.0.22.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
343
+ unstructured_ingest-0.0.22.dist-info/METADATA,sha256=JteQ0j_D7rNBM7XNdb3dSgJMx26-OV8mLUVqubvhSMY,7108
344
+ unstructured_ingest-0.0.22.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
345
+ unstructured_ingest-0.0.22.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
346
+ unstructured_ingest-0.0.22.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
347
+ unstructured_ingest-0.0.22.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: bdist_wheel (0.44.0)
2
+ Generator: setuptools (75.1.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5