unstructured-ingest 0.7.0__py3-none-any.whl → 0.7.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

@@ -1 +1 @@
1
- __version__ = "0.7.0" # pragma: no cover
1
+ __version__ = "0.7.1" # pragma: no cover
@@ -53,11 +53,14 @@ MAX_BYTES_SIZE = 512_000_000
53
53
 
54
54
  class OnedriveAccessConfig(AccessConfig):
55
55
  client_cred: str = Field(description="Microsoft App client secret")
56
+ password: Optional[str] = Field(description="Service account password", default=None)
56
57
 
57
58
 
58
59
  class OnedriveConnectionConfig(ConnectionConfig):
59
60
  client_id: str = Field(description="Microsoft app client ID")
60
- user_pname: str = Field(description="User principal name, usually is your Azure AD email.")
61
+ user_pname: str = Field(
62
+ description="User principal name or service account, usually your Azure AD email."
63
+ )
61
64
  tenant: str = Field(
62
65
  repr=False, description="ID or domain name associated with your Azure AD instance"
63
66
  )
@@ -74,25 +77,50 @@ class OnedriveConnectionConfig(ConnectionConfig):
74
77
  drive = client.users[self.user_pname].drive
75
78
  return drive
76
79
 
77
- @requires_dependencies(["msal"], extras="onedrive")
80
+ @requires_dependencies(["msal", "requests"], extras="onedrive")
78
81
  def get_token(self):
79
82
  from msal import ConfidentialClientApplication
83
+ from requests import post
84
+
85
+ if self.access_config.get_secret_value().password:
86
+ url = f"https://login.microsoftonline.com/{self.tenant}/oauth2/v2.0/token"
87
+ headers = {"Content-Type": "application/x-www-form-urlencoded"}
88
+ data = {
89
+ "grant_type": "password",
90
+ "username": self.user_pname,
91
+ "password": self.access_config.get_secret_value().password,
92
+ "client_id": self.client_id,
93
+ "client_secret": self.access_config.get_secret_value().client_cred,
94
+ "scope": "https://graph.microsoft.com/.default",
95
+ }
96
+ response = post(url, headers=headers, data=data)
97
+ if response.status_code == 200:
98
+ return response.json()
99
+ else:
100
+ raise SourceConnectionError(
101
+ f"Oauth2 authentication failed with {response.status_code}: {response.text}"
102
+ )
80
103
 
81
- try:
82
- app = ConfidentialClientApplication(
83
- authority=f"{self.authority_url}/{self.tenant}",
84
- client_id=self.client_id,
85
- client_credential=self.access_config.get_secret_value().client_cred,
86
- )
87
- token = app.acquire_token_for_client(scopes=["https://graph.microsoft.com/.default"])
88
- except ValueError as exc:
89
- logger.error("Couldn't set up credentials for OneDrive")
90
- raise exc
91
- if "error" in token:
92
- raise SourceConnectionNetworkError(
93
- "failed to fetch token, {}: {}".format(token["error"], token["error_description"])
94
- )
95
- return token
104
+ else:
105
+ try:
106
+ app = ConfidentialClientApplication(
107
+ authority=f"{self.authority_url}/{self.tenant}",
108
+ client_id=self.client_id,
109
+ client_credential=self.access_config.get_secret_value().client_cred,
110
+ )
111
+ token = app.acquire_token_for_client(
112
+ scopes=["https://graph.microsoft.com/.default"]
113
+ )
114
+ except ValueError as exc:
115
+ logger.error("Couldn't set up credentials.")
116
+ raise exc
117
+ if "error" in token:
118
+ raise SourceConnectionNetworkError(
119
+ "failed to fetch token, {}: {}".format(
120
+ token["error"], token["error_description"]
121
+ )
122
+ )
123
+ return token
96
124
 
97
125
  @requires_dependencies(["office365"], extras="onedrive")
98
126
  def get_client(self) -> "GraphClient":
@@ -100,7 +100,7 @@ class SharepointDownloader(OnedriveDownloader):
100
100
  connector_type: str = CONNECTOR_TYPE
101
101
 
102
102
  @SourceConnectionNetworkError.wrap
103
- @requires_dependencies(["office365"], extras="onedrive")
103
+ @requires_dependencies(["office365"], extras="sharepoint")
104
104
  def _fetch_file(self, file_data: FileData) -> DriveItem:
105
105
  from office365.runtime.client_request_exception import ClientRequestException
106
106
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: unstructured-ingest
3
- Version: 0.7.0
3
+ Version: 0.7.1
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,348 +22,349 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.14
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: click
26
- Requires-Dist: python-dateutil
27
- Requires-Dist: pydantic>=2.7
28
25
  Requires-Dist: opentelemetry-sdk
29
- Requires-Dist: tqdm
30
26
  Requires-Dist: dataclasses_json
31
- Requires-Dist: numpy
27
+ Requires-Dist: click
28
+ Requires-Dist: tqdm
29
+ Requires-Dist: pydantic>=2.7
30
+ Requires-Dist: python-dateutil
32
31
  Requires-Dist: pandas
32
+ Requires-Dist: numpy
33
33
  Provides-Extra: remote
34
34
  Requires-Dist: unstructured-client>=0.30.0; extra == "remote"
35
- Requires-Dist: numpy; extra == "remote"
36
35
  Requires-Dist: pandas; extra == "remote"
36
+ Requires-Dist: numpy; extra == "remote"
37
37
  Provides-Extra: csv
38
38
  Requires-Dist: unstructured[tsv]; extra == "csv"
39
- Requires-Dist: numpy; extra == "csv"
40
39
  Requires-Dist: pandas; extra == "csv"
40
+ Requires-Dist: numpy; extra == "csv"
41
41
  Provides-Extra: doc
42
42
  Requires-Dist: unstructured[docx]; extra == "doc"
43
- Requires-Dist: numpy; extra == "doc"
44
43
  Requires-Dist: pandas; extra == "doc"
44
+ Requires-Dist: numpy; extra == "doc"
45
45
  Provides-Extra: docx
46
46
  Requires-Dist: unstructured[docx]; extra == "docx"
47
- Requires-Dist: numpy; extra == "docx"
48
47
  Requires-Dist: pandas; extra == "docx"
48
+ Requires-Dist: numpy; extra == "docx"
49
49
  Provides-Extra: epub
50
50
  Requires-Dist: unstructured[epub]; extra == "epub"
51
- Requires-Dist: numpy; extra == "epub"
52
51
  Requires-Dist: pandas; extra == "epub"
52
+ Requires-Dist: numpy; extra == "epub"
53
53
  Provides-Extra: md
54
54
  Requires-Dist: unstructured[md]; extra == "md"
55
- Requires-Dist: numpy; extra == "md"
56
55
  Requires-Dist: pandas; extra == "md"
56
+ Requires-Dist: numpy; extra == "md"
57
57
  Provides-Extra: msg
58
58
  Requires-Dist: unstructured[msg]; extra == "msg"
59
- Requires-Dist: numpy; extra == "msg"
60
59
  Requires-Dist: pandas; extra == "msg"
60
+ Requires-Dist: numpy; extra == "msg"
61
61
  Provides-Extra: odt
62
62
  Requires-Dist: unstructured[odt]; extra == "odt"
63
- Requires-Dist: numpy; extra == "odt"
64
63
  Requires-Dist: pandas; extra == "odt"
64
+ Requires-Dist: numpy; extra == "odt"
65
65
  Provides-Extra: org
66
66
  Requires-Dist: unstructured[org]; extra == "org"
67
- Requires-Dist: numpy; extra == "org"
68
67
  Requires-Dist: pandas; extra == "org"
68
+ Requires-Dist: numpy; extra == "org"
69
69
  Provides-Extra: pdf
70
70
  Requires-Dist: unstructured[pdf]; extra == "pdf"
71
- Requires-Dist: numpy; extra == "pdf"
72
71
  Requires-Dist: pandas; extra == "pdf"
72
+ Requires-Dist: numpy; extra == "pdf"
73
73
  Provides-Extra: ppt
74
74
  Requires-Dist: unstructured[pptx]; extra == "ppt"
75
- Requires-Dist: numpy; extra == "ppt"
76
75
  Requires-Dist: pandas; extra == "ppt"
76
+ Requires-Dist: numpy; extra == "ppt"
77
77
  Provides-Extra: pptx
78
78
  Requires-Dist: unstructured[pptx]; extra == "pptx"
79
- Requires-Dist: numpy; extra == "pptx"
80
79
  Requires-Dist: pandas; extra == "pptx"
80
+ Requires-Dist: numpy; extra == "pptx"
81
81
  Provides-Extra: rtf
82
82
  Requires-Dist: unstructured[rtf]; extra == "rtf"
83
- Requires-Dist: numpy; extra == "rtf"
84
83
  Requires-Dist: pandas; extra == "rtf"
84
+ Requires-Dist: numpy; extra == "rtf"
85
85
  Provides-Extra: rst
86
86
  Requires-Dist: unstructured[rst]; extra == "rst"
87
- Requires-Dist: numpy; extra == "rst"
88
87
  Requires-Dist: pandas; extra == "rst"
88
+ Requires-Dist: numpy; extra == "rst"
89
89
  Provides-Extra: tsv
90
90
  Requires-Dist: unstructured[tsv]; extra == "tsv"
91
- Requires-Dist: numpy; extra == "tsv"
92
91
  Requires-Dist: pandas; extra == "tsv"
92
+ Requires-Dist: numpy; extra == "tsv"
93
93
  Provides-Extra: xlsx
94
94
  Requires-Dist: unstructured[xlsx]; extra == "xlsx"
95
- Requires-Dist: numpy; extra == "xlsx"
96
95
  Requires-Dist: pandas; extra == "xlsx"
96
+ Requires-Dist: numpy; extra == "xlsx"
97
97
  Provides-Extra: airtable
98
98
  Requires-Dist: pyairtable; extra == "airtable"
99
- Requires-Dist: numpy; extra == "airtable"
100
99
  Requires-Dist: pandas; extra == "airtable"
100
+ Requires-Dist: numpy; extra == "airtable"
101
101
  Provides-Extra: astradb
102
102
  Requires-Dist: astrapy; extra == "astradb"
103
- Requires-Dist: numpy; extra == "astradb"
104
103
  Requires-Dist: pandas; extra == "astradb"
104
+ Requires-Dist: numpy; extra == "astradb"
105
105
  Provides-Extra: azure
106
106
  Requires-Dist: fsspec; extra == "azure"
107
107
  Requires-Dist: adlfs; extra == "azure"
108
- Requires-Dist: numpy; extra == "azure"
109
108
  Requires-Dist: pandas; extra == "azure"
109
+ Requires-Dist: numpy; extra == "azure"
110
110
  Provides-Extra: azure-ai-search
111
111
  Requires-Dist: azure-search-documents; extra == "azure-ai-search"
112
- Requires-Dist: numpy; extra == "azure-ai-search"
113
112
  Requires-Dist: pandas; extra == "azure-ai-search"
113
+ Requires-Dist: numpy; extra == "azure-ai-search"
114
114
  Provides-Extra: biomed
115
115
  Requires-Dist: bs4; extra == "biomed"
116
116
  Requires-Dist: requests; extra == "biomed"
117
- Requires-Dist: numpy; extra == "biomed"
118
117
  Requires-Dist: pandas; extra == "biomed"
118
+ Requires-Dist: numpy; extra == "biomed"
119
119
  Provides-Extra: box
120
- Requires-Dist: boxfs; extra == "box"
121
120
  Requires-Dist: fsspec; extra == "box"
122
- Requires-Dist: numpy; extra == "box"
121
+ Requires-Dist: boxfs; extra == "box"
123
122
  Requires-Dist: pandas; extra == "box"
123
+ Requires-Dist: numpy; extra == "box"
124
124
  Provides-Extra: chroma
125
125
  Requires-Dist: chromadb; extra == "chroma"
126
- Requires-Dist: numpy; extra == "chroma"
127
126
  Requires-Dist: pandas; extra == "chroma"
127
+ Requires-Dist: numpy; extra == "chroma"
128
128
  Provides-Extra: clarifai
129
129
  Requires-Dist: clarifai; extra == "clarifai"
130
- Requires-Dist: numpy; extra == "clarifai"
131
130
  Requires-Dist: pandas; extra == "clarifai"
131
+ Requires-Dist: numpy; extra == "clarifai"
132
132
  Provides-Extra: confluence
133
- Requires-Dist: atlassian-python-api; extra == "confluence"
134
133
  Requires-Dist: requests; extra == "confluence"
135
- Requires-Dist: numpy; extra == "confluence"
134
+ Requires-Dist: atlassian-python-api; extra == "confluence"
136
135
  Requires-Dist: pandas; extra == "confluence"
136
+ Requires-Dist: numpy; extra == "confluence"
137
137
  Provides-Extra: couchbase
138
138
  Requires-Dist: couchbase; extra == "couchbase"
139
- Requires-Dist: numpy; extra == "couchbase"
140
139
  Requires-Dist: pandas; extra == "couchbase"
140
+ Requires-Dist: numpy; extra == "couchbase"
141
141
  Provides-Extra: delta-table
142
- Requires-Dist: boto3; extra == "delta-table"
143
142
  Requires-Dist: deltalake; extra == "delta-table"
144
- Requires-Dist: numpy; extra == "delta-table"
143
+ Requires-Dist: boto3; extra == "delta-table"
145
144
  Requires-Dist: pandas; extra == "delta-table"
145
+ Requires-Dist: numpy; extra == "delta-table"
146
146
  Provides-Extra: discord
147
147
  Requires-Dist: discord.py; extra == "discord"
148
- Requires-Dist: numpy; extra == "discord"
149
148
  Requires-Dist: pandas; extra == "discord"
149
+ Requires-Dist: numpy; extra == "discord"
150
150
  Provides-Extra: dropbox
151
- Requires-Dist: fsspec; extra == "dropbox"
152
151
  Requires-Dist: dropboxdrivefs; extra == "dropbox"
153
- Requires-Dist: numpy; extra == "dropbox"
152
+ Requires-Dist: fsspec; extra == "dropbox"
154
153
  Requires-Dist: pandas; extra == "dropbox"
154
+ Requires-Dist: numpy; extra == "dropbox"
155
155
  Provides-Extra: duckdb
156
156
  Requires-Dist: duckdb; extra == "duckdb"
157
- Requires-Dist: numpy; extra == "duckdb"
158
157
  Requires-Dist: pandas; extra == "duckdb"
158
+ Requires-Dist: numpy; extra == "duckdb"
159
159
  Provides-Extra: elasticsearch
160
160
  Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
161
- Requires-Dist: numpy; extra == "elasticsearch"
162
161
  Requires-Dist: pandas; extra == "elasticsearch"
162
+ Requires-Dist: numpy; extra == "elasticsearch"
163
163
  Provides-Extra: gcs
164
- Requires-Dist: fsspec; extra == "gcs"
165
164
  Requires-Dist: bs4; extra == "gcs"
165
+ Requires-Dist: fsspec; extra == "gcs"
166
166
  Requires-Dist: gcsfs; extra == "gcs"
167
- Requires-Dist: numpy; extra == "gcs"
168
167
  Requires-Dist: pandas; extra == "gcs"
168
+ Requires-Dist: numpy; extra == "gcs"
169
169
  Provides-Extra: github
170
- Requires-Dist: pygithub>1.58.0; extra == "github"
171
170
  Requires-Dist: requests; extra == "github"
172
- Requires-Dist: numpy; extra == "github"
171
+ Requires-Dist: pygithub>1.58.0; extra == "github"
173
172
  Requires-Dist: pandas; extra == "github"
173
+ Requires-Dist: numpy; extra == "github"
174
174
  Provides-Extra: gitlab
175
175
  Requires-Dist: python-gitlab; extra == "gitlab"
176
- Requires-Dist: numpy; extra == "gitlab"
177
176
  Requires-Dist: pandas; extra == "gitlab"
177
+ Requires-Dist: numpy; extra == "gitlab"
178
178
  Provides-Extra: google-drive
179
179
  Requires-Dist: google-api-python-client; extra == "google-drive"
180
- Requires-Dist: numpy; extra == "google-drive"
181
180
  Requires-Dist: pandas; extra == "google-drive"
181
+ Requires-Dist: numpy; extra == "google-drive"
182
182
  Provides-Extra: hubspot
183
183
  Requires-Dist: hubspot-api-client; extra == "hubspot"
184
184
  Requires-Dist: urllib3; extra == "hubspot"
185
- Requires-Dist: numpy; extra == "hubspot"
186
185
  Requires-Dist: pandas; extra == "hubspot"
186
+ Requires-Dist: numpy; extra == "hubspot"
187
187
  Provides-Extra: ibm-watsonx-s3
188
- Requires-Dist: pyarrow; extra == "ibm-watsonx-s3"
189
- Requires-Dist: httpx; extra == "ibm-watsonx-s3"
190
188
  Requires-Dist: tenacity; extra == "ibm-watsonx-s3"
189
+ Requires-Dist: httpx; extra == "ibm-watsonx-s3"
190
+ Requires-Dist: pyarrow; extra == "ibm-watsonx-s3"
191
191
  Requires-Dist: pyiceberg; extra == "ibm-watsonx-s3"
192
- Requires-Dist: numpy; extra == "ibm-watsonx-s3"
193
192
  Requires-Dist: pandas; extra == "ibm-watsonx-s3"
193
+ Requires-Dist: numpy; extra == "ibm-watsonx-s3"
194
194
  Provides-Extra: jira
195
195
  Requires-Dist: atlassian-python-api; extra == "jira"
196
- Requires-Dist: numpy; extra == "jira"
197
196
  Requires-Dist: pandas; extra == "jira"
197
+ Requires-Dist: numpy; extra == "jira"
198
198
  Provides-Extra: kafka
199
199
  Requires-Dist: confluent-kafka; extra == "kafka"
200
- Requires-Dist: numpy; extra == "kafka"
201
200
  Requires-Dist: pandas; extra == "kafka"
201
+ Requires-Dist: numpy; extra == "kafka"
202
202
  Provides-Extra: kdbai
203
203
  Requires-Dist: kdbai-client>=1.4.0; extra == "kdbai"
204
- Requires-Dist: numpy; extra == "kdbai"
205
204
  Requires-Dist: pandas; extra == "kdbai"
205
+ Requires-Dist: numpy; extra == "kdbai"
206
206
  Provides-Extra: lancedb
207
207
  Requires-Dist: lancedb; extra == "lancedb"
208
- Requires-Dist: numpy; extra == "lancedb"
209
208
  Requires-Dist: pandas; extra == "lancedb"
209
+ Requires-Dist: numpy; extra == "lancedb"
210
210
  Provides-Extra: milvus
211
211
  Requires-Dist: pymilvus; extra == "milvus"
212
- Requires-Dist: numpy; extra == "milvus"
213
212
  Requires-Dist: pandas; extra == "milvus"
213
+ Requires-Dist: numpy; extra == "milvus"
214
214
  Provides-Extra: mongodb
215
215
  Requires-Dist: pymongo; extra == "mongodb"
216
- Requires-Dist: numpy; extra == "mongodb"
217
216
  Requires-Dist: pandas; extra == "mongodb"
217
+ Requires-Dist: numpy; extra == "mongodb"
218
218
  Provides-Extra: neo4j
219
- Requires-Dist: networkx; extra == "neo4j"
220
219
  Requires-Dist: cymple; extra == "neo4j"
221
220
  Requires-Dist: neo4j-rust-ext; extra == "neo4j"
222
- Requires-Dist: numpy; extra == "neo4j"
221
+ Requires-Dist: networkx; extra == "neo4j"
223
222
  Requires-Dist: pandas; extra == "neo4j"
223
+ Requires-Dist: numpy; extra == "neo4j"
224
224
  Provides-Extra: notion
225
- Requires-Dist: htmlBuilder; extra == "notion"
226
- Requires-Dist: httpx; extra == "notion"
227
225
  Requires-Dist: notion-client; extra == "notion"
228
226
  Requires-Dist: backoff; extra == "notion"
229
- Requires-Dist: numpy; extra == "notion"
227
+ Requires-Dist: httpx; extra == "notion"
228
+ Requires-Dist: htmlBuilder; extra == "notion"
230
229
  Requires-Dist: pandas; extra == "notion"
230
+ Requires-Dist: numpy; extra == "notion"
231
231
  Provides-Extra: onedrive
232
- Requires-Dist: bs4; extra == "onedrive"
233
232
  Requires-Dist: msal; extra == "onedrive"
234
233
  Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
235
- Requires-Dist: numpy; extra == "onedrive"
234
+ Requires-Dist: requests; extra == "onedrive"
236
235
  Requires-Dist: pandas; extra == "onedrive"
236
+ Requires-Dist: numpy; extra == "onedrive"
237
237
  Provides-Extra: opensearch
238
238
  Requires-Dist: opensearch-py; extra == "opensearch"
239
- Requires-Dist: numpy; extra == "opensearch"
240
239
  Requires-Dist: pandas; extra == "opensearch"
240
+ Requires-Dist: numpy; extra == "opensearch"
241
241
  Provides-Extra: outlook
242
242
  Requires-Dist: msal; extra == "outlook"
243
243
  Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
244
- Requires-Dist: numpy; extra == "outlook"
245
244
  Requires-Dist: pandas; extra == "outlook"
245
+ Requires-Dist: numpy; extra == "outlook"
246
246
  Provides-Extra: pinecone
247
247
  Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
248
- Requires-Dist: numpy; extra == "pinecone"
249
248
  Requires-Dist: pandas; extra == "pinecone"
249
+ Requires-Dist: numpy; extra == "pinecone"
250
250
  Provides-Extra: postgres
251
251
  Requires-Dist: psycopg2-binary; extra == "postgres"
252
- Requires-Dist: numpy; extra == "postgres"
253
252
  Requires-Dist: pandas; extra == "postgres"
253
+ Requires-Dist: numpy; extra == "postgres"
254
254
  Provides-Extra: qdrant
255
255
  Requires-Dist: qdrant-client; extra == "qdrant"
256
- Requires-Dist: numpy; extra == "qdrant"
257
256
  Requires-Dist: pandas; extra == "qdrant"
257
+ Requires-Dist: numpy; extra == "qdrant"
258
258
  Provides-Extra: reddit
259
259
  Requires-Dist: praw; extra == "reddit"
260
- Requires-Dist: numpy; extra == "reddit"
261
260
  Requires-Dist: pandas; extra == "reddit"
261
+ Requires-Dist: numpy; extra == "reddit"
262
262
  Provides-Extra: redis
263
263
  Requires-Dist: redis; extra == "redis"
264
- Requires-Dist: numpy; extra == "redis"
265
264
  Requires-Dist: pandas; extra == "redis"
265
+ Requires-Dist: numpy; extra == "redis"
266
266
  Provides-Extra: s3
267
267
  Requires-Dist: fsspec; extra == "s3"
268
268
  Requires-Dist: s3fs; extra == "s3"
269
- Requires-Dist: numpy; extra == "s3"
270
269
  Requires-Dist: pandas; extra == "s3"
270
+ Requires-Dist: numpy; extra == "s3"
271
271
  Provides-Extra: sharepoint
272
272
  Requires-Dist: msal; extra == "sharepoint"
273
273
  Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
274
- Requires-Dist: numpy; extra == "sharepoint"
274
+ Requires-Dist: requests; extra == "sharepoint"
275
275
  Requires-Dist: pandas; extra == "sharepoint"
276
+ Requires-Dist: numpy; extra == "sharepoint"
276
277
  Provides-Extra: salesforce
277
278
  Requires-Dist: simple-salesforce; extra == "salesforce"
278
- Requires-Dist: numpy; extra == "salesforce"
279
279
  Requires-Dist: pandas; extra == "salesforce"
280
+ Requires-Dist: numpy; extra == "salesforce"
280
281
  Provides-Extra: sftp
281
- Requires-Dist: fsspec; extra == "sftp"
282
282
  Requires-Dist: paramiko; extra == "sftp"
283
- Requires-Dist: numpy; extra == "sftp"
283
+ Requires-Dist: fsspec; extra == "sftp"
284
284
  Requires-Dist: pandas; extra == "sftp"
285
+ Requires-Dist: numpy; extra == "sftp"
285
286
  Provides-Extra: slack
286
287
  Requires-Dist: slack_sdk[optional]; extra == "slack"
287
- Requires-Dist: numpy; extra == "slack"
288
288
  Requires-Dist: pandas; extra == "slack"
289
+ Requires-Dist: numpy; extra == "slack"
289
290
  Provides-Extra: snowflake
290
291
  Requires-Dist: snowflake-connector-python; extra == "snowflake"
291
292
  Requires-Dist: psycopg2-binary; extra == "snowflake"
292
- Requires-Dist: numpy; extra == "snowflake"
293
293
  Requires-Dist: pandas; extra == "snowflake"
294
+ Requires-Dist: numpy; extra == "snowflake"
294
295
  Provides-Extra: wikipedia
295
296
  Requires-Dist: wikipedia; extra == "wikipedia"
296
- Requires-Dist: numpy; extra == "wikipedia"
297
297
  Requires-Dist: pandas; extra == "wikipedia"
298
+ Requires-Dist: numpy; extra == "wikipedia"
298
299
  Provides-Extra: weaviate
299
300
  Requires-Dist: weaviate-client; extra == "weaviate"
300
- Requires-Dist: numpy; extra == "weaviate"
301
301
  Requires-Dist: pandas; extra == "weaviate"
302
+ Requires-Dist: numpy; extra == "weaviate"
302
303
  Provides-Extra: databricks-volumes
303
304
  Requires-Dist: databricks-sdk; extra == "databricks-volumes"
304
- Requires-Dist: numpy; extra == "databricks-volumes"
305
305
  Requires-Dist: pandas; extra == "databricks-volumes"
306
+ Requires-Dist: numpy; extra == "databricks-volumes"
306
307
  Provides-Extra: databricks-delta-tables
307
308
  Requires-Dist: databricks-sql-connector; extra == "databricks-delta-tables"
308
- Requires-Dist: numpy; extra == "databricks-delta-tables"
309
309
  Requires-Dist: pandas; extra == "databricks-delta-tables"
310
+ Requires-Dist: numpy; extra == "databricks-delta-tables"
310
311
  Provides-Extra: singlestore
311
312
  Requires-Dist: singlestoredb; extra == "singlestore"
312
- Requires-Dist: numpy; extra == "singlestore"
313
313
  Requires-Dist: pandas; extra == "singlestore"
314
+ Requires-Dist: numpy; extra == "singlestore"
314
315
  Provides-Extra: vectara
315
- Requires-Dist: httpx; extra == "vectara"
316
316
  Requires-Dist: requests; extra == "vectara"
317
+ Requires-Dist: httpx; extra == "vectara"
317
318
  Requires-Dist: aiofiles; extra == "vectara"
318
- Requires-Dist: numpy; extra == "vectara"
319
319
  Requires-Dist: pandas; extra == "vectara"
320
+ Requires-Dist: numpy; extra == "vectara"
320
321
  Provides-Extra: vastdb
321
322
  Requires-Dist: ibis; extra == "vastdb"
322
- Requires-Dist: pyarrow; extra == "vastdb"
323
323
  Requires-Dist: vastdb; extra == "vastdb"
324
- Requires-Dist: numpy; extra == "vastdb"
324
+ Requires-Dist: pyarrow; extra == "vastdb"
325
325
  Requires-Dist: pandas; extra == "vastdb"
326
+ Requires-Dist: numpy; extra == "vastdb"
326
327
  Provides-Extra: zendesk
327
328
  Requires-Dist: bs4; extra == "zendesk"
328
329
  Requires-Dist: httpx; extra == "zendesk"
329
330
  Requires-Dist: aiofiles; extra == "zendesk"
330
- Requires-Dist: numpy; extra == "zendesk"
331
331
  Requires-Dist: pandas; extra == "zendesk"
332
+ Requires-Dist: numpy; extra == "zendesk"
332
333
  Provides-Extra: embed-huggingface
333
334
  Requires-Dist: sentence-transformers; extra == "embed-huggingface"
334
- Requires-Dist: numpy; extra == "embed-huggingface"
335
335
  Requires-Dist: pandas; extra == "embed-huggingface"
336
+ Requires-Dist: numpy; extra == "embed-huggingface"
336
337
  Provides-Extra: embed-octoai
337
338
  Requires-Dist: tiktoken; extra == "embed-octoai"
338
339
  Requires-Dist: openai; extra == "embed-octoai"
339
- Requires-Dist: numpy; extra == "embed-octoai"
340
340
  Requires-Dist: pandas; extra == "embed-octoai"
341
+ Requires-Dist: numpy; extra == "embed-octoai"
341
342
  Provides-Extra: embed-vertexai
342
343
  Requires-Dist: vertexai; extra == "embed-vertexai"
343
- Requires-Dist: numpy; extra == "embed-vertexai"
344
344
  Requires-Dist: pandas; extra == "embed-vertexai"
345
+ Requires-Dist: numpy; extra == "embed-vertexai"
345
346
  Provides-Extra: embed-voyageai
346
347
  Requires-Dist: voyageai; extra == "embed-voyageai"
347
- Requires-Dist: numpy; extra == "embed-voyageai"
348
348
  Requires-Dist: pandas; extra == "embed-voyageai"
349
+ Requires-Dist: numpy; extra == "embed-voyageai"
349
350
  Provides-Extra: embed-mixedbreadai
350
351
  Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
351
- Requires-Dist: numpy; extra == "embed-mixedbreadai"
352
352
  Requires-Dist: pandas; extra == "embed-mixedbreadai"
353
+ Requires-Dist: numpy; extra == "embed-mixedbreadai"
353
354
  Provides-Extra: openai
354
355
  Requires-Dist: tiktoken; extra == "openai"
355
356
  Requires-Dist: openai; extra == "openai"
356
- Requires-Dist: numpy; extra == "openai"
357
357
  Requires-Dist: pandas; extra == "openai"
358
+ Requires-Dist: numpy; extra == "openai"
358
359
  Provides-Extra: bedrock
359
360
  Requires-Dist: boto3; extra == "bedrock"
360
361
  Requires-Dist: aioboto3; extra == "bedrock"
361
- Requires-Dist: numpy; extra == "bedrock"
362
362
  Requires-Dist: pandas; extra == "bedrock"
363
+ Requires-Dist: numpy; extra == "bedrock"
363
364
  Provides-Extra: togetherai
364
365
  Requires-Dist: together; extra == "togetherai"
365
- Requires-Dist: numpy; extra == "togetherai"
366
366
  Requires-Dist: pandas; extra == "togetherai"
367
+ Requires-Dist: numpy; extra == "togetherai"
367
368
  Dynamic: author
368
369
  Dynamic: author-email
369
370
  Dynamic: classifier
@@ -134,7 +134,7 @@ test/unit/partitioners/test_partitioner.py,sha256=eJoUDbiKtweyU1WYfsY5KqVqoPjbx1
134
134
  test/unit/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
135
135
  test/unit/utils/data_generator.py,sha256=UoYVNjG4S4wlaA9gceQ82HIpF9_6I1UTHD1_GrQBHp0,973
136
136
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
137
- unstructured_ingest/__version__.py,sha256=bNFs6PBmjE3W8Yh7mMRTUVysaeHwLGXC2y6p_RXYa08,42
137
+ unstructured_ingest/__version__.py,sha256=YP5dlQlaTHZ-KOck8o_UzdjIFae7iENB5d3AMIKlZ3M,42
138
138
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
139
139
  unstructured_ingest/errors_v2.py,sha256=9RuRCi7lbDxCguDz07y5RiHoQiFIOWwOD7xqzJ2B3Yw,436
140
140
  unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
@@ -212,12 +212,12 @@ unstructured_ingest/processes/connectors/local.py,sha256=LluTLKv4g7FbJb4A6vuSxI9
212
212
  unstructured_ingest/processes/connectors/milvus.py,sha256=Jr9cul7By03tGAPFnFBoqncnNWwbhKd-qbmkuqnin8U,8908
213
213
  unstructured_ingest/processes/connectors/mongodb.py,sha256=1g_5bfbS6lah3nsOXqLAanR3zNYJ47_Njw_uV-uj3_U,14324
214
214
  unstructured_ingest/processes/connectors/neo4j.py,sha256=eAM2XWSLA5caKJmbcd7ctn2TapreIJEXRoHoxT1OZwA,18718
215
- unstructured_ingest/processes/connectors/onedrive.py,sha256=4uin_BBgxNUrcjob4txQn2NTFEhWXuWY9uLeQJ4lRbs,18047
215
+ unstructured_ingest/processes/connectors/onedrive.py,sha256=VBkKlbJgR7uKlKTnjNybAw6ZawLKflDPpy2uVvgWYWw,19296
216
216
  unstructured_ingest/processes/connectors/outlook.py,sha256=FfHV9OfajGbj5VQZccqHsSyYJ0f6a4CLGQJi1s9UJjo,9294
217
217
  unstructured_ingest/processes/connectors/pinecone.py,sha256=TG-1hVfOsKFepxPfy2MCwEVBEZF4msg8lfNQZBpo35Y,13980
218
218
  unstructured_ingest/processes/connectors/redisdb.py,sha256=5LX6KtuNCzqjHqnJPw0zdKLE0iLx7Dk5RN9e_KT-up4,6975
219
219
  unstructured_ingest/processes/connectors/salesforce.py,sha256=a2Erx5pXbxKIj--oJWTGk2TeOcdmipuxgleazbD62o4,11664
220
- unstructured_ingest/processes/connectors/sharepoint.py,sha256=E_oKMz3rdn2HumlDUnDyVVmQLSBLB_3gqI48O6oZfTc,4825
220
+ unstructured_ingest/processes/connectors/sharepoint.py,sha256=PowaqMzWr-VCW1rnwcAeRhHyE55kJ9J9FCVlrmtzN0E,4827
221
221
  unstructured_ingest/processes/connectors/slack.py,sha256=e4ntATdht_olAPsco1DKwlrOkpKLyDznPO1NJmsr0A8,9243
222
222
  unstructured_ingest/processes/connectors/utils.py,sha256=TAd0hb1f291N-q7-TUe6JKSCGkhqDyo7Ij8zmliBZUc,2071
223
223
  unstructured_ingest/processes/connectors/vectara.py,sha256=frKJkc7ffstQhXD9-HkAGoQAofGkl6AsnKJhGcl8LgA,12294
@@ -362,9 +362,9 @@ unstructured_ingest/utils/ndjson.py,sha256=nz8VUOPEgAFdhaDOpuveknvCU4x82fVwqE01q
362
362
  unstructured_ingest/utils/pydantic_models.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3rJn1PHTI_G_A_EHY,1720
363
363
  unstructured_ingest/utils/string_and_date_utils.py,sha256=QBj8HXZGvDZQSULLOQwJ8tb3r2aYrTBQ71rkiV6gZdI,2519
364
364
  unstructured_ingest/utils/table.py,sha256=WZechczgVFvlodUWFcsnCGvBNh1xRm6hr0VbJTPxKAc,3669
365
- unstructured_ingest-0.7.0.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
366
- unstructured_ingest-0.7.0.dist-info/METADATA,sha256=Ovs5cLsehNodHgRKxapQvTYZatKSYKWkbeXwK_iSXQo,14998
367
- unstructured_ingest-0.7.0.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
368
- unstructured_ingest-0.7.0.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
369
- unstructured_ingest-0.7.0.dist-info/top_level.txt,sha256=85vUyT6fV2A5eCEM3M3FPRUUI9vZOVK1xVZt7eo1oV8,34
370
- unstructured_ingest-0.7.0.dist-info/RECORD,,
365
+ unstructured_ingest-0.7.1.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
366
+ unstructured_ingest-0.7.1.dist-info/METADATA,sha256=Ex_8EkItZzbGEoRJwR7Fqm_t0aajIZLVdtzwL7XBsQw,15050
367
+ unstructured_ingest-0.7.1.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
368
+ unstructured_ingest-0.7.1.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
369
+ unstructured_ingest-0.7.1.dist-info/top_level.txt,sha256=85vUyT6fV2A5eCEM3M3FPRUUI9vZOVK1xVZt7eo1oV8,34
370
+ unstructured_ingest-0.7.1.dist-info/RECORD,,