unstructured-ingest 0.0.16__py3-none-any.whl → 0.0.18__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

@@ -1 +1 @@
1
- __version__ = "0.0.16" # pragma: no cover
1
+ __version__ = "0.0.18" # pragma: no cover
@@ -2,12 +2,12 @@
2
2
  import json
3
3
  import os
4
4
  from dataclasses import dataclass
5
+ from pathlib import Path
5
6
  from typing import TYPE_CHECKING, Annotated, Any, List, Optional
6
7
 
7
8
  import numpy as np
8
9
  from pydantic import Field, Secret, ValidationError
9
10
  from pydantic.functional_validators import BeforeValidator
10
- from unstructured.utils import FileHandler
11
11
 
12
12
  from unstructured_ingest.embed.interfaces import BaseEmbeddingEncoder, EmbeddingConfig
13
13
  from unstructured_ingest.utils.dep_check import requires_dependencies
@@ -35,10 +35,10 @@ class VertexAIEmbeddingConfig(EmbeddingConfig):
35
35
 
36
36
  def register_application_credentials(self):
37
37
  # TODO look into passing credentials in directly, rather than via env var and tmp file
38
- application_credentials_path = os.path.join("/tmp", "google-vertex-app-credentials.json")
39
- credentials_file = FileHandler(application_credentials_path)
40
- credentials_file.write_file(json.dumps(self.api_key.get_secret_value()))
41
- os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = application_credentials_path
38
+ application_credentials_path = Path("/tmp") / "google-vertex-app-credentials.json"
39
+ with application_credentials_path.open("w+") as credentials_file:
40
+ json.dump(self.api_key.get_secret_value(), credentials_file)
41
+ os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = str(application_credentials_path)
42
42
 
43
43
  @requires_dependencies(
44
44
  ["langchain", "langchain_google_vertexai"],
@@ -102,7 +102,13 @@ class FsspecIndexer(Indexer):
102
102
  fs = get_filesystem_class(self.index_config.protocol)(
103
103
  **self.connection_config.get_access_config(),
104
104
  )
105
- fs.ls(path=self.index_config.path_without_protocol, detail=False)
105
+ files = fs.ls(path=self.index_config.path_without_protocol, detail=True)
106
+ valid_files = [x.get("name") for x in files if x.get("type") == "file"]
107
+ if not valid_files:
108
+ return
109
+ file_to_sample = valid_files[0]
110
+ logger.debug(f"attempting to make HEAD request for file: {file_to_sample}")
111
+ self.fs.head(path=file_to_sample)
106
112
  except Exception as e:
107
113
  logger.error(f"failed to validate connection: {e}", exc_info=True)
108
114
  raise SourceConnectionError(f"failed to validate connection: {e}")
@@ -299,8 +305,8 @@ class FsspecUploader(Uploader):
299
305
  fs = get_filesystem_class(self.upload_config.protocol)(
300
306
  **self.connection_config.get_access_config(),
301
307
  )
302
- root_dir = self.upload_config.path_without_protocol.split("/")[0]
303
- fs.ls(path=root_dir, detail=False)
308
+ upload_path = Path(self.upload_config.path_without_protocol) / "_empty"
309
+ fs.write_bytes(path=str(upload_path), value=b"")
304
310
  except Exception as e:
305
311
  logger.error(f"failed to validate connection: {e}", exc_info=True)
306
312
  raise DestinationConnectionError(f"failed to validate connection: {e}")
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.16
3
+ Version: 0.0.18
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,617 +22,617 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.13
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: tqdm
26
25
  Requires-Dist: python-dateutil
27
- Requires-Dist: pydantic>=2.7
28
26
  Requires-Dist: pandas
27
+ Requires-Dist: pydantic>=2.7
29
28
  Requires-Dist: click
30
- Requires-Dist: dataclasses-json
31
29
  Requires-Dist: opentelemetry-sdk
30
+ Requires-Dist: dataclasses-json
31
+ Requires-Dist: tqdm
32
32
  Provides-Extra: airtable
33
33
  Requires-Dist: pyairtable; extra == "airtable"
34
- Requires-Dist: dataclasses-json; extra == "airtable"
35
- Requires-Dist: tqdm; extra == "airtable"
36
- Requires-Dist: pydantic>=2.7; extra == "airtable"
34
+ Requires-Dist: python-dateutil; extra == "airtable"
37
35
  Requires-Dist: pandas; extra == "airtable"
36
+ Requires-Dist: pydantic>=2.7; extra == "airtable"
38
37
  Requires-Dist: click; extra == "airtable"
39
- Requires-Dist: python-dateutil; extra == "airtable"
40
38
  Requires-Dist: opentelemetry-sdk; extra == "airtable"
39
+ Requires-Dist: dataclasses-json; extra == "airtable"
40
+ Requires-Dist: tqdm; extra == "airtable"
41
41
  Provides-Extra: astradb
42
- Requires-Dist: dataclasses-json; extra == "astradb"
43
42
  Requires-Dist: astrapy; extra == "astradb"
44
- Requires-Dist: tqdm; extra == "astradb"
45
- Requires-Dist: pydantic>=2.7; extra == "astradb"
43
+ Requires-Dist: python-dateutil; extra == "astradb"
46
44
  Requires-Dist: pandas; extra == "astradb"
45
+ Requires-Dist: pydantic>=2.7; extra == "astradb"
47
46
  Requires-Dist: click; extra == "astradb"
48
- Requires-Dist: python-dateutil; extra == "astradb"
49
47
  Requires-Dist: opentelemetry-sdk; extra == "astradb"
48
+ Requires-Dist: dataclasses-json; extra == "astradb"
49
+ Requires-Dist: tqdm; extra == "astradb"
50
50
  Provides-Extra: azure
51
51
  Requires-Dist: fsspec; extra == "azure"
52
+ Requires-Dist: python-dateutil; extra == "azure"
52
53
  Requires-Dist: adlfs; extra == "azure"
53
- Requires-Dist: dataclasses-json; extra == "azure"
54
- Requires-Dist: tqdm; extra == "azure"
55
- Requires-Dist: pydantic>=2.7; extra == "azure"
56
54
  Requires-Dist: pandas; extra == "azure"
55
+ Requires-Dist: pydantic>=2.7; extra == "azure"
57
56
  Requires-Dist: click; extra == "azure"
58
- Requires-Dist: python-dateutil; extra == "azure"
59
57
  Requires-Dist: opentelemetry-sdk; extra == "azure"
58
+ Requires-Dist: dataclasses-json; extra == "azure"
59
+ Requires-Dist: tqdm; extra == "azure"
60
60
  Provides-Extra: azure-cognitive-search
61
- Requires-Dist: dataclasses-json; extra == "azure-cognitive-search"
62
- Requires-Dist: tqdm; extra == "azure-cognitive-search"
63
- Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
64
- Requires-Dist: pydantic>=2.7; extra == "azure-cognitive-search"
61
+ Requires-Dist: python-dateutil; extra == "azure-cognitive-search"
65
62
  Requires-Dist: pandas; extra == "azure-cognitive-search"
63
+ Requires-Dist: pydantic>=2.7; extra == "azure-cognitive-search"
64
+ Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
66
65
  Requires-Dist: click; extra == "azure-cognitive-search"
67
- Requires-Dist: python-dateutil; extra == "azure-cognitive-search"
68
66
  Requires-Dist: opentelemetry-sdk; extra == "azure-cognitive-search"
67
+ Requires-Dist: dataclasses-json; extra == "azure-cognitive-search"
68
+ Requires-Dist: tqdm; extra == "azure-cognitive-search"
69
69
  Provides-Extra: bedrock
70
- Requires-Dist: boto3; extra == "bedrock"
71
- Requires-Dist: dataclasses-json; extra == "bedrock"
72
- Requires-Dist: tqdm; extra == "bedrock"
73
- Requires-Dist: pydantic>=2.7; extra == "bedrock"
74
- Requires-Dist: pandas; extra == "bedrock"
70
+ Requires-Dist: python-dateutil; extra == "bedrock"
75
71
  Requires-Dist: langchain-community; extra == "bedrock"
72
+ Requires-Dist: pandas; extra == "bedrock"
73
+ Requires-Dist: pydantic>=2.7; extra == "bedrock"
74
+ Requires-Dist: boto3; extra == "bedrock"
76
75
  Requires-Dist: click; extra == "bedrock"
77
- Requires-Dist: python-dateutil; extra == "bedrock"
78
76
  Requires-Dist: opentelemetry-sdk; extra == "bedrock"
77
+ Requires-Dist: dataclasses-json; extra == "bedrock"
78
+ Requires-Dist: tqdm; extra == "bedrock"
79
79
  Provides-Extra: biomed
80
- Requires-Dist: dataclasses-json; extra == "biomed"
81
- Requires-Dist: tqdm; extra == "biomed"
80
+ Requires-Dist: python-dateutil; extra == "biomed"
81
+ Requires-Dist: requests; extra == "biomed"
82
82
  Requires-Dist: bs4; extra == "biomed"
83
83
  Requires-Dist: pydantic>=2.7; extra == "biomed"
84
84
  Requires-Dist: pandas; extra == "biomed"
85
85
  Requires-Dist: click; extra == "biomed"
86
- Requires-Dist: python-dateutil; extra == "biomed"
87
- Requires-Dist: requests; extra == "biomed"
88
86
  Requires-Dist: opentelemetry-sdk; extra == "biomed"
87
+ Requires-Dist: dataclasses-json; extra == "biomed"
88
+ Requires-Dist: tqdm; extra == "biomed"
89
89
  Provides-Extra: box
90
90
  Requires-Dist: fsspec; extra == "box"
91
- Requires-Dist: dataclasses-json; extra == "box"
92
- Requires-Dist: tqdm; extra == "box"
93
- Requires-Dist: pydantic>=2.7; extra == "box"
91
+ Requires-Dist: python-dateutil; extra == "box"
94
92
  Requires-Dist: pandas; extra == "box"
93
+ Requires-Dist: pydantic>=2.7; extra == "box"
95
94
  Requires-Dist: click; extra == "box"
96
95
  Requires-Dist: opentelemetry-sdk; extra == "box"
97
- Requires-Dist: python-dateutil; extra == "box"
96
+ Requires-Dist: dataclasses-json; extra == "box"
98
97
  Requires-Dist: boxfs; extra == "box"
98
+ Requires-Dist: tqdm; extra == "box"
99
99
  Provides-Extra: chroma
100
- Requires-Dist: chromadb; extra == "chroma"
101
- Requires-Dist: dataclasses-json; extra == "chroma"
102
- Requires-Dist: tqdm; extra == "chroma"
103
- Requires-Dist: pydantic>=2.7; extra == "chroma"
100
+ Requires-Dist: python-dateutil; extra == "chroma"
104
101
  Requires-Dist: pandas; extra == "chroma"
102
+ Requires-Dist: pydantic>=2.7; extra == "chroma"
105
103
  Requires-Dist: click; extra == "chroma"
106
- Requires-Dist: python-dateutil; extra == "chroma"
107
104
  Requires-Dist: opentelemetry-sdk; extra == "chroma"
105
+ Requires-Dist: chromadb; extra == "chroma"
106
+ Requires-Dist: dataclasses-json; extra == "chroma"
107
+ Requires-Dist: tqdm; extra == "chroma"
108
108
  Provides-Extra: clarifai
109
109
  Requires-Dist: clarifai; extra == "clarifai"
110
- Requires-Dist: dataclasses-json; extra == "clarifai"
111
- Requires-Dist: tqdm; extra == "clarifai"
112
- Requires-Dist: pydantic>=2.7; extra == "clarifai"
110
+ Requires-Dist: python-dateutil; extra == "clarifai"
113
111
  Requires-Dist: pandas; extra == "clarifai"
112
+ Requires-Dist: pydantic>=2.7; extra == "clarifai"
114
113
  Requires-Dist: click; extra == "clarifai"
115
- Requires-Dist: python-dateutil; extra == "clarifai"
116
114
  Requires-Dist: opentelemetry-sdk; extra == "clarifai"
115
+ Requires-Dist: dataclasses-json; extra == "clarifai"
116
+ Requires-Dist: tqdm; extra == "clarifai"
117
117
  Provides-Extra: confluence
118
- Requires-Dist: atlassian-python-api; extra == "confluence"
119
- Requires-Dist: dataclasses-json; extra == "confluence"
120
- Requires-Dist: tqdm; extra == "confluence"
121
- Requires-Dist: pydantic>=2.7; extra == "confluence"
122
- Requires-Dist: pandas; extra == "confluence"
123
- Requires-Dist: click; extra == "confluence"
124
118
  Requires-Dist: python-dateutil; extra == "confluence"
125
119
  Requires-Dist: requests; extra == "confluence"
120
+ Requires-Dist: pandas; extra == "confluence"
121
+ Requires-Dist: pydantic>=2.7; extra == "confluence"
122
+ Requires-Dist: click; extra == "confluence"
126
123
  Requires-Dist: opentelemetry-sdk; extra == "confluence"
124
+ Requires-Dist: atlassian-python-api; extra == "confluence"
125
+ Requires-Dist: dataclasses-json; extra == "confluence"
126
+ Requires-Dist: tqdm; extra == "confluence"
127
127
  Provides-Extra: couchbase
128
- Requires-Dist: couchbase; extra == "couchbase"
129
- Requires-Dist: dataclasses-json; extra == "couchbase"
130
- Requires-Dist: tqdm; extra == "couchbase"
131
- Requires-Dist: pydantic>=2.7; extra == "couchbase"
128
+ Requires-Dist: python-dateutil; extra == "couchbase"
132
129
  Requires-Dist: pandas; extra == "couchbase"
130
+ Requires-Dist: pydantic>=2.7; extra == "couchbase"
133
131
  Requires-Dist: click; extra == "couchbase"
134
- Requires-Dist: python-dateutil; extra == "couchbase"
135
132
  Requires-Dist: opentelemetry-sdk; extra == "couchbase"
133
+ Requires-Dist: dataclasses-json; extra == "couchbase"
134
+ Requires-Dist: couchbase; extra == "couchbase"
135
+ Requires-Dist: tqdm; extra == "couchbase"
136
136
  Provides-Extra: csv
137
- Requires-Dist: unstructured[tsv]; extra == "csv"
138
- Requires-Dist: dataclasses-json; extra == "csv"
139
- Requires-Dist: tqdm; extra == "csv"
140
- Requires-Dist: pydantic>=2.7; extra == "csv"
137
+ Requires-Dist: python-dateutil; extra == "csv"
141
138
  Requires-Dist: pandas; extra == "csv"
139
+ Requires-Dist: pydantic>=2.7; extra == "csv"
142
140
  Requires-Dist: click; extra == "csv"
143
- Requires-Dist: python-dateutil; extra == "csv"
144
141
  Requires-Dist: opentelemetry-sdk; extra == "csv"
142
+ Requires-Dist: dataclasses-json; extra == "csv"
143
+ Requires-Dist: unstructured[tsv]; extra == "csv"
144
+ Requires-Dist: tqdm; extra == "csv"
145
145
  Provides-Extra: databricks-volumes
146
- Requires-Dist: dataclasses-json; extra == "databricks-volumes"
147
- Requires-Dist: tqdm; extra == "databricks-volumes"
148
- Requires-Dist: pydantic>=2.7; extra == "databricks-volumes"
146
+ Requires-Dist: python-dateutil; extra == "databricks-volumes"
149
147
  Requires-Dist: pandas; extra == "databricks-volumes"
148
+ Requires-Dist: pydantic>=2.7; extra == "databricks-volumes"
150
149
  Requires-Dist: click; extra == "databricks-volumes"
151
- Requires-Dist: databricks-sdk; extra == "databricks-volumes"
152
- Requires-Dist: python-dateutil; extra == "databricks-volumes"
153
150
  Requires-Dist: opentelemetry-sdk; extra == "databricks-volumes"
151
+ Requires-Dist: dataclasses-json; extra == "databricks-volumes"
152
+ Requires-Dist: databricks-sdk; extra == "databricks-volumes"
153
+ Requires-Dist: tqdm; extra == "databricks-volumes"
154
154
  Provides-Extra: delta-table
155
155
  Requires-Dist: fsspec; extra == "delta-table"
156
- Requires-Dist: dataclasses-json; extra == "delta-table"
157
- Requires-Dist: tqdm; extra == "delta-table"
158
- Requires-Dist: deltalake; extra == "delta-table"
159
- Requires-Dist: pydantic>=2.7; extra == "delta-table"
156
+ Requires-Dist: python-dateutil; extra == "delta-table"
160
157
  Requires-Dist: pandas; extra == "delta-table"
158
+ Requires-Dist: pydantic>=2.7; extra == "delta-table"
161
159
  Requires-Dist: click; extra == "delta-table"
162
- Requires-Dist: python-dateutil; extra == "delta-table"
163
160
  Requires-Dist: opentelemetry-sdk; extra == "delta-table"
161
+ Requires-Dist: dataclasses-json; extra == "delta-table"
162
+ Requires-Dist: deltalake; extra == "delta-table"
163
+ Requires-Dist: tqdm; extra == "delta-table"
164
164
  Provides-Extra: discord
165
- Requires-Dist: dataclasses-json; extra == "discord"
166
- Requires-Dist: tqdm; extra == "discord"
167
- Requires-Dist: pydantic>=2.7; extra == "discord"
165
+ Requires-Dist: python-dateutil; extra == "discord"
168
166
  Requires-Dist: pandas; extra == "discord"
167
+ Requires-Dist: pydantic>=2.7; extra == "discord"
169
168
  Requires-Dist: click; extra == "discord"
170
- Requires-Dist: python-dateutil; extra == "discord"
171
- Requires-Dist: discord-py; extra == "discord"
172
169
  Requires-Dist: opentelemetry-sdk; extra == "discord"
170
+ Requires-Dist: discord-py; extra == "discord"
171
+ Requires-Dist: dataclasses-json; extra == "discord"
172
+ Requires-Dist: tqdm; extra == "discord"
173
173
  Provides-Extra: doc
174
- Requires-Dist: unstructured[docx]; extra == "doc"
175
- Requires-Dist: dataclasses-json; extra == "doc"
176
- Requires-Dist: tqdm; extra == "doc"
177
- Requires-Dist: pydantic>=2.7; extra == "doc"
174
+ Requires-Dist: python-dateutil; extra == "doc"
178
175
  Requires-Dist: pandas; extra == "doc"
176
+ Requires-Dist: pydantic>=2.7; extra == "doc"
179
177
  Requires-Dist: click; extra == "doc"
180
- Requires-Dist: python-dateutil; extra == "doc"
181
178
  Requires-Dist: opentelemetry-sdk; extra == "doc"
179
+ Requires-Dist: unstructured[docx]; extra == "doc"
180
+ Requires-Dist: dataclasses-json; extra == "doc"
181
+ Requires-Dist: tqdm; extra == "doc"
182
182
  Provides-Extra: docx
183
- Requires-Dist: unstructured[docx]; extra == "docx"
184
- Requires-Dist: dataclasses-json; extra == "docx"
185
- Requires-Dist: tqdm; extra == "docx"
186
- Requires-Dist: pydantic>=2.7; extra == "docx"
183
+ Requires-Dist: python-dateutil; extra == "docx"
187
184
  Requires-Dist: pandas; extra == "docx"
185
+ Requires-Dist: pydantic>=2.7; extra == "docx"
188
186
  Requires-Dist: click; extra == "docx"
189
- Requires-Dist: python-dateutil; extra == "docx"
190
187
  Requires-Dist: opentelemetry-sdk; extra == "docx"
188
+ Requires-Dist: unstructured[docx]; extra == "docx"
189
+ Requires-Dist: dataclasses-json; extra == "docx"
190
+ Requires-Dist: tqdm; extra == "docx"
191
191
  Provides-Extra: dropbox
192
192
  Requires-Dist: fsspec; extra == "dropbox"
193
- Requires-Dist: dropboxdrivefs; extra == "dropbox"
194
- Requires-Dist: dataclasses-json; extra == "dropbox"
195
- Requires-Dist: tqdm; extra == "dropbox"
196
- Requires-Dist: pydantic>=2.7; extra == "dropbox"
193
+ Requires-Dist: python-dateutil; extra == "dropbox"
197
194
  Requires-Dist: pandas; extra == "dropbox"
195
+ Requires-Dist: pydantic>=2.7; extra == "dropbox"
198
196
  Requires-Dist: click; extra == "dropbox"
199
- Requires-Dist: python-dateutil; extra == "dropbox"
200
197
  Requires-Dist: opentelemetry-sdk; extra == "dropbox"
198
+ Requires-Dist: dataclasses-json; extra == "dropbox"
199
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
200
+ Requires-Dist: tqdm; extra == "dropbox"
201
201
  Provides-Extra: elasticsearch
202
- Requires-Dist: dataclasses-json; extra == "elasticsearch"
203
- Requires-Dist: tqdm; extra == "elasticsearch"
204
- Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
205
- Requires-Dist: pydantic>=2.7; extra == "elasticsearch"
202
+ Requires-Dist: python-dateutil; extra == "elasticsearch"
206
203
  Requires-Dist: pandas; extra == "elasticsearch"
204
+ Requires-Dist: pydantic>=2.7; extra == "elasticsearch"
205
+ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
207
206
  Requires-Dist: click; extra == "elasticsearch"
208
- Requires-Dist: python-dateutil; extra == "elasticsearch"
209
207
  Requires-Dist: opentelemetry-sdk; extra == "elasticsearch"
208
+ Requires-Dist: dataclasses-json; extra == "elasticsearch"
209
+ Requires-Dist: tqdm; extra == "elasticsearch"
210
210
  Provides-Extra: embed-huggingface
211
+ Requires-Dist: python-dateutil; extra == "embed-huggingface"
211
212
  Requires-Dist: langchain-huggingface; extra == "embed-huggingface"
212
- Requires-Dist: dataclasses-json; extra == "embed-huggingface"
213
- Requires-Dist: tqdm; extra == "embed-huggingface"
214
- Requires-Dist: pydantic>=2.7; extra == "embed-huggingface"
215
213
  Requires-Dist: pandas; extra == "embed-huggingface"
214
+ Requires-Dist: pydantic>=2.7; extra == "embed-huggingface"
216
215
  Requires-Dist: click; extra == "embed-huggingface"
217
- Requires-Dist: python-dateutil; extra == "embed-huggingface"
218
216
  Requires-Dist: opentelemetry-sdk; extra == "embed-huggingface"
217
+ Requires-Dist: dataclasses-json; extra == "embed-huggingface"
218
+ Requires-Dist: tqdm; extra == "embed-huggingface"
219
219
  Provides-Extra: embed-mixedbreadai
220
- Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
221
- Requires-Dist: tqdm; extra == "embed-mixedbreadai"
222
- Requires-Dist: dataclasses-json; extra == "embed-mixedbreadai"
223
- Requires-Dist: pydantic>=2.7; extra == "embed-mixedbreadai"
220
+ Requires-Dist: python-dateutil; extra == "embed-mixedbreadai"
224
221
  Requires-Dist: pandas; extra == "embed-mixedbreadai"
222
+ Requires-Dist: pydantic>=2.7; extra == "embed-mixedbreadai"
225
223
  Requires-Dist: click; extra == "embed-mixedbreadai"
226
- Requires-Dist: python-dateutil; extra == "embed-mixedbreadai"
227
224
  Requires-Dist: opentelemetry-sdk; extra == "embed-mixedbreadai"
225
+ Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
226
+ Requires-Dist: dataclasses-json; extra == "embed-mixedbreadai"
227
+ Requires-Dist: tqdm; extra == "embed-mixedbreadai"
228
228
  Provides-Extra: embed-octoai
229
- Requires-Dist: dataclasses-json; extra == "embed-octoai"
230
- Requires-Dist: tqdm; extra == "embed-octoai"
231
- Requires-Dist: openai; extra == "embed-octoai"
232
- Requires-Dist: tiktoken; extra == "embed-octoai"
233
- Requires-Dist: pydantic>=2.7; extra == "embed-octoai"
229
+ Requires-Dist: python-dateutil; extra == "embed-octoai"
234
230
  Requires-Dist: pandas; extra == "embed-octoai"
231
+ Requires-Dist: pydantic>=2.7; extra == "embed-octoai"
235
232
  Requires-Dist: click; extra == "embed-octoai"
236
- Requires-Dist: python-dateutil; extra == "embed-octoai"
237
233
  Requires-Dist: opentelemetry-sdk; extra == "embed-octoai"
234
+ Requires-Dist: openai; extra == "embed-octoai"
235
+ Requires-Dist: dataclasses-json; extra == "embed-octoai"
236
+ Requires-Dist: tiktoken; extra == "embed-octoai"
237
+ Requires-Dist: tqdm; extra == "embed-octoai"
238
238
  Provides-Extra: embed-vertexai
239
- Requires-Dist: langchain-google-vertexai; extra == "embed-vertexai"
240
- Requires-Dist: dataclasses-json; extra == "embed-vertexai"
241
- Requires-Dist: tqdm; extra == "embed-vertexai"
242
- Requires-Dist: pydantic>=2.7; extra == "embed-vertexai"
243
- Requires-Dist: pandas; extra == "embed-vertexai"
239
+ Requires-Dist: langchain; extra == "embed-vertexai"
240
+ Requires-Dist: python-dateutil; extra == "embed-vertexai"
244
241
  Requires-Dist: langchain-community; extra == "embed-vertexai"
242
+ Requires-Dist: pandas; extra == "embed-vertexai"
243
+ Requires-Dist: pydantic>=2.7; extra == "embed-vertexai"
245
244
  Requires-Dist: click; extra == "embed-vertexai"
246
- Requires-Dist: python-dateutil; extra == "embed-vertexai"
247
- Requires-Dist: langchain; extra == "embed-vertexai"
245
+ Requires-Dist: langchain-google-vertexai; extra == "embed-vertexai"
248
246
  Requires-Dist: opentelemetry-sdk; extra == "embed-vertexai"
247
+ Requires-Dist: dataclasses-json; extra == "embed-vertexai"
248
+ Requires-Dist: tqdm; extra == "embed-vertexai"
249
249
  Provides-Extra: embed-voyageai
250
- Requires-Dist: dataclasses-json; extra == "embed-voyageai"
251
- Requires-Dist: tqdm; extra == "embed-voyageai"
252
- Requires-Dist: pydantic>=2.7; extra == "embed-voyageai"
253
- Requires-Dist: pandas; extra == "embed-voyageai"
254
- Requires-Dist: click; extra == "embed-voyageai"
255
250
  Requires-Dist: langchain-voyageai; extra == "embed-voyageai"
256
- Requires-Dist: python-dateutil; extra == "embed-voyageai"
257
251
  Requires-Dist: langchain; extra == "embed-voyageai"
252
+ Requires-Dist: python-dateutil; extra == "embed-voyageai"
253
+ Requires-Dist: pandas; extra == "embed-voyageai"
254
+ Requires-Dist: pydantic>=2.7; extra == "embed-voyageai"
255
+ Requires-Dist: click; extra == "embed-voyageai"
258
256
  Requires-Dist: opentelemetry-sdk; extra == "embed-voyageai"
257
+ Requires-Dist: dataclasses-json; extra == "embed-voyageai"
258
+ Requires-Dist: tqdm; extra == "embed-voyageai"
259
259
  Provides-Extra: epub
260
- Requires-Dist: dataclasses-json; extra == "epub"
261
- Requires-Dist: tqdm; extra == "epub"
260
+ Requires-Dist: python-dateutil; extra == "epub"
262
261
  Requires-Dist: unstructured[epub]; extra == "epub"
263
- Requires-Dist: pydantic>=2.7; extra == "epub"
264
262
  Requires-Dist: pandas; extra == "epub"
263
+ Requires-Dist: pydantic>=2.7; extra == "epub"
265
264
  Requires-Dist: click; extra == "epub"
266
- Requires-Dist: python-dateutil; extra == "epub"
267
265
  Requires-Dist: opentelemetry-sdk; extra == "epub"
266
+ Requires-Dist: dataclasses-json; extra == "epub"
267
+ Requires-Dist: tqdm; extra == "epub"
268
268
  Provides-Extra: gcs
269
269
  Requires-Dist: fsspec; extra == "gcs"
270
- Requires-Dist: dataclasses-json; extra == "gcs"
271
- Requires-Dist: tqdm; extra == "gcs"
270
+ Requires-Dist: python-dateutil; extra == "gcs"
272
271
  Requires-Dist: bs4; extra == "gcs"
273
- Requires-Dist: gcsfs; extra == "gcs"
274
- Requires-Dist: pydantic>=2.7; extra == "gcs"
275
272
  Requires-Dist: pandas; extra == "gcs"
273
+ Requires-Dist: pydantic>=2.7; extra == "gcs"
276
274
  Requires-Dist: click; extra == "gcs"
277
- Requires-Dist: python-dateutil; extra == "gcs"
278
275
  Requires-Dist: opentelemetry-sdk; extra == "gcs"
276
+ Requires-Dist: dataclasses-json; extra == "gcs"
277
+ Requires-Dist: gcsfs; extra == "gcs"
278
+ Requires-Dist: tqdm; extra == "gcs"
279
279
  Provides-Extra: github
280
- Requires-Dist: dataclasses-json; extra == "github"
281
- Requires-Dist: tqdm; extra == "github"
282
- Requires-Dist: pydantic>=2.7; extra == "github"
283
- Requires-Dist: pandas; extra == "github"
284
- Requires-Dist: pygithub>1.58.0; extra == "github"
285
- Requires-Dist: click; extra == "github"
286
280
  Requires-Dist: python-dateutil; extra == "github"
287
281
  Requires-Dist: requests; extra == "github"
282
+ Requires-Dist: pandas; extra == "github"
283
+ Requires-Dist: pydantic>=2.7; extra == "github"
284
+ Requires-Dist: click; extra == "github"
288
285
  Requires-Dist: opentelemetry-sdk; extra == "github"
286
+ Requires-Dist: dataclasses-json; extra == "github"
287
+ Requires-Dist: pygithub>1.58.0; extra == "github"
288
+ Requires-Dist: tqdm; extra == "github"
289
289
  Provides-Extra: gitlab
290
- Requires-Dist: dataclasses-json; extra == "gitlab"
291
- Requires-Dist: tqdm; extra == "gitlab"
292
- Requires-Dist: pydantic>=2.7; extra == "gitlab"
290
+ Requires-Dist: python-dateutil; extra == "gitlab"
293
291
  Requires-Dist: pandas; extra == "gitlab"
292
+ Requires-Dist: pydantic>=2.7; extra == "gitlab"
294
293
  Requires-Dist: click; extra == "gitlab"
295
294
  Requires-Dist: opentelemetry-sdk; extra == "gitlab"
296
- Requires-Dist: python-dateutil; extra == "gitlab"
295
+ Requires-Dist: tqdm; extra == "gitlab"
296
+ Requires-Dist: dataclasses-json; extra == "gitlab"
297
297
  Requires-Dist: python-gitlab; extra == "gitlab"
298
298
  Provides-Extra: google-drive
299
- Requires-Dist: dataclasses-json; extra == "google-drive"
300
- Requires-Dist: tqdm; extra == "google-drive"
301
- Requires-Dist: pydantic>=2.7; extra == "google-drive"
299
+ Requires-Dist: python-dateutil; extra == "google-drive"
302
300
  Requires-Dist: pandas; extra == "google-drive"
303
- Requires-Dist: google-api-python-client; extra == "google-drive"
301
+ Requires-Dist: pydantic>=2.7; extra == "google-drive"
304
302
  Requires-Dist: click; extra == "google-drive"
305
- Requires-Dist: python-dateutil; extra == "google-drive"
303
+ Requires-Dist: google-api-python-client; extra == "google-drive"
306
304
  Requires-Dist: opentelemetry-sdk; extra == "google-drive"
305
+ Requires-Dist: dataclasses-json; extra == "google-drive"
306
+ Requires-Dist: tqdm; extra == "google-drive"
307
307
  Provides-Extra: hubspot
308
+ Requires-Dist: python-dateutil; extra == "hubspot"
308
309
  Requires-Dist: urllib3; extra == "hubspot"
309
- Requires-Dist: tqdm; extra == "hubspot"
310
- Requires-Dist: hubspot-api-client; extra == "hubspot"
311
- Requires-Dist: dataclasses-json; extra == "hubspot"
312
- Requires-Dist: pydantic>=2.7; extra == "hubspot"
313
310
  Requires-Dist: pandas; extra == "hubspot"
311
+ Requires-Dist: pydantic>=2.7; extra == "hubspot"
314
312
  Requires-Dist: click; extra == "hubspot"
315
- Requires-Dist: python-dateutil; extra == "hubspot"
316
313
  Requires-Dist: opentelemetry-sdk; extra == "hubspot"
314
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
315
+ Requires-Dist: dataclasses-json; extra == "hubspot"
316
+ Requires-Dist: tqdm; extra == "hubspot"
317
317
  Provides-Extra: jira
318
- Requires-Dist: atlassian-python-api; extra == "jira"
319
- Requires-Dist: dataclasses-json; extra == "jira"
320
- Requires-Dist: tqdm; extra == "jira"
321
- Requires-Dist: pydantic>=2.7; extra == "jira"
318
+ Requires-Dist: python-dateutil; extra == "jira"
322
319
  Requires-Dist: pandas; extra == "jira"
320
+ Requires-Dist: pydantic>=2.7; extra == "jira"
323
321
  Requires-Dist: click; extra == "jira"
324
- Requires-Dist: python-dateutil; extra == "jira"
325
322
  Requires-Dist: opentelemetry-sdk; extra == "jira"
323
+ Requires-Dist: atlassian-python-api; extra == "jira"
324
+ Requires-Dist: dataclasses-json; extra == "jira"
325
+ Requires-Dist: tqdm; extra == "jira"
326
326
  Provides-Extra: kafka
327
- Requires-Dist: confluent-kafka; extra == "kafka"
328
- Requires-Dist: dataclasses-json; extra == "kafka"
329
- Requires-Dist: tqdm; extra == "kafka"
330
- Requires-Dist: pydantic>=2.7; extra == "kafka"
327
+ Requires-Dist: python-dateutil; extra == "kafka"
331
328
  Requires-Dist: pandas; extra == "kafka"
329
+ Requires-Dist: pydantic>=2.7; extra == "kafka"
332
330
  Requires-Dist: click; extra == "kafka"
333
- Requires-Dist: python-dateutil; extra == "kafka"
334
331
  Requires-Dist: opentelemetry-sdk; extra == "kafka"
332
+ Requires-Dist: dataclasses-json; extra == "kafka"
333
+ Requires-Dist: confluent-kafka; extra == "kafka"
334
+ Requires-Dist: tqdm; extra == "kafka"
335
335
  Provides-Extra: kdbai
336
336
  Requires-Dist: kdbai-client; extra == "kdbai"
337
337
  Provides-Extra: md
338
- Requires-Dist: unstructured[md]; extra == "md"
339
- Requires-Dist: dataclasses-json; extra == "md"
340
- Requires-Dist: tqdm; extra == "md"
341
- Requires-Dist: pydantic>=2.7; extra == "md"
338
+ Requires-Dist: python-dateutil; extra == "md"
342
339
  Requires-Dist: pandas; extra == "md"
340
+ Requires-Dist: pydantic>=2.7; extra == "md"
341
+ Requires-Dist: unstructured[md]; extra == "md"
343
342
  Requires-Dist: click; extra == "md"
344
- Requires-Dist: python-dateutil; extra == "md"
345
343
  Requires-Dist: opentelemetry-sdk; extra == "md"
344
+ Requires-Dist: dataclasses-json; extra == "md"
345
+ Requires-Dist: tqdm; extra == "md"
346
346
  Provides-Extra: milvus
347
- Requires-Dist: dataclasses-json; extra == "milvus"
348
- Requires-Dist: tqdm; extra == "milvus"
349
347
  Requires-Dist: pymilvus; extra == "milvus"
350
- Requires-Dist: pydantic>=2.7; extra == "milvus"
348
+ Requires-Dist: python-dateutil; extra == "milvus"
351
349
  Requires-Dist: pandas; extra == "milvus"
350
+ Requires-Dist: pydantic>=2.7; extra == "milvus"
352
351
  Requires-Dist: click; extra == "milvus"
353
- Requires-Dist: python-dateutil; extra == "milvus"
354
352
  Requires-Dist: opentelemetry-sdk; extra == "milvus"
353
+ Requires-Dist: dataclasses-json; extra == "milvus"
354
+ Requires-Dist: tqdm; extra == "milvus"
355
355
  Provides-Extra: mongodb
356
+ Requires-Dist: python-dateutil; extra == "mongodb"
356
357
  Requires-Dist: pymongo; extra == "mongodb"
357
- Requires-Dist: dataclasses-json; extra == "mongodb"
358
- Requires-Dist: tqdm; extra == "mongodb"
359
- Requires-Dist: pydantic>=2.7; extra == "mongodb"
360
358
  Requires-Dist: pandas; extra == "mongodb"
359
+ Requires-Dist: pydantic>=2.7; extra == "mongodb"
361
360
  Requires-Dist: click; extra == "mongodb"
362
- Requires-Dist: python-dateutil; extra == "mongodb"
363
361
  Requires-Dist: opentelemetry-sdk; extra == "mongodb"
362
+ Requires-Dist: dataclasses-json; extra == "mongodb"
363
+ Requires-Dist: tqdm; extra == "mongodb"
364
364
  Provides-Extra: msg
365
- Requires-Dist: dataclasses-json; extra == "msg"
366
- Requires-Dist: tqdm; extra == "msg"
367
- Requires-Dist: pydantic>=2.7; extra == "msg"
365
+ Requires-Dist: python-dateutil; extra == "msg"
368
366
  Requires-Dist: pandas; extra == "msg"
367
+ Requires-Dist: pydantic>=2.7; extra == "msg"
369
368
  Requires-Dist: click; extra == "msg"
370
- Requires-Dist: python-dateutil; extra == "msg"
371
- Requires-Dist: unstructured[msg]; extra == "msg"
372
369
  Requires-Dist: opentelemetry-sdk; extra == "msg"
370
+ Requires-Dist: dataclasses-json; extra == "msg"
371
+ Requires-Dist: unstructured[msg]; extra == "msg"
372
+ Requires-Dist: tqdm; extra == "msg"
373
373
  Provides-Extra: notion
374
- Requires-Dist: htmlBuilder; extra == "notion"
375
- Requires-Dist: dataclasses-json; extra == "notion"
376
- Requires-Dist: tqdm; extra == "notion"
377
- Requires-Dist: httpx; extra == "notion"
374
+ Requires-Dist: notion-client; extra == "notion"
378
375
  Requires-Dist: python-dateutil; extra == "notion"
379
- Requires-Dist: pydantic>=2.7; extra == "notion"
376
+ Requires-Dist: httpx; extra == "notion"
380
377
  Requires-Dist: pandas; extra == "notion"
378
+ Requires-Dist: pydantic>=2.7; extra == "notion"
381
379
  Requires-Dist: click; extra == "notion"
382
- Requires-Dist: backoff; extra == "notion"
383
- Requires-Dist: notion-client; extra == "notion"
384
380
  Requires-Dist: opentelemetry-sdk; extra == "notion"
381
+ Requires-Dist: dataclasses-json; extra == "notion"
382
+ Requires-Dist: backoff; extra == "notion"
383
+ Requires-Dist: htmlBuilder; extra == "notion"
384
+ Requires-Dist: tqdm; extra == "notion"
385
385
  Provides-Extra: odt
386
- Requires-Dist: dataclasses-json; extra == "odt"
387
- Requires-Dist: tqdm; extra == "odt"
388
386
  Requires-Dist: unstructured[odt]; extra == "odt"
389
- Requires-Dist: pydantic>=2.7; extra == "odt"
387
+ Requires-Dist: python-dateutil; extra == "odt"
390
388
  Requires-Dist: pandas; extra == "odt"
389
+ Requires-Dist: pydantic>=2.7; extra == "odt"
391
390
  Requires-Dist: click; extra == "odt"
392
- Requires-Dist: python-dateutil; extra == "odt"
393
391
  Requires-Dist: opentelemetry-sdk; extra == "odt"
392
+ Requires-Dist: dataclasses-json; extra == "odt"
393
+ Requires-Dist: tqdm; extra == "odt"
394
394
  Provides-Extra: onedrive
395
- Requires-Dist: dataclasses-json; extra == "onedrive"
396
- Requires-Dist: tqdm; extra == "onedrive"
397
- Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
395
+ Requires-Dist: python-dateutil; extra == "onedrive"
398
396
  Requires-Dist: bs4; extra == "onedrive"
399
- Requires-Dist: pydantic>=2.7; extra == "onedrive"
400
397
  Requires-Dist: pandas; extra == "onedrive"
398
+ Requires-Dist: pydantic>=2.7; extra == "onedrive"
401
399
  Requires-Dist: click; extra == "onedrive"
402
- Requires-Dist: msal; extra == "onedrive"
403
- Requires-Dist: python-dateutil; extra == "onedrive"
404
400
  Requires-Dist: opentelemetry-sdk; extra == "onedrive"
401
+ Requires-Dist: dataclasses-json; extra == "onedrive"
402
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
403
+ Requires-Dist: msal; extra == "onedrive"
404
+ Requires-Dist: tqdm; extra == "onedrive"
405
405
  Provides-Extra: openai
406
- Requires-Dist: dataclasses-json; extra == "openai"
407
- Requires-Dist: tqdm; extra == "openai"
408
- Requires-Dist: openai; extra == "openai"
409
- Requires-Dist: tiktoken; extra == "openai"
410
- Requires-Dist: pydantic>=2.7; extra == "openai"
411
- Requires-Dist: pandas; extra == "openai"
406
+ Requires-Dist: python-dateutil; extra == "openai"
412
407
  Requires-Dist: langchain-community; extra == "openai"
408
+ Requires-Dist: pandas; extra == "openai"
409
+ Requires-Dist: pydantic>=2.7; extra == "openai"
413
410
  Requires-Dist: click; extra == "openai"
414
- Requires-Dist: python-dateutil; extra == "openai"
415
411
  Requires-Dist: opentelemetry-sdk; extra == "openai"
412
+ Requires-Dist: openai; extra == "openai"
413
+ Requires-Dist: dataclasses-json; extra == "openai"
414
+ Requires-Dist: tiktoken; extra == "openai"
415
+ Requires-Dist: tqdm; extra == "openai"
416
416
  Provides-Extra: opensearch
417
- Requires-Dist: dataclasses-json; extra == "opensearch"
418
- Requires-Dist: tqdm; extra == "opensearch"
417
+ Requires-Dist: python-dateutil; extra == "opensearch"
418
+ Requires-Dist: opensearch-py; extra == "opensearch"
419
419
  Requires-Dist: pydantic>=2.7; extra == "opensearch"
420
420
  Requires-Dist: pandas; extra == "opensearch"
421
421
  Requires-Dist: click; extra == "opensearch"
422
- Requires-Dist: python-dateutil; extra == "opensearch"
423
- Requires-Dist: opensearch-py; extra == "opensearch"
424
422
  Requires-Dist: opentelemetry-sdk; extra == "opensearch"
423
+ Requires-Dist: dataclasses-json; extra == "opensearch"
424
+ Requires-Dist: tqdm; extra == "opensearch"
425
425
  Provides-Extra: org
426
- Requires-Dist: dataclasses-json; extra == "org"
427
- Requires-Dist: tqdm; extra == "org"
428
- Requires-Dist: unstructured[org]; extra == "org"
429
- Requires-Dist: pydantic>=2.7; extra == "org"
426
+ Requires-Dist: python-dateutil; extra == "org"
430
427
  Requires-Dist: pandas; extra == "org"
428
+ Requires-Dist: pydantic>=2.7; extra == "org"
431
429
  Requires-Dist: click; extra == "org"
432
- Requires-Dist: python-dateutil; extra == "org"
433
430
  Requires-Dist: opentelemetry-sdk; extra == "org"
431
+ Requires-Dist: dataclasses-json; extra == "org"
432
+ Requires-Dist: unstructured[org]; extra == "org"
433
+ Requires-Dist: tqdm; extra == "org"
434
434
  Provides-Extra: outlook
435
- Requires-Dist: dataclasses-json; extra == "outlook"
436
- Requires-Dist: tqdm; extra == "outlook"
437
- Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
438
- Requires-Dist: pydantic>=2.7; extra == "outlook"
435
+ Requires-Dist: python-dateutil; extra == "outlook"
439
436
  Requires-Dist: pandas; extra == "outlook"
437
+ Requires-Dist: pydantic>=2.7; extra == "outlook"
440
438
  Requires-Dist: click; extra == "outlook"
441
- Requires-Dist: msal; extra == "outlook"
442
- Requires-Dist: python-dateutil; extra == "outlook"
443
439
  Requires-Dist: opentelemetry-sdk; extra == "outlook"
440
+ Requires-Dist: dataclasses-json; extra == "outlook"
441
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
442
+ Requires-Dist: msal; extra == "outlook"
443
+ Requires-Dist: tqdm; extra == "outlook"
444
444
  Provides-Extra: pdf
445
- Requires-Dist: dataclasses-json; extra == "pdf"
446
- Requires-Dist: tqdm; extra == "pdf"
447
- Requires-Dist: unstructured[pdf]; extra == "pdf"
448
- Requires-Dist: pydantic>=2.7; extra == "pdf"
445
+ Requires-Dist: python-dateutil; extra == "pdf"
449
446
  Requires-Dist: pandas; extra == "pdf"
447
+ Requires-Dist: pydantic>=2.7; extra == "pdf"
448
+ Requires-Dist: unstructured[pdf]; extra == "pdf"
450
449
  Requires-Dist: click; extra == "pdf"
451
- Requires-Dist: python-dateutil; extra == "pdf"
452
450
  Requires-Dist: opentelemetry-sdk; extra == "pdf"
451
+ Requires-Dist: dataclasses-json; extra == "pdf"
452
+ Requires-Dist: tqdm; extra == "pdf"
453
453
  Provides-Extra: pinecone
454
- Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
455
- Requires-Dist: dataclasses-json; extra == "pinecone"
456
- Requires-Dist: tqdm; extra == "pinecone"
457
- Requires-Dist: pydantic>=2.7; extra == "pinecone"
454
+ Requires-Dist: python-dateutil; extra == "pinecone"
458
455
  Requires-Dist: pandas; extra == "pinecone"
456
+ Requires-Dist: pydantic>=2.7; extra == "pinecone"
459
457
  Requires-Dist: click; extra == "pinecone"
460
- Requires-Dist: python-dateutil; extra == "pinecone"
461
458
  Requires-Dist: opentelemetry-sdk; extra == "pinecone"
459
+ Requires-Dist: dataclasses-json; extra == "pinecone"
460
+ Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
461
+ Requires-Dist: tqdm; extra == "pinecone"
462
462
  Provides-Extra: postgres
463
- Requires-Dist: dataclasses-json; extra == "postgres"
464
- Requires-Dist: tqdm; extra == "postgres"
465
- Requires-Dist: pydantic>=2.7; extra == "postgres"
463
+ Requires-Dist: python-dateutil; extra == "postgres"
466
464
  Requires-Dist: pandas; extra == "postgres"
465
+ Requires-Dist: pydantic>=2.7; extra == "postgres"
467
466
  Requires-Dist: click; extra == "postgres"
468
467
  Requires-Dist: opentelemetry-sdk; extra == "postgres"
469
- Requires-Dist: python-dateutil; extra == "postgres"
468
+ Requires-Dist: dataclasses-json; extra == "postgres"
470
469
  Requires-Dist: psycopg2-binary; extra == "postgres"
470
+ Requires-Dist: tqdm; extra == "postgres"
471
471
  Provides-Extra: ppt
472
472
  Requires-Dist: unstructured[pptx]; extra == "ppt"
473
- Requires-Dist: tqdm; extra == "ppt"
474
- Requires-Dist: dataclasses-json; extra == "ppt"
475
- Requires-Dist: pydantic>=2.7; extra == "ppt"
473
+ Requires-Dist: python-dateutil; extra == "ppt"
476
474
  Requires-Dist: pandas; extra == "ppt"
475
+ Requires-Dist: pydantic>=2.7; extra == "ppt"
477
476
  Requires-Dist: click; extra == "ppt"
478
- Requires-Dist: python-dateutil; extra == "ppt"
479
477
  Requires-Dist: opentelemetry-sdk; extra == "ppt"
478
+ Requires-Dist: dataclasses-json; extra == "ppt"
479
+ Requires-Dist: tqdm; extra == "ppt"
480
480
  Provides-Extra: pptx
481
481
  Requires-Dist: unstructured[pptx]; extra == "pptx"
482
- Requires-Dist: tqdm; extra == "pptx"
483
- Requires-Dist: dataclasses-json; extra == "pptx"
484
- Requires-Dist: pydantic>=2.7; extra == "pptx"
482
+ Requires-Dist: python-dateutil; extra == "pptx"
485
483
  Requires-Dist: pandas; extra == "pptx"
484
+ Requires-Dist: pydantic>=2.7; extra == "pptx"
486
485
  Requires-Dist: click; extra == "pptx"
487
- Requires-Dist: python-dateutil; extra == "pptx"
488
486
  Requires-Dist: opentelemetry-sdk; extra == "pptx"
487
+ Requires-Dist: dataclasses-json; extra == "pptx"
488
+ Requires-Dist: tqdm; extra == "pptx"
489
489
  Provides-Extra: qdrant
490
- Requires-Dist: dataclasses-json; extra == "qdrant"
491
- Requires-Dist: tqdm; extra == "qdrant"
492
- Requires-Dist: qdrant-client; extra == "qdrant"
493
- Requires-Dist: pydantic>=2.7; extra == "qdrant"
490
+ Requires-Dist: python-dateutil; extra == "qdrant"
494
491
  Requires-Dist: pandas; extra == "qdrant"
492
+ Requires-Dist: pydantic>=2.7; extra == "qdrant"
495
493
  Requires-Dist: click; extra == "qdrant"
496
- Requires-Dist: python-dateutil; extra == "qdrant"
497
494
  Requires-Dist: opentelemetry-sdk; extra == "qdrant"
495
+ Requires-Dist: dataclasses-json; extra == "qdrant"
496
+ Requires-Dist: qdrant-client; extra == "qdrant"
497
+ Requires-Dist: tqdm; extra == "qdrant"
498
498
  Provides-Extra: reddit
499
- Requires-Dist: dataclasses-json; extra == "reddit"
500
- Requires-Dist: tqdm; extra == "reddit"
501
- Requires-Dist: pydantic>=2.7; extra == "reddit"
499
+ Requires-Dist: python-dateutil; extra == "reddit"
502
500
  Requires-Dist: pandas; extra == "reddit"
501
+ Requires-Dist: pydantic>=2.7; extra == "reddit"
503
502
  Requires-Dist: click; extra == "reddit"
504
- Requires-Dist: python-dateutil; extra == "reddit"
505
- Requires-Dist: praw; extra == "reddit"
506
503
  Requires-Dist: opentelemetry-sdk; extra == "reddit"
504
+ Requires-Dist: dataclasses-json; extra == "reddit"
505
+ Requires-Dist: praw; extra == "reddit"
506
+ Requires-Dist: tqdm; extra == "reddit"
507
507
  Provides-Extra: remote
508
- Requires-Dist: dataclasses-json; extra == "remote"
509
- Requires-Dist: tqdm; extra == "remote"
508
+ Requires-Dist: python-dateutil; extra == "remote"
510
509
  Requires-Dist: unstructured-client>=0.25.8; extra == "remote"
511
- Requires-Dist: pydantic>=2.7; extra == "remote"
512
510
  Requires-Dist: pandas; extra == "remote"
511
+ Requires-Dist: pydantic>=2.7; extra == "remote"
513
512
  Requires-Dist: click; extra == "remote"
514
- Requires-Dist: python-dateutil; extra == "remote"
515
513
  Requires-Dist: opentelemetry-sdk; extra == "remote"
514
+ Requires-Dist: dataclasses-json; extra == "remote"
515
+ Requires-Dist: tqdm; extra == "remote"
516
516
  Provides-Extra: rst
517
517
  Requires-Dist: unstructured[rst]; extra == "rst"
518
- Requires-Dist: dataclasses-json; extra == "rst"
519
- Requires-Dist: tqdm; extra == "rst"
520
- Requires-Dist: pydantic>=2.7; extra == "rst"
518
+ Requires-Dist: python-dateutil; extra == "rst"
521
519
  Requires-Dist: pandas; extra == "rst"
520
+ Requires-Dist: pydantic>=2.7; extra == "rst"
522
521
  Requires-Dist: click; extra == "rst"
523
- Requires-Dist: python-dateutil; extra == "rst"
524
522
  Requires-Dist: opentelemetry-sdk; extra == "rst"
523
+ Requires-Dist: dataclasses-json; extra == "rst"
524
+ Requires-Dist: tqdm; extra == "rst"
525
525
  Provides-Extra: rtf
526
- Requires-Dist: unstructured[rtf]; extra == "rtf"
527
- Requires-Dist: tqdm; extra == "rtf"
528
- Requires-Dist: dataclasses-json; extra == "rtf"
529
- Requires-Dist: pydantic>=2.7; extra == "rtf"
526
+ Requires-Dist: python-dateutil; extra == "rtf"
530
527
  Requires-Dist: pandas; extra == "rtf"
528
+ Requires-Dist: pydantic>=2.7; extra == "rtf"
531
529
  Requires-Dist: click; extra == "rtf"
532
- Requires-Dist: python-dateutil; extra == "rtf"
533
530
  Requires-Dist: opentelemetry-sdk; extra == "rtf"
531
+ Requires-Dist: dataclasses-json; extra == "rtf"
532
+ Requires-Dist: unstructured[rtf]; extra == "rtf"
533
+ Requires-Dist: tqdm; extra == "rtf"
534
534
  Provides-Extra: s3
535
535
  Requires-Dist: fsspec; extra == "s3"
536
- Requires-Dist: dataclasses-json; extra == "s3"
537
- Requires-Dist: tqdm; extra == "s3"
538
- Requires-Dist: pydantic>=2.7; extra == "s3"
539
- Requires-Dist: s3fs; extra == "s3"
536
+ Requires-Dist: python-dateutil; extra == "s3"
540
537
  Requires-Dist: pandas; extra == "s3"
538
+ Requires-Dist: pydantic>=2.7; extra == "s3"
541
539
  Requires-Dist: click; extra == "s3"
542
- Requires-Dist: python-dateutil; extra == "s3"
543
540
  Requires-Dist: opentelemetry-sdk; extra == "s3"
541
+ Requires-Dist: dataclasses-json; extra == "s3"
542
+ Requires-Dist: s3fs; extra == "s3"
543
+ Requires-Dist: tqdm; extra == "s3"
544
544
  Provides-Extra: salesforce
545
- Requires-Dist: simple-salesforce; extra == "salesforce"
546
- Requires-Dist: dataclasses-json; extra == "salesforce"
547
- Requires-Dist: tqdm; extra == "salesforce"
548
- Requires-Dist: pydantic>=2.7; extra == "salesforce"
545
+ Requires-Dist: python-dateutil; extra == "salesforce"
549
546
  Requires-Dist: pandas; extra == "salesforce"
547
+ Requires-Dist: pydantic>=2.7; extra == "salesforce"
550
548
  Requires-Dist: click; extra == "salesforce"
551
- Requires-Dist: python-dateutil; extra == "salesforce"
552
549
  Requires-Dist: opentelemetry-sdk; extra == "salesforce"
550
+ Requires-Dist: dataclasses-json; extra == "salesforce"
551
+ Requires-Dist: simple-salesforce; extra == "salesforce"
552
+ Requires-Dist: tqdm; extra == "salesforce"
553
553
  Provides-Extra: sftp
554
554
  Requires-Dist: fsspec; extra == "sftp"
555
- Requires-Dist: dataclasses-json; extra == "sftp"
556
- Requires-Dist: tqdm; extra == "sftp"
557
- Requires-Dist: pydantic>=2.7; extra == "sftp"
555
+ Requires-Dist: python-dateutil; extra == "sftp"
558
556
  Requires-Dist: pandas; extra == "sftp"
559
- Requires-Dist: paramiko; extra == "sftp"
557
+ Requires-Dist: pydantic>=2.7; extra == "sftp"
560
558
  Requires-Dist: click; extra == "sftp"
561
- Requires-Dist: python-dateutil; extra == "sftp"
562
559
  Requires-Dist: opentelemetry-sdk; extra == "sftp"
560
+ Requires-Dist: dataclasses-json; extra == "sftp"
561
+ Requires-Dist: paramiko; extra == "sftp"
562
+ Requires-Dist: tqdm; extra == "sftp"
563
563
  Provides-Extra: sharepoint
564
- Requires-Dist: dataclasses-json; extra == "sharepoint"
565
- Requires-Dist: tqdm; extra == "sharepoint"
566
- Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
567
- Requires-Dist: pydantic>=2.7; extra == "sharepoint"
564
+ Requires-Dist: python-dateutil; extra == "sharepoint"
568
565
  Requires-Dist: pandas; extra == "sharepoint"
566
+ Requires-Dist: pydantic>=2.7; extra == "sharepoint"
569
567
  Requires-Dist: click; extra == "sharepoint"
570
- Requires-Dist: msal; extra == "sharepoint"
571
- Requires-Dist: python-dateutil; extra == "sharepoint"
572
568
  Requires-Dist: opentelemetry-sdk; extra == "sharepoint"
569
+ Requires-Dist: dataclasses-json; extra == "sharepoint"
570
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
571
+ Requires-Dist: msal; extra == "sharepoint"
572
+ Requires-Dist: tqdm; extra == "sharepoint"
573
573
  Provides-Extra: singlestore
574
- Requires-Dist: singlestoredb; extra == "singlestore"
575
- Requires-Dist: dataclasses-json; extra == "singlestore"
576
- Requires-Dist: tqdm; extra == "singlestore"
577
- Requires-Dist: pydantic>=2.7; extra == "singlestore"
574
+ Requires-Dist: python-dateutil; extra == "singlestore"
578
575
  Requires-Dist: pandas; extra == "singlestore"
576
+ Requires-Dist: pydantic>=2.7; extra == "singlestore"
579
577
  Requires-Dist: click; extra == "singlestore"
580
- Requires-Dist: python-dateutil; extra == "singlestore"
581
578
  Requires-Dist: opentelemetry-sdk; extra == "singlestore"
579
+ Requires-Dist: tqdm; extra == "singlestore"
580
+ Requires-Dist: dataclasses-json; extra == "singlestore"
581
+ Requires-Dist: singlestoredb; extra == "singlestore"
582
582
  Provides-Extra: slack
583
- Requires-Dist: dataclasses-json; extra == "slack"
584
- Requires-Dist: tqdm; extra == "slack"
585
- Requires-Dist: slack-sdk; extra == "slack"
586
- Requires-Dist: pydantic>=2.7; extra == "slack"
583
+ Requires-Dist: python-dateutil; extra == "slack"
587
584
  Requires-Dist: pandas; extra == "slack"
585
+ Requires-Dist: pydantic>=2.7; extra == "slack"
588
586
  Requires-Dist: click; extra == "slack"
589
- Requires-Dist: python-dateutil; extra == "slack"
587
+ Requires-Dist: slack-sdk; extra == "slack"
590
588
  Requires-Dist: opentelemetry-sdk; extra == "slack"
589
+ Requires-Dist: dataclasses-json; extra == "slack"
590
+ Requires-Dist: tqdm; extra == "slack"
591
591
  Provides-Extra: tsv
592
- Requires-Dist: unstructured[tsv]; extra == "tsv"
593
- Requires-Dist: dataclasses-json; extra == "tsv"
594
- Requires-Dist: tqdm; extra == "tsv"
595
- Requires-Dist: pydantic>=2.7; extra == "tsv"
592
+ Requires-Dist: python-dateutil; extra == "tsv"
596
593
  Requires-Dist: pandas; extra == "tsv"
594
+ Requires-Dist: pydantic>=2.7; extra == "tsv"
597
595
  Requires-Dist: click; extra == "tsv"
598
- Requires-Dist: python-dateutil; extra == "tsv"
599
596
  Requires-Dist: opentelemetry-sdk; extra == "tsv"
597
+ Requires-Dist: dataclasses-json; extra == "tsv"
598
+ Requires-Dist: unstructured[tsv]; extra == "tsv"
599
+ Requires-Dist: tqdm; extra == "tsv"
600
600
  Provides-Extra: vectara
601
- Requires-Dist: dataclasses-json; extra == "vectara"
602
- Requires-Dist: tqdm; extra == "vectara"
603
- Requires-Dist: pydantic>=2.7; extra == "vectara"
604
- Requires-Dist: pandas; extra == "vectara"
605
- Requires-Dist: click; extra == "vectara"
606
601
  Requires-Dist: python-dateutil; extra == "vectara"
607
602
  Requires-Dist: requests; extra == "vectara"
603
+ Requires-Dist: pandas; extra == "vectara"
604
+ Requires-Dist: pydantic>=2.7; extra == "vectara"
605
+ Requires-Dist: click; extra == "vectara"
608
606
  Requires-Dist: opentelemetry-sdk; extra == "vectara"
607
+ Requires-Dist: dataclasses-json; extra == "vectara"
608
+ Requires-Dist: tqdm; extra == "vectara"
609
609
  Provides-Extra: weaviate
610
- Requires-Dist: dataclasses-json; extra == "weaviate"
611
- Requires-Dist: tqdm; extra == "weaviate"
612
- Requires-Dist: weaviate-client; extra == "weaviate"
613
- Requires-Dist: pydantic>=2.7; extra == "weaviate"
610
+ Requires-Dist: python-dateutil; extra == "weaviate"
614
611
  Requires-Dist: pandas; extra == "weaviate"
612
+ Requires-Dist: pydantic>=2.7; extra == "weaviate"
615
613
  Requires-Dist: click; extra == "weaviate"
616
- Requires-Dist: python-dateutil; extra == "weaviate"
617
614
  Requires-Dist: opentelemetry-sdk; extra == "weaviate"
615
+ Requires-Dist: weaviate-client; extra == "weaviate"
616
+ Requires-Dist: dataclasses-json; extra == "weaviate"
617
+ Requires-Dist: tqdm; extra == "weaviate"
618
618
  Provides-Extra: wikipedia
619
- Requires-Dist: dataclasses-json; extra == "wikipedia"
620
- Requires-Dist: tqdm; extra == "wikipedia"
621
- Requires-Dist: wikipedia; extra == "wikipedia"
622
- Requires-Dist: pydantic>=2.7; extra == "wikipedia"
619
+ Requires-Dist: python-dateutil; extra == "wikipedia"
623
620
  Requires-Dist: pandas; extra == "wikipedia"
621
+ Requires-Dist: pydantic>=2.7; extra == "wikipedia"
624
622
  Requires-Dist: click; extra == "wikipedia"
625
- Requires-Dist: python-dateutil; extra == "wikipedia"
626
623
  Requires-Dist: opentelemetry-sdk; extra == "wikipedia"
624
+ Requires-Dist: dataclasses-json; extra == "wikipedia"
625
+ Requires-Dist: wikipedia; extra == "wikipedia"
626
+ Requires-Dist: tqdm; extra == "wikipedia"
627
627
  Provides-Extra: xlsx
628
- Requires-Dist: dataclasses-json; extra == "xlsx"
629
- Requires-Dist: tqdm; extra == "xlsx"
630
- Requires-Dist: unstructured[xlsx]; extra == "xlsx"
631
- Requires-Dist: pydantic>=2.7; extra == "xlsx"
628
+ Requires-Dist: python-dateutil; extra == "xlsx"
632
629
  Requires-Dist: pandas; extra == "xlsx"
630
+ Requires-Dist: pydantic>=2.7; extra == "xlsx"
633
631
  Requires-Dist: click; extra == "xlsx"
634
- Requires-Dist: python-dateutil; extra == "xlsx"
635
632
  Requires-Dist: opentelemetry-sdk; extra == "xlsx"
633
+ Requires-Dist: dataclasses-json; extra == "xlsx"
634
+ Requires-Dist: unstructured[xlsx]; extra == "xlsx"
635
+ Requires-Dist: tqdm; extra == "xlsx"
636
636
 
637
637
  # Unstructured Ingest
638
638
 
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=lCtX0MMAdwcQmclRZsJB-JMGsL5l4lSBsmyXt8YWrDA,43
2
+ unstructured_ingest/__version__.py,sha256=bJ5C3mWqhuWY5BAH5bAUzjjkW54gcd2KffrdBiGTVK0,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/interfaces.py,sha256=LuY-85clq5iyOtDd9vDABjK2MZCm6wRWK53cdb4SROY,31411
5
5
  unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
@@ -173,7 +173,7 @@ unstructured_ingest/embed/interfaces.py,sha256=O_USsEcVHRzE2dpHCJEJWKq04NLfdAnm5
173
173
  unstructured_ingest/embed/mixedbreadai.py,sha256=wMdY1a4PyynguIZQ4fPFImKGk9ryqHv0NRL3e3iSPEI,5491
174
174
  unstructured_ingest/embed/octoai.py,sha256=ERJby6VdqcIO6NLTqLXVHmX7LNIM0Fsmhf3dn10Z4is,2347
175
175
  unstructured_ingest/embed/openai.py,sha256=zOh3GHg1sPVUd3YzZLS5JIV21emYyrCHGYzqH5MIAiY,2250
176
- unstructured_ingest/embed/vertexai.py,sha256=6IJlNFMW5GKb5r28aM97YUokHMXIlefjpplJxzgpOZc,3332
176
+ unstructured_ingest/embed/vertexai.py,sha256=DuOQNHUzickx9kIobfIz2RjhJ712OsZhIoYJiXxaMco,3309
177
177
  unstructured_ingest/embed/voyageai.py,sha256=PwyW-_dXZT1AGSkeF3c2heM-pdBxciUxdtP7PluCauY,2430
178
178
  unstructured_ingest/enhanced_dataclass/__init__.py,sha256=gDZOUsv5eo-8jm4Yu7DdDwi101aGbfG7JctTdOYnTOM,151
179
179
  unstructured_ingest/enhanced_dataclass/core.py,sha256=d6aUkDynuKX87cHx9_N5UDUWrvISR4jYRFRTvd_avlI,3038
@@ -333,14 +333,14 @@ unstructured_ingest/v2/processes/connectors/fsspec/__init__.py,sha256=TtdeImM7Yp
333
333
  unstructured_ingest/v2/processes/connectors/fsspec/azure.py,sha256=GrC44PnA8PLHUJQ4aH3gETxL8v8UvknbKptxiXweqdc,6214
334
334
  unstructured_ingest/v2/processes/connectors/fsspec/box.py,sha256=JgSgF7f4UOx_JUV8zghgykyBA4rKvqkErRm6zYXO1XA,4434
335
335
  unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py,sha256=ZnoSGAZ4wtOhyg8G3PLYFMpbMVsBffvW-qp5jWwEDuA,4775
336
- unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=HptjVCGfGLOFoVwx8eYK_34sLb41ebCPbmSb5rCF10o,12441
336
+ unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py,sha256=Ri1TscAbQyIb3QZXDIC3vYJyGRgFWAOrzaQsngsCl-Q,12785
337
337
  unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=O1j0hIYWI4lPpTQ5hsEKV8usDCrUm-t1qVcSNKsJQd0,6006
338
338
  unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=cOMvMh0C9rtyEPJ0X59Fn-qb11LFUMRfeUgsi3QRWUk,6390
339
339
  unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=NkcU4U2DQWWuM8UHkez67C3SEOZpVyRtmtNS-z-F0Fw,6056
340
340
  unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
341
- unstructured_ingest-0.0.16.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
342
- unstructured_ingest-0.0.16.dist-info/METADATA,sha256=TKFqD-HE2ZCSxOyoO6Swo36JMSTla4W91IiaXa3lJMg,28507
343
- unstructured_ingest-0.0.16.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
344
- unstructured_ingest-0.0.16.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
345
- unstructured_ingest-0.0.16.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
346
- unstructured_ingest-0.0.16.dist-info/RECORD,,
341
+ unstructured_ingest-0.0.18.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
342
+ unstructured_ingest-0.0.18.dist-info/METADATA,sha256=rKqUHDyuaADzZishCNkNG8JlnkxswaTljDIBPzAs7_Q,28507
343
+ unstructured_ingest-0.0.18.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
344
+ unstructured_ingest-0.0.18.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
345
+ unstructured_ingest-0.0.18.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
346
+ unstructured_ingest-0.0.18.dist-info/RECORD,,