unstructured-ingest 0.0.9__py3-none-any.whl → 0.0.10__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1 +1 @@
1
- __version__ = "0.0.9" # pragma: no cover
1
+ __version__ = "0.0.10" # pragma: no cover
@@ -63,7 +63,8 @@ def uncompress_tar_file(tar_filename: str, path: Optional[str] = None) -> str:
63
63
 
64
64
  path = path if path else os.path.join(head, f"{tail}-tar-uncompressed")
65
65
  logger.info(f"extracting tar {tar_filename} -> {path}")
66
- with tarfile.open(tar_filename, "r:gz") as tfile:
66
+ # NOTE: "r:*" mode opens both compressed (e.g ".tar.gz") and uncompressed ".tar" archives
67
+ with tarfile.open(tar_filename, "r:*") as tfile:
67
68
  # NOTE(robinson: Mitigate against malicious content being extracted from the tar file.
68
69
  # This was added in Python 3.12
69
70
  # Ref: https://docs.python.org/3/library/tarfile.html#extraction-filters
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.9
3
+ Version: 0.0.10
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,616 +22,616 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.13
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: tqdm
26
25
  Requires-Dist: pandas
27
- Requires-Dist: opentelemetry-sdk
28
- Requires-Dist: pydantic
29
26
  Requires-Dist: dataclasses-json
30
- Requires-Dist: python-dateutil
27
+ Requires-Dist: pydantic
31
28
  Requires-Dist: click
29
+ Requires-Dist: tqdm
30
+ Requires-Dist: opentelemetry-sdk
31
+ Requires-Dist: python-dateutil
32
32
  Provides-Extra: airtable
33
- Requires-Dist: tqdm; extra == "airtable"
34
33
  Requires-Dist: pandas; extra == "airtable"
35
- Requires-Dist: opentelemetry-sdk; extra == "airtable"
36
- Requires-Dist: pydantic; extra == "airtable"
37
34
  Requires-Dist: dataclasses-json; extra == "airtable"
38
- Requires-Dist: python-dateutil; extra == "airtable"
39
- Requires-Dist: pyairtable; extra == "airtable"
35
+ Requires-Dist: pydantic; extra == "airtable"
40
36
  Requires-Dist: click; extra == "airtable"
37
+ Requires-Dist: pyairtable; extra == "airtable"
38
+ Requires-Dist: tqdm; extra == "airtable"
39
+ Requires-Dist: opentelemetry-sdk; extra == "airtable"
40
+ Requires-Dist: python-dateutil; extra == "airtable"
41
41
  Provides-Extra: astradb
42
- Requires-Dist: tqdm; extra == "astradb"
43
42
  Requires-Dist: pandas; extra == "astradb"
44
- Requires-Dist: opentelemetry-sdk; extra == "astradb"
45
- Requires-Dist: pydantic; extra == "astradb"
46
- Requires-Dist: python-dateutil; extra == "astradb"
47
43
  Requires-Dist: dataclasses-json; extra == "astradb"
48
44
  Requires-Dist: astrapy; extra == "astradb"
45
+ Requires-Dist: pydantic; extra == "astradb"
49
46
  Requires-Dist: click; extra == "astradb"
47
+ Requires-Dist: tqdm; extra == "astradb"
48
+ Requires-Dist: opentelemetry-sdk; extra == "astradb"
49
+ Requires-Dist: python-dateutil; extra == "astradb"
50
50
  Provides-Extra: azure
51
- Requires-Dist: fsspec; extra == "azure"
52
- Requires-Dist: tqdm; extra == "azure"
53
51
  Requires-Dist: pandas; extra == "azure"
54
- Requires-Dist: opentelemetry-sdk; extra == "azure"
55
- Requires-Dist: pydantic; extra == "azure"
56
52
  Requires-Dist: dataclasses-json; extra == "azure"
53
+ Requires-Dist: fsspec; extra == "azure"
57
54
  Requires-Dist: adlfs; extra == "azure"
58
- Requires-Dist: python-dateutil; extra == "azure"
55
+ Requires-Dist: pydantic; extra == "azure"
59
56
  Requires-Dist: click; extra == "azure"
57
+ Requires-Dist: tqdm; extra == "azure"
58
+ Requires-Dist: opentelemetry-sdk; extra == "azure"
59
+ Requires-Dist: python-dateutil; extra == "azure"
60
60
  Provides-Extra: azure-cognitive-search
61
- Requires-Dist: tqdm; extra == "azure-cognitive-search"
62
- Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
63
61
  Requires-Dist: pandas; extra == "azure-cognitive-search"
64
- Requires-Dist: opentelemetry-sdk; extra == "azure-cognitive-search"
65
- Requires-Dist: pydantic; extra == "azure-cognitive-search"
66
62
  Requires-Dist: dataclasses-json; extra == "azure-cognitive-search"
67
- Requires-Dist: python-dateutil; extra == "azure-cognitive-search"
63
+ Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
64
+ Requires-Dist: pydantic; extra == "azure-cognitive-search"
68
65
  Requires-Dist: click; extra == "azure-cognitive-search"
66
+ Requires-Dist: tqdm; extra == "azure-cognitive-search"
67
+ Requires-Dist: opentelemetry-sdk; extra == "azure-cognitive-search"
68
+ Requires-Dist: python-dateutil; extra == "azure-cognitive-search"
69
69
  Provides-Extra: bedrock
70
- Requires-Dist: boto3; extra == "bedrock"
71
- Requires-Dist: tqdm; extra == "bedrock"
72
70
  Requires-Dist: pandas; extra == "bedrock"
73
- Requires-Dist: opentelemetry-sdk; extra == "bedrock"
74
- Requires-Dist: pydantic; extra == "bedrock"
75
- Requires-Dist: langchain-community; extra == "bedrock"
76
71
  Requires-Dist: dataclasses-json; extra == "bedrock"
72
+ Requires-Dist: boto3; extra == "bedrock"
77
73
  Requires-Dist: unstructured; extra == "bedrock"
78
- Requires-Dist: python-dateutil; extra == "bedrock"
74
+ Requires-Dist: pydantic; extra == "bedrock"
79
75
  Requires-Dist: click; extra == "bedrock"
76
+ Requires-Dist: python-dateutil; extra == "bedrock"
77
+ Requires-Dist: tqdm; extra == "bedrock"
78
+ Requires-Dist: opentelemetry-sdk; extra == "bedrock"
79
+ Requires-Dist: langchain-community; extra == "bedrock"
80
80
  Provides-Extra: biomed
81
- Requires-Dist: bs4; extra == "biomed"
82
- Requires-Dist: tqdm; extra == "biomed"
83
81
  Requires-Dist: pandas; extra == "biomed"
84
- Requires-Dist: opentelemetry-sdk; extra == "biomed"
85
- Requires-Dist: pydantic; extra == "biomed"
82
+ Requires-Dist: bs4; extra == "biomed"
86
83
  Requires-Dist: requests; extra == "biomed"
87
84
  Requires-Dist: dataclasses-json; extra == "biomed"
88
- Requires-Dist: python-dateutil; extra == "biomed"
85
+ Requires-Dist: pydantic; extra == "biomed"
89
86
  Requires-Dist: click; extra == "biomed"
87
+ Requires-Dist: tqdm; extra == "biomed"
88
+ Requires-Dist: opentelemetry-sdk; extra == "biomed"
89
+ Requires-Dist: python-dateutil; extra == "biomed"
90
90
  Provides-Extra: box
91
+ Requires-Dist: pandas; extra == "box"
92
+ Requires-Dist: dataclasses-json; extra == "box"
93
+ Requires-Dist: boxfs; extra == "box"
91
94
  Requires-Dist: fsspec; extra == "box"
95
+ Requires-Dist: pydantic; extra == "box"
96
+ Requires-Dist: click; extra == "box"
92
97
  Requires-Dist: tqdm; extra == "box"
93
- Requires-Dist: pandas; extra == "box"
94
98
  Requires-Dist: opentelemetry-sdk; extra == "box"
95
- Requires-Dist: pydantic; extra == "box"
96
- Requires-Dist: boxfs; extra == "box"
97
- Requires-Dist: dataclasses-json; extra == "box"
98
99
  Requires-Dist: python-dateutil; extra == "box"
99
- Requires-Dist: click; extra == "box"
100
100
  Provides-Extra: chroma
101
+ Requires-Dist: typer<=0.9.0; extra == "chroma"
101
102
  Requires-Dist: chromadb; extra == "chroma"
102
- Requires-Dist: tqdm; extra == "chroma"
103
103
  Requires-Dist: pandas; extra == "chroma"
104
- Requires-Dist: opentelemetry-sdk; extra == "chroma"
104
+ Requires-Dist: dataclasses-json; extra == "chroma"
105
105
  Requires-Dist: importlib-metadata>=7.1.0; extra == "chroma"
106
- Requires-Dist: typer<=0.9.0; extra == "chroma"
107
106
  Requires-Dist: pydantic; extra == "chroma"
108
- Requires-Dist: dataclasses-json; extra == "chroma"
109
- Requires-Dist: python-dateutil; extra == "chroma"
110
107
  Requires-Dist: click; extra == "chroma"
108
+ Requires-Dist: tqdm; extra == "chroma"
109
+ Requires-Dist: opentelemetry-sdk; extra == "chroma"
110
+ Requires-Dist: python-dateutil; extra == "chroma"
111
111
  Provides-Extra: clarifai
112
- Requires-Dist: tqdm; extra == "clarifai"
113
112
  Requires-Dist: pandas; extra == "clarifai"
114
- Requires-Dist: opentelemetry-sdk; extra == "clarifai"
115
- Requires-Dist: pydantic; extra == "clarifai"
116
- Requires-Dist: clarifai; extra == "clarifai"
117
113
  Requires-Dist: dataclasses-json; extra == "clarifai"
118
- Requires-Dist: python-dateutil; extra == "clarifai"
114
+ Requires-Dist: clarifai; extra == "clarifai"
115
+ Requires-Dist: pydantic; extra == "clarifai"
119
116
  Requires-Dist: click; extra == "clarifai"
117
+ Requires-Dist: tqdm; extra == "clarifai"
118
+ Requires-Dist: opentelemetry-sdk; extra == "clarifai"
119
+ Requires-Dist: python-dateutil; extra == "clarifai"
120
120
  Provides-Extra: confluence
121
- Requires-Dist: atlassian-python-api; extra == "confluence"
122
- Requires-Dist: tqdm; extra == "confluence"
123
121
  Requires-Dist: pandas; extra == "confluence"
124
- Requires-Dist: opentelemetry-sdk; extra == "confluence"
125
- Requires-Dist: pydantic; extra == "confluence"
126
122
  Requires-Dist: requests; extra == "confluence"
127
123
  Requires-Dist: dataclasses-json; extra == "confluence"
128
- Requires-Dist: python-dateutil; extra == "confluence"
124
+ Requires-Dist: pydantic; extra == "confluence"
129
125
  Requires-Dist: click; extra == "confluence"
126
+ Requires-Dist: atlassian-python-api; extra == "confluence"
127
+ Requires-Dist: tqdm; extra == "confluence"
128
+ Requires-Dist: opentelemetry-sdk; extra == "confluence"
129
+ Requires-Dist: python-dateutil; extra == "confluence"
130
130
  Provides-Extra: couchbase
131
- Requires-Dist: tqdm; extra == "couchbase"
132
131
  Requires-Dist: pandas; extra == "couchbase"
133
- Requires-Dist: opentelemetry-sdk; extra == "couchbase"
134
- Requires-Dist: pydantic; extra == "couchbase"
135
132
  Requires-Dist: dataclasses-json; extra == "couchbase"
136
- Requires-Dist: python-dateutil; extra == "couchbase"
137
- Requires-Dist: couchbase; extra == "couchbase"
133
+ Requires-Dist: tqdm; extra == "couchbase"
134
+ Requires-Dist: pydantic; extra == "couchbase"
138
135
  Requires-Dist: click; extra == "couchbase"
136
+ Requires-Dist: couchbase; extra == "couchbase"
137
+ Requires-Dist: opentelemetry-sdk; extra == "couchbase"
138
+ Requires-Dist: python-dateutil; extra == "couchbase"
139
139
  Provides-Extra: csv
140
140
  Requires-Dist: unstructured[tsv]; extra == "csv"
141
- Requires-Dist: tqdm; extra == "csv"
142
141
  Requires-Dist: pandas; extra == "csv"
143
- Requires-Dist: opentelemetry-sdk; extra == "csv"
144
- Requires-Dist: pydantic; extra == "csv"
145
142
  Requires-Dist: dataclasses-json; extra == "csv"
146
- Requires-Dist: python-dateutil; extra == "csv"
143
+ Requires-Dist: pydantic; extra == "csv"
147
144
  Requires-Dist: click; extra == "csv"
145
+ Requires-Dist: tqdm; extra == "csv"
146
+ Requires-Dist: opentelemetry-sdk; extra == "csv"
147
+ Requires-Dist: python-dateutil; extra == "csv"
148
148
  Provides-Extra: databricks-volumes
149
- Requires-Dist: tqdm; extra == "databricks-volumes"
150
149
  Requires-Dist: pandas; extra == "databricks-volumes"
151
- Requires-Dist: opentelemetry-sdk; extra == "databricks-volumes"
152
- Requires-Dist: pydantic; extra == "databricks-volumes"
153
150
  Requires-Dist: dataclasses-json; extra == "databricks-volumes"
151
+ Requires-Dist: tqdm; extra == "databricks-volumes"
152
+ Requires-Dist: pydantic; extra == "databricks-volumes"
153
+ Requires-Dist: click; extra == "databricks-volumes"
154
154
  Requires-Dist: databricks-sdk; extra == "databricks-volumes"
155
+ Requires-Dist: opentelemetry-sdk; extra == "databricks-volumes"
155
156
  Requires-Dist: python-dateutil; extra == "databricks-volumes"
156
- Requires-Dist: click; extra == "databricks-volumes"
157
157
  Provides-Extra: delta-table
158
+ Requires-Dist: pandas; extra == "delta-table"
159
+ Requires-Dist: dataclasses-json; extra == "delta-table"
158
160
  Requires-Dist: fsspec; extra == "delta-table"
159
161
  Requires-Dist: deltalake; extra == "delta-table"
162
+ Requires-Dist: pydantic; extra == "delta-table"
163
+ Requires-Dist: click; extra == "delta-table"
160
164
  Requires-Dist: tqdm; extra == "delta-table"
161
- Requires-Dist: pandas; extra == "delta-table"
162
165
  Requires-Dist: opentelemetry-sdk; extra == "delta-table"
163
- Requires-Dist: pydantic; extra == "delta-table"
164
- Requires-Dist: dataclasses-json; extra == "delta-table"
165
166
  Requires-Dist: python-dateutil; extra == "delta-table"
166
- Requires-Dist: click; extra == "delta-table"
167
167
  Provides-Extra: discord
168
- Requires-Dist: tqdm; extra == "discord"
169
168
  Requires-Dist: pandas; extra == "discord"
170
- Requires-Dist: opentelemetry-sdk; extra == "discord"
169
+ Requires-Dist: dataclasses-json; extra == "discord"
171
170
  Requires-Dist: pydantic; extra == "discord"
172
171
  Requires-Dist: discord-py; extra == "discord"
173
- Requires-Dist: dataclasses-json; extra == "discord"
174
- Requires-Dist: python-dateutil; extra == "discord"
175
172
  Requires-Dist: click; extra == "discord"
173
+ Requires-Dist: tqdm; extra == "discord"
174
+ Requires-Dist: opentelemetry-sdk; extra == "discord"
175
+ Requires-Dist: python-dateutil; extra == "discord"
176
176
  Provides-Extra: doc
177
- Requires-Dist: tqdm; extra == "doc"
178
- Requires-Dist: unstructured[docx]; extra == "doc"
179
177
  Requires-Dist: pandas; extra == "doc"
180
- Requires-Dist: opentelemetry-sdk; extra == "doc"
181
- Requires-Dist: pydantic; extra == "doc"
182
178
  Requires-Dist: dataclasses-json; extra == "doc"
183
- Requires-Dist: python-dateutil; extra == "doc"
179
+ Requires-Dist: pydantic; extra == "doc"
184
180
  Requires-Dist: click; extra == "doc"
181
+ Requires-Dist: unstructured[docx]; extra == "doc"
182
+ Requires-Dist: tqdm; extra == "doc"
183
+ Requires-Dist: opentelemetry-sdk; extra == "doc"
184
+ Requires-Dist: python-dateutil; extra == "doc"
185
185
  Provides-Extra: docx
186
- Requires-Dist: tqdm; extra == "docx"
187
- Requires-Dist: unstructured[docx]; extra == "docx"
188
186
  Requires-Dist: pandas; extra == "docx"
189
- Requires-Dist: opentelemetry-sdk; extra == "docx"
190
- Requires-Dist: pydantic; extra == "docx"
191
187
  Requires-Dist: dataclasses-json; extra == "docx"
192
- Requires-Dist: python-dateutil; extra == "docx"
188
+ Requires-Dist: pydantic; extra == "docx"
193
189
  Requires-Dist: click; extra == "docx"
190
+ Requires-Dist: unstructured[docx]; extra == "docx"
191
+ Requires-Dist: tqdm; extra == "docx"
192
+ Requires-Dist: opentelemetry-sdk; extra == "docx"
193
+ Requires-Dist: python-dateutil; extra == "docx"
194
194
  Provides-Extra: dropbox
195
+ Requires-Dist: pandas; extra == "dropbox"
196
+ Requires-Dist: dataclasses-json; extra == "dropbox"
195
197
  Requires-Dist: fsspec; extra == "dropbox"
198
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
199
+ Requires-Dist: pydantic; extra == "dropbox"
200
+ Requires-Dist: click; extra == "dropbox"
196
201
  Requires-Dist: tqdm; extra == "dropbox"
197
- Requires-Dist: pandas; extra == "dropbox"
198
202
  Requires-Dist: opentelemetry-sdk; extra == "dropbox"
199
- Requires-Dist: pydantic; extra == "dropbox"
200
- Requires-Dist: dropboxdrivefs; extra == "dropbox"
201
- Requires-Dist: dataclasses-json; extra == "dropbox"
202
203
  Requires-Dist: python-dateutil; extra == "dropbox"
203
- Requires-Dist: click; extra == "dropbox"
204
204
  Provides-Extra: elasticsearch
205
- Requires-Dist: tqdm; extra == "elasticsearch"
206
205
  Requires-Dist: pandas; extra == "elasticsearch"
207
- Requires-Dist: opentelemetry-sdk; extra == "elasticsearch"
208
- Requires-Dist: pydantic; extra == "elasticsearch"
209
- Requires-Dist: dataclasses-json; extra == "elasticsearch"
210
206
  Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
211
- Requires-Dist: python-dateutil; extra == "elasticsearch"
207
+ Requires-Dist: dataclasses-json; extra == "elasticsearch"
208
+ Requires-Dist: pydantic; extra == "elasticsearch"
212
209
  Requires-Dist: click; extra == "elasticsearch"
210
+ Requires-Dist: tqdm; extra == "elasticsearch"
211
+ Requires-Dist: opentelemetry-sdk; extra == "elasticsearch"
212
+ Requires-Dist: python-dateutil; extra == "elasticsearch"
213
213
  Provides-Extra: embed-huggingface
214
- Requires-Dist: tqdm; extra == "embed-huggingface"
215
- Requires-Dist: langchain-huggingface; extra == "embed-huggingface"
216
214
  Requires-Dist: pandas; extra == "embed-huggingface"
217
- Requires-Dist: opentelemetry-sdk; extra == "embed-huggingface"
218
- Requires-Dist: pydantic; extra == "embed-huggingface"
219
215
  Requires-Dist: dataclasses-json; extra == "embed-huggingface"
216
+ Requires-Dist: langchain-huggingface; extra == "embed-huggingface"
220
217
  Requires-Dist: unstructured; extra == "embed-huggingface"
221
- Requires-Dist: python-dateutil; extra == "embed-huggingface"
218
+ Requires-Dist: pydantic; extra == "embed-huggingface"
222
219
  Requires-Dist: click; extra == "embed-huggingface"
220
+ Requires-Dist: tqdm; extra == "embed-huggingface"
221
+ Requires-Dist: opentelemetry-sdk; extra == "embed-huggingface"
222
+ Requires-Dist: python-dateutil; extra == "embed-huggingface"
223
223
  Provides-Extra: embed-octoai
224
- Requires-Dist: openai; extra == "embed-octoai"
225
- Requires-Dist: tqdm; extra == "embed-octoai"
226
224
  Requires-Dist: pandas; extra == "embed-octoai"
227
- Requires-Dist: opentelemetry-sdk; extra == "embed-octoai"
228
- Requires-Dist: pydantic; extra == "embed-octoai"
229
- Requires-Dist: tiktoken; extra == "embed-octoai"
230
225
  Requires-Dist: dataclasses-json; extra == "embed-octoai"
226
+ Requires-Dist: openai; extra == "embed-octoai"
231
227
  Requires-Dist: unstructured; extra == "embed-octoai"
232
- Requires-Dist: python-dateutil; extra == "embed-octoai"
228
+ Requires-Dist: pydantic; extra == "embed-octoai"
229
+ Requires-Dist: tiktoken; extra == "embed-octoai"
233
230
  Requires-Dist: click; extra == "embed-octoai"
231
+ Requires-Dist: tqdm; extra == "embed-octoai"
232
+ Requires-Dist: opentelemetry-sdk; extra == "embed-octoai"
233
+ Requires-Dist: python-dateutil; extra == "embed-octoai"
234
234
  Provides-Extra: embed-vertexai
235
235
  Requires-Dist: langchain; extra == "embed-vertexai"
236
- Requires-Dist: tqdm; extra == "embed-vertexai"
237
236
  Requires-Dist: pandas; extra == "embed-vertexai"
238
- Requires-Dist: opentelemetry-sdk; extra == "embed-vertexai"
239
- Requires-Dist: pydantic; extra == "embed-vertexai"
240
- Requires-Dist: langchain-google-vertexai; extra == "embed-vertexai"
241
- Requires-Dist: langchain-community; extra == "embed-vertexai"
242
237
  Requires-Dist: dataclasses-json; extra == "embed-vertexai"
243
238
  Requires-Dist: unstructured; extra == "embed-vertexai"
244
- Requires-Dist: python-dateutil; extra == "embed-vertexai"
239
+ Requires-Dist: langchain-google-vertexai; extra == "embed-vertexai"
240
+ Requires-Dist: pydantic; extra == "embed-vertexai"
245
241
  Requires-Dist: click; extra == "embed-vertexai"
242
+ Requires-Dist: python-dateutil; extra == "embed-vertexai"
243
+ Requires-Dist: tqdm; extra == "embed-vertexai"
244
+ Requires-Dist: opentelemetry-sdk; extra == "embed-vertexai"
245
+ Requires-Dist: langchain-community; extra == "embed-vertexai"
246
246
  Provides-Extra: embed-voyageai
247
247
  Requires-Dist: langchain; extra == "embed-voyageai"
248
- Requires-Dist: tqdm; extra == "embed-voyageai"
249
248
  Requires-Dist: pandas; extra == "embed-voyageai"
250
- Requires-Dist: opentelemetry-sdk; extra == "embed-voyageai"
251
- Requires-Dist: pydantic; extra == "embed-voyageai"
252
249
  Requires-Dist: dataclasses-json; extra == "embed-voyageai"
253
- Requires-Dist: langchain-voyageai; extra == "embed-voyageai"
254
250
  Requires-Dist: unstructured; extra == "embed-voyageai"
255
- Requires-Dist: python-dateutil; extra == "embed-voyageai"
251
+ Requires-Dist: pydantic; extra == "embed-voyageai"
256
252
  Requires-Dist: click; extra == "embed-voyageai"
253
+ Requires-Dist: tqdm; extra == "embed-voyageai"
254
+ Requires-Dist: langchain-voyageai; extra == "embed-voyageai"
255
+ Requires-Dist: opentelemetry-sdk; extra == "embed-voyageai"
256
+ Requires-Dist: python-dateutil; extra == "embed-voyageai"
257
257
  Provides-Extra: epub
258
- Requires-Dist: tqdm; extra == "epub"
259
258
  Requires-Dist: pandas; extra == "epub"
260
- Requires-Dist: opentelemetry-sdk; extra == "epub"
261
- Requires-Dist: pydantic; extra == "epub"
262
259
  Requires-Dist: dataclasses-json; extra == "epub"
263
- Requires-Dist: python-dateutil; extra == "epub"
264
260
  Requires-Dist: unstructured[epub]; extra == "epub"
261
+ Requires-Dist: pydantic; extra == "epub"
265
262
  Requires-Dist: click; extra == "epub"
263
+ Requires-Dist: tqdm; extra == "epub"
264
+ Requires-Dist: opentelemetry-sdk; extra == "epub"
265
+ Requires-Dist: python-dateutil; extra == "epub"
266
266
  Provides-Extra: gcs
267
- Requires-Dist: fsspec; extra == "gcs"
267
+ Requires-Dist: pandas; extra == "gcs"
268
268
  Requires-Dist: bs4; extra == "gcs"
269
+ Requires-Dist: dataclasses-json; extra == "gcs"
270
+ Requires-Dist: fsspec; extra == "gcs"
271
+ Requires-Dist: pydantic; extra == "gcs"
272
+ Requires-Dist: click; extra == "gcs"
269
273
  Requires-Dist: tqdm; extra == "gcs"
270
274
  Requires-Dist: gcsfs; extra == "gcs"
271
- Requires-Dist: pandas; extra == "gcs"
272
275
  Requires-Dist: opentelemetry-sdk; extra == "gcs"
273
- Requires-Dist: pydantic; extra == "gcs"
274
- Requires-Dist: dataclasses-json; extra == "gcs"
275
276
  Requires-Dist: python-dateutil; extra == "gcs"
276
- Requires-Dist: click; extra == "gcs"
277
277
  Provides-Extra: github
278
- Requires-Dist: pygithub>1.58.0; extra == "github"
279
- Requires-Dist: tqdm; extra == "github"
280
278
  Requires-Dist: pandas; extra == "github"
281
- Requires-Dist: opentelemetry-sdk; extra == "github"
282
- Requires-Dist: pydantic; extra == "github"
283
279
  Requires-Dist: requests; extra == "github"
284
280
  Requires-Dist: dataclasses-json; extra == "github"
285
- Requires-Dist: python-dateutil; extra == "github"
281
+ Requires-Dist: pygithub>1.58.0; extra == "github"
282
+ Requires-Dist: pydantic; extra == "github"
286
283
  Requires-Dist: click; extra == "github"
284
+ Requires-Dist: tqdm; extra == "github"
285
+ Requires-Dist: opentelemetry-sdk; extra == "github"
286
+ Requires-Dist: python-dateutil; extra == "github"
287
287
  Provides-Extra: gitlab
288
- Requires-Dist: tqdm; extra == "gitlab"
289
288
  Requires-Dist: pandas; extra == "gitlab"
290
- Requires-Dist: opentelemetry-sdk; extra == "gitlab"
289
+ Requires-Dist: dataclasses-json; extra == "gitlab"
291
290
  Requires-Dist: pydantic; extra == "gitlab"
291
+ Requires-Dist: click; extra == "gitlab"
292
+ Requires-Dist: tqdm; extra == "gitlab"
292
293
  Requires-Dist: python-gitlab; extra == "gitlab"
293
- Requires-Dist: dataclasses-json; extra == "gitlab"
294
+ Requires-Dist: opentelemetry-sdk; extra == "gitlab"
294
295
  Requires-Dist: python-dateutil; extra == "gitlab"
295
- Requires-Dist: click; extra == "gitlab"
296
296
  Provides-Extra: google-drive
297
- Requires-Dist: tqdm; extra == "google-drive"
298
297
  Requires-Dist: pandas; extra == "google-drive"
299
- Requires-Dist: opentelemetry-sdk; extra == "google-drive"
300
- Requires-Dist: pydantic; extra == "google-drive"
301
298
  Requires-Dist: dataclasses-json; extra == "google-drive"
302
299
  Requires-Dist: google-api-python-client; extra == "google-drive"
303
- Requires-Dist: python-dateutil; extra == "google-drive"
300
+ Requires-Dist: pydantic; extra == "google-drive"
304
301
  Requires-Dist: click; extra == "google-drive"
302
+ Requires-Dist: tqdm; extra == "google-drive"
303
+ Requires-Dist: opentelemetry-sdk; extra == "google-drive"
304
+ Requires-Dist: python-dateutil; extra == "google-drive"
305
305
  Provides-Extra: hubspot
306
- Requires-Dist: tqdm; extra == "hubspot"
307
- Requires-Dist: urllib3; extra == "hubspot"
308
306
  Requires-Dist: pandas; extra == "hubspot"
309
- Requires-Dist: opentelemetry-sdk; extra == "hubspot"
310
- Requires-Dist: pydantic; extra == "hubspot"
311
307
  Requires-Dist: dataclasses-json; extra == "hubspot"
312
308
  Requires-Dist: hubspot-api-client; extra == "hubspot"
313
- Requires-Dist: python-dateutil; extra == "hubspot"
309
+ Requires-Dist: pydantic; extra == "hubspot"
314
310
  Requires-Dist: click; extra == "hubspot"
311
+ Requires-Dist: tqdm; extra == "hubspot"
312
+ Requires-Dist: urllib3; extra == "hubspot"
313
+ Requires-Dist: opentelemetry-sdk; extra == "hubspot"
314
+ Requires-Dist: python-dateutil; extra == "hubspot"
315
315
  Provides-Extra: jira
316
+ Requires-Dist: pandas; extra == "jira"
317
+ Requires-Dist: dataclasses-json; extra == "jira"
318
+ Requires-Dist: pydantic; extra == "jira"
319
+ Requires-Dist: click; extra == "jira"
316
320
  Requires-Dist: atlassian-python-api; extra == "jira"
317
321
  Requires-Dist: tqdm; extra == "jira"
318
- Requires-Dist: pandas; extra == "jira"
319
322
  Requires-Dist: opentelemetry-sdk; extra == "jira"
320
- Requires-Dist: pydantic; extra == "jira"
321
- Requires-Dist: dataclasses-json; extra == "jira"
322
323
  Requires-Dist: python-dateutil; extra == "jira"
323
- Requires-Dist: click; extra == "jira"
324
324
  Provides-Extra: kafka
325
- Requires-Dist: tqdm; extra == "kafka"
326
- Requires-Dist: confluent-kafka; extra == "kafka"
327
325
  Requires-Dist: pandas; extra == "kafka"
328
- Requires-Dist: opentelemetry-sdk; extra == "kafka"
329
- Requires-Dist: pydantic; extra == "kafka"
330
326
  Requires-Dist: dataclasses-json; extra == "kafka"
331
- Requires-Dist: python-dateutil; extra == "kafka"
327
+ Requires-Dist: pydantic; extra == "kafka"
332
328
  Requires-Dist: click; extra == "kafka"
329
+ Requires-Dist: tqdm; extra == "kafka"
330
+ Requires-Dist: opentelemetry-sdk; extra == "kafka"
331
+ Requires-Dist: python-dateutil; extra == "kafka"
332
+ Requires-Dist: confluent-kafka; extra == "kafka"
333
333
  Provides-Extra: kdbai
334
334
  Requires-Dist: kdbai-client; extra == "kdbai"
335
335
  Provides-Extra: md
336
- Requires-Dist: tqdm; extra == "md"
337
336
  Requires-Dist: pandas; extra == "md"
338
- Requires-Dist: opentelemetry-sdk; extra == "md"
339
- Requires-Dist: pydantic; extra == "md"
340
337
  Requires-Dist: dataclasses-json; extra == "md"
341
- Requires-Dist: unstructured[md]; extra == "md"
342
- Requires-Dist: python-dateutil; extra == "md"
338
+ Requires-Dist: pydantic; extra == "md"
343
339
  Requires-Dist: click; extra == "md"
340
+ Requires-Dist: tqdm; extra == "md"
341
+ Requires-Dist: opentelemetry-sdk; extra == "md"
342
+ Requires-Dist: python-dateutil; extra == "md"
343
+ Requires-Dist: unstructured[md]; extra == "md"
344
344
  Provides-Extra: milvus
345
- Requires-Dist: tqdm; extra == "milvus"
346
345
  Requires-Dist: pymilvus; extra == "milvus"
347
346
  Requires-Dist: pandas; extra == "milvus"
348
- Requires-Dist: opentelemetry-sdk; extra == "milvus"
349
- Requires-Dist: pydantic; extra == "milvus"
350
347
  Requires-Dist: dataclasses-json; extra == "milvus"
351
- Requires-Dist: python-dateutil; extra == "milvus"
348
+ Requires-Dist: pydantic; extra == "milvus"
352
349
  Requires-Dist: click; extra == "milvus"
350
+ Requires-Dist: tqdm; extra == "milvus"
351
+ Requires-Dist: opentelemetry-sdk; extra == "milvus"
352
+ Requires-Dist: python-dateutil; extra == "milvus"
353
353
  Provides-Extra: mongodb
354
- Requires-Dist: tqdm; extra == "mongodb"
355
354
  Requires-Dist: pandas; extra == "mongodb"
356
- Requires-Dist: opentelemetry-sdk; extra == "mongodb"
357
- Requires-Dist: pydantic; extra == "mongodb"
358
355
  Requires-Dist: dataclasses-json; extra == "mongodb"
359
- Requires-Dist: python-dateutil; extra == "mongodb"
360
356
  Requires-Dist: pymongo; extra == "mongodb"
357
+ Requires-Dist: pydantic; extra == "mongodb"
361
358
  Requires-Dist: click; extra == "mongodb"
359
+ Requires-Dist: tqdm; extra == "mongodb"
360
+ Requires-Dist: opentelemetry-sdk; extra == "mongodb"
361
+ Requires-Dist: python-dateutil; extra == "mongodb"
362
362
  Provides-Extra: msg
363
- Requires-Dist: tqdm; extra == "msg"
364
363
  Requires-Dist: pandas; extra == "msg"
365
- Requires-Dist: opentelemetry-sdk; extra == "msg"
366
- Requires-Dist: pydantic; extra == "msg"
367
364
  Requires-Dist: dataclasses-json; extra == "msg"
368
- Requires-Dist: python-dateutil; extra == "msg"
369
- Requires-Dist: unstructured[msg]; extra == "msg"
365
+ Requires-Dist: pydantic; extra == "msg"
370
366
  Requires-Dist: click; extra == "msg"
367
+ Requires-Dist: tqdm; extra == "msg"
368
+ Requires-Dist: unstructured[msg]; extra == "msg"
369
+ Requires-Dist: opentelemetry-sdk; extra == "msg"
370
+ Requires-Dist: python-dateutil; extra == "msg"
371
371
  Provides-Extra: notion
372
+ Requires-Dist: httpx; extra == "notion"
373
+ Requires-Dist: pandas; extra == "notion"
374
+ Requires-Dist: dataclasses-json; extra == "notion"
375
+ Requires-Dist: backoff; extra == "notion"
372
376
  Requires-Dist: htmlBuilder; extra == "notion"
373
- Requires-Dist: tqdm; extra == "notion"
377
+ Requires-Dist: pydantic; extra == "notion"
374
378
  Requires-Dist: notion-client; extra == "notion"
375
- Requires-Dist: backoff; extra == "notion"
376
- Requires-Dist: pandas; extra == "notion"
379
+ Requires-Dist: click; extra == "notion"
380
+ Requires-Dist: tqdm; extra == "notion"
377
381
  Requires-Dist: opentelemetry-sdk; extra == "notion"
378
- Requires-Dist: pydantic; extra == "notion"
379
- Requires-Dist: dataclasses-json; extra == "notion"
380
- Requires-Dist: httpx; extra == "notion"
381
382
  Requires-Dist: python-dateutil; extra == "notion"
382
- Requires-Dist: click; extra == "notion"
383
383
  Provides-Extra: odt
384
- Requires-Dist: tqdm; extra == "odt"
385
- Requires-Dist: click; extra == "odt"
386
384
  Requires-Dist: pandas; extra == "odt"
387
- Requires-Dist: opentelemetry-sdk; extra == "odt"
388
- Requires-Dist: pydantic; extra == "odt"
389
385
  Requires-Dist: dataclasses-json; extra == "odt"
390
- Requires-Dist: python-dateutil; extra == "odt"
391
386
  Requires-Dist: unstructured[odt]; extra == "odt"
387
+ Requires-Dist: pydantic; extra == "odt"
388
+ Requires-Dist: click; extra == "odt"
389
+ Requires-Dist: tqdm; extra == "odt"
390
+ Requires-Dist: opentelemetry-sdk; extra == "odt"
391
+ Requires-Dist: python-dateutil; extra == "odt"
392
392
  Provides-Extra: onedrive
393
- Requires-Dist: bs4; extra == "onedrive"
394
- Requires-Dist: tqdm; extra == "onedrive"
395
393
  Requires-Dist: msal; extra == "onedrive"
394
+ Requires-Dist: bs4; extra == "onedrive"
396
395
  Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
397
396
  Requires-Dist: pandas; extra == "onedrive"
398
- Requires-Dist: opentelemetry-sdk; extra == "onedrive"
399
- Requires-Dist: pydantic; extra == "onedrive"
400
397
  Requires-Dist: dataclasses-json; extra == "onedrive"
401
- Requires-Dist: python-dateutil; extra == "onedrive"
398
+ Requires-Dist: pydantic; extra == "onedrive"
402
399
  Requires-Dist: click; extra == "onedrive"
400
+ Requires-Dist: tqdm; extra == "onedrive"
401
+ Requires-Dist: opentelemetry-sdk; extra == "onedrive"
402
+ Requires-Dist: python-dateutil; extra == "onedrive"
403
403
  Provides-Extra: openai
404
- Requires-Dist: openai; extra == "openai"
405
- Requires-Dist: tqdm; extra == "openai"
406
404
  Requires-Dist: pandas; extra == "openai"
407
- Requires-Dist: opentelemetry-sdk; extra == "openai"
408
- Requires-Dist: pydantic; extra == "openai"
409
- Requires-Dist: tiktoken; extra == "openai"
410
- Requires-Dist: langchain-community; extra == "openai"
411
405
  Requires-Dist: dataclasses-json; extra == "openai"
406
+ Requires-Dist: openai; extra == "openai"
412
407
  Requires-Dist: unstructured; extra == "openai"
413
- Requires-Dist: python-dateutil; extra == "openai"
408
+ Requires-Dist: tiktoken; extra == "openai"
409
+ Requires-Dist: pydantic; extra == "openai"
414
410
  Requires-Dist: click; extra == "openai"
411
+ Requires-Dist: tqdm; extra == "openai"
412
+ Requires-Dist: python-dateutil; extra == "openai"
413
+ Requires-Dist: opentelemetry-sdk; extra == "openai"
414
+ Requires-Dist: langchain-community; extra == "openai"
415
415
  Provides-Extra: opensearch
416
- Requires-Dist: tqdm; extra == "opensearch"
417
416
  Requires-Dist: pandas; extra == "opensearch"
418
- Requires-Dist: opentelemetry-sdk; extra == "opensearch"
419
- Requires-Dist: pydantic; extra == "opensearch"
420
417
  Requires-Dist: dataclasses-json; extra == "opensearch"
421
418
  Requires-Dist: opensearch-py; extra == "opensearch"
422
- Requires-Dist: python-dateutil; extra == "opensearch"
419
+ Requires-Dist: pydantic; extra == "opensearch"
423
420
  Requires-Dist: click; extra == "opensearch"
421
+ Requires-Dist: tqdm; extra == "opensearch"
422
+ Requires-Dist: opentelemetry-sdk; extra == "opensearch"
423
+ Requires-Dist: python-dateutil; extra == "opensearch"
424
424
  Provides-Extra: org
425
+ Requires-Dist: pandas; extra == "org"
426
+ Requires-Dist: dataclasses-json; extra == "org"
425
427
  Requires-Dist: unstructured[org]; extra == "org"
428
+ Requires-Dist: pydantic; extra == "org"
429
+ Requires-Dist: click; extra == "org"
426
430
  Requires-Dist: tqdm; extra == "org"
427
- Requires-Dist: pandas; extra == "org"
428
431
  Requires-Dist: opentelemetry-sdk; extra == "org"
429
- Requires-Dist: pydantic; extra == "org"
430
- Requires-Dist: dataclasses-json; extra == "org"
431
432
  Requires-Dist: python-dateutil; extra == "org"
432
- Requires-Dist: click; extra == "org"
433
433
  Provides-Extra: outlook
434
- Requires-Dist: tqdm; extra == "outlook"
435
434
  Requires-Dist: msal; extra == "outlook"
435
+ Requires-Dist: dataclasses-json; extra == "outlook"
436
436
  Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
437
437
  Requires-Dist: pandas; extra == "outlook"
438
- Requires-Dist: opentelemetry-sdk; extra == "outlook"
439
438
  Requires-Dist: pydantic; extra == "outlook"
440
- Requires-Dist: dataclasses-json; extra == "outlook"
441
- Requires-Dist: python-dateutil; extra == "outlook"
442
439
  Requires-Dist: click; extra == "outlook"
440
+ Requires-Dist: tqdm; extra == "outlook"
441
+ Requires-Dist: opentelemetry-sdk; extra == "outlook"
442
+ Requires-Dist: python-dateutil; extra == "outlook"
443
443
  Provides-Extra: pdf
444
- Requires-Dist: tqdm; extra == "pdf"
445
444
  Requires-Dist: pandas; extra == "pdf"
446
- Requires-Dist: opentelemetry-sdk; extra == "pdf"
447
- Requires-Dist: pydantic; extra == "pdf"
448
445
  Requires-Dist: dataclasses-json; extra == "pdf"
449
- Requires-Dist: python-dateutil; extra == "pdf"
450
446
  Requires-Dist: unstructured[pdf]; extra == "pdf"
447
+ Requires-Dist: pydantic; extra == "pdf"
451
448
  Requires-Dist: click; extra == "pdf"
449
+ Requires-Dist: tqdm; extra == "pdf"
450
+ Requires-Dist: opentelemetry-sdk; extra == "pdf"
451
+ Requires-Dist: python-dateutil; extra == "pdf"
452
452
  Provides-Extra: pinecone
453
- Requires-Dist: tqdm; extra == "pinecone"
454
- Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
455
453
  Requires-Dist: pandas; extra == "pinecone"
456
- Requires-Dist: opentelemetry-sdk; extra == "pinecone"
457
- Requires-Dist: pydantic; extra == "pinecone"
458
454
  Requires-Dist: dataclasses-json; extra == "pinecone"
459
- Requires-Dist: python-dateutil; extra == "pinecone"
455
+ Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
456
+ Requires-Dist: pydantic; extra == "pinecone"
460
457
  Requires-Dist: click; extra == "pinecone"
458
+ Requires-Dist: tqdm; extra == "pinecone"
459
+ Requires-Dist: opentelemetry-sdk; extra == "pinecone"
460
+ Requires-Dist: python-dateutil; extra == "pinecone"
461
461
  Provides-Extra: postgres
462
- Requires-Dist: tqdm; extra == "postgres"
463
462
  Requires-Dist: pandas; extra == "postgres"
464
- Requires-Dist: opentelemetry-sdk; extra == "postgres"
465
- Requires-Dist: pydantic; extra == "postgres"
466
463
  Requires-Dist: dataclasses-json; extra == "postgres"
464
+ Requires-Dist: pydantic; extra == "postgres"
465
+ Requires-Dist: click; extra == "postgres"
466
+ Requires-Dist: tqdm; extra == "postgres"
467
467
  Requires-Dist: psycopg2-binary; extra == "postgres"
468
+ Requires-Dist: opentelemetry-sdk; extra == "postgres"
468
469
  Requires-Dist: python-dateutil; extra == "postgres"
469
- Requires-Dist: click; extra == "postgres"
470
470
  Provides-Extra: ppt
471
- Requires-Dist: tqdm; extra == "ppt"
472
- Requires-Dist: unstructured[pptx]; extra == "ppt"
473
471
  Requires-Dist: pandas; extra == "ppt"
474
- Requires-Dist: opentelemetry-sdk; extra == "ppt"
475
- Requires-Dist: pydantic; extra == "ppt"
476
472
  Requires-Dist: dataclasses-json; extra == "ppt"
477
- Requires-Dist: python-dateutil; extra == "ppt"
473
+ Requires-Dist: pydantic; extra == "ppt"
478
474
  Requires-Dist: click; extra == "ppt"
475
+ Requires-Dist: tqdm; extra == "ppt"
476
+ Requires-Dist: opentelemetry-sdk; extra == "ppt"
477
+ Requires-Dist: python-dateutil; extra == "ppt"
478
+ Requires-Dist: unstructured[pptx]; extra == "ppt"
479
479
  Provides-Extra: pptx
480
- Requires-Dist: tqdm; extra == "pptx"
481
- Requires-Dist: unstructured[pptx]; extra == "pptx"
482
480
  Requires-Dist: pandas; extra == "pptx"
483
- Requires-Dist: opentelemetry-sdk; extra == "pptx"
484
- Requires-Dist: pydantic; extra == "pptx"
485
481
  Requires-Dist: dataclasses-json; extra == "pptx"
486
- Requires-Dist: python-dateutil; extra == "pptx"
482
+ Requires-Dist: pydantic; extra == "pptx"
487
483
  Requires-Dist: click; extra == "pptx"
484
+ Requires-Dist: tqdm; extra == "pptx"
485
+ Requires-Dist: opentelemetry-sdk; extra == "pptx"
486
+ Requires-Dist: python-dateutil; extra == "pptx"
487
+ Requires-Dist: unstructured[pptx]; extra == "pptx"
488
488
  Provides-Extra: qdrant
489
- Requires-Dist: tqdm; extra == "qdrant"
490
- Requires-Dist: qdrant-client; extra == "qdrant"
491
489
  Requires-Dist: pandas; extra == "qdrant"
492
- Requires-Dist: opentelemetry-sdk; extra == "qdrant"
493
- Requires-Dist: pydantic; extra == "qdrant"
494
490
  Requires-Dist: dataclasses-json; extra == "qdrant"
495
- Requires-Dist: python-dateutil; extra == "qdrant"
491
+ Requires-Dist: pydantic; extra == "qdrant"
496
492
  Requires-Dist: click; extra == "qdrant"
493
+ Requires-Dist: tqdm; extra == "qdrant"
494
+ Requires-Dist: opentelemetry-sdk; extra == "qdrant"
495
+ Requires-Dist: python-dateutil; extra == "qdrant"
496
+ Requires-Dist: qdrant-client; extra == "qdrant"
497
497
  Provides-Extra: reddit
498
- Requires-Dist: tqdm; extra == "reddit"
499
- Requires-Dist: praw; extra == "reddit"
500
498
  Requires-Dist: pandas; extra == "reddit"
501
- Requires-Dist: opentelemetry-sdk; extra == "reddit"
502
- Requires-Dist: pydantic; extra == "reddit"
503
499
  Requires-Dist: dataclasses-json; extra == "reddit"
504
- Requires-Dist: python-dateutil; extra == "reddit"
500
+ Requires-Dist: pydantic; extra == "reddit"
505
501
  Requires-Dist: click; extra == "reddit"
502
+ Requires-Dist: praw; extra == "reddit"
503
+ Requires-Dist: tqdm; extra == "reddit"
504
+ Requires-Dist: opentelemetry-sdk; extra == "reddit"
505
+ Requires-Dist: python-dateutil; extra == "reddit"
506
506
  Provides-Extra: remote
507
+ Requires-Dist: pandas; extra == "remote"
508
+ Requires-Dist: dataclasses-json; extra == "remote"
507
509
  Requires-Dist: tqdm; extra == "remote"
510
+ Requires-Dist: pydantic; extra == "remote"
511
+ Requires-Dist: click; extra == "remote"
508
512
  Requires-Dist: unstructured-client>=0.23.0; extra == "remote"
509
- Requires-Dist: pandas; extra == "remote"
510
513
  Requires-Dist: opentelemetry-sdk; extra == "remote"
511
- Requires-Dist: pydantic; extra == "remote"
512
- Requires-Dist: dataclasses-json; extra == "remote"
513
514
  Requires-Dist: python-dateutil; extra == "remote"
514
- Requires-Dist: click; extra == "remote"
515
515
  Provides-Extra: rst
516
- Requires-Dist: tqdm; extra == "rst"
517
516
  Requires-Dist: pandas; extra == "rst"
518
- Requires-Dist: opentelemetry-sdk; extra == "rst"
519
- Requires-Dist: pydantic; extra == "rst"
520
- Requires-Dist: unstructured[rst]; extra == "rst"
521
517
  Requires-Dist: dataclasses-json; extra == "rst"
522
- Requires-Dist: python-dateutil; extra == "rst"
518
+ Requires-Dist: unstructured[rst]; extra == "rst"
519
+ Requires-Dist: pydantic; extra == "rst"
523
520
  Requires-Dist: click; extra == "rst"
521
+ Requires-Dist: tqdm; extra == "rst"
522
+ Requires-Dist: opentelemetry-sdk; extra == "rst"
523
+ Requires-Dist: python-dateutil; extra == "rst"
524
524
  Provides-Extra: rtf
525
- Requires-Dist: tqdm; extra == "rtf"
526
525
  Requires-Dist: pandas; extra == "rtf"
527
- Requires-Dist: opentelemetry-sdk; extra == "rtf"
526
+ Requires-Dist: dataclasses-json; extra == "rtf"
528
527
  Requires-Dist: unstructured[rtf]; extra == "rtf"
529
528
  Requires-Dist: pydantic; extra == "rtf"
530
- Requires-Dist: dataclasses-json; extra == "rtf"
531
- Requires-Dist: python-dateutil; extra == "rtf"
532
529
  Requires-Dist: click; extra == "rtf"
530
+ Requires-Dist: tqdm; extra == "rtf"
531
+ Requires-Dist: opentelemetry-sdk; extra == "rtf"
532
+ Requires-Dist: python-dateutil; extra == "rtf"
533
533
  Provides-Extra: s3
534
+ Requires-Dist: pandas; extra == "s3"
535
+ Requires-Dist: dataclasses-json; extra == "s3"
536
+ Requires-Dist: s3fs; extra == "s3"
534
537
  Requires-Dist: fsspec; extra == "s3"
538
+ Requires-Dist: pydantic; extra == "s3"
539
+ Requires-Dist: click; extra == "s3"
535
540
  Requires-Dist: tqdm; extra == "s3"
536
- Requires-Dist: pandas; extra == "s3"
537
541
  Requires-Dist: opentelemetry-sdk; extra == "s3"
538
- Requires-Dist: pydantic; extra == "s3"
539
- Requires-Dist: s3fs; extra == "s3"
540
- Requires-Dist: dataclasses-json; extra == "s3"
541
542
  Requires-Dist: python-dateutil; extra == "s3"
542
- Requires-Dist: click; extra == "s3"
543
543
  Provides-Extra: salesforce
544
- Requires-Dist: tqdm; extra == "salesforce"
545
544
  Requires-Dist: simple-salesforce; extra == "salesforce"
545
+ Requires-Dist: dataclasses-json; extra == "salesforce"
546
546
  Requires-Dist: pandas; extra == "salesforce"
547
- Requires-Dist: opentelemetry-sdk; extra == "salesforce"
548
547
  Requires-Dist: pydantic; extra == "salesforce"
549
- Requires-Dist: dataclasses-json; extra == "salesforce"
550
- Requires-Dist: python-dateutil; extra == "salesforce"
551
548
  Requires-Dist: click; extra == "salesforce"
549
+ Requires-Dist: tqdm; extra == "salesforce"
550
+ Requires-Dist: opentelemetry-sdk; extra == "salesforce"
551
+ Requires-Dist: python-dateutil; extra == "salesforce"
552
552
  Provides-Extra: sftp
553
- Requires-Dist: fsspec; extra == "sftp"
554
- Requires-Dist: tqdm; extra == "sftp"
555
- Requires-Dist: paramiko; extra == "sftp"
556
553
  Requires-Dist: pandas; extra == "sftp"
557
- Requires-Dist: opentelemetry-sdk; extra == "sftp"
558
- Requires-Dist: pydantic; extra == "sftp"
559
554
  Requires-Dist: dataclasses-json; extra == "sftp"
560
- Requires-Dist: python-dateutil; extra == "sftp"
555
+ Requires-Dist: fsspec; extra == "sftp"
556
+ Requires-Dist: pydantic; extra == "sftp"
561
557
  Requires-Dist: click; extra == "sftp"
558
+ Requires-Dist: python-dateutil; extra == "sftp"
559
+ Requires-Dist: tqdm; extra == "sftp"
560
+ Requires-Dist: opentelemetry-sdk; extra == "sftp"
561
+ Requires-Dist: paramiko; extra == "sftp"
562
562
  Provides-Extra: sharepoint
563
- Requires-Dist: tqdm; extra == "sharepoint"
564
563
  Requires-Dist: msal; extra == "sharepoint"
564
+ Requires-Dist: dataclasses-json; extra == "sharepoint"
565
565
  Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
566
566
  Requires-Dist: pandas; extra == "sharepoint"
567
- Requires-Dist: opentelemetry-sdk; extra == "sharepoint"
568
567
  Requires-Dist: pydantic; extra == "sharepoint"
569
- Requires-Dist: dataclasses-json; extra == "sharepoint"
570
- Requires-Dist: python-dateutil; extra == "sharepoint"
571
568
  Requires-Dist: click; extra == "sharepoint"
569
+ Requires-Dist: tqdm; extra == "sharepoint"
570
+ Requires-Dist: opentelemetry-sdk; extra == "sharepoint"
571
+ Requires-Dist: python-dateutil; extra == "sharepoint"
572
572
  Provides-Extra: singlestore
573
- Requires-Dist: tqdm; extra == "singlestore"
574
573
  Requires-Dist: pandas; extra == "singlestore"
575
- Requires-Dist: opentelemetry-sdk; extra == "singlestore"
576
- Requires-Dist: pydantic; extra == "singlestore"
577
- Requires-Dist: singlestoredb; extra == "singlestore"
578
574
  Requires-Dist: dataclasses-json; extra == "singlestore"
579
- Requires-Dist: python-dateutil; extra == "singlestore"
575
+ Requires-Dist: singlestoredb; extra == "singlestore"
576
+ Requires-Dist: pydantic; extra == "singlestore"
580
577
  Requires-Dist: click; extra == "singlestore"
578
+ Requires-Dist: tqdm; extra == "singlestore"
579
+ Requires-Dist: opentelemetry-sdk; extra == "singlestore"
580
+ Requires-Dist: python-dateutil; extra == "singlestore"
581
581
  Provides-Extra: slack
582
- Requires-Dist: tqdm; extra == "slack"
583
582
  Requires-Dist: pandas; extra == "slack"
584
- Requires-Dist: opentelemetry-sdk; extra == "slack"
583
+ Requires-Dist: dataclasses-json; extra == "slack"
585
584
  Requires-Dist: pydantic; extra == "slack"
585
+ Requires-Dist: click; extra == "slack"
586
586
  Requires-Dist: slack-sdk; extra == "slack"
587
- Requires-Dist: dataclasses-json; extra == "slack"
587
+ Requires-Dist: tqdm; extra == "slack"
588
+ Requires-Dist: opentelemetry-sdk; extra == "slack"
588
589
  Requires-Dist: python-dateutil; extra == "slack"
589
- Requires-Dist: click; extra == "slack"
590
590
  Provides-Extra: tsv
591
591
  Requires-Dist: unstructured[tsv]; extra == "tsv"
592
- Requires-Dist: tqdm; extra == "tsv"
593
592
  Requires-Dist: pandas; extra == "tsv"
594
- Requires-Dist: opentelemetry-sdk; extra == "tsv"
595
- Requires-Dist: pydantic; extra == "tsv"
596
593
  Requires-Dist: dataclasses-json; extra == "tsv"
597
- Requires-Dist: python-dateutil; extra == "tsv"
594
+ Requires-Dist: pydantic; extra == "tsv"
598
595
  Requires-Dist: click; extra == "tsv"
596
+ Requires-Dist: tqdm; extra == "tsv"
597
+ Requires-Dist: opentelemetry-sdk; extra == "tsv"
598
+ Requires-Dist: python-dateutil; extra == "tsv"
599
599
  Provides-Extra: vectara
600
- Requires-Dist: tqdm; extra == "vectara"
601
600
  Requires-Dist: pandas; extra == "vectara"
602
- Requires-Dist: opentelemetry-sdk; extra == "vectara"
603
- Requires-Dist: pydantic; extra == "vectara"
604
601
  Requires-Dist: requests; extra == "vectara"
605
602
  Requires-Dist: dataclasses-json; extra == "vectara"
606
- Requires-Dist: python-dateutil; extra == "vectara"
603
+ Requires-Dist: pydantic; extra == "vectara"
607
604
  Requires-Dist: click; extra == "vectara"
605
+ Requires-Dist: tqdm; extra == "vectara"
606
+ Requires-Dist: opentelemetry-sdk; extra == "vectara"
607
+ Requires-Dist: python-dateutil; extra == "vectara"
608
608
  Provides-Extra: weaviate
609
- Requires-Dist: tqdm; extra == "weaviate"
610
609
  Requires-Dist: pandas; extra == "weaviate"
611
- Requires-Dist: opentelemetry-sdk; extra == "weaviate"
612
- Requires-Dist: pydantic; extra == "weaviate"
613
- Requires-Dist: weaviate-client; extra == "weaviate"
614
610
  Requires-Dist: dataclasses-json; extra == "weaviate"
615
- Requires-Dist: python-dateutil; extra == "weaviate"
611
+ Requires-Dist: weaviate-client; extra == "weaviate"
612
+ Requires-Dist: pydantic; extra == "weaviate"
616
613
  Requires-Dist: click; extra == "weaviate"
614
+ Requires-Dist: tqdm; extra == "weaviate"
615
+ Requires-Dist: opentelemetry-sdk; extra == "weaviate"
616
+ Requires-Dist: python-dateutil; extra == "weaviate"
617
617
  Provides-Extra: wikipedia
618
+ Requires-Dist: pandas; extra == "wikipedia"
619
+ Requires-Dist: dataclasses-json; extra == "wikipedia"
618
620
  Requires-Dist: wikipedia; extra == "wikipedia"
621
+ Requires-Dist: pydantic; extra == "wikipedia"
622
+ Requires-Dist: click; extra == "wikipedia"
619
623
  Requires-Dist: tqdm; extra == "wikipedia"
620
- Requires-Dist: pandas; extra == "wikipedia"
621
624
  Requires-Dist: opentelemetry-sdk; extra == "wikipedia"
622
- Requires-Dist: pydantic; extra == "wikipedia"
623
- Requires-Dist: dataclasses-json; extra == "wikipedia"
624
625
  Requires-Dist: python-dateutil; extra == "wikipedia"
625
- Requires-Dist: click; extra == "wikipedia"
626
626
  Provides-Extra: xlsx
627
- Requires-Dist: tqdm; extra == "xlsx"
628
- Requires-Dist: pandas; extra == "xlsx"
629
- Requires-Dist: opentelemetry-sdk; extra == "xlsx"
630
627
  Requires-Dist: unstructured[xlsx]; extra == "xlsx"
631
- Requires-Dist: pydantic; extra == "xlsx"
632
628
  Requires-Dist: dataclasses-json; extra == "xlsx"
633
- Requires-Dist: python-dateutil; extra == "xlsx"
629
+ Requires-Dist: pandas; extra == "xlsx"
630
+ Requires-Dist: pydantic; extra == "xlsx"
634
631
  Requires-Dist: click; extra == "xlsx"
632
+ Requires-Dist: tqdm; extra == "xlsx"
633
+ Requires-Dist: opentelemetry-sdk; extra == "xlsx"
634
+ Requires-Dist: python-dateutil; extra == "xlsx"
635
635
 
636
636
  # Unstructured Ingest
637
637
 
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=Ku8DcDzvBk86e8J7KB72YMZJCZ5U1RYp2FNQ17mXors,42
2
+ unstructured_ingest/__version__.py,sha256=AGLzGoXiCZqjaKy2UooViVI5-HB2c17dSBEa2hb1LMA,43
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/evaluate.py,sha256=R-mKLFXbVX1xQ1tjGsLHjdP-TbSSV-925IHzggW_bIg,9793
5
5
  unstructured_ingest/interfaces.py,sha256=AeEywcSKCMA5AiEdENLpu_yPcXp_c6wpvESePfC00yo,31214
@@ -247,7 +247,7 @@ unstructured_ingest/runner/writers/fsspec/gcs.py,sha256=ia-gconOz1kWI1jmYeB9NY6c
247
247
  unstructured_ingest/runner/writers/fsspec/s3.py,sha256=kHJq2O3864QBd_tL2SKb0mdywczOCr2VI5e_bVms-Vw,622
248
248
  unstructured_ingest/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
249
249
  unstructured_ingest/utils/chunking.py,sha256=efWEfMcCukG5zASZrXhkNgAX8AzHa6t3rClMzm2TwFE,1521
250
- unstructured_ingest/utils/compression.py,sha256=ZzJQeNn1a6oseKo-oDwaLggBzi32oqPL5Z9I_Y-YYy8,4340
250
+ unstructured_ingest/utils/compression.py,sha256=mgndeNULGH7stoC51hhT4B9HwqMUSL0jhphcia6F_bw,4433
251
251
  unstructured_ingest/utils/data_prep.py,sha256=oizt8xZ15hExZ_8xacMG0j1LSH4ILreQpXJUYm2Bb_M,3917
252
252
  unstructured_ingest/utils/dep_check.py,sha256=cVEqZtMwji8BIt7pjtUOMtEmN7KaNXRXwelEKFpOdW8,1914
253
253
  unstructured_ingest/utils/google_filetype.py,sha256=YVspEkiiBrRUSGVeVbsavvLvTmizdy2e6TsjigXTSRU,468
@@ -329,9 +329,9 @@ unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=O1j0hIYWI4lPpTQ
329
329
  unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=cOMvMh0C9rtyEPJ0X59Fn-qb11LFUMRfeUgsi3QRWUk,6390
330
330
  unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=NkcU4U2DQWWuM8UHkez67C3SEOZpVyRtmtNS-z-F0Fw,6056
331
331
  unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
332
- unstructured_ingest-0.0.9.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
333
- unstructured_ingest-0.0.9.dist-info/METADATA,sha256=cMGo-6_uYAZFhWQGTkfNVMxeT-h7QudXo3O00GbMUm8,28109
334
- unstructured_ingest-0.0.9.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
335
- unstructured_ingest-0.0.9.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
336
- unstructured_ingest-0.0.9.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
337
- unstructured_ingest-0.0.9.dist-info/RECORD,,
332
+ unstructured_ingest-0.0.10.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
333
+ unstructured_ingest-0.0.10.dist-info/METADATA,sha256=2j3kp-lp2IbhVpbtZSgVRqom9ZUbcIqKFsWyw3ueGuM,28110
334
+ unstructured_ingest-0.0.10.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
335
+ unstructured_ingest-0.0.10.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
336
+ unstructured_ingest-0.0.10.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
337
+ unstructured_ingest-0.0.10.dist-info/RECORD,,