unstructured-ingest 0.0.7__py3-none-any.whl → 0.0.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

@@ -1 +1 @@
1
- __version__ = "0.0.7" # pragma: no cover
1
+ __version__ = "0.0.8" # pragma: no cover
@@ -67,7 +67,15 @@ class MilvusConnectionConfig(ConnectionConfig):
67
67
 
68
68
 
69
69
  class MilvusUploadStagerConfig(UploadStagerConfig):
70
- pass
70
+
71
+ fields_to_include: Optional[list[str]] = None
72
+ """If set - list of fields to include in the output.
73
+ Unspecified fields are removed from the elements.
74
+ This action takse place after metadata flattening.
75
+ Missing fields will cause stager to throw KeyError."""
76
+
77
+ flatten_metadata: bool = True
78
+ """If set - flatten "metadata" key and put contents directly into data"""
71
79
 
72
80
 
73
81
  @dataclass
@@ -85,8 +93,26 @@ class MilvusUploadStager(UploadStager):
85
93
  pass
86
94
  return parser.parse(date_string).timestamp()
87
95
 
88
- @classmethod
89
- def conform_dict(cls, data: dict) -> None:
96
+ def conform_dict(self, data: dict) -> None:
97
+ if self.upload_stager_config.flatten_metadata and (metadata := data.pop("metadata", None)):
98
+ data.update(flatten_dict(metadata, keys_to_omit=["data_source_record_locator"]))
99
+
100
+ # TODO: milvus sdk doesn't seem to support defaults via the schema yet,
101
+ # remove once that gets updated
102
+ defaults = {"is_continuation": False}
103
+ for default in defaults:
104
+ if default not in data:
105
+ data[default] = defaults[default]
106
+
107
+ if self.upload_stager_config.fields_to_include:
108
+ data_keys = set(data.keys())
109
+ for data_key in data_keys:
110
+ if data_key not in self.upload_stager_config.fields_to_include:
111
+ data.pop(data_key)
112
+ for field_include_key in self.upload_stager_config.fields_to_include:
113
+ if field_include_key not in data:
114
+ raise KeyError(f"Field '{field_include_key}' is missing in data!")
115
+
90
116
  datetime_columns = [
91
117
  "data_source_date_created",
92
118
  "data_source_date_modified",
@@ -96,21 +122,12 @@ class MilvusUploadStager(UploadStager):
96
122
 
97
123
  json_dumps_fields = ["languages", "data_source_permissions_data"]
98
124
 
99
- # TODO: milvus sdk doesn't seem to support defaults via the schema yet,
100
- # remove once that gets updated
101
- defaults = {"is_continuation": False}
102
-
103
- if metadata := data.pop("metadata", None):
104
- data.update(flatten_dict(metadata, keys_to_omit=["data_source_record_locator"]))
105
125
  for datetime_column in datetime_columns:
106
126
  if datetime_column in data:
107
- data[datetime_column] = cls.parse_date_string(data[datetime_column])
127
+ data[datetime_column] = self.parse_date_string(data[datetime_column])
108
128
  for json_dumps_field in json_dumps_fields:
109
129
  if json_dumps_field in data:
110
130
  data[json_dumps_field] = json.dumps(data[json_dumps_field])
111
- for default in defaults:
112
- if default not in data:
113
- data[default] = defaults[default]
114
131
 
115
132
  def run(
116
133
  self,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.7
3
+ Version: 0.0.8
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,616 +22,616 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.13
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: opentelemetry-sdk
26
- Requires-Dist: click
27
- Requires-Dist: dataclasses-json
28
25
  Requires-Dist: tqdm
29
- Requires-Dist: pandas
30
26
  Requires-Dist: python-dateutil
27
+ Requires-Dist: dataclasses-json
28
+ Requires-Dist: click
31
29
  Requires-Dist: pydantic
30
+ Requires-Dist: pandas
31
+ Requires-Dist: opentelemetry-sdk
32
32
  Provides-Extra: airtable
33
- Requires-Dist: opentelemetry-sdk; extra == "airtable"
34
- Requires-Dist: pyairtable; extra == "airtable"
35
- Requires-Dist: click; extra == "airtable"
36
- Requires-Dist: dataclasses-json; extra == "airtable"
37
33
  Requires-Dist: tqdm; extra == "airtable"
38
- Requires-Dist: pandas; extra == "airtable"
39
34
  Requires-Dist: python-dateutil; extra == "airtable"
35
+ Requires-Dist: dataclasses-json; extra == "airtable"
36
+ Requires-Dist: click; extra == "airtable"
37
+ Requires-Dist: pyairtable; extra == "airtable"
40
38
  Requires-Dist: pydantic; extra == "airtable"
39
+ Requires-Dist: pandas; extra == "airtable"
40
+ Requires-Dist: opentelemetry-sdk; extra == "airtable"
41
41
  Provides-Extra: astradb
42
- Requires-Dist: opentelemetry-sdk; extra == "astradb"
43
- Requires-Dist: click; extra == "astradb"
44
42
  Requires-Dist: astrapy; extra == "astradb"
45
- Requires-Dist: dataclasses-json; extra == "astradb"
46
43
  Requires-Dist: tqdm; extra == "astradb"
47
- Requires-Dist: pandas; extra == "astradb"
48
44
  Requires-Dist: python-dateutil; extra == "astradb"
45
+ Requires-Dist: dataclasses-json; extra == "astradb"
46
+ Requires-Dist: click; extra == "astradb"
49
47
  Requires-Dist: pydantic; extra == "astradb"
48
+ Requires-Dist: pandas; extra == "astradb"
49
+ Requires-Dist: opentelemetry-sdk; extra == "astradb"
50
50
  Provides-Extra: azure
51
- Requires-Dist: opentelemetry-sdk; extra == "azure"
51
+ Requires-Dist: fsspec; extra == "azure"
52
+ Requires-Dist: tqdm; extra == "azure"
53
+ Requires-Dist: python-dateutil; extra == "azure"
54
+ Requires-Dist: adlfs; extra == "azure"
55
+ Requires-Dist: dataclasses-json; extra == "azure"
52
56
  Requires-Dist: click; extra == "azure"
53
57
  Requires-Dist: pydantic; extra == "azure"
54
- Requires-Dist: dataclasses-json; extra == "azure"
55
- Requires-Dist: tqdm; extra == "azure"
56
58
  Requires-Dist: pandas; extra == "azure"
57
- Requires-Dist: adlfs; extra == "azure"
58
- Requires-Dist: python-dateutil; extra == "azure"
59
- Requires-Dist: fsspec; extra == "azure"
59
+ Requires-Dist: opentelemetry-sdk; extra == "azure"
60
60
  Provides-Extra: azure-cognitive-search
61
- Requires-Dist: opentelemetry-sdk; extra == "azure-cognitive-search"
62
- Requires-Dist: click; extra == "azure-cognitive-search"
63
- Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
64
- Requires-Dist: dataclasses-json; extra == "azure-cognitive-search"
65
61
  Requires-Dist: tqdm; extra == "azure-cognitive-search"
66
- Requires-Dist: pandas; extra == "azure-cognitive-search"
67
62
  Requires-Dist: python-dateutil; extra == "azure-cognitive-search"
63
+ Requires-Dist: dataclasses-json; extra == "azure-cognitive-search"
64
+ Requires-Dist: click; extra == "azure-cognitive-search"
68
65
  Requires-Dist: pydantic; extra == "azure-cognitive-search"
66
+ Requires-Dist: pandas; extra == "azure-cognitive-search"
67
+ Requires-Dist: opentelemetry-sdk; extra == "azure-cognitive-search"
68
+ Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
69
69
  Provides-Extra: bedrock
70
- Requires-Dist: opentelemetry-sdk; extra == "bedrock"
71
- Requires-Dist: click; extra == "bedrock"
72
- Requires-Dist: langchain-community; extra == "bedrock"
73
- Requires-Dist: dataclasses-json; extra == "bedrock"
74
70
  Requires-Dist: tqdm; extra == "bedrock"
75
- Requires-Dist: pandas; extra == "bedrock"
76
- Requires-Dist: boto3; extra == "bedrock"
77
71
  Requires-Dist: python-dateutil; extra == "bedrock"
72
+ Requires-Dist: dataclasses-json; extra == "bedrock"
73
+ Requires-Dist: boto3; extra == "bedrock"
74
+ Requires-Dist: click; extra == "bedrock"
78
75
  Requires-Dist: unstructured; extra == "bedrock"
79
76
  Requires-Dist: pydantic; extra == "bedrock"
77
+ Requires-Dist: pandas; extra == "bedrock"
78
+ Requires-Dist: opentelemetry-sdk; extra == "bedrock"
79
+ Requires-Dist: langchain-community; extra == "bedrock"
80
80
  Provides-Extra: biomed
81
- Requires-Dist: opentelemetry-sdk; extra == "biomed"
82
- Requires-Dist: click; extra == "biomed"
83
- Requires-Dist: dataclasses-json; extra == "biomed"
84
- Requires-Dist: requests; extra == "biomed"
85
81
  Requires-Dist: tqdm; extra == "biomed"
86
- Requires-Dist: pandas; extra == "biomed"
87
82
  Requires-Dist: python-dateutil; extra == "biomed"
88
83
  Requires-Dist: bs4; extra == "biomed"
84
+ Requires-Dist: dataclasses-json; extra == "biomed"
85
+ Requires-Dist: click; extra == "biomed"
86
+ Requires-Dist: requests; extra == "biomed"
89
87
  Requires-Dist: pydantic; extra == "biomed"
88
+ Requires-Dist: pandas; extra == "biomed"
89
+ Requires-Dist: opentelemetry-sdk; extra == "biomed"
90
90
  Provides-Extra: box
91
- Requires-Dist: opentelemetry-sdk; extra == "box"
92
- Requires-Dist: click; extra == "box"
93
91
  Requires-Dist: boxfs; extra == "box"
94
- Requires-Dist: pydantic; extra == "box"
95
- Requires-Dist: dataclasses-json; extra == "box"
92
+ Requires-Dist: fsspec; extra == "box"
96
93
  Requires-Dist: tqdm; extra == "box"
97
- Requires-Dist: pandas; extra == "box"
98
94
  Requires-Dist: python-dateutil; extra == "box"
99
- Requires-Dist: fsspec; extra == "box"
95
+ Requires-Dist: dataclasses-json; extra == "box"
96
+ Requires-Dist: click; extra == "box"
97
+ Requires-Dist: pydantic; extra == "box"
98
+ Requires-Dist: pandas; extra == "box"
99
+ Requires-Dist: opentelemetry-sdk; extra == "box"
100
100
  Provides-Extra: chroma
101
- Requires-Dist: opentelemetry-sdk; extra == "chroma"
102
- Requires-Dist: click; extra == "chroma"
103
- Requires-Dist: dataclasses-json; extra == "chroma"
104
- Requires-Dist: importlib-metadata>=7.1.0; extra == "chroma"
105
101
  Requires-Dist: tqdm; extra == "chroma"
106
- Requires-Dist: pandas; extra == "chroma"
107
- Requires-Dist: typer<=0.9.0; extra == "chroma"
108
102
  Requires-Dist: python-dateutil; extra == "chroma"
103
+ Requires-Dist: typer<=0.9.0; extra == "chroma"
104
+ Requires-Dist: dataclasses-json; extra == "chroma"
105
+ Requires-Dist: click; extra == "chroma"
109
106
  Requires-Dist: pydantic; extra == "chroma"
107
+ Requires-Dist: pandas; extra == "chroma"
108
+ Requires-Dist: opentelemetry-sdk; extra == "chroma"
109
+ Requires-Dist: importlib-metadata>=7.1.0; extra == "chroma"
110
110
  Requires-Dist: chromadb; extra == "chroma"
111
111
  Provides-Extra: clarifai
112
- Requires-Dist: opentelemetry-sdk; extra == "clarifai"
112
+ Requires-Dist: tqdm; extra == "clarifai"
113
+ Requires-Dist: python-dateutil; extra == "clarifai"
114
+ Requires-Dist: dataclasses-json; extra == "clarifai"
113
115
  Requires-Dist: click; extra == "clarifai"
114
116
  Requires-Dist: pydantic; extra == "clarifai"
115
- Requires-Dist: dataclasses-json; extra == "clarifai"
116
- Requires-Dist: tqdm; extra == "clarifai"
117
117
  Requires-Dist: pandas; extra == "clarifai"
118
- Requires-Dist: python-dateutil; extra == "clarifai"
118
+ Requires-Dist: opentelemetry-sdk; extra == "clarifai"
119
119
  Requires-Dist: clarifai; extra == "clarifai"
120
120
  Provides-Extra: confluence
121
- Requires-Dist: opentelemetry-sdk; extra == "confluence"
122
- Requires-Dist: click; extra == "confluence"
123
- Requires-Dist: atlassian-python-api; extra == "confluence"
124
- Requires-Dist: dataclasses-json; extra == "confluence"
125
- Requires-Dist: requests; extra == "confluence"
126
121
  Requires-Dist: tqdm; extra == "confluence"
127
- Requires-Dist: pandas; extra == "confluence"
128
122
  Requires-Dist: python-dateutil; extra == "confluence"
123
+ Requires-Dist: dataclasses-json; extra == "confluence"
124
+ Requires-Dist: click; extra == "confluence"
125
+ Requires-Dist: requests; extra == "confluence"
126
+ Requires-Dist: atlassian-python-api; extra == "confluence"
129
127
  Requires-Dist: pydantic; extra == "confluence"
128
+ Requires-Dist: pandas; extra == "confluence"
129
+ Requires-Dist: opentelemetry-sdk; extra == "confluence"
130
130
  Provides-Extra: couchbase
131
- Requires-Dist: opentelemetry-sdk; extra == "couchbase"
132
- Requires-Dist: click; extra == "couchbase"
133
- Requires-Dist: dataclasses-json; extra == "couchbase"
131
+ Requires-Dist: couchbase; extra == "couchbase"
134
132
  Requires-Dist: tqdm; extra == "couchbase"
135
- Requires-Dist: pandas; extra == "couchbase"
136
133
  Requires-Dist: python-dateutil; extra == "couchbase"
134
+ Requires-Dist: dataclasses-json; extra == "couchbase"
135
+ Requires-Dist: click; extra == "couchbase"
137
136
  Requires-Dist: pydantic; extra == "couchbase"
138
- Requires-Dist: couchbase; extra == "couchbase"
137
+ Requires-Dist: pandas; extra == "couchbase"
138
+ Requires-Dist: opentelemetry-sdk; extra == "couchbase"
139
139
  Provides-Extra: csv
140
- Requires-Dist: opentelemetry-sdk; extra == "csv"
141
- Requires-Dist: click; extra == "csv"
142
- Requires-Dist: unstructured[tsv]; extra == "csv"
143
- Requires-Dist: dataclasses-json; extra == "csv"
144
140
  Requires-Dist: tqdm; extra == "csv"
145
- Requires-Dist: pandas; extra == "csv"
146
141
  Requires-Dist: python-dateutil; extra == "csv"
142
+ Requires-Dist: dataclasses-json; extra == "csv"
143
+ Requires-Dist: unstructured[tsv]; extra == "csv"
144
+ Requires-Dist: click; extra == "csv"
147
145
  Requires-Dist: pydantic; extra == "csv"
146
+ Requires-Dist: pandas; extra == "csv"
147
+ Requires-Dist: opentelemetry-sdk; extra == "csv"
148
148
  Provides-Extra: databricks-volumes
149
- Requires-Dist: opentelemetry-sdk; extra == "databricks-volumes"
150
- Requires-Dist: click; extra == "databricks-volumes"
151
- Requires-Dist: databricks-sdk; extra == "databricks-volumes"
152
- Requires-Dist: dataclasses-json; extra == "databricks-volumes"
153
149
  Requires-Dist: tqdm; extra == "databricks-volumes"
154
- Requires-Dist: pandas; extra == "databricks-volumes"
155
150
  Requires-Dist: python-dateutil; extra == "databricks-volumes"
151
+ Requires-Dist: dataclasses-json; extra == "databricks-volumes"
152
+ Requires-Dist: click; extra == "databricks-volumes"
156
153
  Requires-Dist: pydantic; extra == "databricks-volumes"
154
+ Requires-Dist: pandas; extra == "databricks-volumes"
155
+ Requires-Dist: databricks-sdk; extra == "databricks-volumes"
156
+ Requires-Dist: opentelemetry-sdk; extra == "databricks-volumes"
157
157
  Provides-Extra: delta-table
158
- Requires-Dist: opentelemetry-sdk; extra == "delta-table"
158
+ Requires-Dist: deltalake; extra == "delta-table"
159
+ Requires-Dist: tqdm; extra == "delta-table"
160
+ Requires-Dist: fsspec; extra == "delta-table"
161
+ Requires-Dist: python-dateutil; extra == "delta-table"
162
+ Requires-Dist: dataclasses-json; extra == "delta-table"
159
163
  Requires-Dist: click; extra == "delta-table"
160
164
  Requires-Dist: pydantic; extra == "delta-table"
161
- Requires-Dist: dataclasses-json; extra == "delta-table"
162
- Requires-Dist: tqdm; extra == "delta-table"
163
165
  Requires-Dist: pandas; extra == "delta-table"
164
- Requires-Dist: deltalake; extra == "delta-table"
165
- Requires-Dist: python-dateutil; extra == "delta-table"
166
- Requires-Dist: fsspec; extra == "delta-table"
166
+ Requires-Dist: opentelemetry-sdk; extra == "delta-table"
167
167
  Provides-Extra: discord
168
- Requires-Dist: opentelemetry-sdk; extra == "discord"
169
- Requires-Dist: discord-py; extra == "discord"
170
- Requires-Dist: click; extra == "discord"
171
- Requires-Dist: dataclasses-json; extra == "discord"
172
168
  Requires-Dist: tqdm; extra == "discord"
173
- Requires-Dist: pandas; extra == "discord"
169
+ Requires-Dist: discord-py; extra == "discord"
174
170
  Requires-Dist: python-dateutil; extra == "discord"
171
+ Requires-Dist: dataclasses-json; extra == "discord"
172
+ Requires-Dist: click; extra == "discord"
175
173
  Requires-Dist: pydantic; extra == "discord"
174
+ Requires-Dist: pandas; extra == "discord"
175
+ Requires-Dist: opentelemetry-sdk; extra == "discord"
176
176
  Provides-Extra: doc
177
- Requires-Dist: opentelemetry-sdk; extra == "doc"
178
- Requires-Dist: click; extra == "doc"
179
- Requires-Dist: dataclasses-json; extra == "doc"
180
177
  Requires-Dist: tqdm; extra == "doc"
181
- Requires-Dist: pandas; extra == "doc"
182
- Requires-Dist: unstructured[docx]; extra == "doc"
183
178
  Requires-Dist: python-dateutil; extra == "doc"
179
+ Requires-Dist: dataclasses-json; extra == "doc"
180
+ Requires-Dist: click; extra == "doc"
184
181
  Requires-Dist: pydantic; extra == "doc"
182
+ Requires-Dist: unstructured[docx]; extra == "doc"
183
+ Requires-Dist: pandas; extra == "doc"
184
+ Requires-Dist: opentelemetry-sdk; extra == "doc"
185
185
  Provides-Extra: docx
186
- Requires-Dist: opentelemetry-sdk; extra == "docx"
187
- Requires-Dist: click; extra == "docx"
188
- Requires-Dist: dataclasses-json; extra == "docx"
189
186
  Requires-Dist: tqdm; extra == "docx"
190
- Requires-Dist: pandas; extra == "docx"
191
- Requires-Dist: unstructured[docx]; extra == "docx"
192
187
  Requires-Dist: python-dateutil; extra == "docx"
188
+ Requires-Dist: dataclasses-json; extra == "docx"
189
+ Requires-Dist: click; extra == "docx"
193
190
  Requires-Dist: pydantic; extra == "docx"
191
+ Requires-Dist: unstructured[docx]; extra == "docx"
192
+ Requires-Dist: pandas; extra == "docx"
193
+ Requires-Dist: opentelemetry-sdk; extra == "docx"
194
194
  Provides-Extra: dropbox
195
- Requires-Dist: opentelemetry-sdk; extra == "dropbox"
195
+ Requires-Dist: fsspec; extra == "dropbox"
196
+ Requires-Dist: tqdm; extra == "dropbox"
197
+ Requires-Dist: python-dateutil; extra == "dropbox"
198
+ Requires-Dist: dataclasses-json; extra == "dropbox"
196
199
  Requires-Dist: dropboxdrivefs; extra == "dropbox"
197
200
  Requires-Dist: click; extra == "dropbox"
198
201
  Requires-Dist: pydantic; extra == "dropbox"
199
- Requires-Dist: dataclasses-json; extra == "dropbox"
200
- Requires-Dist: tqdm; extra == "dropbox"
201
202
  Requires-Dist: pandas; extra == "dropbox"
202
- Requires-Dist: python-dateutil; extra == "dropbox"
203
- Requires-Dist: fsspec; extra == "dropbox"
203
+ Requires-Dist: opentelemetry-sdk; extra == "dropbox"
204
204
  Provides-Extra: elasticsearch
205
- Requires-Dist: opentelemetry-sdk; extra == "elasticsearch"
206
- Requires-Dist: click; extra == "elasticsearch"
207
- Requires-Dist: dataclasses-json; extra == "elasticsearch"
208
205
  Requires-Dist: tqdm; extra == "elasticsearch"
209
- Requires-Dist: pandas; extra == "elasticsearch"
210
206
  Requires-Dist: python-dateutil; extra == "elasticsearch"
211
- Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
207
+ Requires-Dist: dataclasses-json; extra == "elasticsearch"
208
+ Requires-Dist: click; extra == "elasticsearch"
212
209
  Requires-Dist: pydantic; extra == "elasticsearch"
210
+ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
211
+ Requires-Dist: pandas; extra == "elasticsearch"
212
+ Requires-Dist: opentelemetry-sdk; extra == "elasticsearch"
213
213
  Provides-Extra: embed-huggingface
214
- Requires-Dist: opentelemetry-sdk; extra == "embed-huggingface"
215
- Requires-Dist: click; extra == "embed-huggingface"
216
- Requires-Dist: dataclasses-json; extra == "embed-huggingface"
217
214
  Requires-Dist: langchain-huggingface; extra == "embed-huggingface"
218
215
  Requires-Dist: tqdm; extra == "embed-huggingface"
219
- Requires-Dist: pandas; extra == "embed-huggingface"
220
216
  Requires-Dist: python-dateutil; extra == "embed-huggingface"
217
+ Requires-Dist: dataclasses-json; extra == "embed-huggingface"
218
+ Requires-Dist: click; extra == "embed-huggingface"
221
219
  Requires-Dist: unstructured; extra == "embed-huggingface"
222
220
  Requires-Dist: pydantic; extra == "embed-huggingface"
221
+ Requires-Dist: pandas; extra == "embed-huggingface"
222
+ Requires-Dist: opentelemetry-sdk; extra == "embed-huggingface"
223
223
  Provides-Extra: embed-octoai
224
- Requires-Dist: opentelemetry-sdk; extra == "embed-octoai"
225
- Requires-Dist: click; extra == "embed-octoai"
226
- Requires-Dist: openai; extra == "embed-octoai"
227
- Requires-Dist: dataclasses-json; extra == "embed-octoai"
228
224
  Requires-Dist: tqdm; extra == "embed-octoai"
229
- Requires-Dist: pandas; extra == "embed-octoai"
230
- Requires-Dist: tiktoken; extra == "embed-octoai"
231
225
  Requires-Dist: python-dateutil; extra == "embed-octoai"
226
+ Requires-Dist: tiktoken; extra == "embed-octoai"
227
+ Requires-Dist: dataclasses-json; extra == "embed-octoai"
228
+ Requires-Dist: click; extra == "embed-octoai"
232
229
  Requires-Dist: unstructured; extra == "embed-octoai"
233
230
  Requires-Dist: pydantic; extra == "embed-octoai"
231
+ Requires-Dist: pandas; extra == "embed-octoai"
232
+ Requires-Dist: opentelemetry-sdk; extra == "embed-octoai"
233
+ Requires-Dist: openai; extra == "embed-octoai"
234
234
  Provides-Extra: embed-vertexai
235
- Requires-Dist: opentelemetry-sdk; extra == "embed-vertexai"
236
- Requires-Dist: langchain; extra == "embed-vertexai"
237
- Requires-Dist: click; extra == "embed-vertexai"
238
- Requires-Dist: langchain-community; extra == "embed-vertexai"
239
- Requires-Dist: dataclasses-json; extra == "embed-vertexai"
235
+ Requires-Dist: langchain-google-vertexai; extra == "embed-vertexai"
240
236
  Requires-Dist: tqdm; extra == "embed-vertexai"
241
- Requires-Dist: pandas; extra == "embed-vertexai"
242
237
  Requires-Dist: python-dateutil; extra == "embed-vertexai"
238
+ Requires-Dist: dataclasses-json; extra == "embed-vertexai"
239
+ Requires-Dist: click; extra == "embed-vertexai"
243
240
  Requires-Dist: unstructured; extra == "embed-vertexai"
244
- Requires-Dist: langchain-google-vertexai; extra == "embed-vertexai"
241
+ Requires-Dist: langchain; extra == "embed-vertexai"
245
242
  Requires-Dist: pydantic; extra == "embed-vertexai"
243
+ Requires-Dist: pandas; extra == "embed-vertexai"
244
+ Requires-Dist: opentelemetry-sdk; extra == "embed-vertexai"
245
+ Requires-Dist: langchain-community; extra == "embed-vertexai"
246
246
  Provides-Extra: embed-voyageai
247
- Requires-Dist: opentelemetry-sdk; extra == "embed-voyageai"
248
- Requires-Dist: click; extra == "embed-voyageai"
249
- Requires-Dist: dataclasses-json; extra == "embed-voyageai"
250
- Requires-Dist: langchain-voyageai; extra == "embed-voyageai"
251
247
  Requires-Dist: tqdm; extra == "embed-voyageai"
252
- Requires-Dist: pandas; extra == "embed-voyageai"
253
248
  Requires-Dist: python-dateutil; extra == "embed-voyageai"
249
+ Requires-Dist: dataclasses-json; extra == "embed-voyageai"
250
+ Requires-Dist: click; extra == "embed-voyageai"
254
251
  Requires-Dist: unstructured; extra == "embed-voyageai"
255
252
  Requires-Dist: langchain; extra == "embed-voyageai"
256
253
  Requires-Dist: pydantic; extra == "embed-voyageai"
254
+ Requires-Dist: langchain-voyageai; extra == "embed-voyageai"
255
+ Requires-Dist: pandas; extra == "embed-voyageai"
256
+ Requires-Dist: opentelemetry-sdk; extra == "embed-voyageai"
257
257
  Provides-Extra: epub
258
- Requires-Dist: opentelemetry-sdk; extra == "epub"
259
- Requires-Dist: unstructured[epub]; extra == "epub"
260
- Requires-Dist: click; extra == "epub"
261
- Requires-Dist: dataclasses-json; extra == "epub"
262
258
  Requires-Dist: tqdm; extra == "epub"
263
- Requires-Dist: pandas; extra == "epub"
264
259
  Requires-Dist: python-dateutil; extra == "epub"
265
- Requires-Dist: pydantic; extra == "epub"
260
+ Requires-Dist: dataclasses-json; extra == "epub"
261
+ Requires-Dist: click; extra == "epub"
262
+ Requires-Dist: unstructured[epub]; extra == "epub"
263
+ Requires-Dist: pydantic; extra == "epub"
264
+ Requires-Dist: pandas; extra == "epub"
265
+ Requires-Dist: opentelemetry-sdk; extra == "epub"
266
266
  Provides-Extra: gcs
267
- Requires-Dist: opentelemetry-sdk; extra == "gcs"
268
- Requires-Dist: click; extra == "gcs"
269
- Requires-Dist: pydantic; extra == "gcs"
270
267
  Requires-Dist: gcsfs; extra == "gcs"
271
- Requires-Dist: dataclasses-json; extra == "gcs"
268
+ Requires-Dist: fsspec; extra == "gcs"
272
269
  Requires-Dist: tqdm; extra == "gcs"
273
- Requires-Dist: pandas; extra == "gcs"
274
270
  Requires-Dist: python-dateutil; extra == "gcs"
275
271
  Requires-Dist: bs4; extra == "gcs"
276
- Requires-Dist: fsspec; extra == "gcs"
272
+ Requires-Dist: dataclasses-json; extra == "gcs"
273
+ Requires-Dist: click; extra == "gcs"
274
+ Requires-Dist: pydantic; extra == "gcs"
275
+ Requires-Dist: pandas; extra == "gcs"
276
+ Requires-Dist: opentelemetry-sdk; extra == "gcs"
277
277
  Provides-Extra: github
278
- Requires-Dist: opentelemetry-sdk; extra == "github"
279
- Requires-Dist: click; extra == "github"
278
+ Requires-Dist: tqdm; extra == "github"
279
+ Requires-Dist: python-dateutil; extra == "github"
280
280
  Requires-Dist: dataclasses-json; extra == "github"
281
+ Requires-Dist: click; extra == "github"
281
282
  Requires-Dist: requests; extra == "github"
282
283
  Requires-Dist: pygithub>1.58.0; extra == "github"
283
- Requires-Dist: tqdm; extra == "github"
284
- Requires-Dist: pandas; extra == "github"
285
- Requires-Dist: python-dateutil; extra == "github"
286
284
  Requires-Dist: pydantic; extra == "github"
285
+ Requires-Dist: pandas; extra == "github"
286
+ Requires-Dist: opentelemetry-sdk; extra == "github"
287
287
  Provides-Extra: gitlab
288
- Requires-Dist: opentelemetry-sdk; extra == "gitlab"
289
- Requires-Dist: click; extra == "gitlab"
290
- Requires-Dist: dataclasses-json; extra == "gitlab"
288
+ Requires-Dist: python-gitlab; extra == "gitlab"
291
289
  Requires-Dist: tqdm; extra == "gitlab"
292
- Requires-Dist: pandas; extra == "gitlab"
293
290
  Requires-Dist: python-dateutil; extra == "gitlab"
291
+ Requires-Dist: dataclasses-json; extra == "gitlab"
292
+ Requires-Dist: click; extra == "gitlab"
294
293
  Requires-Dist: pydantic; extra == "gitlab"
295
- Requires-Dist: python-gitlab; extra == "gitlab"
294
+ Requires-Dist: pandas; extra == "gitlab"
295
+ Requires-Dist: opentelemetry-sdk; extra == "gitlab"
296
296
  Provides-Extra: google-drive
297
- Requires-Dist: opentelemetry-sdk; extra == "google-drive"
298
- Requires-Dist: click; extra == "google-drive"
299
- Requires-Dist: dataclasses-json; extra == "google-drive"
300
297
  Requires-Dist: tqdm; extra == "google-drive"
301
- Requires-Dist: pandas; extra == "google-drive"
302
- Requires-Dist: python-dateutil; extra == "google-drive"
303
298
  Requires-Dist: google-api-python-client; extra == "google-drive"
299
+ Requires-Dist: python-dateutil; extra == "google-drive"
300
+ Requires-Dist: dataclasses-json; extra == "google-drive"
301
+ Requires-Dist: click; extra == "google-drive"
304
302
  Requires-Dist: pydantic; extra == "google-drive"
303
+ Requires-Dist: pandas; extra == "google-drive"
304
+ Requires-Dist: opentelemetry-sdk; extra == "google-drive"
305
305
  Provides-Extra: hubspot
306
- Requires-Dist: opentelemetry-sdk; extra == "hubspot"
306
+ Requires-Dist: urllib3; extra == "hubspot"
307
+ Requires-Dist: tqdm; extra == "hubspot"
308
+ Requires-Dist: python-dateutil; extra == "hubspot"
309
+ Requires-Dist: dataclasses-json; extra == "hubspot"
310
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
307
311
  Requires-Dist: click; extra == "hubspot"
308
312
  Requires-Dist: pydantic; extra == "hubspot"
309
- Requires-Dist: dataclasses-json; extra == "hubspot"
310
- Requires-Dist: tqdm; extra == "hubspot"
311
313
  Requires-Dist: pandas; extra == "hubspot"
312
- Requires-Dist: hubspot-api-client; extra == "hubspot"
313
- Requires-Dist: python-dateutil; extra == "hubspot"
314
- Requires-Dist: urllib3; extra == "hubspot"
314
+ Requires-Dist: opentelemetry-sdk; extra == "hubspot"
315
315
  Provides-Extra: jira
316
- Requires-Dist: opentelemetry-sdk; extra == "jira"
317
- Requires-Dist: click; extra == "jira"
318
- Requires-Dist: atlassian-python-api; extra == "jira"
319
- Requires-Dist: dataclasses-json; extra == "jira"
320
316
  Requires-Dist: tqdm; extra == "jira"
321
- Requires-Dist: pandas; extra == "jira"
322
317
  Requires-Dist: python-dateutil; extra == "jira"
318
+ Requires-Dist: dataclasses-json; extra == "jira"
319
+ Requires-Dist: click; extra == "jira"
320
+ Requires-Dist: atlassian-python-api; extra == "jira"
323
321
  Requires-Dist: pydantic; extra == "jira"
322
+ Requires-Dist: pandas; extra == "jira"
323
+ Requires-Dist: opentelemetry-sdk; extra == "jira"
324
324
  Provides-Extra: kafka
325
- Requires-Dist: opentelemetry-sdk; extra == "kafka"
326
- Requires-Dist: click; extra == "kafka"
327
- Requires-Dist: dataclasses-json; extra == "kafka"
328
- Requires-Dist: confluent-kafka; extra == "kafka"
329
325
  Requires-Dist: tqdm; extra == "kafka"
330
- Requires-Dist: pandas; extra == "kafka"
331
326
  Requires-Dist: python-dateutil; extra == "kafka"
327
+ Requires-Dist: dataclasses-json; extra == "kafka"
328
+ Requires-Dist: click; extra == "kafka"
332
329
  Requires-Dist: pydantic; extra == "kafka"
330
+ Requires-Dist: pandas; extra == "kafka"
331
+ Requires-Dist: opentelemetry-sdk; extra == "kafka"
332
+ Requires-Dist: confluent-kafka; extra == "kafka"
333
333
  Provides-Extra: kdbai
334
334
  Requires-Dist: kdbai-client; extra == "kdbai"
335
335
  Provides-Extra: md
336
- Requires-Dist: opentelemetry-sdk; extra == "md"
337
- Requires-Dist: click; extra == "md"
338
- Requires-Dist: dataclasses-json; extra == "md"
339
336
  Requires-Dist: tqdm; extra == "md"
340
- Requires-Dist: pandas; extra == "md"
341
- Requires-Dist: unstructured[md]; extra == "md"
342
337
  Requires-Dist: python-dateutil; extra == "md"
338
+ Requires-Dist: dataclasses-json; extra == "md"
339
+ Requires-Dist: click; extra == "md"
343
340
  Requires-Dist: pydantic; extra == "md"
341
+ Requires-Dist: pandas; extra == "md"
342
+ Requires-Dist: opentelemetry-sdk; extra == "md"
343
+ Requires-Dist: unstructured[md]; extra == "md"
344
344
  Provides-Extra: milvus
345
- Requires-Dist: opentelemetry-sdk; extra == "milvus"
346
- Requires-Dist: click; extra == "milvus"
347
- Requires-Dist: dataclasses-json; extra == "milvus"
348
345
  Requires-Dist: tqdm; extra == "milvus"
349
- Requires-Dist: pandas; extra == "milvus"
350
- Requires-Dist: pymilvus; extra == "milvus"
351
346
  Requires-Dist: python-dateutil; extra == "milvus"
347
+ Requires-Dist: dataclasses-json; extra == "milvus"
348
+ Requires-Dist: click; extra == "milvus"
349
+ Requires-Dist: pymilvus; extra == "milvus"
352
350
  Requires-Dist: pydantic; extra == "milvus"
351
+ Requires-Dist: pandas; extra == "milvus"
352
+ Requires-Dist: opentelemetry-sdk; extra == "milvus"
353
353
  Provides-Extra: mongodb
354
- Requires-Dist: opentelemetry-sdk; extra == "mongodb"
355
- Requires-Dist: click; extra == "mongodb"
356
- Requires-Dist: dataclasses-json; extra == "mongodb"
357
354
  Requires-Dist: tqdm; extra == "mongodb"
358
- Requires-Dist: pandas; extra == "mongodb"
359
355
  Requires-Dist: python-dateutil; extra == "mongodb"
360
- Requires-Dist: pymongo; extra == "mongodb"
356
+ Requires-Dist: dataclasses-json; extra == "mongodb"
357
+ Requires-Dist: click; extra == "mongodb"
361
358
  Requires-Dist: pydantic; extra == "mongodb"
359
+ Requires-Dist: pandas; extra == "mongodb"
360
+ Requires-Dist: opentelemetry-sdk; extra == "mongodb"
361
+ Requires-Dist: pymongo; extra == "mongodb"
362
362
  Provides-Extra: msg
363
- Requires-Dist: opentelemetry-sdk; extra == "msg"
364
- Requires-Dist: click; extra == "msg"
365
- Requires-Dist: dataclasses-json; extra == "msg"
366
363
  Requires-Dist: tqdm; extra == "msg"
367
- Requires-Dist: pandas; extra == "msg"
368
364
  Requires-Dist: python-dateutil; extra == "msg"
365
+ Requires-Dist: dataclasses-json; extra == "msg"
366
+ Requires-Dist: click; extra == "msg"
369
367
  Requires-Dist: pydantic; extra == "msg"
368
+ Requires-Dist: pandas; extra == "msg"
369
+ Requires-Dist: opentelemetry-sdk; extra == "msg"
370
370
  Requires-Dist: unstructured[msg]; extra == "msg"
371
371
  Provides-Extra: notion
372
- Requires-Dist: opentelemetry-sdk; extra == "notion"
373
- Requires-Dist: click; extra == "notion"
374
- Requires-Dist: notion-client; extra == "notion"
375
- Requires-Dist: dataclasses-json; extra == "notion"
376
372
  Requires-Dist: tqdm; extra == "notion"
377
- Requires-Dist: pandas; extra == "notion"
378
- Requires-Dist: backoff; extra == "notion"
379
373
  Requires-Dist: httpx; extra == "notion"
380
374
  Requires-Dist: python-dateutil; extra == "notion"
375
+ Requires-Dist: dataclasses-json; extra == "notion"
376
+ Requires-Dist: click; extra == "notion"
381
377
  Requires-Dist: htmlBuilder; extra == "notion"
378
+ Requires-Dist: notion-client; extra == "notion"
382
379
  Requires-Dist: pydantic; extra == "notion"
380
+ Requires-Dist: pandas; extra == "notion"
381
+ Requires-Dist: opentelemetry-sdk; extra == "notion"
382
+ Requires-Dist: backoff; extra == "notion"
383
383
  Provides-Extra: odt
384
- Requires-Dist: opentelemetry-sdk; extra == "odt"
385
- Requires-Dist: click; extra == "odt"
386
- Requires-Dist: dataclasses-json; extra == "odt"
384
+ Requires-Dist: unstructured[odt]; extra == "odt"
387
385
  Requires-Dist: tqdm; extra == "odt"
388
- Requires-Dist: pandas; extra == "odt"
389
386
  Requires-Dist: python-dateutil; extra == "odt"
390
- Requires-Dist: unstructured[odt]; extra == "odt"
387
+ Requires-Dist: dataclasses-json; extra == "odt"
388
+ Requires-Dist: click; extra == "odt"
391
389
  Requires-Dist: pydantic; extra == "odt"
390
+ Requires-Dist: pandas; extra == "odt"
391
+ Requires-Dist: opentelemetry-sdk; extra == "odt"
392
392
  Provides-Extra: onedrive
393
- Requires-Dist: opentelemetry-sdk; extra == "onedrive"
394
- Requires-Dist: click; extra == "onedrive"
395
- Requires-Dist: dataclasses-json; extra == "onedrive"
396
393
  Requires-Dist: tqdm; extra == "onedrive"
397
- Requires-Dist: pandas; extra == "onedrive"
398
- Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
399
394
  Requires-Dist: python-dateutil; extra == "onedrive"
400
395
  Requires-Dist: bs4; extra == "onedrive"
401
- Requires-Dist: msal; extra == "onedrive"
396
+ Requires-Dist: dataclasses-json; extra == "onedrive"
397
+ Requires-Dist: click; extra == "onedrive"
398
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
402
399
  Requires-Dist: pydantic; extra == "onedrive"
400
+ Requires-Dist: pandas; extra == "onedrive"
401
+ Requires-Dist: opentelemetry-sdk; extra == "onedrive"
402
+ Requires-Dist: msal; extra == "onedrive"
403
403
  Provides-Extra: openai
404
- Requires-Dist: opentelemetry-sdk; extra == "openai"
405
- Requires-Dist: click; extra == "openai"
406
- Requires-Dist: openai; extra == "openai"
407
- Requires-Dist: langchain-community; extra == "openai"
408
- Requires-Dist: dataclasses-json; extra == "openai"
409
404
  Requires-Dist: tqdm; extra == "openai"
410
- Requires-Dist: pandas; extra == "openai"
411
- Requires-Dist: tiktoken; extra == "openai"
412
405
  Requires-Dist: python-dateutil; extra == "openai"
406
+ Requires-Dist: tiktoken; extra == "openai"
407
+ Requires-Dist: dataclasses-json; extra == "openai"
408
+ Requires-Dist: click; extra == "openai"
413
409
  Requires-Dist: unstructured; extra == "openai"
414
410
  Requires-Dist: pydantic; extra == "openai"
411
+ Requires-Dist: pandas; extra == "openai"
412
+ Requires-Dist: opentelemetry-sdk; extra == "openai"
413
+ Requires-Dist: openai; extra == "openai"
414
+ Requires-Dist: langchain-community; extra == "openai"
415
415
  Provides-Extra: opensearch
416
- Requires-Dist: opentelemetry-sdk; extra == "opensearch"
417
- Requires-Dist: click; extra == "opensearch"
418
- Requires-Dist: dataclasses-json; extra == "opensearch"
419
416
  Requires-Dist: tqdm; extra == "opensearch"
420
- Requires-Dist: pandas; extra == "opensearch"
421
- Requires-Dist: opensearch-py; extra == "opensearch"
422
417
  Requires-Dist: python-dateutil; extra == "opensearch"
418
+ Requires-Dist: dataclasses-json; extra == "opensearch"
419
+ Requires-Dist: click; extra == "opensearch"
423
420
  Requires-Dist: pydantic; extra == "opensearch"
421
+ Requires-Dist: pandas; extra == "opensearch"
422
+ Requires-Dist: opentelemetry-sdk; extra == "opensearch"
423
+ Requires-Dist: opensearch-py; extra == "opensearch"
424
424
  Provides-Extra: org
425
- Requires-Dist: opentelemetry-sdk; extra == "org"
426
- Requires-Dist: click; extra == "org"
427
- Requires-Dist: dataclasses-json; extra == "org"
425
+ Requires-Dist: unstructured[org]; extra == "org"
428
426
  Requires-Dist: tqdm; extra == "org"
429
- Requires-Dist: pandas; extra == "org"
430
427
  Requires-Dist: python-dateutil; extra == "org"
431
- Requires-Dist: unstructured[org]; extra == "org"
428
+ Requires-Dist: dataclasses-json; extra == "org"
429
+ Requires-Dist: click; extra == "org"
432
430
  Requires-Dist: pydantic; extra == "org"
431
+ Requires-Dist: pandas; extra == "org"
432
+ Requires-Dist: opentelemetry-sdk; extra == "org"
433
433
  Provides-Extra: outlook
434
- Requires-Dist: opentelemetry-sdk; extra == "outlook"
435
- Requires-Dist: click; extra == "outlook"
436
- Requires-Dist: dataclasses-json; extra == "outlook"
437
434
  Requires-Dist: tqdm; extra == "outlook"
438
- Requires-Dist: pandas; extra == "outlook"
439
- Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
440
435
  Requires-Dist: python-dateutil; extra == "outlook"
441
- Requires-Dist: msal; extra == "outlook"
436
+ Requires-Dist: dataclasses-json; extra == "outlook"
437
+ Requires-Dist: click; extra == "outlook"
438
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
442
439
  Requires-Dist: pydantic; extra == "outlook"
440
+ Requires-Dist: pandas; extra == "outlook"
441
+ Requires-Dist: opentelemetry-sdk; extra == "outlook"
442
+ Requires-Dist: msal; extra == "outlook"
443
443
  Provides-Extra: pdf
444
- Requires-Dist: opentelemetry-sdk; extra == "pdf"
445
- Requires-Dist: click; extra == "pdf"
446
- Requires-Dist: dataclasses-json; extra == "pdf"
447
444
  Requires-Dist: tqdm; extra == "pdf"
448
- Requires-Dist: pandas; extra == "pdf"
449
445
  Requires-Dist: python-dateutil; extra == "pdf"
446
+ Requires-Dist: dataclasses-json; extra == "pdf"
450
447
  Requires-Dist: unstructured[pdf]; extra == "pdf"
448
+ Requires-Dist: click; extra == "pdf"
451
449
  Requires-Dist: pydantic; extra == "pdf"
450
+ Requires-Dist: pandas; extra == "pdf"
451
+ Requires-Dist: opentelemetry-sdk; extra == "pdf"
452
452
  Provides-Extra: pinecone
453
- Requires-Dist: opentelemetry-sdk; extra == "pinecone"
454
- Requires-Dist: click; extra == "pinecone"
455
- Requires-Dist: dataclasses-json; extra == "pinecone"
456
- Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
457
453
  Requires-Dist: tqdm; extra == "pinecone"
458
- Requires-Dist: pandas; extra == "pinecone"
459
454
  Requires-Dist: python-dateutil; extra == "pinecone"
455
+ Requires-Dist: dataclasses-json; extra == "pinecone"
456
+ Requires-Dist: click; extra == "pinecone"
457
+ Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
460
458
  Requires-Dist: pydantic; extra == "pinecone"
459
+ Requires-Dist: pandas; extra == "pinecone"
460
+ Requires-Dist: opentelemetry-sdk; extra == "pinecone"
461
461
  Provides-Extra: postgres
462
- Requires-Dist: opentelemetry-sdk; extra == "postgres"
463
- Requires-Dist: click; extra == "postgres"
464
- Requires-Dist: dataclasses-json; extra == "postgres"
465
- Requires-Dist: tqdm; extra == "postgres"
466
- Requires-Dist: pandas; extra == "postgres"
467
462
  Requires-Dist: psycopg2-binary; extra == "postgres"
463
+ Requires-Dist: tqdm; extra == "postgres"
468
464
  Requires-Dist: python-dateutil; extra == "postgres"
465
+ Requires-Dist: dataclasses-json; extra == "postgres"
466
+ Requires-Dist: click; extra == "postgres"
469
467
  Requires-Dist: pydantic; extra == "postgres"
468
+ Requires-Dist: pandas; extra == "postgres"
469
+ Requires-Dist: opentelemetry-sdk; extra == "postgres"
470
470
  Provides-Extra: ppt
471
- Requires-Dist: opentelemetry-sdk; extra == "ppt"
472
- Requires-Dist: click; extra == "ppt"
473
- Requires-Dist: unstructured[pptx]; extra == "ppt"
474
- Requires-Dist: dataclasses-json; extra == "ppt"
475
471
  Requires-Dist: tqdm; extra == "ppt"
476
- Requires-Dist: pandas; extra == "ppt"
477
472
  Requires-Dist: python-dateutil; extra == "ppt"
473
+ Requires-Dist: dataclasses-json; extra == "ppt"
474
+ Requires-Dist: click; extra == "ppt"
478
475
  Requires-Dist: pydantic; extra == "ppt"
476
+ Requires-Dist: pandas; extra == "ppt"
477
+ Requires-Dist: opentelemetry-sdk; extra == "ppt"
478
+ Requires-Dist: unstructured[pptx]; extra == "ppt"
479
479
  Provides-Extra: pptx
480
- Requires-Dist: opentelemetry-sdk; extra == "pptx"
481
- Requires-Dist: click; extra == "pptx"
482
- Requires-Dist: unstructured[pptx]; extra == "pptx"
483
- Requires-Dist: dataclasses-json; extra == "pptx"
484
480
  Requires-Dist: tqdm; extra == "pptx"
485
- Requires-Dist: pandas; extra == "pptx"
486
481
  Requires-Dist: python-dateutil; extra == "pptx"
482
+ Requires-Dist: dataclasses-json; extra == "pptx"
483
+ Requires-Dist: click; extra == "pptx"
487
484
  Requires-Dist: pydantic; extra == "pptx"
485
+ Requires-Dist: pandas; extra == "pptx"
486
+ Requires-Dist: opentelemetry-sdk; extra == "pptx"
487
+ Requires-Dist: unstructured[pptx]; extra == "pptx"
488
488
  Provides-Extra: qdrant
489
- Requires-Dist: opentelemetry-sdk; extra == "qdrant"
490
- Requires-Dist: click; extra == "qdrant"
491
- Requires-Dist: dataclasses-json; extra == "qdrant"
492
489
  Requires-Dist: tqdm; extra == "qdrant"
493
- Requires-Dist: pandas; extra == "qdrant"
494
490
  Requires-Dist: python-dateutil; extra == "qdrant"
491
+ Requires-Dist: dataclasses-json; extra == "qdrant"
492
+ Requires-Dist: click; extra == "qdrant"
495
493
  Requires-Dist: pydantic; extra == "qdrant"
494
+ Requires-Dist: pandas; extra == "qdrant"
495
+ Requires-Dist: opentelemetry-sdk; extra == "qdrant"
496
496
  Requires-Dist: qdrant-client; extra == "qdrant"
497
497
  Provides-Extra: reddit
498
- Requires-Dist: opentelemetry-sdk; extra == "reddit"
499
- Requires-Dist: click; extra == "reddit"
500
- Requires-Dist: dataclasses-json; extra == "reddit"
501
498
  Requires-Dist: tqdm; extra == "reddit"
502
- Requires-Dist: pandas; extra == "reddit"
503
499
  Requires-Dist: python-dateutil; extra == "reddit"
504
- Requires-Dist: praw; extra == "reddit"
500
+ Requires-Dist: dataclasses-json; extra == "reddit"
501
+ Requires-Dist: click; extra == "reddit"
505
502
  Requires-Dist: pydantic; extra == "reddit"
503
+ Requires-Dist: pandas; extra == "reddit"
504
+ Requires-Dist: opentelemetry-sdk; extra == "reddit"
505
+ Requires-Dist: praw; extra == "reddit"
506
506
  Provides-Extra: remote
507
- Requires-Dist: opentelemetry-sdk; extra == "remote"
508
- Requires-Dist: click; extra == "remote"
509
- Requires-Dist: unstructured-client>=0.23.0; extra == "remote"
510
- Requires-Dist: dataclasses-json; extra == "remote"
511
507
  Requires-Dist: tqdm; extra == "remote"
512
- Requires-Dist: pandas; extra == "remote"
513
508
  Requires-Dist: python-dateutil; extra == "remote"
509
+ Requires-Dist: dataclasses-json; extra == "remote"
510
+ Requires-Dist: click; extra == "remote"
514
511
  Requires-Dist: pydantic; extra == "remote"
512
+ Requires-Dist: pandas; extra == "remote"
513
+ Requires-Dist: opentelemetry-sdk; extra == "remote"
514
+ Requires-Dist: unstructured-client>=0.23.0; extra == "remote"
515
515
  Provides-Extra: rst
516
- Requires-Dist: opentelemetry-sdk; extra == "rst"
517
- Requires-Dist: click; extra == "rst"
518
- Requires-Dist: dataclasses-json; extra == "rst"
519
516
  Requires-Dist: tqdm; extra == "rst"
520
- Requires-Dist: pandas; extra == "rst"
521
- Requires-Dist: unstructured[rst]; extra == "rst"
522
517
  Requires-Dist: python-dateutil; extra == "rst"
518
+ Requires-Dist: dataclasses-json; extra == "rst"
519
+ Requires-Dist: unstructured[rst]; extra == "rst"
520
+ Requires-Dist: click; extra == "rst"
523
521
  Requires-Dist: pydantic; extra == "rst"
522
+ Requires-Dist: pandas; extra == "rst"
523
+ Requires-Dist: opentelemetry-sdk; extra == "rst"
524
524
  Provides-Extra: rtf
525
- Requires-Dist: opentelemetry-sdk; extra == "rtf"
526
- Requires-Dist: click; extra == "rtf"
527
- Requires-Dist: dataclasses-json; extra == "rtf"
528
525
  Requires-Dist: tqdm; extra == "rtf"
529
- Requires-Dist: pandas; extra == "rtf"
530
526
  Requires-Dist: python-dateutil; extra == "rtf"
527
+ Requires-Dist: dataclasses-json; extra == "rtf"
528
+ Requires-Dist: click; extra == "rtf"
531
529
  Requires-Dist: pydantic; extra == "rtf"
530
+ Requires-Dist: pandas; extra == "rtf"
531
+ Requires-Dist: opentelemetry-sdk; extra == "rtf"
532
532
  Requires-Dist: unstructured[rtf]; extra == "rtf"
533
533
  Provides-Extra: s3
534
- Requires-Dist: opentelemetry-sdk; extra == "s3"
534
+ Requires-Dist: s3fs; extra == "s3"
535
+ Requires-Dist: fsspec; extra == "s3"
536
+ Requires-Dist: tqdm; extra == "s3"
537
+ Requires-Dist: python-dateutil; extra == "s3"
538
+ Requires-Dist: dataclasses-json; extra == "s3"
535
539
  Requires-Dist: click; extra == "s3"
536
540
  Requires-Dist: pydantic; extra == "s3"
537
- Requires-Dist: dataclasses-json; extra == "s3"
538
- Requires-Dist: tqdm; extra == "s3"
539
541
  Requires-Dist: pandas; extra == "s3"
540
- Requires-Dist: s3fs; extra == "s3"
541
- Requires-Dist: python-dateutil; extra == "s3"
542
- Requires-Dist: fsspec; extra == "s3"
542
+ Requires-Dist: opentelemetry-sdk; extra == "s3"
543
543
  Provides-Extra: salesforce
544
- Requires-Dist: opentelemetry-sdk; extra == "salesforce"
545
- Requires-Dist: click; extra == "salesforce"
546
- Requires-Dist: dataclasses-json; extra == "salesforce"
547
544
  Requires-Dist: tqdm; extra == "salesforce"
548
- Requires-Dist: pandas; extra == "salesforce"
549
545
  Requires-Dist: python-dateutil; extra == "salesforce"
550
546
  Requires-Dist: simple-salesforce; extra == "salesforce"
547
+ Requires-Dist: dataclasses-json; extra == "salesforce"
548
+ Requires-Dist: click; extra == "salesforce"
551
549
  Requires-Dist: pydantic; extra == "salesforce"
550
+ Requires-Dist: pandas; extra == "salesforce"
551
+ Requires-Dist: opentelemetry-sdk; extra == "salesforce"
552
552
  Provides-Extra: sftp
553
- Requires-Dist: opentelemetry-sdk; extra == "sftp"
554
- Requires-Dist: paramiko; extra == "sftp"
553
+ Requires-Dist: fsspec; extra == "sftp"
554
+ Requires-Dist: tqdm; extra == "sftp"
555
+ Requires-Dist: python-dateutil; extra == "sftp"
556
+ Requires-Dist: dataclasses-json; extra == "sftp"
555
557
  Requires-Dist: click; extra == "sftp"
558
+ Requires-Dist: paramiko; extra == "sftp"
556
559
  Requires-Dist: pydantic; extra == "sftp"
557
- Requires-Dist: dataclasses-json; extra == "sftp"
558
- Requires-Dist: tqdm; extra == "sftp"
559
560
  Requires-Dist: pandas; extra == "sftp"
560
- Requires-Dist: python-dateutil; extra == "sftp"
561
- Requires-Dist: fsspec; extra == "sftp"
561
+ Requires-Dist: opentelemetry-sdk; extra == "sftp"
562
562
  Provides-Extra: sharepoint
563
- Requires-Dist: opentelemetry-sdk; extra == "sharepoint"
564
- Requires-Dist: click; extra == "sharepoint"
565
- Requires-Dist: dataclasses-json; extra == "sharepoint"
566
563
  Requires-Dist: tqdm; extra == "sharepoint"
567
- Requires-Dist: pandas; extra == "sharepoint"
568
- Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
569
564
  Requires-Dist: python-dateutil; extra == "sharepoint"
570
- Requires-Dist: msal; extra == "sharepoint"
565
+ Requires-Dist: dataclasses-json; extra == "sharepoint"
566
+ Requires-Dist: click; extra == "sharepoint"
567
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
571
568
  Requires-Dist: pydantic; extra == "sharepoint"
569
+ Requires-Dist: pandas; extra == "sharepoint"
570
+ Requires-Dist: opentelemetry-sdk; extra == "sharepoint"
571
+ Requires-Dist: msal; extra == "sharepoint"
572
572
  Provides-Extra: singlestore
573
- Requires-Dist: opentelemetry-sdk; extra == "singlestore"
574
- Requires-Dist: click; extra == "singlestore"
575
- Requires-Dist: dataclasses-json; extra == "singlestore"
576
573
  Requires-Dist: tqdm; extra == "singlestore"
577
- Requires-Dist: pandas; extra == "singlestore"
578
- Requires-Dist: singlestoredb; extra == "singlestore"
579
574
  Requires-Dist: python-dateutil; extra == "singlestore"
575
+ Requires-Dist: dataclasses-json; extra == "singlestore"
576
+ Requires-Dist: click; extra == "singlestore"
577
+ Requires-Dist: singlestoredb; extra == "singlestore"
580
578
  Requires-Dist: pydantic; extra == "singlestore"
579
+ Requires-Dist: pandas; extra == "singlestore"
580
+ Requires-Dist: opentelemetry-sdk; extra == "singlestore"
581
581
  Provides-Extra: slack
582
- Requires-Dist: opentelemetry-sdk; extra == "slack"
583
- Requires-Dist: click; extra == "slack"
584
- Requires-Dist: dataclasses-json; extra == "slack"
582
+ Requires-Dist: slack-sdk; extra == "slack"
585
583
  Requires-Dist: tqdm; extra == "slack"
586
- Requires-Dist: pandas; extra == "slack"
587
584
  Requires-Dist: python-dateutil; extra == "slack"
585
+ Requires-Dist: dataclasses-json; extra == "slack"
586
+ Requires-Dist: click; extra == "slack"
588
587
  Requires-Dist: pydantic; extra == "slack"
589
- Requires-Dist: slack-sdk; extra == "slack"
588
+ Requires-Dist: pandas; extra == "slack"
589
+ Requires-Dist: opentelemetry-sdk; extra == "slack"
590
590
  Provides-Extra: tsv
591
- Requires-Dist: opentelemetry-sdk; extra == "tsv"
592
- Requires-Dist: click; extra == "tsv"
593
- Requires-Dist: unstructured[tsv]; extra == "tsv"
594
- Requires-Dist: dataclasses-json; extra == "tsv"
595
591
  Requires-Dist: tqdm; extra == "tsv"
596
- Requires-Dist: pandas; extra == "tsv"
597
592
  Requires-Dist: python-dateutil; extra == "tsv"
593
+ Requires-Dist: dataclasses-json; extra == "tsv"
594
+ Requires-Dist: unstructured[tsv]; extra == "tsv"
595
+ Requires-Dist: click; extra == "tsv"
598
596
  Requires-Dist: pydantic; extra == "tsv"
597
+ Requires-Dist: pandas; extra == "tsv"
598
+ Requires-Dist: opentelemetry-sdk; extra == "tsv"
599
599
  Provides-Extra: vectara
600
- Requires-Dist: opentelemetry-sdk; extra == "vectara"
601
- Requires-Dist: click; extra == "vectara"
602
- Requires-Dist: dataclasses-json; extra == "vectara"
603
- Requires-Dist: requests; extra == "vectara"
604
600
  Requires-Dist: tqdm; extra == "vectara"
605
- Requires-Dist: pandas; extra == "vectara"
606
601
  Requires-Dist: python-dateutil; extra == "vectara"
602
+ Requires-Dist: dataclasses-json; extra == "vectara"
603
+ Requires-Dist: click; extra == "vectara"
604
+ Requires-Dist: requests; extra == "vectara"
607
605
  Requires-Dist: pydantic; extra == "vectara"
606
+ Requires-Dist: pandas; extra == "vectara"
607
+ Requires-Dist: opentelemetry-sdk; extra == "vectara"
608
608
  Provides-Extra: weaviate
609
- Requires-Dist: opentelemetry-sdk; extra == "weaviate"
610
- Requires-Dist: click; extra == "weaviate"
611
- Requires-Dist: dataclasses-json; extra == "weaviate"
612
609
  Requires-Dist: tqdm; extra == "weaviate"
613
- Requires-Dist: pandas; extra == "weaviate"
614
- Requires-Dist: weaviate-client; extra == "weaviate"
615
610
  Requires-Dist: python-dateutil; extra == "weaviate"
611
+ Requires-Dist: dataclasses-json; extra == "weaviate"
612
+ Requires-Dist: click; extra == "weaviate"
616
613
  Requires-Dist: pydantic; extra == "weaviate"
614
+ Requires-Dist: pandas; extra == "weaviate"
615
+ Requires-Dist: opentelemetry-sdk; extra == "weaviate"
616
+ Requires-Dist: weaviate-client; extra == "weaviate"
617
617
  Provides-Extra: wikipedia
618
- Requires-Dist: opentelemetry-sdk; extra == "wikipedia"
619
- Requires-Dist: click; extra == "wikipedia"
620
- Requires-Dist: dataclasses-json; extra == "wikipedia"
621
- Requires-Dist: wikipedia; extra == "wikipedia"
622
618
  Requires-Dist: tqdm; extra == "wikipedia"
623
- Requires-Dist: pandas; extra == "wikipedia"
624
619
  Requires-Dist: python-dateutil; extra == "wikipedia"
620
+ Requires-Dist: wikipedia; extra == "wikipedia"
621
+ Requires-Dist: dataclasses-json; extra == "wikipedia"
622
+ Requires-Dist: click; extra == "wikipedia"
625
623
  Requires-Dist: pydantic; extra == "wikipedia"
624
+ Requires-Dist: pandas; extra == "wikipedia"
625
+ Requires-Dist: opentelemetry-sdk; extra == "wikipedia"
626
626
  Provides-Extra: xlsx
627
- Requires-Dist: opentelemetry-sdk; extra == "xlsx"
627
+ Requires-Dist: unstructured[xlsx]; extra == "xlsx"
628
+ Requires-Dist: tqdm; extra == "xlsx"
629
+ Requires-Dist: python-dateutil; extra == "xlsx"
630
+ Requires-Dist: dataclasses-json; extra == "xlsx"
628
631
  Requires-Dist: click; extra == "xlsx"
629
632
  Requires-Dist: pydantic; extra == "xlsx"
630
- Requires-Dist: dataclasses-json; extra == "xlsx"
631
- Requires-Dist: tqdm; extra == "xlsx"
632
633
  Requires-Dist: pandas; extra == "xlsx"
633
- Requires-Dist: python-dateutil; extra == "xlsx"
634
- Requires-Dist: unstructured[xlsx]; extra == "xlsx"
634
+ Requires-Dist: opentelemetry-sdk; extra == "xlsx"
635
635
 
636
636
  # Unstructured Ingest
637
637
 
@@ -1,5 +1,5 @@
1
1
  unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
2
- unstructured_ingest/__version__.py,sha256=9_yNWUxyxaaKHXO3q2QY_s0mmWikO7bg69Xm4jGu4hQ,41
2
+ unstructured_ingest/__version__.py,sha256=mhrX1cgjjM8K7dLNNIYu3tS3ABCdK59YLgH5zvk67BI,42
3
3
  unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
4
4
  unstructured_ingest/evaluate.py,sha256=R-mKLFXbVX1xQ1tjGsLHjdP-TbSSV-925IHzggW_bIg,9793
5
5
  unstructured_ingest/interfaces.py,sha256=AeEywcSKCMA5AiEdENLpu_yPcXp_c6wpvESePfC00yo,31214
@@ -309,7 +309,7 @@ unstructured_ingest/v2/processes/connectors/elasticsearch.py,sha256=0O7l5LTIKw5b
309
309
  unstructured_ingest/v2/processes/connectors/google_drive.py,sha256=zRhhBCDFF4QzBpT2Ij1uXd5jdKTc_JR9WwfSLV9ynQc,12890
310
310
  unstructured_ingest/v2/processes/connectors/kdbai.py,sha256=vF-Owg2ZDI4nC7sk-Ied-5o_qkfwJzDr3uztOeS8kC0,5653
311
311
  unstructured_ingest/v2/processes/connectors/local.py,sha256=sXO-t_HZbq3rE3RzPUiWPnlrCHDixcSxz6epg4XgyYo,6786
312
- unstructured_ingest/v2/processes/connectors/milvus.py,sha256=9vCe-U_-wvmUohS56nLyeyHop7b4gVGuAakQtGTmdQk,6871
312
+ unstructured_ingest/v2/processes/connectors/milvus.py,sha256=hNMtjdNF6Nv8E_0n5uDpki1kAFdtPplq_5N0W92rrVs,7761
313
313
  unstructured_ingest/v2/processes/connectors/mongodb.py,sha256=q_GRuG2RQ5-8ajefifKuhFO52wCVhtU9j4ZIEf5hNas,4948
314
314
  unstructured_ingest/v2/processes/connectors/onedrive.py,sha256=-B8ELr0rnspzrTy6HBvgbvuiF1eEKRQyCT1ocwmET5Q,9145
315
315
  unstructured_ingest/v2/processes/connectors/opensearch.py,sha256=dEj4yYCgdhCD6376kuhKH7NVO5v-vsrN8dbULjEXfss,6811
@@ -329,9 +329,9 @@ unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=O1j0hIYWI4lPpTQ
329
329
  unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=cOMvMh0C9rtyEPJ0X59Fn-qb11LFUMRfeUgsi3QRWUk,6390
330
330
  unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=NkcU4U2DQWWuM8UHkez67C3SEOZpVyRtmtNS-z-F0Fw,6056
331
331
  unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
332
- unstructured_ingest-0.0.7.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
333
- unstructured_ingest-0.0.7.dist-info/METADATA,sha256=zcBWenMe64xmdQNwKMvyoGuiVpjg1Bwrz7v0RoGME5c,28109
334
- unstructured_ingest-0.0.7.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
335
- unstructured_ingest-0.0.7.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
336
- unstructured_ingest-0.0.7.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
337
- unstructured_ingest-0.0.7.dist-info/RECORD,,
332
+ unstructured_ingest-0.0.8.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
333
+ unstructured_ingest-0.0.8.dist-info/METADATA,sha256=ooohUbW_ADaqx0TqLjxrj-T8wj6Q9r4xdMu380kvQ5k,28109
334
+ unstructured_ingest-0.0.8.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
335
+ unstructured_ingest-0.0.8.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
336
+ unstructured_ingest-0.0.8.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
337
+ unstructured_ingest-0.0.8.dist-info/RECORD,,