unstructured-ingest 0.0.22__py3-none-any.whl → 0.0.23__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of unstructured-ingest might be problematic. Click here for more details.
- unstructured_ingest/__version__.py +1 -1
- unstructured_ingest/cli/interfaces.py +5 -5
- unstructured_ingest/embed/__init__.py +0 -17
- unstructured_ingest/embed/vertexai.py +1 -1
- unstructured_ingest/embed/voyageai.py +2 -2
- unstructured_ingest/interfaces.py +5 -5
- unstructured_ingest/v2/processes/embedder.py +10 -10
- {unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/METADATA +17 -17
- {unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/RECORD +13 -13
- {unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/LICENSE.md +0 -0
- {unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/WHEEL +0 -0
- {unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/entry_points.txt +0 -0
- {unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/top_level.txt +0 -0
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "0.0.
|
|
1
|
+
__version__ = "0.0.23" # pragma: no cover
|
|
@@ -415,11 +415,11 @@ class CliEmbeddingConfig(EmbeddingConfig, CliMixin):
|
|
|
415
415
|
@staticmethod
|
|
416
416
|
def get_cli_options() -> t.List[click.Option]:
|
|
417
417
|
embed_providers = [
|
|
418
|
-
"
|
|
419
|
-
"
|
|
420
|
-
"
|
|
421
|
-
"
|
|
422
|
-
"
|
|
418
|
+
"openai",
|
|
419
|
+
"huggingface",
|
|
420
|
+
"aws-bedrock",
|
|
421
|
+
"vertexai",
|
|
422
|
+
"voyageai",
|
|
423
423
|
"octoai",
|
|
424
424
|
]
|
|
425
425
|
options = [
|
|
@@ -1,17 +0,0 @@
|
|
|
1
|
-
from unstructured_ingest.embed.bedrock import BedrockEmbeddingEncoder
|
|
2
|
-
from unstructured_ingest.embed.huggingface import HuggingFaceEmbeddingEncoder
|
|
3
|
-
from unstructured_ingest.embed.mixedbreadai import MixedbreadAIEmbeddingEncoder
|
|
4
|
-
from unstructured_ingest.embed.octoai import OctoAIEmbeddingEncoder
|
|
5
|
-
from unstructured_ingest.embed.openai import OpenAIEmbeddingEncoder
|
|
6
|
-
from unstructured_ingest.embed.vertexai import VertexAIEmbeddingEncoder
|
|
7
|
-
from unstructured_ingest.embed.voyageai import VoyageAIEmbeddingEncoder
|
|
8
|
-
|
|
9
|
-
EMBEDDING_PROVIDER_TO_CLASS_MAP = {
|
|
10
|
-
"langchain-openai": OpenAIEmbeddingEncoder,
|
|
11
|
-
"langchain-huggingface": HuggingFaceEmbeddingEncoder,
|
|
12
|
-
"langchain-aws-bedrock": BedrockEmbeddingEncoder,
|
|
13
|
-
"langchain-vertexai": VertexAIEmbeddingEncoder,
|
|
14
|
-
"langchain-voyageai": VoyageAIEmbeddingEncoder,
|
|
15
|
-
"mixedbread-ai": MixedbreadAIEmbeddingEncoder,
|
|
16
|
-
"octoai": OctoAIEmbeddingEncoder,
|
|
17
|
-
}
|
|
@@ -45,7 +45,7 @@ class VertexAIEmbeddingConfig(EmbeddingConfig):
|
|
|
45
45
|
extras="embed-vertexai",
|
|
46
46
|
)
|
|
47
47
|
def get_client(self) -> "TextEmbeddingModel":
|
|
48
|
-
"""Creates a
|
|
48
|
+
"""Creates a VertexAI python client to embed elements."""
|
|
49
49
|
from vertexai.language_models import TextEmbeddingModel
|
|
50
50
|
|
|
51
51
|
self.register_application_credentials()
|
|
@@ -20,11 +20,11 @@ class VoyageAIEmbeddingConfig(EmbeddingConfig):
|
|
|
20
20
|
timeout_in_seconds: Optional[int] = None
|
|
21
21
|
|
|
22
22
|
@requires_dependencies(
|
|
23
|
-
["
|
|
23
|
+
["voyageai"],
|
|
24
24
|
extras="embed-voyageai",
|
|
25
25
|
)
|
|
26
26
|
def get_client(self) -> "VoyageAIClient":
|
|
27
|
-
"""Creates a
|
|
27
|
+
"""Creates a VoyageAI python client to embed elements."""
|
|
28
28
|
from voyageai import Client as VoyageAIClient
|
|
29
29
|
|
|
30
30
|
client = VoyageAIClient(
|
|
@@ -204,14 +204,14 @@ class EmbeddingConfig(BaseConfig):
|
|
|
204
204
|
if self.model_name:
|
|
205
205
|
kwargs["model_name"] = self.model_name
|
|
206
206
|
# TODO make this more dynamic to map to encoder configs
|
|
207
|
-
if self.provider == "
|
|
207
|
+
if self.provider == "openai":
|
|
208
208
|
from unstructured_ingest.embed.openai import (
|
|
209
209
|
OpenAIEmbeddingConfig,
|
|
210
210
|
OpenAIEmbeddingEncoder,
|
|
211
211
|
)
|
|
212
212
|
|
|
213
213
|
return OpenAIEmbeddingEncoder(config=OpenAIEmbeddingConfig(**kwargs))
|
|
214
|
-
elif self.provider == "
|
|
214
|
+
elif self.provider == "huggingface":
|
|
215
215
|
from unstructured_ingest.embed.huggingface import (
|
|
216
216
|
HuggingFaceEmbeddingConfig,
|
|
217
217
|
HuggingFaceEmbeddingEncoder,
|
|
@@ -225,7 +225,7 @@ class EmbeddingConfig(BaseConfig):
|
|
|
225
225
|
)
|
|
226
226
|
|
|
227
227
|
return OctoAIEmbeddingEncoder(config=OctoAiEmbeddingConfig(**kwargs))
|
|
228
|
-
elif self.provider == "
|
|
228
|
+
elif self.provider == "aws-bedrock":
|
|
229
229
|
from unstructured_ingest.embed.bedrock import (
|
|
230
230
|
BedrockEmbeddingConfig,
|
|
231
231
|
BedrockEmbeddingEncoder,
|
|
@@ -238,14 +238,14 @@ class EmbeddingConfig(BaseConfig):
|
|
|
238
238
|
region_name=self.aws_region,
|
|
239
239
|
)
|
|
240
240
|
)
|
|
241
|
-
elif self.provider == "
|
|
241
|
+
elif self.provider == "vertexai":
|
|
242
242
|
from unstructured_ingest.embed.vertexai import (
|
|
243
243
|
VertexAIEmbeddingConfig,
|
|
244
244
|
VertexAIEmbeddingEncoder,
|
|
245
245
|
)
|
|
246
246
|
|
|
247
247
|
return VertexAIEmbeddingEncoder(config=VertexAIEmbeddingConfig(**kwargs))
|
|
248
|
-
elif self.provider == "
|
|
248
|
+
elif self.provider == "voyageai":
|
|
249
249
|
from unstructured_ingest.embed.voyageai import (
|
|
250
250
|
VoyageAIEmbeddingConfig,
|
|
251
251
|
VoyageAIEmbeddingEncoder,
|
|
@@ -15,11 +15,11 @@ if TYPE_CHECKING:
|
|
|
15
15
|
class EmbedderConfig(BaseModel):
|
|
16
16
|
embedding_provider: Optional[
|
|
17
17
|
Literal[
|
|
18
|
-
"
|
|
19
|
-
"
|
|
20
|
-
"
|
|
21
|
-
"
|
|
22
|
-
"
|
|
18
|
+
"openai",
|
|
19
|
+
"huggingface",
|
|
20
|
+
"aws-bedrock",
|
|
21
|
+
"vertexai",
|
|
22
|
+
"voyageai",
|
|
23
23
|
"octoai",
|
|
24
24
|
"mixedbread-ai",
|
|
25
25
|
]
|
|
@@ -114,22 +114,22 @@ class EmbedderConfig(BaseModel):
|
|
|
114
114
|
if self.embedding_model_name:
|
|
115
115
|
kwargs["model_name"] = self.embedding_model_name
|
|
116
116
|
# TODO make this more dynamic to map to encoder configs
|
|
117
|
-
if self.embedding_provider == "
|
|
117
|
+
if self.embedding_provider == "openai":
|
|
118
118
|
return self.get_openai_embedder(embedding_kwargs=kwargs)
|
|
119
119
|
|
|
120
|
-
if self.embedding_provider == "
|
|
120
|
+
if self.embedding_provider == "huggingface":
|
|
121
121
|
return self.get_huggingface_embedder(embedding_kwargs=kwargs)
|
|
122
122
|
|
|
123
123
|
if self.embedding_provider == "octoai":
|
|
124
124
|
return self.get_octoai_embedder(embedding_kwargs=kwargs)
|
|
125
125
|
|
|
126
|
-
if self.embedding_provider == "
|
|
126
|
+
if self.embedding_provider == "aws-bedrock":
|
|
127
127
|
return self.get_bedrock_embedder()
|
|
128
128
|
|
|
129
|
-
if self.embedding_provider == "
|
|
129
|
+
if self.embedding_provider == "vertexai":
|
|
130
130
|
return self.get_vertexai_embedder(embedding_kwargs=kwargs)
|
|
131
131
|
|
|
132
|
-
if self.embedding_provider == "
|
|
132
|
+
if self.embedding_provider == "voyageai":
|
|
133
133
|
return self.get_voyageai_embedder(embedding_kwargs=kwargs)
|
|
134
134
|
if self.embedding_provider == "mixedbread-ai":
|
|
135
135
|
return self.get_mixedbread_embedder(embedding_kwargs=kwargs)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: unstructured-ingest
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.23
|
|
4
4
|
Summary: A library that prepares raw documents for downstream ML tasks.
|
|
5
5
|
Home-page: https://github.com/Unstructured-IO/unstructured-ingest
|
|
6
6
|
Author: Unstructured Technologies
|
|
@@ -22,20 +22,20 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
|
22
22
|
Requires-Python: >=3.9.0,<3.13
|
|
23
23
|
Description-Content-Type: text/markdown
|
|
24
24
|
License-File: LICENSE.md
|
|
25
|
-
Requires-Dist:
|
|
26
|
-
Requires-Dist: dataclasses-json
|
|
27
|
-
Requires-Dist: opentelemetry-sdk
|
|
25
|
+
Requires-Dist: pydantic>=2.7
|
|
28
26
|
Requires-Dist: python-dateutil
|
|
29
27
|
Requires-Dist: click
|
|
28
|
+
Requires-Dist: opentelemetry-sdk
|
|
29
|
+
Requires-Dist: pandas
|
|
30
|
+
Requires-Dist: dataclasses-json
|
|
30
31
|
Requires-Dist: tqdm
|
|
31
|
-
Requires-Dist: pydantic>=2.7
|
|
32
32
|
Provides-Extra: airtable
|
|
33
33
|
Requires-Dist: pyairtable; extra == "airtable"
|
|
34
34
|
Provides-Extra: astradb
|
|
35
35
|
Requires-Dist: astrapy; extra == "astradb"
|
|
36
36
|
Provides-Extra: azure
|
|
37
|
-
Requires-Dist: adlfs; extra == "azure"
|
|
38
37
|
Requires-Dist: fsspec; extra == "azure"
|
|
38
|
+
Requires-Dist: adlfs; extra == "azure"
|
|
39
39
|
Provides-Extra: azure-cognitive-search
|
|
40
40
|
Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
|
|
41
41
|
Provides-Extra: bedrock
|
|
@@ -44,8 +44,8 @@ Provides-Extra: biomed
|
|
|
44
44
|
Requires-Dist: bs4; extra == "biomed"
|
|
45
45
|
Requires-Dist: requests; extra == "biomed"
|
|
46
46
|
Provides-Extra: box
|
|
47
|
-
Requires-Dist: boxfs; extra == "box"
|
|
48
47
|
Requires-Dist: fsspec; extra == "box"
|
|
48
|
+
Requires-Dist: boxfs; extra == "box"
|
|
49
49
|
Provides-Extra: chroma
|
|
50
50
|
Requires-Dist: chromadb; extra == "chroma"
|
|
51
51
|
Provides-Extra: clarifai
|
|
@@ -60,8 +60,8 @@ Requires-Dist: unstructured[tsv]; extra == "csv"
|
|
|
60
60
|
Provides-Extra: databricks-volumes
|
|
61
61
|
Requires-Dist: databricks-sdk; extra == "databricks-volumes"
|
|
62
62
|
Provides-Extra: delta-table
|
|
63
|
-
Requires-Dist: deltalake; extra == "delta-table"
|
|
64
63
|
Requires-Dist: fsspec; extra == "delta-table"
|
|
64
|
+
Requires-Dist: deltalake; extra == "delta-table"
|
|
65
65
|
Provides-Extra: discord
|
|
66
66
|
Requires-Dist: discord-py; extra == "discord"
|
|
67
67
|
Provides-Extra: doc
|
|
@@ -69,8 +69,8 @@ Requires-Dist: unstructured[docx]; extra == "doc"
|
|
|
69
69
|
Provides-Extra: docx
|
|
70
70
|
Requires-Dist: unstructured[docx]; extra == "docx"
|
|
71
71
|
Provides-Extra: dropbox
|
|
72
|
-
Requires-Dist: dropboxdrivefs; extra == "dropbox"
|
|
73
72
|
Requires-Dist: fsspec; extra == "dropbox"
|
|
73
|
+
Requires-Dist: dropboxdrivefs; extra == "dropbox"
|
|
74
74
|
Provides-Extra: elasticsearch
|
|
75
75
|
Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
|
|
76
76
|
Provides-Extra: embed-huggingface
|
|
@@ -88,18 +88,18 @@ Provides-Extra: epub
|
|
|
88
88
|
Requires-Dist: unstructured[epub]; extra == "epub"
|
|
89
89
|
Provides-Extra: gcs
|
|
90
90
|
Requires-Dist: bs4; extra == "gcs"
|
|
91
|
-
Requires-Dist: gcsfs; extra == "gcs"
|
|
92
91
|
Requires-Dist: fsspec; extra == "gcs"
|
|
92
|
+
Requires-Dist: gcsfs; extra == "gcs"
|
|
93
93
|
Provides-Extra: github
|
|
94
|
-
Requires-Dist: pygithub>1.58.0; extra == "github"
|
|
95
94
|
Requires-Dist: requests; extra == "github"
|
|
95
|
+
Requires-Dist: pygithub>1.58.0; extra == "github"
|
|
96
96
|
Provides-Extra: gitlab
|
|
97
97
|
Requires-Dist: python-gitlab; extra == "gitlab"
|
|
98
98
|
Provides-Extra: google-drive
|
|
99
99
|
Requires-Dist: google-api-python-client; extra == "google-drive"
|
|
100
100
|
Provides-Extra: hubspot
|
|
101
|
-
Requires-Dist: hubspot-api-client; extra == "hubspot"
|
|
102
101
|
Requires-Dist: urllib3; extra == "hubspot"
|
|
102
|
+
Requires-Dist: hubspot-api-client; extra == "hubspot"
|
|
103
103
|
Provides-Extra: jira
|
|
104
104
|
Requires-Dist: atlassian-python-api; extra == "jira"
|
|
105
105
|
Provides-Extra: kafka
|
|
@@ -115,16 +115,16 @@ Requires-Dist: pymongo; extra == "mongodb"
|
|
|
115
115
|
Provides-Extra: msg
|
|
116
116
|
Requires-Dist: unstructured[msg]; extra == "msg"
|
|
117
117
|
Provides-Extra: notion
|
|
118
|
+
Requires-Dist: backoff; extra == "notion"
|
|
118
119
|
Requires-Dist: httpx; extra == "notion"
|
|
119
|
-
Requires-Dist: notion-client; extra == "notion"
|
|
120
120
|
Requires-Dist: htmlBuilder; extra == "notion"
|
|
121
|
-
Requires-Dist:
|
|
121
|
+
Requires-Dist: notion-client; extra == "notion"
|
|
122
122
|
Provides-Extra: odt
|
|
123
123
|
Requires-Dist: unstructured[odt]; extra == "odt"
|
|
124
124
|
Provides-Extra: onedrive
|
|
125
|
+
Requires-Dist: bs4; extra == "onedrive"
|
|
125
126
|
Requires-Dist: msal; extra == "onedrive"
|
|
126
127
|
Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
|
|
127
|
-
Requires-Dist: bs4; extra == "onedrive"
|
|
128
128
|
Provides-Extra: openai
|
|
129
129
|
Requires-Dist: openai; extra == "openai"
|
|
130
130
|
Requires-Dist: tiktoken; extra == "openai"
|
|
@@ -156,13 +156,13 @@ Requires-Dist: unstructured[rst]; extra == "rst"
|
|
|
156
156
|
Provides-Extra: rtf
|
|
157
157
|
Requires-Dist: unstructured[rtf]; extra == "rtf"
|
|
158
158
|
Provides-Extra: s3
|
|
159
|
-
Requires-Dist: s3fs; extra == "s3"
|
|
160
159
|
Requires-Dist: fsspec; extra == "s3"
|
|
160
|
+
Requires-Dist: s3fs; extra == "s3"
|
|
161
161
|
Provides-Extra: salesforce
|
|
162
162
|
Requires-Dist: simple-salesforce; extra == "salesforce"
|
|
163
163
|
Provides-Extra: sftp
|
|
164
|
-
Requires-Dist: fsspec; extra == "sftp"
|
|
165
164
|
Requires-Dist: paramiko; extra == "sftp"
|
|
165
|
+
Requires-Dist: fsspec; extra == "sftp"
|
|
166
166
|
Provides-Extra: sharepoint
|
|
167
167
|
Requires-Dist: msal; extra == "sharepoint"
|
|
168
168
|
Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
|
|
2
|
-
unstructured_ingest/__version__.py,sha256=
|
|
2
|
+
unstructured_ingest/__version__.py,sha256=HgbcmBIk6mQp0Bz81M53L-kPIBJnMYIFOGkRL73EChs,43
|
|
3
3
|
unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
|
|
4
|
-
unstructured_ingest/interfaces.py,sha256=
|
|
4
|
+
unstructured_ingest/interfaces.py,sha256=0r0gQoHJQ4DVSQEVbUPBA3N6WyvGMkR1u6U2SwUvoAQ,31361
|
|
5
5
|
unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
|
|
6
6
|
unstructured_ingest/main.py,sha256=82G_7eG4PNhc_xIqj4Y_sFbDV9VI-nwSfsfJQMzovMk,169
|
|
7
7
|
unstructured_ingest/processor.py,sha256=XKKrvbxsb--5cDzz4hB3-GfWZYyIjJ2ah8FpzQKF_DM,2760
|
|
@@ -9,7 +9,7 @@ unstructured_ingest/cli/__init__.py,sha256=9kNcBOHuXON5lB1MJU9QewEhwPmId56vXqB29
|
|
|
9
9
|
unstructured_ingest/cli/cli.py,sha256=LutBTBYMqboKw8cputHVszpenyfnySzcUC15ifwuYyg,1049
|
|
10
10
|
unstructured_ingest/cli/cmd_factory.py,sha256=UdHm1KacTombpF6DxyTSwTCuApsKHUYw_kVu5Nhcy3Y,364
|
|
11
11
|
unstructured_ingest/cli/common.py,sha256=I0El08FHz5kxw7iz0VWOWPrvcJD1rBgXJSwVIpVmmwU,204
|
|
12
|
-
unstructured_ingest/cli/interfaces.py,sha256=
|
|
12
|
+
unstructured_ingest/cli/interfaces.py,sha256=nWZVXAoLEP08eDPj10c2nwHNbd-HXOHFa4YvEdUJ8y8,24084
|
|
13
13
|
unstructured_ingest/cli/utils.py,sha256=KNhkFNKOeEihc8HlvMz_MTbYVQNFklrBKbC8xg9h1xE,7982
|
|
14
14
|
unstructured_ingest/cli/base/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
15
15
|
unstructured_ingest/cli/base/cmd.py,sha256=BbfjA2v203Jh-7DL6bzxQ7fOeNixd5BsBMuzXz6h5IQ,583
|
|
@@ -166,15 +166,15 @@ unstructured_ingest/connector/notion/types/database_properties/title.py,sha256=O
|
|
|
166
166
|
unstructured_ingest/connector/notion/types/database_properties/unique_id.py,sha256=H9lKi8rCDPtKmuu7j9CnJoTUr6YmzIF4oXbv_OxuN9k,1162
|
|
167
167
|
unstructured_ingest/connector/notion/types/database_properties/url.py,sha256=iXQ2tVUm9UlKVtDA0NQiFIRJ5PHYW9wOaWt2vFfSVCg,862
|
|
168
168
|
unstructured_ingest/connector/notion/types/database_properties/verification.py,sha256=J_DLjY-v2T6xDGMQ7FkI0YMKMA6SG6Y3yYW7qUD1hKA,2334
|
|
169
|
-
unstructured_ingest/embed/__init__.py,sha256=
|
|
169
|
+
unstructured_ingest/embed/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
170
170
|
unstructured_ingest/embed/bedrock.py,sha256=5-pKWwOEGHKOHa06wYuKOhvT8Xu72ke6nrpCnRtkAaU,3872
|
|
171
171
|
unstructured_ingest/embed/huggingface.py,sha256=ku_JQr72KBG8n5b6KRkXIbeBGzdgLw_KKIEm1dFK3oM,2729
|
|
172
172
|
unstructured_ingest/embed/interfaces.py,sha256=L5WimR69bmEvliIBlZ8wOCH_YDA9DWteCu6QEsKCV5I,1113
|
|
173
173
|
unstructured_ingest/embed/mixedbreadai.py,sha256=NSrAt1_bjphTHLUnlzzWSBU25UBCZlpYaLdWSRSGyqs,5504
|
|
174
174
|
unstructured_ingest/embed/octoai.py,sha256=0zxAUAMzodGkqMwqMkEvSfgWLNHtEnhdvUofvJDQD1A,2368
|
|
175
175
|
unstructured_ingest/embed/openai.py,sha256=4Ee4A2rQ8OlSh_yiJSFmok_qqRDi1A3KyayB5YiPLFw,2058
|
|
176
|
-
unstructured_ingest/embed/vertexai.py,sha256=
|
|
177
|
-
unstructured_ingest/embed/voyageai.py,sha256=
|
|
176
|
+
unstructured_ingest/embed/vertexai.py,sha256=cgyRyTm_dO_qyedwbIhOQIFvKjCqZBoDh606ykzTYHI,3598
|
|
177
|
+
unstructured_ingest/embed/voyageai.py,sha256=6BWNJUZOqkHSMaO2XPVZVYAVRrAtpMWQZEKp0qgp20Q,2631
|
|
178
178
|
unstructured_ingest/enhanced_dataclass/__init__.py,sha256=gDZOUsv5eo-8jm4Yu7DdDwi101aGbfG7JctTdOYnTOM,151
|
|
179
179
|
unstructured_ingest/enhanced_dataclass/core.py,sha256=d6aUkDynuKX87cHx9_N5UDUWrvISR4jYRFRTvd_avlI,3038
|
|
180
180
|
unstructured_ingest/enhanced_dataclass/dataclasses.py,sha256=aZMsoCzAGRb8Rmh3BTSBFtNr6FmFTY93KYGLk3gYJKQ,1949
|
|
@@ -304,7 +304,7 @@ unstructured_ingest/v2/pipeline/steps/upload.py,sha256=zlgXgwReX9TBOdfTpS9hETah4
|
|
|
304
304
|
unstructured_ingest/v2/processes/__init__.py,sha256=FaHWSCGyc7GWVnAsNEUUj7L8hT8gCVY3_hUE2VzWtUg,462
|
|
305
305
|
unstructured_ingest/v2/processes/chunker.py,sha256=76PrpCSd8k3DpfdZcl8I10u7vciKzhSV9ZByrrp302g,5476
|
|
306
306
|
unstructured_ingest/v2/processes/connector_registry.py,sha256=vkEe6jpgdYtZCxMj59s5atWGgmPuxAEXRUoTt-MJ7wc,2198
|
|
307
|
-
unstructured_ingest/v2/processes/embedder.py,sha256=
|
|
307
|
+
unstructured_ingest/v2/processes/embedder.py,sha256=nFYiOmIJwWLodBt_cC-E5h7zmYB9t3hLu2BWtBStm3g,5977
|
|
308
308
|
unstructured_ingest/v2/processes/filter.py,sha256=kjUmMw2SDq2bme0JCAOxs6cJriIG6Ty09KOznS-xz08,2145
|
|
309
309
|
unstructured_ingest/v2/processes/partitioner.py,sha256=bpqmZDsKKi6qtxNWdIWBfQmr1ccQUhU0axecpGAUf_4,7739
|
|
310
310
|
unstructured_ingest/v2/processes/uncompress.py,sha256=Z_XfsITGdyaRwhtNUc7bMj5Y2jLuBge8KoK4nxhqKag,2425
|
|
@@ -339,9 +339,9 @@ unstructured_ingest/v2/processes/connectors/fsspec/gcs.py,sha256=-_pYHbsBG9FyRyN
|
|
|
339
339
|
unstructured_ingest/v2/processes/connectors/fsspec/s3.py,sha256=je1BDqFWlyMfPa4oAMMNFQLLQtCY9quuqx3xjTwF8OQ,6251
|
|
340
340
|
unstructured_ingest/v2/processes/connectors/fsspec/sftp.py,sha256=dwpyqDq0qceCBWX3zM1hiUlgXB4hzX6ObOr-sh-5CJs,6926
|
|
341
341
|
unstructured_ingest/v2/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
|
|
342
|
-
unstructured_ingest-0.0.
|
|
343
|
-
unstructured_ingest-0.0.
|
|
344
|
-
unstructured_ingest-0.0.
|
|
345
|
-
unstructured_ingest-0.0.
|
|
346
|
-
unstructured_ingest-0.0.
|
|
347
|
-
unstructured_ingest-0.0.
|
|
342
|
+
unstructured_ingest-0.0.23.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
|
|
343
|
+
unstructured_ingest-0.0.23.dist-info/METADATA,sha256=iWfV6hzGvmClCO7_huz8s-h9FST1mJsc-mUHZQaGQU4,7108
|
|
344
|
+
unstructured_ingest-0.0.23.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
|
|
345
|
+
unstructured_ingest-0.0.23.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
|
|
346
|
+
unstructured_ingest-0.0.23.dist-info/top_level.txt,sha256=QaTxTcjfM5Hr9sZJ6weOJvSe5ESQc0F8AWkhHInTCf8,20
|
|
347
|
+
unstructured_ingest-0.0.23.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
{unstructured_ingest-0.0.22.dist-info → unstructured_ingest-0.0.23.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
|
File without changes
|