unstructured-ingest 0.3.15__py3-none-any.whl → 0.4.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of unstructured-ingest might be problematic. Click here for more details.
- test/integration/connectors/test_confluence.py +4 -4
- test/unit/v2/connectors/sql/__init__.py +0 -0
- test/unit/v2/connectors/sql/test_sql.py +72 -0
- test/unit/v2/connectors/test_confluence.py +6 -6
- unstructured_ingest/__version__.py +1 -1
- unstructured_ingest/v2/processes/connectors/confluence.py +30 -10
- unstructured_ingest/v2/processes/connectors/sql/snowflake.py +1 -1
- unstructured_ingest/v2/processes/connectors/sql/sql.py +2 -0
- {unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/METADATA +18 -18
- {unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/RECORD +14 -12
- {unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/LICENSE.md +0 -0
- {unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/WHEEL +0 -0
- {unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/entry_points.txt +0 -0
- {unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/top_level.txt +0 -0
|
@@ -30,10 +30,10 @@ async def test_confluence_source(temp_dir):
|
|
|
30
30
|
spaces = ["testteamsp", "MFS"]
|
|
31
31
|
|
|
32
32
|
# Create connection and indexer configurations
|
|
33
|
-
access_config = ConfluenceAccessConfig(
|
|
33
|
+
access_config = ConfluenceAccessConfig(password=api_token)
|
|
34
34
|
connection_config = ConfluenceConnectionConfig(
|
|
35
35
|
url=confluence_url,
|
|
36
|
-
|
|
36
|
+
username=user_email,
|
|
37
37
|
access_config=access_config,
|
|
38
38
|
)
|
|
39
39
|
index_config = ConfluenceIndexerConfig(
|
|
@@ -77,10 +77,10 @@ async def test_confluence_source_large(temp_dir):
|
|
|
77
77
|
spaces = ["testteamsp1"]
|
|
78
78
|
|
|
79
79
|
# Create connection and indexer configurations
|
|
80
|
-
access_config = ConfluenceAccessConfig(
|
|
80
|
+
access_config = ConfluenceAccessConfig(password=api_token)
|
|
81
81
|
connection_config = ConfluenceConnectionConfig(
|
|
82
82
|
url=confluence_url,
|
|
83
|
-
|
|
83
|
+
username=user_email,
|
|
84
84
|
access_config=access_config,
|
|
85
85
|
)
|
|
86
86
|
index_config = ConfluenceIndexerConfig(
|
|
File without changes
|
|
@@ -0,0 +1,72 @@
|
|
|
1
|
+
from pathlib import Path
|
|
2
|
+
|
|
3
|
+
import pytest
|
|
4
|
+
from pytest_mock import MockerFixture
|
|
5
|
+
|
|
6
|
+
from unstructured_ingest.v2.interfaces.file_data import FileData, SourceIdentifiers
|
|
7
|
+
from unstructured_ingest.v2.processes.connectors.sql.sql import SQLUploadStager
|
|
8
|
+
|
|
9
|
+
|
|
10
|
+
@pytest.fixture
|
|
11
|
+
def mock_instance() -> SQLUploadStager:
|
|
12
|
+
return SQLUploadStager()
|
|
13
|
+
|
|
14
|
+
|
|
15
|
+
@pytest.mark.parametrize(
|
|
16
|
+
("input_filepath", "output_filename", "expected"),
|
|
17
|
+
[
|
|
18
|
+
(
|
|
19
|
+
"/path/to/input_file.ndjson",
|
|
20
|
+
"output_file.ndjson",
|
|
21
|
+
"output_file.ndjson",
|
|
22
|
+
),
|
|
23
|
+
("input_file.txt", "output_file.json", "output_file.txt"),
|
|
24
|
+
("/path/to/input_file.json", "output_file", "output_file.json"),
|
|
25
|
+
],
|
|
26
|
+
)
|
|
27
|
+
def test_run_output_filename_suffix(
|
|
28
|
+
mocker: MockerFixture,
|
|
29
|
+
mock_instance: SQLUploadStager,
|
|
30
|
+
input_filepath: str,
|
|
31
|
+
output_filename: str,
|
|
32
|
+
expected: str,
|
|
33
|
+
):
|
|
34
|
+
output_dir = Path("/tmp/test/output_dir")
|
|
35
|
+
|
|
36
|
+
# Mocks
|
|
37
|
+
mock_get_data = mocker.patch(
|
|
38
|
+
"unstructured_ingest.v2.processes.connectors.sql.sql.get_data",
|
|
39
|
+
return_value=[{"key": "value"}, {"key": "value2"}],
|
|
40
|
+
)
|
|
41
|
+
mock_conform_dict = mocker.patch.object(
|
|
42
|
+
SQLUploadStager, "conform_dict", side_effect=lambda element_dict, file_data: element_dict
|
|
43
|
+
)
|
|
44
|
+
mock_conform_dataframe = mocker.patch.object(
|
|
45
|
+
SQLUploadStager, "conform_dataframe", side_effect=lambda df: df
|
|
46
|
+
)
|
|
47
|
+
mock_get_output_path = mocker.patch.object(
|
|
48
|
+
SQLUploadStager, "get_output_path", return_value=output_dir / expected
|
|
49
|
+
)
|
|
50
|
+
mock_write_output = mocker.patch.object(SQLUploadStager, "write_output")
|
|
51
|
+
|
|
52
|
+
# Act
|
|
53
|
+
result = mock_instance.run(
|
|
54
|
+
elements_filepath=Path(input_filepath),
|
|
55
|
+
file_data=FileData(
|
|
56
|
+
identifier="test",
|
|
57
|
+
connector_type="test",
|
|
58
|
+
source_identifiers=SourceIdentifiers(filename=input_filepath, fullpath=input_filepath),
|
|
59
|
+
),
|
|
60
|
+
output_dir=output_dir,
|
|
61
|
+
output_filename=output_filename,
|
|
62
|
+
)
|
|
63
|
+
|
|
64
|
+
# Assert
|
|
65
|
+
mock_get_data.assert_called_once_with(path=Path(input_filepath))
|
|
66
|
+
assert mock_conform_dict.call_count == 2
|
|
67
|
+
mock_conform_dataframe.assert_called_once()
|
|
68
|
+
mock_get_output_path.assert_called_once_with(output_filename=expected, output_dir=output_dir)
|
|
69
|
+
mock_write_output.assert_called_once_with(
|
|
70
|
+
output_path=output_dir / expected, data=[{"key": "value"}, {"key": "value2"}]
|
|
71
|
+
)
|
|
72
|
+
assert result.name == expected
|
|
@@ -11,10 +11,10 @@ def test_connection_config_multiple_auth():
|
|
|
11
11
|
with pytest.raises(ValidationError):
|
|
12
12
|
ConfluenceConnectionConfig(
|
|
13
13
|
access_config=ConfluenceAccessConfig(
|
|
14
|
-
|
|
15
|
-
|
|
14
|
+
password="api_token",
|
|
15
|
+
token="access_token",
|
|
16
16
|
),
|
|
17
|
-
|
|
17
|
+
username="user_email",
|
|
18
18
|
url="url",
|
|
19
19
|
)
|
|
20
20
|
|
|
@@ -26,14 +26,14 @@ def test_connection_config_no_auth():
|
|
|
26
26
|
|
|
27
27
|
def test_connection_config_basic_auth():
|
|
28
28
|
ConfluenceConnectionConfig(
|
|
29
|
-
access_config=ConfluenceAccessConfig(
|
|
29
|
+
access_config=ConfluenceAccessConfig(password="api_token"),
|
|
30
30
|
url="url",
|
|
31
|
-
|
|
31
|
+
username="user_email",
|
|
32
32
|
)
|
|
33
33
|
|
|
34
34
|
|
|
35
35
|
def test_connection_config_pat_auth():
|
|
36
36
|
ConfluenceConnectionConfig(
|
|
37
|
-
access_config=ConfluenceAccessConfig(
|
|
37
|
+
access_config=ConfluenceAccessConfig(token="access_token"),
|
|
38
38
|
url="url",
|
|
39
39
|
)
|
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "0.
|
|
1
|
+
__version__ = "0.4.0" # pragma: no cover
|
|
@@ -30,27 +30,45 @@ CONNECTOR_TYPE = "confluence"
|
|
|
30
30
|
|
|
31
31
|
|
|
32
32
|
class ConfluenceAccessConfig(AccessConfig):
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
33
|
+
password: Optional[str] = Field(
|
|
34
|
+
description="Confluence password or Cloud API token",
|
|
35
|
+
default=None,
|
|
36
|
+
)
|
|
37
|
+
token: Optional[str] = Field(
|
|
38
|
+
description="Confluence Personal Access Token",
|
|
39
|
+
default=None,
|
|
36
40
|
)
|
|
37
41
|
|
|
38
42
|
|
|
39
43
|
class ConfluenceConnectionConfig(ConnectionConfig):
|
|
40
44
|
url: str = Field(description="URL of the Confluence instance")
|
|
41
|
-
|
|
45
|
+
username: Optional[str] = Field(
|
|
46
|
+
description="Username or email for authentication",
|
|
47
|
+
default=None,
|
|
48
|
+
)
|
|
49
|
+
cloud: bool = Field(description="Authenticate to Confluence Cloud", default=False)
|
|
42
50
|
access_config: Secret[ConfluenceAccessConfig] = Field(
|
|
43
51
|
description="Access configuration for Confluence"
|
|
44
52
|
)
|
|
45
53
|
|
|
46
54
|
def model_post_init(self, __context):
|
|
47
55
|
access_configs = self.access_config.get_secret_value()
|
|
48
|
-
basic_auth = self.
|
|
49
|
-
pat_auth = access_configs.
|
|
56
|
+
basic_auth = self.username and access_configs.password
|
|
57
|
+
pat_auth = access_configs.token
|
|
58
|
+
if self.cloud and not basic_auth:
|
|
59
|
+
raise ValueError(
|
|
60
|
+
"cloud authentication requires username and API token (--password), "
|
|
61
|
+
"see: https://atlassian-python-api.readthedocs.io/"
|
|
62
|
+
)
|
|
50
63
|
if basic_auth and pat_auth:
|
|
51
|
-
raise ValueError(
|
|
64
|
+
raise ValueError(
|
|
65
|
+
"both password and token provided, only one allowed, "
|
|
66
|
+
"see: https://atlassian-python-api.readthedocs.io/"
|
|
67
|
+
)
|
|
52
68
|
if not (basic_auth or pat_auth):
|
|
53
|
-
raise ValueError(
|
|
69
|
+
raise ValueError(
|
|
70
|
+
"no form of auth provided, see: https://atlassian-python-api.readthedocs.io/"
|
|
71
|
+
)
|
|
54
72
|
|
|
55
73
|
@requires_dependencies(["atlassian"], extras="confluence")
|
|
56
74
|
def get_client(self) -> "Confluence":
|
|
@@ -59,8 +77,10 @@ class ConfluenceConnectionConfig(ConnectionConfig):
|
|
|
59
77
|
access_configs = self.access_config.get_secret_value()
|
|
60
78
|
return Confluence(
|
|
61
79
|
url=self.url,
|
|
62
|
-
username=self.
|
|
63
|
-
password=access_configs.
|
|
80
|
+
username=self.username,
|
|
81
|
+
password=access_configs.password,
|
|
82
|
+
token=access_configs.token,
|
|
83
|
+
cloud=self.cloud,
|
|
64
84
|
)
|
|
65
85
|
|
|
66
86
|
|
|
@@ -170,7 +170,7 @@ class SnowflakeUploader(SQLUploader):
|
|
|
170
170
|
f"{self.upload_config.record_id_key}, skipping delete"
|
|
171
171
|
)
|
|
172
172
|
df.replace({np.nan: None}, inplace=True)
|
|
173
|
-
self._fit_to_schema(df=df
|
|
173
|
+
self._fit_to_schema(df=df)
|
|
174
174
|
|
|
175
175
|
columns = list(df.columns)
|
|
176
176
|
stmt = "INSERT INTO {table_name} ({columns}) VALUES({values})".format(
|
|
@@ -310,6 +310,8 @@ class SQLUploadStager(UploadStager):
|
|
|
310
310
|
)
|
|
311
311
|
df = self.conform_dataframe(df=df)
|
|
312
312
|
|
|
313
|
+
output_filename_suffix = Path(elements_filepath).suffix
|
|
314
|
+
output_filename = f"{Path(output_filename).stem}{output_filename_suffix}"
|
|
313
315
|
output_path = self.get_output_path(output_filename=output_filename, output_dir=output_dir)
|
|
314
316
|
|
|
315
317
|
self.write_output(output_path=output_path, data=df.to_dict(orient="records"))
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: unstructured-ingest
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.4.0
|
|
4
4
|
Summary: A library that prepares raw documents for downstream ML tasks.
|
|
5
5
|
Home-page: https://github.com/Unstructured-IO/unstructured-ingest
|
|
6
6
|
Author: Unstructured Technologies
|
|
@@ -22,39 +22,39 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
|
22
22
|
Requires-Python: >=3.9.0,<3.14
|
|
23
23
|
Description-Content-Type: text/markdown
|
|
24
24
|
License-File: LICENSE.md
|
|
25
|
-
Requires-Dist:
|
|
25
|
+
Requires-Dist: click
|
|
26
26
|
Requires-Dist: pydantic>=2.7
|
|
27
27
|
Requires-Dist: pandas
|
|
28
|
-
Requires-Dist:
|
|
29
|
-
Requires-Dist: tqdm
|
|
30
|
-
Requires-Dist: click
|
|
31
|
-
Requires-Dist: python-dateutil
|
|
28
|
+
Requires-Dist: ndjson
|
|
32
29
|
Requires-Dist: opentelemetry-sdk
|
|
30
|
+
Requires-Dist: python-dateutil
|
|
31
|
+
Requires-Dist: tqdm
|
|
32
|
+
Requires-Dist: dataclasses-json
|
|
33
33
|
Provides-Extra: airtable
|
|
34
34
|
Requires-Dist: pyairtable; extra == "airtable"
|
|
35
35
|
Provides-Extra: astradb
|
|
36
36
|
Requires-Dist: astrapy; extra == "astradb"
|
|
37
37
|
Provides-Extra: azure
|
|
38
|
-
Requires-Dist: adlfs; extra == "azure"
|
|
39
38
|
Requires-Dist: fsspec; extra == "azure"
|
|
39
|
+
Requires-Dist: adlfs; extra == "azure"
|
|
40
40
|
Provides-Extra: azure-ai-search
|
|
41
41
|
Requires-Dist: azure-search-documents; extra == "azure-ai-search"
|
|
42
42
|
Provides-Extra: bedrock
|
|
43
|
-
Requires-Dist: aioboto3; extra == "bedrock"
|
|
44
43
|
Requires-Dist: boto3; extra == "bedrock"
|
|
44
|
+
Requires-Dist: aioboto3; extra == "bedrock"
|
|
45
45
|
Provides-Extra: biomed
|
|
46
46
|
Requires-Dist: bs4; extra == "biomed"
|
|
47
47
|
Requires-Dist: requests; extra == "biomed"
|
|
48
48
|
Provides-Extra: box
|
|
49
|
-
Requires-Dist: boxfs; extra == "box"
|
|
50
49
|
Requires-Dist: fsspec; extra == "box"
|
|
50
|
+
Requires-Dist: boxfs; extra == "box"
|
|
51
51
|
Provides-Extra: chroma
|
|
52
52
|
Requires-Dist: chromadb; extra == "chroma"
|
|
53
53
|
Provides-Extra: clarifai
|
|
54
54
|
Requires-Dist: clarifai; extra == "clarifai"
|
|
55
55
|
Provides-Extra: confluence
|
|
56
|
-
Requires-Dist: requests; extra == "confluence"
|
|
57
56
|
Requires-Dist: atlassian-python-api; extra == "confluence"
|
|
57
|
+
Requires-Dist: requests; extra == "confluence"
|
|
58
58
|
Provides-Extra: couchbase
|
|
59
59
|
Requires-Dist: couchbase; extra == "couchbase"
|
|
60
60
|
Provides-Extra: csv
|
|
@@ -73,8 +73,8 @@ Requires-Dist: unstructured[docx]; extra == "doc"
|
|
|
73
73
|
Provides-Extra: docx
|
|
74
74
|
Requires-Dist: unstructured[docx]; extra == "docx"
|
|
75
75
|
Provides-Extra: dropbox
|
|
76
|
-
Requires-Dist: dropboxdrivefs; extra == "dropbox"
|
|
77
76
|
Requires-Dist: fsspec; extra == "dropbox"
|
|
77
|
+
Requires-Dist: dropboxdrivefs; extra == "dropbox"
|
|
78
78
|
Provides-Extra: duckdb
|
|
79
79
|
Requires-Dist: duckdb; extra == "duckdb"
|
|
80
80
|
Provides-Extra: elasticsearch
|
|
@@ -93,9 +93,9 @@ Requires-Dist: voyageai; extra == "embed-voyageai"
|
|
|
93
93
|
Provides-Extra: epub
|
|
94
94
|
Requires-Dist: unstructured[epub]; extra == "epub"
|
|
95
95
|
Provides-Extra: gcs
|
|
96
|
+
Requires-Dist: fsspec; extra == "gcs"
|
|
96
97
|
Requires-Dist: bs4; extra == "gcs"
|
|
97
98
|
Requires-Dist: gcsfs; extra == "gcs"
|
|
98
|
-
Requires-Dist: fsspec; extra == "gcs"
|
|
99
99
|
Provides-Extra: github
|
|
100
100
|
Requires-Dist: pygithub>1.58.0; extra == "github"
|
|
101
101
|
Requires-Dist: requests; extra == "github"
|
|
@@ -104,8 +104,8 @@ Requires-Dist: python-gitlab; extra == "gitlab"
|
|
|
104
104
|
Provides-Extra: google-drive
|
|
105
105
|
Requires-Dist: google-api-python-client; extra == "google-drive"
|
|
106
106
|
Provides-Extra: hubspot
|
|
107
|
-
Requires-Dist: urllib3; extra == "hubspot"
|
|
108
107
|
Requires-Dist: hubspot-api-client; extra == "hubspot"
|
|
108
|
+
Requires-Dist: urllib3; extra == "hubspot"
|
|
109
109
|
Provides-Extra: jira
|
|
110
110
|
Requires-Dist: atlassian-python-api; extra == "jira"
|
|
111
111
|
Provides-Extra: kafka
|
|
@@ -127,15 +127,15 @@ Requires-Dist: cymple; extra == "neo4j"
|
|
|
127
127
|
Requires-Dist: neo4j; extra == "neo4j"
|
|
128
128
|
Requires-Dist: networkx; extra == "neo4j"
|
|
129
129
|
Provides-Extra: notion
|
|
130
|
-
Requires-Dist:
|
|
130
|
+
Requires-Dist: notion-client; extra == "notion"
|
|
131
131
|
Requires-Dist: htmlBuilder; extra == "notion"
|
|
132
132
|
Requires-Dist: backoff; extra == "notion"
|
|
133
|
-
Requires-Dist:
|
|
133
|
+
Requires-Dist: httpx; extra == "notion"
|
|
134
134
|
Provides-Extra: odt
|
|
135
135
|
Requires-Dist: unstructured[odt]; extra == "odt"
|
|
136
136
|
Provides-Extra: onedrive
|
|
137
|
-
Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
|
|
138
137
|
Requires-Dist: bs4; extra == "onedrive"
|
|
138
|
+
Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
|
|
139
139
|
Requires-Dist: msal; extra == "onedrive"
|
|
140
140
|
Provides-Extra: openai
|
|
141
141
|
Requires-Dist: tiktoken; extra == "openai"
|
|
@@ -175,8 +175,8 @@ Requires-Dist: s3fs; extra == "s3"
|
|
|
175
175
|
Provides-Extra: salesforce
|
|
176
176
|
Requires-Dist: simple-salesforce; extra == "salesforce"
|
|
177
177
|
Provides-Extra: sftp
|
|
178
|
-
Requires-Dist: paramiko; extra == "sftp"
|
|
179
178
|
Requires-Dist: fsspec; extra == "sftp"
|
|
179
|
+
Requires-Dist: paramiko; extra == "sftp"
|
|
180
180
|
Provides-Extra: sharepoint
|
|
181
181
|
Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
|
|
182
182
|
Requires-Dist: msal; extra == "sharepoint"
|
|
@@ -193,8 +193,8 @@ Provides-Extra: tsv
|
|
|
193
193
|
Requires-Dist: unstructured[tsv]; extra == "tsv"
|
|
194
194
|
Provides-Extra: vectara
|
|
195
195
|
Requires-Dist: httpx; extra == "vectara"
|
|
196
|
-
Requires-Dist: aiofiles; extra == "vectara"
|
|
197
196
|
Requires-Dist: requests; extra == "vectara"
|
|
197
|
+
Requires-Dist: aiofiles; extra == "vectara"
|
|
198
198
|
Provides-Extra: weaviate
|
|
199
199
|
Requires-Dist: weaviate-client; extra == "weaviate"
|
|
200
200
|
Provides-Extra: wikipedia
|
|
@@ -8,7 +8,7 @@ test/integration/connectors/conftest.py,sha256=vYs4WDlCuieAwwErkJxCk4a1lGvr3qpei
|
|
|
8
8
|
test/integration/connectors/test_astradb.py,sha256=2DNNNum7cTKjsRvYaCu4doAGjhSN8vl-iHprFMDfQgk,7951
|
|
9
9
|
test/integration/connectors/test_azure_ai_search.py,sha256=MxFwk84vI_HT4taQTGrNpJ8ewGPqHSGrx626j8hC_Pw,9695
|
|
10
10
|
test/integration/connectors/test_chroma.py,sha256=NuQv0PWPM0_LQfdPeUd6IYKqaKKXWmVaHGWjq5aBfOY,3721
|
|
11
|
-
test/integration/connectors/test_confluence.py,sha256=
|
|
11
|
+
test/integration/connectors/test_confluence.py,sha256=Ju0gRQbD2g9l9iRf2HDZKi7RyPnBGtFRWcGpsqhO3F8,3588
|
|
12
12
|
test/integration/connectors/test_delta_table.py,sha256=4qm2Arfc9Eb7SOZOnOlLF-vNpHy6Eqvr5Q45svfX1PY,6911
|
|
13
13
|
test/integration/connectors/test_lancedb.py,sha256=8MBxK_CUtOt87-4B7svDDK82NFII5psceo5cNN8HJMs,9228
|
|
14
14
|
test/integration/connectors/test_milvus.py,sha256=7mI6zznN0PTxDL9DLogH1k3dxx6R8DgGzlpyevsFu2w,7173
|
|
@@ -82,7 +82,9 @@ test/unit/v2/test_utils.py,sha256=TWVAeE0OrcHgPyzGPtEnQakICsVrDeVhIKPMRQPX554,26
|
|
|
82
82
|
test/unit/v2/chunkers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
83
83
|
test/unit/v2/chunkers/test_chunkers.py,sha256=HSr3_lsoMw1nkDhkjO0-NOTEomRdR9oxCrSXvcMFecE,1772
|
|
84
84
|
test/unit/v2/connectors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
85
|
-
test/unit/v2/connectors/test_confluence.py,sha256=
|
|
85
|
+
test/unit/v2/connectors/test_confluence.py,sha256=bXrn_kRb4IQdqkk4rc-P2gJAtPba7n7pNplQgfbqZDY,1047
|
|
86
|
+
test/unit/v2/connectors/sql/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
87
|
+
test/unit/v2/connectors/sql/test_sql.py,sha256=6BfOxNqIvf6OoxGmCSucEqDkUOmaKgA6E1FvwOyB9pc,2412
|
|
86
88
|
test/unit/v2/embedders/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
87
89
|
test/unit/v2/embedders/test_bedrock.py,sha256=sW-Vv-u3Yiw8rHPOfE5x_reywXlnozxO49rIMx6_xjo,1071
|
|
88
90
|
test/unit/v2/embedders/test_huggingface.py,sha256=mkVPym7TZkRJchwHedujgFXWdL9sVMi1W90jpmZ_vxg,1543
|
|
@@ -97,7 +99,7 @@ test/unit/v2/partitioners/test_partitioner.py,sha256=iIYg7IpftV3LusoO4H8tr1IHY1U
|
|
|
97
99
|
test/unit/v2/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
98
100
|
test/unit/v2/utils/data_generator.py,sha256=UoYVNjG4S4wlaA9gceQ82HIpF9_6I1UTHD1_GrQBHp0,973
|
|
99
101
|
unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
|
|
100
|
-
unstructured_ingest/__version__.py,sha256=
|
|
102
|
+
unstructured_ingest/__version__.py,sha256=uG7rkjX1YTBF6-J_mvj3gBQn-ZgW3qMoKBfjt0oZDS8,42
|
|
101
103
|
unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
|
|
102
104
|
unstructured_ingest/interfaces.py,sha256=OYVUP0bzBJpT-Lz92BDyz_hLBvyfxkuSwWHhUdnUayA,31493
|
|
103
105
|
unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
|
|
@@ -415,7 +417,7 @@ unstructured_ingest/v2/processes/connectors/airtable.py,sha256=eeZJe-bBNxt5Sa-XE
|
|
|
415
417
|
unstructured_ingest/v2/processes/connectors/astradb.py,sha256=xhUMoUdnrfAY1isZGqsV4lZUsnZNpbvgLyQWQbR4hVo,14814
|
|
416
418
|
unstructured_ingest/v2/processes/connectors/azure_ai_search.py,sha256=ngPDpU0oZ6m5sxIlB6u5ebQpqCS_SJ-_amCC1KQ03EQ,11529
|
|
417
419
|
unstructured_ingest/v2/processes/connectors/chroma.py,sha256=VHCnM56qNXuHzovJihrNfJnZbWLJShOe8j12PJFrbL0,7219
|
|
418
|
-
unstructured_ingest/v2/processes/connectors/confluence.py,sha256
|
|
420
|
+
unstructured_ingest/v2/processes/connectors/confluence.py,sha256=dE2kEQJT2QamFLsdCHpac_D5G4zTN7RIFRIEvt6XBPc,8238
|
|
419
421
|
unstructured_ingest/v2/processes/connectors/couchbase.py,sha256=i7vuNKsUkN93JRVmg4--MO0ZgbjvhIqt46oYqk9zFSQ,12250
|
|
420
422
|
unstructured_ingest/v2/processes/connectors/delta_table.py,sha256=SotSXZQ85_6TO906YvFi3yTml8jE9A_zV6nBJ4oTx8A,7075
|
|
421
423
|
unstructured_ingest/v2/processes/connectors/discord.py,sha256=-e4-cBK4TnHkknK1qIb86AIVMy81lBgC288_iLpTzM8,5246
|
|
@@ -544,17 +546,17 @@ unstructured_ingest/v2/processes/connectors/sql/__init__.py,sha256=mxcrncrjeP-C2
|
|
|
544
546
|
unstructured_ingest/v2/processes/connectors/sql/databricks_delta_tables.py,sha256=s_W6wSvyIXZ9mdAxvgSXFeFSze9E7pwIvc38p1hVDLM,8839
|
|
545
547
|
unstructured_ingest/v2/processes/connectors/sql/postgres.py,sha256=BATfX1PQGT2kl8jAbdNKXTojYKJxh3pJV9-h3OBnHGo,5124
|
|
546
548
|
unstructured_ingest/v2/processes/connectors/sql/singlestore.py,sha256=-2E9dsdNhjAiuzeSBytBbAhljOhvQ8kN8wvlUESvLo8,5465
|
|
547
|
-
unstructured_ingest/v2/processes/connectors/sql/snowflake.py,sha256=
|
|
548
|
-
unstructured_ingest/v2/processes/connectors/sql/sql.py,sha256=
|
|
549
|
+
unstructured_ingest/v2/processes/connectors/sql/snowflake.py,sha256=QE-WBqrPVjCgcxR5EdVD9iTHBjgDSSSQgWYvq5N61qU,7746
|
|
550
|
+
unstructured_ingest/v2/processes/connectors/sql/sql.py,sha256=MZPj-o4OdIrcMPmzMk851w21i9Ms0fm7dTiqegp773k,15813
|
|
549
551
|
unstructured_ingest/v2/processes/connectors/sql/sqlite.py,sha256=Q5RAqn5Ccw-pbeKZLkiMn5IVw6EemCMukXzLlS7pDhc,5162
|
|
550
552
|
unstructured_ingest/v2/processes/connectors/weaviate/__init__.py,sha256=NMiwnVWan69KnzVELvaqX34tMhCytIa-C8EDsXVKsEo,856
|
|
551
553
|
unstructured_ingest/v2/processes/connectors/weaviate/cloud.py,sha256=bXtfEYLquR-BszZ5S_lQ4JbETNs9Vozgpfm8x9egAmE,6251
|
|
552
554
|
unstructured_ingest/v2/processes/connectors/weaviate/embedded.py,sha256=S8Zg8StuZT-k7tCg1D5YShO1-vJYYk9-M1bE1fIqx64,3014
|
|
553
555
|
unstructured_ingest/v2/processes/connectors/weaviate/local.py,sha256=LuTBKPseVewsz8VqxRPRLfGEm3BeI9nBZxpy7ZU5tOA,2201
|
|
554
556
|
unstructured_ingest/v2/processes/connectors/weaviate/weaviate.py,sha256=X1yv1H_orDQ-J965EMXhR2XaURqe8vovSi9n1fk85B4,10499
|
|
555
|
-
unstructured_ingest-0.
|
|
556
|
-
unstructured_ingest-0.
|
|
557
|
-
unstructured_ingest-0.
|
|
558
|
-
unstructured_ingest-0.
|
|
559
|
-
unstructured_ingest-0.
|
|
560
|
-
unstructured_ingest-0.
|
|
557
|
+
unstructured_ingest-0.4.0.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
|
|
558
|
+
unstructured_ingest-0.4.0.dist-info/METADATA,sha256=YCJmfdIJGlE9lfszi5ybee8wf0rTrB58YmBakeuZ8ac,7928
|
|
559
|
+
unstructured_ingest-0.4.0.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
|
|
560
|
+
unstructured_ingest-0.4.0.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
|
|
561
|
+
unstructured_ingest-0.4.0.dist-info/top_level.txt,sha256=DMuDMHZRMdeay8v8Kdi855muIv92F0OkutvBCaBEW6M,25
|
|
562
|
+
unstructured_ingest-0.4.0.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
{unstructured_ingest-0.3.15.dist-info → unstructured_ingest-0.4.0.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
|
File without changes
|