unstructured-ingest 0.0.18__tar.gz → 0.0.21__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of unstructured-ingest might be problematic. Click here for more details.
- {unstructured-ingest-0.0.18/unstructured_ingest.egg-info → unstructured-ingest-0.0.21}/PKG-INFO +1 -1
- unstructured-ingest-0.0.21/unstructured_ingest/__version__.py +1 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/astradb.py +2 -2
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/astradb.py +54 -24
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/chunker.py +8 -29
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/astradb.py +26 -19
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/chroma.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/databricks_volumes.py +12 -14
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +1 -6
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/box.py +1 -6
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +1 -6
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +1 -6
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/kdbai.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/local.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/milvus.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/mongodb.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/pinecone.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/sql.py +1 -6
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/weaviate.py +2 -5
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/partitioner.py +9 -55
- unstructured-ingest-0.0.21/unstructured_ingest/v2/unstructured_api.py +87 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21/unstructured_ingest.egg-info}/PKG-INFO +1 -1
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/SOURCES.txt +1 -0
- unstructured-ingest-0.0.18/unstructured_ingest/__version__.py +0 -1
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/LICENSE.md +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/README.md +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/pyproject.toml +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/setup.cfg +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/setup.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_chunking_utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_error.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_logger.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_utils_v2.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/cmd.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/dest.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/src.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cli.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmd_factory.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/airtable.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/azure_cognitive_search.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/biomed.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/chroma.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/clarifai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/confluence.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/delta_table.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/discord.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/elasticsearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/box.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/github.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/gitlab.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/google_drive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/hubspot.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/jira.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/kafka.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/local.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/mongodb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/notion.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/onedrive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/opensearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/outlook.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/pinecone.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/qdrant.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/reddit.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/salesforce.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/sharepoint.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/slack.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/sql.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/vectara.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/weaviate.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/wikipedia.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/common.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/airtable.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/azure_cognitive_search.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/biomed.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/chroma.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/clarifai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/confluence.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/databricks_volumes.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/delta_table.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/discord.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/elasticsearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/azure.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/box.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/dropbox.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/fsspec.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/gcs.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/s3.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/sftp.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/git.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/github.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/gitlab.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/google_drive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/hubspot.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/jira.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/kafka.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/local.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/mongodb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/client.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/connector.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/helpers.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/block.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/code.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/file.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/image.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/table.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/template.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/video.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/date.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/file.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/page.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/parent.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/rich_text.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/user.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/onedrive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/opensearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/outlook.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/pinecone.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/qdrant.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/reddit.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/registry.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/salesforce.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/sharepoint.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/slack.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/sql.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/vectara.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/weaviate.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/wikipedia.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/bedrock.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/huggingface.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/mixedbreadai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/octoai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/openai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/vertexai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/voyageai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/core.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/error.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/ingest_backoff/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/ingest_backoff/_common.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/ingest_backoff/_wrapper.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/logger.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/main.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/copy.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/doc_factory.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/partition.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/permissions.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/pipeline.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/reformat/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/reformat/chunking.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/reformat/embedding.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/source.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/write.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/processor.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/airtable.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/astradb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/base_runner.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/biomed.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/confluence.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/delta_table.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/discord.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/elasticsearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/azure.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/box.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/dropbox.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/fsspec.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/gcs.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/s3.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/sftp.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/github.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/gitlab.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/google_drive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/hubspot.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/jira.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/kafka.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/local.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/mongodb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/notion.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/onedrive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/opensearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/outlook.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/reddit.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/salesforce.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/sharepoint.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/slack.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/wikipedia.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/astradb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/azure_cognitive_search.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/base_writer.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/chroma.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/clarifai.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/databricks_volumes.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/delta_table.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/elasticsearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/azure.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/box.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/s3.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/kafka.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/mongodb.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/opensearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/pinecone.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/qdrant.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/sql.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/vectara.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/weaviate.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/chunking.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/compression.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/data_prep.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/dep_check.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/google_filetype.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/table.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/cmd.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/dest.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/importer.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/src.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/cli.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/cmds.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/utils/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/utils/click.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/utils/model_conversion.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/connector.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/downloader.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/file_data.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/indexer.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/process.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/processor.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/upload_stager.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/uploader.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/logger.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/main.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/otel.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/interfaces.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/otel.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/pipeline.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/download.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/embed.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/filter.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/index.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/partition.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/stage.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/upload.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connector_registry.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/airtable.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/couchbase.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/elasticsearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/opensearch.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/singlestore.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/embedder.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/filter.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/uncompress.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/utils.py +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/entry_points.txt +0 -0
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/requires.txt +276 -276
- {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/top_level.txt +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__ = "0.0.21" # pragma: no cover
|
{unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/astradb.py
RENAMED
|
@@ -37,11 +37,11 @@ class AstraDBCliConfig(SimpleAstraDBConfig, CliConfig):
|
|
|
37
37
|
"numbers, and underscores.",
|
|
38
38
|
),
|
|
39
39
|
click.Option(
|
|
40
|
-
["--
|
|
40
|
+
["--keyspace"],
|
|
41
41
|
required=False,
|
|
42
42
|
default=None,
|
|
43
43
|
type=str,
|
|
44
|
-
help="The Astra DB connection
|
|
44
|
+
help="The Astra DB connection keyspace.",
|
|
45
45
|
),
|
|
46
46
|
]
|
|
47
47
|
return options
|
{unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/astradb.py
RENAMED
|
@@ -24,7 +24,8 @@ from unstructured_ingest.utils.data_prep import batch_generator, flatten_dict
|
|
|
24
24
|
from unstructured_ingest.utils.dep_check import requires_dependencies
|
|
25
25
|
|
|
26
26
|
if t.TYPE_CHECKING:
|
|
27
|
-
from astrapy
|
|
27
|
+
from astrapy import Collection as AstraDBCollection
|
|
28
|
+
from astrapy import Database as AstraDB
|
|
28
29
|
|
|
29
30
|
NON_INDEXED_FIELDS = ["metadata._node_content", "content"]
|
|
30
31
|
|
|
@@ -39,6 +40,7 @@ class AstraDBAccessConfig(AccessConfig):
|
|
|
39
40
|
class SimpleAstraDBConfig(BaseConnectorConfig):
|
|
40
41
|
access_config: AstraDBAccessConfig
|
|
41
42
|
collection_name: str
|
|
43
|
+
keyspace: t.Optional[str] = None
|
|
42
44
|
namespace: t.Optional[str] = None
|
|
43
45
|
|
|
44
46
|
|
|
@@ -98,22 +100,30 @@ class AstraDBSourceConnector(SourceConnectorCleanupMixin, BaseSourceConnector):
|
|
|
98
100
|
@requires_dependencies(["astrapy"], extras="astradb")
|
|
99
101
|
def astra_db_collection(self) -> "AstraDBCollection":
|
|
100
102
|
if self._astra_db_collection is None:
|
|
101
|
-
from astrapy
|
|
103
|
+
from astrapy import DataAPIClient as AstraDBClient
|
|
102
104
|
|
|
103
|
-
#
|
|
105
|
+
# Choose keyspace or deprecated namespace
|
|
106
|
+
keyspace_param = self.connector_config.keyspace or self.connector_config.namespace
|
|
107
|
+
|
|
108
|
+
# Create a client object to interact with the Astra DB
|
|
104
109
|
# caller_name/version for Astra DB tracking
|
|
105
|
-
|
|
106
|
-
api_endpoint=self.connector_config.access_config.api_endpoint,
|
|
107
|
-
token=self.connector_config.access_config.token,
|
|
108
|
-
namespace=self.connector_config.namespace,
|
|
110
|
+
my_client = AstraDBClient(
|
|
109
111
|
caller_name=integration_name,
|
|
110
112
|
caller_version=integration_version,
|
|
111
113
|
)
|
|
112
114
|
|
|
113
|
-
#
|
|
114
|
-
self.
|
|
115
|
-
|
|
115
|
+
# Get the database object
|
|
116
|
+
self._astra_db = my_client.get_database(
|
|
117
|
+
api_endpoint=self.connector_config.access_config.api_endpoint,
|
|
118
|
+
token=self.connector_config.access_config.token,
|
|
119
|
+
keyspace=keyspace_param,
|
|
116
120
|
)
|
|
121
|
+
|
|
122
|
+
# Create and connect to the newly created collection
|
|
123
|
+
self._astra_db_collection = self._astra_db.get_collection(
|
|
124
|
+
name=self.connector_config.collection_name,
|
|
125
|
+
)
|
|
126
|
+
|
|
117
127
|
return self._astra_db_collection # type: ignore
|
|
118
128
|
|
|
119
129
|
@requires_dependencies(["astrapy"], extras="astradb")
|
|
@@ -132,8 +142,14 @@ class AstraDBSourceConnector(SourceConnectorCleanupMixin, BaseSourceConnector):
|
|
|
132
142
|
@requires_dependencies(["astrapy"], extras="astradb")
|
|
133
143
|
def get_ingest_docs(self): # type: ignore
|
|
134
144
|
# Perform the find operation
|
|
135
|
-
|
|
145
|
+
astra_db_docs_cursor = self.astra_db_collection.find({})
|
|
136
146
|
|
|
147
|
+
# Iterate over the cursor
|
|
148
|
+
astra_db_docs = []
|
|
149
|
+
for result in astra_db_docs_cursor:
|
|
150
|
+
astra_db_docs.append(result)
|
|
151
|
+
|
|
152
|
+
# Create a list of AstraDBIngestDoc objects
|
|
137
153
|
doc_list = []
|
|
138
154
|
for record in astra_db_docs:
|
|
139
155
|
doc = AstraDBIngestDoc(
|
|
@@ -182,30 +198,41 @@ class AstraDBDestinationConnector(BaseDestinationConnector):
|
|
|
182
198
|
@requires_dependencies(["astrapy"], extras="astradb")
|
|
183
199
|
def astra_db_collection(self) -> "AstraDBCollection":
|
|
184
200
|
if self._astra_db_collection is None:
|
|
185
|
-
from astrapy
|
|
201
|
+
from astrapy import DataAPIClient as AstraDBClient
|
|
202
|
+
from astrapy.exceptions import CollectionAlreadyExistsException
|
|
203
|
+
|
|
204
|
+
# Choose keyspace or deprecated namespace
|
|
205
|
+
keyspace_param = self.connector_config.keyspace or self.connector_config.namespace
|
|
186
206
|
|
|
187
207
|
collection_name = self.connector_config.collection_name
|
|
188
208
|
embedding_dimension = self.write_config.embedding_dimension
|
|
189
|
-
|
|
190
|
-
# If the user has requested an indexing policy, pass it to the Astra DB
|
|
191
209
|
requested_indexing_policy = self.write_config.requested_indexing_policy
|
|
192
|
-
options = {"indexing": requested_indexing_policy} if requested_indexing_policy else None
|
|
193
210
|
|
|
211
|
+
# Create a client object to interact with the Astra DB
|
|
194
212
|
# caller_name/version for Astra DB tracking
|
|
195
|
-
|
|
196
|
-
api_endpoint=self.connector_config.access_config.api_endpoint,
|
|
197
|
-
token=self.connector_config.access_config.token,
|
|
198
|
-
namespace=self.connector_config.namespace,
|
|
213
|
+
my_client = AstraDBClient(
|
|
199
214
|
caller_name=integration_name,
|
|
200
215
|
caller_version=integration_version,
|
|
201
216
|
)
|
|
202
217
|
|
|
203
|
-
#
|
|
204
|
-
self.
|
|
205
|
-
|
|
206
|
-
|
|
207
|
-
|
|
218
|
+
# Get the database object
|
|
219
|
+
self._astra_db = my_client.get_database(
|
|
220
|
+
api_endpoint=self.connector_config.access_config.api_endpoint,
|
|
221
|
+
token=self.connector_config.access_config.token,
|
|
222
|
+
keyspace=keyspace_param,
|
|
208
223
|
)
|
|
224
|
+
|
|
225
|
+
# Create and connect to the newly created collection
|
|
226
|
+
try:
|
|
227
|
+
self._astra_db_collection = self._astra_db.create_collection(
|
|
228
|
+
name=collection_name,
|
|
229
|
+
dimension=embedding_dimension,
|
|
230
|
+
indexing=requested_indexing_policy,
|
|
231
|
+
)
|
|
232
|
+
except CollectionAlreadyExistsException as e:
|
|
233
|
+
logger.info(f"{e}", exc_info=True)
|
|
234
|
+
self._astra_db_collection = self._astra_db.get_collection(name=collection_name)
|
|
235
|
+
|
|
209
236
|
return self._astra_db_collection
|
|
210
237
|
|
|
211
238
|
@requires_dependencies(["astrapy"], extras="astradb")
|
|
@@ -224,6 +251,9 @@ class AstraDBDestinationConnector(BaseDestinationConnector):
|
|
|
224
251
|
def write_dict(self, *args, elements_dict: t.List[t.Dict[str, t.Any]], **kwargs) -> None:
|
|
225
252
|
logger.info(f"inserting / updating {len(elements_dict)} documents to Astra DB.")
|
|
226
253
|
|
|
254
|
+
if self._astra_db_collection is None:
|
|
255
|
+
raise DestinationConnectionError("Astra DB collection not available for insertion.")
|
|
256
|
+
|
|
227
257
|
astra_db_batch_size = self.write_config.batch_size
|
|
228
258
|
|
|
229
259
|
for batch in batch_generator(elements_dict, astra_db_batch_size):
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
from abc import ABC
|
|
2
|
-
from dataclasses import dataclass
|
|
2
|
+
from dataclasses import dataclass
|
|
3
3
|
from pathlib import Path
|
|
4
4
|
from typing import Any, Optional
|
|
5
5
|
|
|
@@ -9,6 +9,7 @@ from unstructured_ingest.utils.chunking import assign_and_map_hash_ids
|
|
|
9
9
|
from unstructured_ingest.utils.dep_check import requires_dependencies
|
|
10
10
|
from unstructured_ingest.v2.interfaces.process import BaseProcess
|
|
11
11
|
from unstructured_ingest.v2.logger import logger
|
|
12
|
+
from unstructured_ingest.v2.unstructured_api import call_api
|
|
12
13
|
|
|
13
14
|
CHUNK_MAX_CHARS_DEFAULT: int = 500
|
|
14
15
|
CHUNK_MULTI_PAGE_DEFAULT: bool = True
|
|
@@ -111,35 +112,13 @@ class Chunker(BaseProcess, ABC):
|
|
|
111
112
|
|
|
112
113
|
@requires_dependencies(dependencies=["unstructured_client"], extras="remote")
|
|
113
114
|
async def run_async(self, elements_filepath: Path, **kwargs: Any) -> list[dict]:
|
|
114
|
-
|
|
115
|
-
from unstructured_client.models.operations import PartitionRequest
|
|
116
|
-
from unstructured_client.models.shared import Files, PartitionParameters
|
|
117
|
-
|
|
118
|
-
client = UnstructuredClient(
|
|
119
|
-
api_key_auth=self.config.chunk_api_key.get_secret_value(),
|
|
115
|
+
elements = await call_api(
|
|
120
116
|
server_url=self.config.chunking_endpoint,
|
|
117
|
+
api_key=self.config.chunk_api_key.get_secret_value(),
|
|
118
|
+
filename=elements_filepath,
|
|
119
|
+
api_parameters=self.config.to_chunking_kwargs(),
|
|
121
120
|
)
|
|
122
|
-
|
|
123
|
-
possible_fields = [f.name for f in fields(PartitionParameters)]
|
|
124
|
-
filtered_partition_request = {
|
|
125
|
-
k: v for k, v in partition_request.items() if k in possible_fields
|
|
126
|
-
}
|
|
127
|
-
if len(filtered_partition_request) != len(partition_request):
|
|
128
|
-
logger.debug(
|
|
129
|
-
"Following fields were omitted due to not being "
|
|
130
|
-
"supported by the currently used unstructured client: {}".format(
|
|
131
|
-
", ".join([v for v in partition_request if v not in filtered_partition_request])
|
|
132
|
-
)
|
|
133
|
-
)
|
|
134
|
-
with open(elements_filepath, "rb") as f:
|
|
135
|
-
files = Files(
|
|
136
|
-
content=f.read(),
|
|
137
|
-
file_name=str(elements_filepath.resolve()),
|
|
138
|
-
)
|
|
139
|
-
filtered_partition_request["files"] = files
|
|
140
|
-
partition_params = PartitionParameters(**filtered_partition_request)
|
|
141
|
-
partition_request_obj = PartitionRequest(partition_params)
|
|
142
|
-
resp = client.general.partition(partition_request_obj)
|
|
143
|
-
elements = resp.elements or []
|
|
121
|
+
|
|
144
122
|
elements = assign_and_map_hash_ids(elements=elements)
|
|
123
|
+
|
|
145
124
|
return elements
|
|
@@ -25,7 +25,8 @@ from unstructured_ingest.v2.processes.connector_registry import (
|
|
|
25
25
|
)
|
|
26
26
|
|
|
27
27
|
if TYPE_CHECKING:
|
|
28
|
-
from astrapy
|
|
28
|
+
from astrapy import Collection as AstraDBCollection
|
|
29
|
+
|
|
29
30
|
|
|
30
31
|
CONNECTOR_TYPE = "astradb"
|
|
31
32
|
|
|
@@ -85,7 +86,12 @@ class AstraDBUploaderConfig(UploaderConfig):
|
|
|
85
86
|
embedding_dimension: int = Field(
|
|
86
87
|
default=384, description="The dimensionality of the embeddings"
|
|
87
88
|
)
|
|
88
|
-
|
|
89
|
+
keyspace: Optional[str] = Field(default=None, description="The Astra DB connection keyspace.")
|
|
90
|
+
namespace: Optional[str] = Field(
|
|
91
|
+
default=None,
|
|
92
|
+
description="The Astra DB connection namespace.",
|
|
93
|
+
deprecated="Please use 'keyspace' instead.",
|
|
94
|
+
)
|
|
89
95
|
requested_indexing_policy: Optional[dict[str, Any]] = Field(
|
|
90
96
|
default=None,
|
|
91
97
|
description="The indexing policy to use for the collection.",
|
|
@@ -109,33 +115,34 @@ class AstraDBUploader(Uploader):
|
|
|
109
115
|
|
|
110
116
|
@requires_dependencies(["astrapy"], extras="astradb")
|
|
111
117
|
def get_collection(self) -> "AstraDBCollection":
|
|
112
|
-
from astrapy
|
|
118
|
+
from astrapy import DataAPIClient as AstraDBClient
|
|
113
119
|
|
|
114
|
-
#
|
|
115
|
-
|
|
116
|
-
embedding_dimension = self.upload_config.embedding_dimension
|
|
117
|
-
requested_indexing_policy = self.upload_config.requested_indexing_policy
|
|
120
|
+
# Choose keyspace or deprecated namespace
|
|
121
|
+
keyspace_param = self.upload_config.keyspace or self.upload_config.namespace
|
|
118
122
|
|
|
119
|
-
#
|
|
120
|
-
|
|
123
|
+
# Get the collection_name
|
|
124
|
+
collection_name = self.upload_config.collection_name
|
|
121
125
|
|
|
122
126
|
# Build the Astra DB object.
|
|
123
|
-
# caller_name/version for AstraDB tracking
|
|
124
127
|
access_configs = self.connection_config.access_config.get_secret_value()
|
|
125
|
-
|
|
126
|
-
|
|
127
|
-
|
|
128
|
-
|
|
128
|
+
|
|
129
|
+
# Create a client object to interact with the Astra DB
|
|
130
|
+
# caller_name/version for Astra DB tracking
|
|
131
|
+
my_client = AstraDBClient(
|
|
129
132
|
caller_name=integration_name,
|
|
130
133
|
caller_version=integration_version,
|
|
131
134
|
)
|
|
132
135
|
|
|
133
|
-
#
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
136
|
+
# Get the database object
|
|
137
|
+
astra_db = my_client.get_database(
|
|
138
|
+
api_endpoint=access_configs.api_endpoint,
|
|
139
|
+
token=access_configs.token,
|
|
140
|
+
keyspace=keyspace_param,
|
|
138
141
|
)
|
|
142
|
+
|
|
143
|
+
# Connect to the newly created collection
|
|
144
|
+
astra_db_collection = astra_db.get_collection(name=collection_name)
|
|
145
|
+
|
|
139
146
|
return astra_db_collection
|
|
140
147
|
|
|
141
148
|
def run(self, path: Path, file_data: FileData, **kwargs: Any) -> None:
|
|
@@ -41,13 +41,10 @@ class ChromaAccessConfig(AccessConfig):
|
|
|
41
41
|
)
|
|
42
42
|
|
|
43
43
|
|
|
44
|
-
SecretChromaAccessConfig = Secret[ChromaAccessConfig]
|
|
45
|
-
|
|
46
|
-
|
|
47
44
|
class ChromaConnectionConfig(ConnectionConfig):
|
|
48
45
|
collection_name: str = Field(description="The name of the Chroma collection to write into.")
|
|
49
|
-
access_config:
|
|
50
|
-
default=
|
|
46
|
+
access_config: Secret[ChromaAccessConfig] = Field(
|
|
47
|
+
default=ChromaAccessConfig(), validate_default=True
|
|
51
48
|
)
|
|
52
49
|
path: Optional[str] = Field(
|
|
53
50
|
default=None, description="Location where Chroma is persisted, if not connecting via http."
|
|
@@ -42,8 +42,10 @@ class DatabricksVolumesAccessConfig(AccessConfig):
|
|
|
42
42
|
description="The Databricks password part of basic authentication. "
|
|
43
43
|
"Only possible when Host is *.cloud.databricks.com (AWS).",
|
|
44
44
|
)
|
|
45
|
-
client_id: Optional[str] = Field(default=None)
|
|
46
|
-
client_secret: Optional[str] = Field(
|
|
45
|
+
client_id: Optional[str] = Field(default=None, description="Client ID of the OAuth app.")
|
|
46
|
+
client_secret: Optional[str] = Field(
|
|
47
|
+
default=None, description="Client Secret of the OAuth app."
|
|
48
|
+
)
|
|
47
49
|
token: Optional[str] = Field(
|
|
48
50
|
default=None,
|
|
49
51
|
description="The Databricks personal access token (PAT) (AWS, Azure, and GCP) or "
|
|
@@ -81,14 +83,9 @@ class DatabricksVolumesAccessConfig(AccessConfig):
|
|
|
81
83
|
google_service_account: Optional[str] = None
|
|
82
84
|
|
|
83
85
|
|
|
84
|
-
SecretDatabricksVolumesAccessConfig = Secret[DatabricksVolumesAccessConfig]
|
|
85
|
-
|
|
86
|
-
|
|
87
86
|
class DatabricksVolumesConnectionConfig(ConnectionConfig):
|
|
88
|
-
access_config:
|
|
89
|
-
|
|
90
|
-
secret_value=DatabricksVolumesAccessConfig()
|
|
91
|
-
)
|
|
87
|
+
access_config: Secret[DatabricksVolumesAccessConfig] = Field(
|
|
88
|
+
default=DatabricksVolumesAccessConfig(), validate_default=True
|
|
92
89
|
)
|
|
93
90
|
host: Optional[str] = Field(
|
|
94
91
|
default=None,
|
|
@@ -145,11 +142,12 @@ class DatabricksVolumesUploader(Uploader):
|
|
|
145
142
|
|
|
146
143
|
def run(self, path: Path, file_data: FileData, **kwargs: Any) -> None:
|
|
147
144
|
output_path = os.path.join(self.upload_config.path, path.name)
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
145
|
+
with open(path, "rb") as elements_file:
|
|
146
|
+
self.get_client().files.upload(
|
|
147
|
+
file_path=output_path,
|
|
148
|
+
contents=elements_file,
|
|
149
|
+
overwrite=self.upload_config.overwrite,
|
|
150
|
+
)
|
|
153
151
|
|
|
154
152
|
|
|
155
153
|
databricks_volumes_destination_entry = DestinationRegistryEntry(
|
|
@@ -76,14 +76,9 @@ class AzureAccessConfig(FsspecAccessConfig):
|
|
|
76
76
|
raise ValueError("either connection_string or account_name must be set")
|
|
77
77
|
|
|
78
78
|
|
|
79
|
-
SecretAzureAccessConfig = Secret[AzureAccessConfig]
|
|
80
|
-
|
|
81
|
-
|
|
82
79
|
class AzureConnectionConfig(FsspecConnectionConfig):
|
|
83
80
|
supported_protocols: list[str] = field(default_factory=lambda: ["az"], init=False)
|
|
84
|
-
access_config:
|
|
85
|
-
default_factory=lambda: SecretAzureAccessConfig(secret_value=AzureAccessConfig())
|
|
86
|
-
)
|
|
81
|
+
access_config: Secret[AzureAccessConfig]
|
|
87
82
|
connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
|
|
88
83
|
|
|
89
84
|
def get_access_config(self) -> dict[str, Any]:
|
|
@@ -36,14 +36,9 @@ class BoxAccessConfig(FsspecAccessConfig):
|
|
|
36
36
|
)
|
|
37
37
|
|
|
38
38
|
|
|
39
|
-
SecretBoxAccessConfig = Secret[BoxAccessConfig]
|
|
40
|
-
|
|
41
|
-
|
|
42
39
|
class BoxConnectionConfig(FsspecConnectionConfig):
|
|
43
40
|
supported_protocols: list[str] = field(default_factory=lambda: ["box"], init=False)
|
|
44
|
-
access_config:
|
|
45
|
-
default_factory=lambda: SecretBoxAccessConfig(secret_value=BoxAccessConfig())
|
|
46
|
-
)
|
|
41
|
+
access_config: Secret[BoxAccessConfig] = Field(default=BoxAccessConfig(), validate_default=True)
|
|
47
42
|
connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
|
|
48
43
|
|
|
49
44
|
def get_access_config(self) -> dict[str, Any]:
|
|
@@ -35,13 +35,10 @@ class DropboxAccessConfig(FsspecAccessConfig):
|
|
|
35
35
|
token: Optional[str] = Field(default=None, description="Dropbox access token.")
|
|
36
36
|
|
|
37
37
|
|
|
38
|
-
SecretDropboxAccessConfig = Secret[DropboxAccessConfig]
|
|
39
|
-
|
|
40
|
-
|
|
41
38
|
class DropboxConnectionConfig(FsspecConnectionConfig):
|
|
42
39
|
supported_protocols: list[str] = field(default_factory=lambda: ["dropbox"], init=False)
|
|
43
|
-
access_config:
|
|
44
|
-
|
|
40
|
+
access_config: Secret[DropboxAccessConfig] = Field(
|
|
41
|
+
default=DropboxAccessConfig(), validate_default=True
|
|
45
42
|
)
|
|
46
43
|
connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
|
|
47
44
|
|
|
@@ -86,14 +86,9 @@ class GcsAccessConfig(FsspecAccessConfig):
|
|
|
86
86
|
raise ValueError("Invalid auth token value")
|
|
87
87
|
|
|
88
88
|
|
|
89
|
-
SecretGcsAccessConfig = Secret[GcsAccessConfig]
|
|
90
|
-
|
|
91
|
-
|
|
92
89
|
class GcsConnectionConfig(FsspecConnectionConfig):
|
|
93
90
|
supported_protocols: list[str] = field(default_factory=lambda: ["gs", "gcs"], init=False)
|
|
94
|
-
access_config:
|
|
95
|
-
default_factory=lambda: SecretGcsAccessConfig(secret_value=GcsAccessConfig())
|
|
96
|
-
)
|
|
91
|
+
access_config: Secret[GcsAccessConfig] = Field(default=GcsAccessConfig(), validate_default=True)
|
|
97
92
|
connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
|
|
98
93
|
|
|
99
94
|
|
|
@@ -49,14 +49,9 @@ class S3AccessConfig(FsspecAccessConfig):
|
|
|
49
49
|
)
|
|
50
50
|
|
|
51
51
|
|
|
52
|
-
SecretS3AccessConfig = Secret[S3AccessConfig]
|
|
53
|
-
|
|
54
|
-
|
|
55
52
|
class S3ConnectionConfig(FsspecConnectionConfig):
|
|
56
53
|
supported_protocols: list[str] = field(default_factory=lambda: ["s3", "s3a"], init=False)
|
|
57
|
-
access_config:
|
|
58
|
-
default_factory=lambda: SecretS3AccessConfig(secret_value=S3AccessConfig())
|
|
59
|
-
)
|
|
54
|
+
access_config: Secret[S3AccessConfig] = Field(default=S3AccessConfig(), validate_default=True)
|
|
60
55
|
endpoint_url: Optional[str] = Field(
|
|
61
56
|
default=None,
|
|
62
57
|
description="Use this endpoint_url, if specified. Needed for "
|
|
@@ -39,12 +39,9 @@ class KdbaiAccessConfig(AccessConfig):
|
|
|
39
39
|
)
|
|
40
40
|
|
|
41
41
|
|
|
42
|
-
SecretKdbaiAccessConfig = Secret[KdbaiAccessConfig]
|
|
43
|
-
|
|
44
|
-
|
|
45
42
|
class KdbaiConnectionConfig(ConnectionConfig):
|
|
46
|
-
access_config:
|
|
47
|
-
default=
|
|
43
|
+
access_config: Secret[KdbaiAccessConfig] = Field(
|
|
44
|
+
default=KdbaiAccessConfig(), validate_default=True
|
|
48
45
|
)
|
|
49
46
|
endpoint: str = Field(
|
|
50
47
|
default="http://localhost:8082", description="Endpoint url where KDBAI is hosted."
|
|
@@ -34,12 +34,9 @@ class LocalAccessConfig(AccessConfig):
|
|
|
34
34
|
pass
|
|
35
35
|
|
|
36
36
|
|
|
37
|
-
SecretLocalAccessConfig = Secret[LocalAccessConfig]
|
|
38
|
-
|
|
39
|
-
|
|
40
37
|
class LocalConnectionConfig(ConnectionConfig):
|
|
41
|
-
access_config:
|
|
42
|
-
|
|
38
|
+
access_config: Secret[LocalAccessConfig] = Field(
|
|
39
|
+
default=LocalAccessConfig(), validate_default=True
|
|
43
40
|
)
|
|
44
41
|
|
|
45
42
|
|
|
@@ -36,12 +36,9 @@ class MilvusAccessConfig(AccessConfig):
|
|
|
36
36
|
token: Optional[str] = Field(default=None, description="Milvus access token")
|
|
37
37
|
|
|
38
38
|
|
|
39
|
-
SecretMilvusAccessConfig = Secret[MilvusAccessConfig]
|
|
40
|
-
|
|
41
|
-
|
|
42
39
|
class MilvusConnectionConfig(ConnectionConfig):
|
|
43
|
-
access_config:
|
|
44
|
-
|
|
40
|
+
access_config: Secret[MilvusAccessConfig] = Field(
|
|
41
|
+
default=MilvusAccessConfig(), validate_default=True
|
|
45
42
|
)
|
|
46
43
|
uri: Optional[str] = Field(
|
|
47
44
|
default=None, description="Milvus uri", examples=["http://localhost:19530"]
|
|
@@ -34,12 +34,9 @@ class MongoDBAccessConfig(AccessConfig):
|
|
|
34
34
|
uri: Optional[str] = Field(default=None, description="URI to user when connecting")
|
|
35
35
|
|
|
36
36
|
|
|
37
|
-
SecretMongoDBAccessConfig = Secret[MongoDBAccessConfig]
|
|
38
|
-
|
|
39
|
-
|
|
40
37
|
class MongoDBConnectionConfig(ConnectionConfig):
|
|
41
|
-
access_config:
|
|
42
|
-
|
|
38
|
+
access_config: Secret[MongoDBAccessConfig] = Field(
|
|
39
|
+
default=MongoDBAccessConfig(), validate_default=True
|
|
43
40
|
)
|
|
44
41
|
host: Optional[str] = Field(
|
|
45
42
|
default=None,
|
|
@@ -36,13 +36,10 @@ class PineconeAccessConfig(AccessConfig):
|
|
|
36
36
|
)
|
|
37
37
|
|
|
38
38
|
|
|
39
|
-
SecretPineconeAccessConfig = Secret[PineconeAccessConfig]
|
|
40
|
-
|
|
41
|
-
|
|
42
39
|
class PineconeConnectionConfig(ConnectionConfig):
|
|
43
40
|
index_name: str = Field(description="Name of the index to connect to.")
|
|
44
|
-
access_config:
|
|
45
|
-
|
|
41
|
+
access_config: Secret[PineconeAccessConfig] = Field(
|
|
42
|
+
default=PineconeAccessConfig(), validate_default=True
|
|
46
43
|
)
|
|
47
44
|
|
|
48
45
|
@requires_dependencies(["pinecone"], extras="pinecone")
|
|
@@ -40,9 +40,6 @@ class SQLAccessConfig(AccessConfig):
|
|
|
40
40
|
password: Optional[str] = Field(default=None, description="DB password")
|
|
41
41
|
|
|
42
42
|
|
|
43
|
-
SecreteSQLAccessConfig = Secret[SQLAccessConfig]
|
|
44
|
-
|
|
45
|
-
|
|
46
43
|
class SQLConnectionConfig(ConnectionConfig):
|
|
47
44
|
db_type: Literal["sqlite", "postgresql"] = Field(
|
|
48
45
|
default=SQLITE_DB, description="Type of the database backend"
|
|
@@ -53,9 +50,7 @@ class SQLConnectionConfig(ConnectionConfig):
|
|
|
53
50
|
)
|
|
54
51
|
host: Optional[str] = Field(default=None, description="DB host")
|
|
55
52
|
port: Optional[int] = Field(default=5432, description="DB host connection port")
|
|
56
|
-
access_config:
|
|
57
|
-
default_factory=lambda: SecreteSQLAccessConfig(secret_value=SQLAccessConfig())
|
|
58
|
-
)
|
|
53
|
+
access_config: Secret[SQLAccessConfig] = Field(default=SQLAccessConfig(), validate_default=True)
|
|
59
54
|
connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
|
|
60
55
|
|
|
61
56
|
def __post_init__(self):
|
|
@@ -38,16 +38,13 @@ class WeaviateAccessConfig(AccessConfig):
|
|
|
38
38
|
password: Optional[str] = None
|
|
39
39
|
|
|
40
40
|
|
|
41
|
-
SecretWeaviateAccessConfig = Secret[WeaviateAccessConfig]
|
|
42
|
-
|
|
43
|
-
|
|
44
41
|
class WeaviateConnectionConfig(ConnectionConfig):
|
|
45
42
|
host_url: str = Field(description="Weaviate instance url")
|
|
46
43
|
class_name: str = Field(
|
|
47
44
|
description="Name of the class to push the records into, e.g: Pdf-elements"
|
|
48
45
|
)
|
|
49
|
-
access_config:
|
|
50
|
-
|
|
46
|
+
access_config: Secret[WeaviateAccessConfig] = Field(
|
|
47
|
+
default=WeaviateAccessConfig(), validate_default=True
|
|
51
48
|
)
|
|
52
49
|
username: Optional[str] = None
|
|
53
50
|
anonymous: bool = Field(default=False, description="if set, all auth values will be ignored")
|