unstructured-ingest 0.6.4__py3-none-any.whl → 0.7.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of unstructured-ingest might be problematic. Click here for more details.
- examples/airtable.py +44 -0
- examples/azure_cognitive_search.py +55 -0
- examples/chroma.py +54 -0
- examples/couchbase.py +55 -0
- examples/databricks_volumes_dest.py +55 -0
- examples/databricks_volumes_source.py +53 -0
- examples/delta_table.py +45 -0
- examples/discord_example.py +36 -0
- examples/elasticsearch.py +49 -0
- examples/google_drive.py +45 -0
- examples/kdbai.py +54 -0
- examples/local.py +36 -0
- examples/milvus.py +44 -0
- examples/mongodb.py +53 -0
- examples/opensearch.py +50 -0
- examples/pinecone.py +57 -0
- examples/s3.py +38 -0
- examples/salesforce.py +44 -0
- examples/sharepoint.py +47 -0
- examples/singlestore.py +49 -0
- examples/sql.py +90 -0
- examples/vectara.py +54 -0
- examples/weaviate.py +44 -0
- test/integration/chunkers/test_chunkers.py +1 -1
- test/integration/connectors/conftest.py +1 -1
- test/integration/connectors/databricks/test_volumes_native.py +3 -3
- test/integration/connectors/discord/test_discord.py +1 -1
- test/integration/connectors/duckdb/test_duckdb.py +2 -2
- test/integration/connectors/duckdb/test_motherduck.py +2 -2
- test/integration/connectors/elasticsearch/test_elasticsearch.py +2 -2
- test/integration/connectors/elasticsearch/test_opensearch.py +2 -2
- test/integration/connectors/sql/test_databricks_delta_tables.py +3 -3
- test/integration/connectors/sql/test_postgres.py +2 -2
- test/integration/connectors/sql/test_singlestore.py +2 -2
- test/integration/connectors/sql/test_snowflake.py +2 -2
- test/integration/connectors/sql/test_sqlite.py +2 -2
- test/integration/connectors/sql/test_vastdb.py +1 -1
- test/integration/connectors/test_astradb.py +2 -2
- test/integration/connectors/test_azure_ai_search.py +2 -2
- test/integration/connectors/test_chroma.py +2 -2
- test/integration/connectors/test_confluence.py +1 -1
- test/integration/connectors/test_delta_table.py +2 -2
- test/integration/connectors/test_dropbox.py +2 -2
- test/integration/connectors/test_github.py +1 -1
- test/integration/connectors/test_google_drive.py +2 -2
- test/integration/connectors/test_jira.py +1 -1
- test/integration/connectors/test_lancedb.py +7 -7
- test/integration/connectors/test_milvus.py +2 -2
- test/integration/connectors/test_mongodb.py +2 -2
- test/integration/connectors/test_neo4j.py +7 -7
- test/integration/connectors/test_notion.py +2 -2
- test/integration/connectors/test_onedrive.py +2 -2
- test/integration/connectors/test_pinecone.py +3 -3
- test/integration/connectors/test_qdrant.py +6 -6
- test/integration/connectors/test_redis.py +3 -3
- test/integration/connectors/test_s3.py +3 -3
- test/integration/connectors/test_sharepoint.py +1 -1
- test/integration/connectors/test_vectara.py +4 -4
- test/integration/connectors/test_zendesk.py +2 -2
- test/integration/connectors/utils/validation/destination.py +2 -2
- test/integration/connectors/utils/validation/source.py +2 -2
- test/integration/connectors/weaviate/test_cloud.py +1 -1
- test/integration/connectors/weaviate/test_local.py +2 -2
- test/integration/embedders/test_azure_openai.py +1 -1
- test/integration/embedders/test_bedrock.py +2 -2
- test/integration/embedders/test_huggingface.py +1 -1
- test/integration/embedders/test_mixedbread.py +1 -1
- test/integration/embedders/test_octoai.py +2 -2
- test/integration/embedders/test_openai.py +2 -2
- test/integration/embedders/test_togetherai.py +2 -2
- test/integration/embedders/test_vertexai.py +1 -1
- test/integration/embedders/test_voyageai.py +1 -1
- test/integration/partitioners/test_partitioner.py +2 -2
- test/unit/{v2/chunkers → chunkers}/test_chunkers.py +1 -1
- test/unit/{v2/connectors → connectors}/ibm_watsonx/test_ibm_watsonx_s3.py +6 -6
- test/unit/{v2/connectors → connectors}/motherduck/test_base.py +5 -5
- test/unit/{v2/connectors → connectors}/sql/test_sql.py +4 -4
- test/unit/{v2/connectors → connectors}/test_confluence.py +1 -1
- test/unit/{v2/connectors → connectors}/test_jira.py +1 -1
- test/unit/{v2/embedders → embedders}/test_huggingface.py +1 -1
- test/unit/{v2/embedders → embedders}/test_vertexai.py +1 -1
- test/unit/{v2/partitioners → partitioners}/test_partitioner.py +2 -2
- test/unit/test_html.py +1 -1
- test/unit/{v2/test_interfaces.py → test_interfaces.py} +1 -1
- test/unit/test_utils.py +106 -97
- unstructured_ingest/__version__.py +1 -1
- unstructured_ingest/cli/__init__.py +0 -14
- unstructured_ingest/cli/base/__init__.py +4 -0
- unstructured_ingest/cli/base/cmd.py +259 -9
- unstructured_ingest/cli/base/dest.py +58 -61
- unstructured_ingest/cli/base/src.py +54 -36
- unstructured_ingest/cli/cli.py +4 -17
- unstructured_ingest/{v2/cli → cli}/cmds.py +2 -2
- unstructured_ingest/{v2/cli → cli}/utils/model_conversion.py +6 -6
- unstructured_ingest/{v2/types → data_types}/file_data.py +1 -1
- unstructured_ingest/embed/bedrock.py +3 -3
- unstructured_ingest/embed/octoai.py +3 -3
- unstructured_ingest/embed/openai.py +3 -3
- unstructured_ingest/embed/togetherai.py +4 -4
- unstructured_ingest/embed/vertexai.py +1 -1
- unstructured_ingest/embed/voyageai.py +4 -4
- unstructured_ingest/{v2/interfaces → interfaces}/downloader.py +3 -3
- unstructured_ingest/{v2/interfaces → interfaces}/indexer.py +3 -3
- unstructured_ingest/{v2/interfaces → interfaces}/upload_stager.py +2 -2
- unstructured_ingest/{v2/interfaces → interfaces}/uploader.py +2 -2
- unstructured_ingest/{v2/otel.py → otel.py} +1 -1
- unstructured_ingest/pipeline/__init__.py +0 -22
- unstructured_ingest/pipeline/interfaces.py +179 -238
- unstructured_ingest/{v2/pipeline → pipeline}/otel.py +2 -2
- unstructured_ingest/pipeline/pipeline.py +388 -97
- unstructured_ingest/{v2/pipeline → pipeline}/steps/chunk.py +5 -5
- unstructured_ingest/{v2/pipeline → pipeline}/steps/download.py +5 -5
- unstructured_ingest/{v2/pipeline → pipeline}/steps/embed.py +5 -5
- unstructured_ingest/{v2/pipeline → pipeline}/steps/filter.py +4 -4
- unstructured_ingest/{v2/pipeline → pipeline}/steps/index.py +5 -5
- unstructured_ingest/{v2/pipeline → pipeline}/steps/partition.py +5 -5
- unstructured_ingest/{v2/pipeline → pipeline}/steps/stage.py +5 -5
- unstructured_ingest/{v2/pipeline → pipeline}/steps/uncompress.py +4 -4
- unstructured_ingest/{v2/pipeline → pipeline}/steps/upload.py +5 -5
- unstructured_ingest/{v2/processes → processes}/chunker.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connector_registry.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/__init__.py +11 -11
- unstructured_ingest/{v2/processes → processes}/connectors/airtable.py +4 -4
- unstructured_ingest/{v2/processes → processes}/connectors/astradb.py +15 -15
- unstructured_ingest/{v2/processes → processes}/connectors/azure_ai_search.py +8 -9
- unstructured_ingest/{v2/processes → processes}/connectors/chroma.py +10 -7
- unstructured_ingest/{v2/processes → processes}/connectors/confluence.py +11 -11
- unstructured_ingest/{v2/processes → processes}/connectors/couchbase.py +12 -12
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/volumes.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/volumes_aws.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/volumes_azure.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/volumes_gcp.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/volumes_native.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/databricks/volumes_table.py +8 -9
- unstructured_ingest/{v2/processes → processes}/connectors/delta_table.py +7 -7
- unstructured_ingest/{v2/processes → processes}/connectors/discord.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/duckdb/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/duckdb/base.py +3 -4
- unstructured_ingest/{v2/processes → processes}/connectors/duckdb/duckdb.py +7 -7
- unstructured_ingest/{v2/processes → processes}/connectors/duckdb/motherduck.py +7 -7
- unstructured_ingest/{v2/processes → processes}/connectors/elasticsearch/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/elasticsearch/elasticsearch.py +17 -17
- unstructured_ingest/{v2/processes → processes}/connectors/elasticsearch/opensearch.py +5 -5
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/azure.py +8 -8
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/box.py +8 -8
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/dropbox.py +8 -8
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/fsspec.py +8 -8
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/gcs.py +8 -8
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/s3.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/fsspec/sftp.py +5 -5
- unstructured_ingest/{v2/processes → processes}/connectors/github.py +10 -10
- unstructured_ingest/{v2/processes → processes}/connectors/gitlab.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/google_drive.py +22 -13
- unstructured_ingest/{v2/processes → processes}/connectors/ibm_watsonx/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/ibm_watsonx/ibm_watsonx_s3.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/jira.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/kafka/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/kafka/cloud.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/kafka/kafka.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/kafka/local.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/kdbai.py +11 -7
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/aws.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/azure.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/cloud.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/gcp.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/lancedb.py +6 -6
- unstructured_ingest/{v2/processes → processes}/connectors/lancedb/local.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/local.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/milvus.py +7 -7
- unstructured_ingest/{v2/processes → processes}/connectors/mongodb.py +13 -13
- unstructured_ingest/{v2/processes → processes}/connectors/neo4j.py +7 -7
- unstructured_ingest/{v2/processes → processes}/connectors/notion/client.py +6 -6
- unstructured_ingest/{v2/processes → processes}/connectors/notion/connector.py +15 -15
- unstructured_ingest/{v2/processes → processes}/connectors/notion/helpers.py +4 -4
- unstructured_ingest/{ingest_backoff → processes/connectors/notion/ingest_backoff}/_wrapper.py +5 -1
- unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +24 -0
- unstructured_ingest/{connector → processes/connectors}/notion/types/block.py +4 -4
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/bookmark.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/breadcrumb.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/bulleted_list_item.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/callout.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/child_database.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/child_page.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/code.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/column_list.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/divider.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/embed.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/equation.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/file.py +4 -4
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/heading.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/image.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/link_preview.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/link_to_page.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/numbered_list.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/paragraph.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/pdf.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/quote.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/synced_block.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/table.py +2 -5
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/table_of_contents.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/template.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/todo.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/toggle.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/blocks/unsupported.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/video.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/database.py +6 -6
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/checkbox.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/created_by.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/created_time.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/date.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/email.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/files.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/formula.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/last_edited_by.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/last_edited_time.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/multiselect.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/number.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/people.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/phone_number.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/relation.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/rich_text.py +2 -2
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/rollup.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/select.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/status.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/title.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/database_properties/unique_id.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/url.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/database_properties/verification.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/date.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/file.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/page.py +4 -4
- unstructured_ingest/{connector → processes/connectors}/notion/types/parent.py +1 -1
- unstructured_ingest/{connector → processes/connectors}/notion/types/rich_text.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/notion/types/user.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/onedrive.py +55 -27
- unstructured_ingest/{v2/processes → processes}/connectors/outlook.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/pinecone.py +12 -9
- unstructured_ingest/{v2/processes → processes}/connectors/qdrant/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/qdrant/cloud.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/qdrant/local.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/qdrant/qdrant.py +9 -6
- unstructured_ingest/{v2/processes → processes}/connectors/qdrant/server.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/redisdb.py +6 -6
- unstructured_ingest/{v2/processes → processes}/connectors/salesforce.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/sharepoint.py +8 -8
- unstructured_ingest/{v2/processes → processes}/connectors/slack.py +9 -9
- unstructured_ingest/{v2/processes → processes}/connectors/sql/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/sql/databricks_delta_tables.py +7 -7
- unstructured_ingest/{v2/processes → processes}/connectors/sql/postgres.py +4 -4
- unstructured_ingest/{v2/processes → processes}/connectors/sql/singlestore.py +4 -4
- unstructured_ingest/{v2/processes → processes}/connectors/sql/snowflake.py +6 -6
- unstructured_ingest/{v2/processes → processes}/connectors/sql/sql.py +16 -11
- unstructured_ingest/{v2/processes → processes}/connectors/sql/sqlite.py +4 -4
- unstructured_ingest/{v2/processes → processes}/connectors/sql/vastdb.py +9 -10
- unstructured_ingest/{v2/processes → processes}/connectors/vectara.py +6 -6
- unstructured_ingest/{v2/processes → processes}/connectors/weaviate/__init__.py +1 -1
- unstructured_ingest/{v2/processes → processes}/connectors/weaviate/cloud.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/weaviate/embedded.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/weaviate/local.py +3 -3
- unstructured_ingest/{v2/processes → processes}/connectors/weaviate/weaviate.py +5 -5
- unstructured_ingest/{v2/processes → processes}/connectors/zendesk/client.py +2 -2
- unstructured_ingest/{v2/processes → processes}/connectors/zendesk/zendesk.py +10 -10
- unstructured_ingest/{v2/processes → processes}/embedder.py +1 -1
- unstructured_ingest/{v2/processes → processes}/filter.py +4 -4
- unstructured_ingest/{v2/processes → processes}/partitioner.py +6 -6
- unstructured_ingest/{v2/processes → processes}/uncompress.py +3 -3
- unstructured_ingest/{v2/processes → processes}/utils/blob_storage.py +2 -2
- unstructured_ingest/{v2/unstructured_api.py → unstructured_api.py} +2 -2
- unstructured_ingest/utils/compression.py +1 -48
- unstructured_ingest/utils/data_prep.py +9 -1
- unstructured_ingest/utils/html.py +3 -3
- unstructured_ingest/{v2/utils.py → utils/pydantic_models.py} +0 -9
- unstructured_ingest/utils/string_and_date_utils.py +1 -1
- {unstructured_ingest-0.6.4.dist-info → unstructured_ingest-0.7.1.dist-info}/METADATA +98 -97
- unstructured_ingest-0.7.1.dist-info/RECORD +370 -0
- {unstructured_ingest-0.6.4.dist-info → unstructured_ingest-0.7.1.dist-info}/top_level.txt +1 -0
- test/unit/v2/test_utils.py +0 -82
- unstructured_ingest/cli/cmd_factory.py +0 -12
- unstructured_ingest/cli/cmds/__init__.py +0 -145
- unstructured_ingest/cli/cmds/airtable.py +0 -69
- unstructured_ingest/cli/cmds/astradb.py +0 -99
- unstructured_ingest/cli/cmds/azure_ai_search.py +0 -65
- unstructured_ingest/cli/cmds/biomed.py +0 -52
- unstructured_ingest/cli/cmds/chroma.py +0 -104
- unstructured_ingest/cli/cmds/clarifai.py +0 -71
- unstructured_ingest/cli/cmds/confluence.py +0 -69
- unstructured_ingest/cli/cmds/databricks_volumes.py +0 -163
- unstructured_ingest/cli/cmds/delta_table.py +0 -94
- unstructured_ingest/cli/cmds/discord.py +0 -47
- unstructured_ingest/cli/cmds/elasticsearch.py +0 -133
- unstructured_ingest/cli/cmds/fsspec/azure.py +0 -94
- unstructured_ingest/cli/cmds/fsspec/box.py +0 -48
- unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -51
- unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -15
- unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -71
- unstructured_ingest/cli/cmds/fsspec/s3.py +0 -74
- unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -58
- unstructured_ingest/cli/cmds/github.py +0 -54
- unstructured_ingest/cli/cmds/gitlab.py +0 -54
- unstructured_ingest/cli/cmds/google_drive.py +0 -49
- unstructured_ingest/cli/cmds/hubspot.py +0 -70
- unstructured_ingest/cli/cmds/jira.py +0 -71
- unstructured_ingest/cli/cmds/kafka.py +0 -102
- unstructured_ingest/cli/cmds/local.py +0 -43
- unstructured_ingest/cli/cmds/mongodb.py +0 -72
- unstructured_ingest/cli/cmds/notion.py +0 -48
- unstructured_ingest/cli/cmds/onedrive.py +0 -66
- unstructured_ingest/cli/cmds/opensearch.py +0 -117
- unstructured_ingest/cli/cmds/outlook.py +0 -67
- unstructured_ingest/cli/cmds/pinecone.py +0 -71
- unstructured_ingest/cli/cmds/qdrant.py +0 -124
- unstructured_ingest/cli/cmds/reddit.py +0 -67
- unstructured_ingest/cli/cmds/salesforce.py +0 -58
- unstructured_ingest/cli/cmds/sharepoint.py +0 -66
- unstructured_ingest/cli/cmds/slack.py +0 -56
- unstructured_ingest/cli/cmds/sql.py +0 -66
- unstructured_ingest/cli/cmds/vectara.py +0 -66
- unstructured_ingest/cli/cmds/weaviate.py +0 -98
- unstructured_ingest/cli/cmds/wikipedia.py +0 -40
- unstructured_ingest/cli/common.py +0 -7
- unstructured_ingest/cli/interfaces.py +0 -663
- unstructured_ingest/cli/utils.py +0 -205
- unstructured_ingest/connector/airtable.py +0 -309
- unstructured_ingest/connector/astradb.py +0 -267
- unstructured_ingest/connector/azure_ai_search.py +0 -144
- unstructured_ingest/connector/biomed.py +0 -320
- unstructured_ingest/connector/chroma.py +0 -158
- unstructured_ingest/connector/clarifai.py +0 -122
- unstructured_ingest/connector/confluence.py +0 -285
- unstructured_ingest/connector/databricks_volumes.py +0 -137
- unstructured_ingest/connector/delta_table.py +0 -203
- unstructured_ingest/connector/discord.py +0 -180
- unstructured_ingest/connector/elasticsearch.py +0 -396
- unstructured_ingest/connector/fsspec/azure.py +0 -78
- unstructured_ingest/connector/fsspec/box.py +0 -109
- unstructured_ingest/connector/fsspec/dropbox.py +0 -160
- unstructured_ingest/connector/fsspec/fsspec.py +0 -359
- unstructured_ingest/connector/fsspec/gcs.py +0 -82
- unstructured_ingest/connector/fsspec/s3.py +0 -62
- unstructured_ingest/connector/fsspec/sftp.py +0 -81
- unstructured_ingest/connector/git.py +0 -124
- unstructured_ingest/connector/github.py +0 -174
- unstructured_ingest/connector/gitlab.py +0 -142
- unstructured_ingest/connector/google_drive.py +0 -348
- unstructured_ingest/connector/hubspot.py +0 -278
- unstructured_ingest/connector/jira.py +0 -469
- unstructured_ingest/connector/kafka.py +0 -293
- unstructured_ingest/connector/local.py +0 -139
- unstructured_ingest/connector/mongodb.py +0 -284
- unstructured_ingest/connector/notion/client.py +0 -248
- unstructured_ingest/connector/notion/connector.py +0 -469
- unstructured_ingest/connector/notion/helpers.py +0 -584
- unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -40
- unstructured_ingest/connector/notion/types/blocks/callout.py +0 -94
- unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -23
- unstructured_ingest/connector/notion/types/blocks/code.py +0 -43
- unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -35
- unstructured_ingest/connector/notion/types/blocks/divider.py +0 -22
- unstructured_ingest/connector/notion/types/blocks/heading.py +0 -37
- unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -24
- unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -29
- unstructured_ingest/connector/notion/types/blocks/quote.py +0 -37
- unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -57
- unstructured_ingest/connector/notion/types/blocks/table.py +0 -63
- unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -23
- unstructured_ingest/connector/notion/types/blocks/template.py +0 -30
- unstructured_ingest/connector/notion/types/blocks/todo.py +0 -42
- unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -20
- unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -106
- unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -38
- unstructured_ingest/connector/notion/types/database_properties/date.py +0 -41
- unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -49
- unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -34
- unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -73
- unstructured_ingest/connector/notion/types/database_properties/people.py +0 -40
- unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -36
- unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -67
- unstructured_ingest/connector/notion/types/database_properties/select.py +0 -68
- unstructured_ingest/connector/notion/types/database_properties/status.py +0 -80
- unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -50
- unstructured_ingest/connector/notion/types/date.py +0 -26
- unstructured_ingest/connector/notion/types/file.py +0 -51
- unstructured_ingest/connector/notion/types/user.py +0 -76
- unstructured_ingest/connector/onedrive.py +0 -232
- unstructured_ingest/connector/opensearch.py +0 -218
- unstructured_ingest/connector/outlook.py +0 -285
- unstructured_ingest/connector/pinecone.py +0 -150
- unstructured_ingest/connector/qdrant.py +0 -144
- unstructured_ingest/connector/reddit.py +0 -166
- unstructured_ingest/connector/registry.py +0 -109
- unstructured_ingest/connector/salesforce.py +0 -301
- unstructured_ingest/connector/sharepoint.py +0 -573
- unstructured_ingest/connector/slack.py +0 -224
- unstructured_ingest/connector/sql.py +0 -199
- unstructured_ingest/connector/vectara.py +0 -253
- unstructured_ingest/connector/weaviate.py +0 -190
- unstructured_ingest/connector/wikipedia.py +0 -208
- unstructured_ingest/enhanced_dataclass/__init__.py +0 -4
- unstructured_ingest/enhanced_dataclass/core.py +0 -99
- unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -54
- unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -125
- unstructured_ingest/interfaces.py +0 -852
- unstructured_ingest/pipeline/copy.py +0 -19
- unstructured_ingest/pipeline/doc_factory.py +0 -12
- unstructured_ingest/pipeline/partition.py +0 -60
- unstructured_ingest/pipeline/permissions.py +0 -12
- unstructured_ingest/pipeline/reformat/chunking.py +0 -134
- unstructured_ingest/pipeline/reformat/embedding.py +0 -64
- unstructured_ingest/pipeline/source.py +0 -77
- unstructured_ingest/pipeline/utils.py +0 -6
- unstructured_ingest/pipeline/write.py +0 -18
- unstructured_ingest/processor.py +0 -93
- unstructured_ingest/runner/__init__.py +0 -104
- unstructured_ingest/runner/airtable.py +0 -35
- unstructured_ingest/runner/astradb.py +0 -34
- unstructured_ingest/runner/base_runner.py +0 -89
- unstructured_ingest/runner/biomed.py +0 -45
- unstructured_ingest/runner/confluence.py +0 -35
- unstructured_ingest/runner/delta_table.py +0 -34
- unstructured_ingest/runner/discord.py +0 -35
- unstructured_ingest/runner/elasticsearch.py +0 -40
- unstructured_ingest/runner/fsspec/azure.py +0 -30
- unstructured_ingest/runner/fsspec/box.py +0 -28
- unstructured_ingest/runner/fsspec/dropbox.py +0 -30
- unstructured_ingest/runner/fsspec/fsspec.py +0 -40
- unstructured_ingest/runner/fsspec/gcs.py +0 -28
- unstructured_ingest/runner/fsspec/s3.py +0 -28
- unstructured_ingest/runner/fsspec/sftp.py +0 -28
- unstructured_ingest/runner/github.py +0 -37
- unstructured_ingest/runner/gitlab.py +0 -37
- unstructured_ingest/runner/google_drive.py +0 -35
- unstructured_ingest/runner/hubspot.py +0 -35
- unstructured_ingest/runner/jira.py +0 -35
- unstructured_ingest/runner/kafka.py +0 -34
- unstructured_ingest/runner/local.py +0 -23
- unstructured_ingest/runner/mongodb.py +0 -34
- unstructured_ingest/runner/notion.py +0 -61
- unstructured_ingest/runner/onedrive.py +0 -35
- unstructured_ingest/runner/opensearch.py +0 -40
- unstructured_ingest/runner/outlook.py +0 -33
- unstructured_ingest/runner/reddit.py +0 -35
- unstructured_ingest/runner/salesforce.py +0 -33
- unstructured_ingest/runner/sharepoint.py +0 -35
- unstructured_ingest/runner/slack.py +0 -33
- unstructured_ingest/runner/utils.py +0 -47
- unstructured_ingest/runner/wikipedia.py +0 -35
- unstructured_ingest/runner/writers/__init__.py +0 -48
- unstructured_ingest/runner/writers/astradb.py +0 -22
- unstructured_ingest/runner/writers/azure_ai_search.py +0 -24
- unstructured_ingest/runner/writers/base_writer.py +0 -26
- unstructured_ingest/runner/writers/chroma.py +0 -22
- unstructured_ingest/runner/writers/clarifai.py +0 -19
- unstructured_ingest/runner/writers/databricks_volumes.py +0 -25
- unstructured_ingest/runner/writers/delta_table.py +0 -24
- unstructured_ingest/runner/writers/elasticsearch.py +0 -24
- unstructured_ingest/runner/writers/fsspec/azure.py +0 -24
- unstructured_ingest/runner/writers/fsspec/box.py +0 -21
- unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -21
- unstructured_ingest/runner/writers/fsspec/gcs.py +0 -19
- unstructured_ingest/runner/writers/fsspec/s3.py +0 -21
- unstructured_ingest/runner/writers/kafka.py +0 -21
- unstructured_ingest/runner/writers/mongodb.py +0 -21
- unstructured_ingest/runner/writers/opensearch.py +0 -26
- unstructured_ingest/runner/writers/pinecone.py +0 -21
- unstructured_ingest/runner/writers/qdrant.py +0 -19
- unstructured_ingest/runner/writers/sql.py +0 -22
- unstructured_ingest/runner/writers/vectara.py +0 -22
- unstructured_ingest/runner/writers/weaviate.py +0 -21
- unstructured_ingest/utils/google_filetype.py +0 -9
- unstructured_ingest/v2/__init__.py +0 -1
- unstructured_ingest/v2/cli/__init__.py +0 -0
- unstructured_ingest/v2/cli/base/__init__.py +0 -4
- unstructured_ingest/v2/cli/base/cmd.py +0 -269
- unstructured_ingest/v2/cli/base/dest.py +0 -85
- unstructured_ingest/v2/cli/base/src.py +0 -85
- unstructured_ingest/v2/cli/cli.py +0 -24
- unstructured_ingest/v2/cli/utils/__init__.py +0 -0
- unstructured_ingest/v2/logger.py +0 -126
- unstructured_ingest/v2/main.py +0 -11
- unstructured_ingest/v2/pipeline/__init__.py +0 -0
- unstructured_ingest/v2/pipeline/interfaces.py +0 -211
- unstructured_ingest/v2/pipeline/pipeline.py +0 -408
- unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
- unstructured_ingest/v2/processes/connectors/assets/__init__.py +0 -0
- unstructured_ingest/v2/processes/connectors/assets/databricks_delta_table_schema.sql +0 -10
- unstructured_ingest/v2/processes/connectors/assets/weaviate_collection_config.json +0 -23
- unstructured_ingest/v2/processes/connectors/notion/__init__.py +0 -0
- unstructured_ingest/v2/processes/connectors/notion/interfaces.py +0 -32
- unstructured_ingest/v2/processes/connectors/notion/types/__init__.py +0 -0
- unstructured_ingest/v2/processes/connectors/notion/types/block.py +0 -96
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/__init__.py +0 -63
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/breadcrumb.py +0 -21
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -31
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/child_page.py +0 -23
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/embed.py +0 -36
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/equation.py +0 -23
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/file.py +0 -49
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/image.py +0 -21
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/link_to_page.py +0 -29
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/paragraph.py +0 -31
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/pdf.py +0 -49
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/toggle.py +0 -37
- unstructured_ingest/v2/processes/connectors/notion/types/blocks/video.py +0 -22
- unstructured_ingest/v2/processes/connectors/notion/types/database.py +0 -73
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/created_by.py +0 -35
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/created_time.py +0 -34
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/email.py +0 -36
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/files.py +0 -37
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -34
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/number.py +0 -49
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/rich_text.py +0 -43
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/rollup.py +0 -56
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/title.py +0 -37
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/url.py +0 -37
- unstructured_ingest/v2/processes/connectors/notion/types/database_properties/verification.py +0 -78
- unstructured_ingest/v2/processes/connectors/notion/types/page.py +0 -45
- unstructured_ingest/v2/processes/connectors/notion/types/parent.py +0 -66
- unstructured_ingest/v2/processes/connectors/notion/types/rich_text.py +0 -189
- unstructured_ingest/v2/processes/connectors/zendesk/__init__.py +0 -0
- unstructured_ingest/v2/processes/utils/__init__.py +0 -0
- unstructured_ingest/v2/types/__init__.py +0 -0
- unstructured_ingest-0.6.4.dist-info/RECORD +0 -591
- {test/unit/v2 → examples}/__init__.py +0 -0
- /test/unit/{v2/chunkers → chunkers}/__init__.py +0 -0
- /test/unit/{v2/connectors → connectors}/__init__.py +0 -0
- /test/unit/{v2/connectors → connectors}/ibm_watsonx/__init__.py +0 -0
- /test/unit/{v2/connectors → connectors}/motherduck/__init__.py +0 -0
- /test/unit/{v2/connectors → connectors}/sql/__init__.py +0 -0
- /test/unit/{v2/embedders → embedders}/__init__.py +0 -0
- /test/unit/{v2/embedders → embedders}/test_bedrock.py +0 -0
- /test/unit/{v2/embedders → embedders}/test_mixedbread.py +0 -0
- /test/unit/{v2/embedders → embedders}/test_octoai.py +0 -0
- /test/unit/{v2/embedders → embedders}/test_openai.py +0 -0
- /test/unit/{v2/embedders → embedders}/test_togetherai.py +0 -0
- /test/unit/{v2/embedders → embedders}/test_voyageai.py +0 -0
- /test/unit/{v2/partitioners → partitioners}/__init__.py +0 -0
- /test/unit/{v2/utils → utils}/__init__.py +0 -0
- /test/unit/{v2/utils → utils}/data_generator.py +0 -0
- /unstructured_ingest/{v2/cli → cli}/base/importer.py +0 -0
- /unstructured_ingest/cli/{cmds/fsspec → utils}/__init__.py +0 -0
- /unstructured_ingest/{v2/cli → cli}/utils/click.py +0 -0
- /unstructured_ingest/{connector → data_types}/__init__.py +0 -0
- /unstructured_ingest/{v2/errors.py → errors_v2.py} +0 -0
- /unstructured_ingest/{v2/interfaces → interfaces}/__init__.py +0 -0
- /unstructured_ingest/{v2/interfaces → interfaces}/connector.py +0 -0
- /unstructured_ingest/{v2/interfaces → interfaces}/process.py +0 -0
- /unstructured_ingest/{v2/interfaces → interfaces}/processor.py +0 -0
- /unstructured_ingest/{connector/fsspec → pipeline/steps}/__init__.py +0 -0
- /unstructured_ingest/{v2/processes → processes}/__init__.py +0 -0
- /unstructured_ingest/{connector/notion → processes/connectors/assets}/__init__.py +0 -0
- /unstructured_ingest/{v2/processes → processes}/connectors/fsspec/utils.py +0 -0
- /unstructured_ingest/{connector/notion/types → processes/connectors/notion}/__init__.py +0 -0
- /unstructured_ingest/{ingest_backoff → processes/connectors/notion/ingest_backoff}/__init__.py +0 -0
- /unstructured_ingest/{ingest_backoff → processes/connectors/notion/ingest_backoff}/_common.py +0 -0
- /unstructured_ingest/{connector → processes/connectors}/notion/interfaces.py +0 -0
- /unstructured_ingest/{pipeline/reformat → processes/connectors/notion/types}/__init__.py +0 -0
- /unstructured_ingest/{connector → processes/connectors}/notion/types/blocks/__init__.py +0 -0
- /unstructured_ingest/{v2/processes → processes}/connectors/utils.py +0 -0
- /unstructured_ingest/{runner/fsspec → processes/connectors/zendesk}/__init__.py +0 -0
- /unstructured_ingest/{runner/writers/fsspec → processes/utils}/__init__.py +0 -0
- /unstructured_ingest/{v2 → utils}/constants.py +0 -0
- {unstructured_ingest-0.6.4.dist-info → unstructured_ingest-0.7.1.dist-info}/LICENSE.md +0 -0
- {unstructured_ingest-0.6.4.dist-info → unstructured_ingest-0.7.1.dist-info}/WHEEL +0 -0
- {unstructured_ingest-0.6.4.dist-info → unstructured_ingest-0.7.1.dist-info}/entry_points.txt +0 -0
|
@@ -0,0 +1,370 @@
|
|
|
1
|
+
examples/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
2
|
+
examples/airtable.py,sha256=4n6B8l_fmnlZLdk9SIfYticOTgZGQBjBfktNwFQf9Zc,1831
|
|
3
|
+
examples/azure_cognitive_search.py,sha256=KThZyRQ2HhTndBcGBn1dlr0FARB2PmBBRRnKJU5AuQU,2279
|
|
4
|
+
examples/chroma.py,sha256=fLqcpnbMAlJEe96SCMm17ZGOtcnaDQBGusURhLDwth8,2208
|
|
5
|
+
examples/couchbase.py,sha256=u4fmZb4eBYEcBgWCaWOKSxxxV1v-YpyaGG7J4ept1w0,2261
|
|
6
|
+
examples/databricks_volumes_dest.py,sha256=xoSVgmS4dNKOKGKtin0ojB20mO7vfCJ8FQ_DFIgMW-U,2329
|
|
7
|
+
examples/databricks_volumes_source.py,sha256=DT7PXW6CTOGSH5lzuZMfasjV6vgoG28R68I9Cb98JvQ,2278
|
|
8
|
+
examples/delta_table.py,sha256=0InvWFYZZt6TolYtWlKp9KliOnRxFNubInbwqlBWMIA,1898
|
|
9
|
+
examples/discord_example.py,sha256=ZNzKVxk7hfUF0qZdOLkh7fGItaiIdo6gh7JYhwr2vyQ,1624
|
|
10
|
+
examples/elasticsearch.py,sha256=KQXIYCE44w_CRZQGanlfP9ZY9NZ5gclxKKvtZnd-IRA,2129
|
|
11
|
+
examples/google_drive.py,sha256=iOjkC8iWQ3sqM3TTsL8Ng_yZbm2C5xfws1a9MTZuV7M,1677
|
|
12
|
+
examples/kdbai.py,sha256=W7yT2lnYOPbftqTiSHQNgWVwQC4UXJ8QhkPqSdiG_Co,2225
|
|
13
|
+
examples/local.py,sha256=WuN3SqxoXRlh2xhMZPh4R9EdCNfjQUhurAlGVqGuUF8,1569
|
|
14
|
+
examples/milvus.py,sha256=TKtH1Rxrj3Hr9d1BUx7qEK468Xb0ux7Ak1RukPXSOOo,1877
|
|
15
|
+
examples/mongodb.py,sha256=eP43TY-rjOeWnVk4m5jSSWJSWXcy6xRYFuLWusBZXws,2160
|
|
16
|
+
examples/opensearch.py,sha256=8YmQpvOB9HBQqoC47ht-lX34SpkoaDlezbQOHRG82cw,2103
|
|
17
|
+
examples/pinecone.py,sha256=URXalj5-0eTVnmfzD0icCB1brGklplU4P8l0jrawCjI,2479
|
|
18
|
+
examples/s3.py,sha256=23y_lPUkPo50rDMZC7cc3kBaSOf5pP_xl_7HO0Mb3c8,1742
|
|
19
|
+
examples/salesforce.py,sha256=tiO6hdRI79H_oORPnIf1FvB0IuGTYG2KzZlnqC_J9Cw,1888
|
|
20
|
+
examples/sharepoint.py,sha256=a0h2zU28m6bW5g17b8BDrcsHzdzjSgb--gYV80bRqs0,2067
|
|
21
|
+
examples/singlestore.py,sha256=UAdBOtIcmhyRkZ-pIh7rrY7Yt_Ed8t3puulZ-MhaSfU,2060
|
|
22
|
+
examples/sql.py,sha256=YSmLD7Ri2a8CvBxRJWxPQefqV4kV8kF3W0l3TXu_iyY,2997
|
|
23
|
+
examples/vectara.py,sha256=bWSsMQL3hEEt5CLR9CZFnuplrSAeLj_EiADipRU_Gkw,2247
|
|
24
|
+
examples/weaviate.py,sha256=QUtYJ-y7eYfm69T316-aUm1imQZnoSJ09RGSVQAoTck,1906
|
|
25
|
+
test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
26
|
+
test/integration/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
27
|
+
test/integration/utils.py,sha256=CWqzEGw6TA_ZoP9hRUkW64TWYssooBbufcTRmbJvod8,401
|
|
28
|
+
test/integration/chunkers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
29
|
+
test/integration/chunkers/test_chunkers.py,sha256=MTPVBCBvh54fBqi_53oPkrH9QJtvJeE9YEXDOZ8G0so,1059
|
|
30
|
+
test/integration/connectors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
31
|
+
test/integration/connectors/conftest.py,sha256=3weYhwyXyAVVk8DsLqScDOk-PZwsrHQLs1RdYa1EYqQ,1015
|
|
32
|
+
test/integration/connectors/test_astradb.py,sha256=1hFqd9NI283t6lQZryBJMfJoRfP6PKVHTl_6X3Nk0bM,9925
|
|
33
|
+
test/integration/connectors/test_azure_ai_search.py,sha256=NMSjIbFO1EWqr8U-Owd4qdC3pDROjg7zNAXr5yGSsH4,9699
|
|
34
|
+
test/integration/connectors/test_chroma.py,sha256=_K4CUp9x5O_Uuw1uwDi1R0jIvzcaW0wI8tXfAV1hh7c,4536
|
|
35
|
+
test/integration/connectors/test_confluence.py,sha256=3sAFQxRUrS7xXIQXQBccY0r5kihnP8rc_sAs-44g4Ys,3587
|
|
36
|
+
test/integration/connectors/test_delta_table.py,sha256=-ivYySHKgFRCd6PUIK-fy6yOkku3uj4YhDDEUlqi-tM,6915
|
|
37
|
+
test/integration/connectors/test_dropbox.py,sha256=sW-NOXA0-4xtAUgnSnPGg-OhiIhKviROJPpxUt8y8s8,4939
|
|
38
|
+
test/integration/connectors/test_github.py,sha256=wFWRFhfhTUz3byk2FSe9qVv7xMxcBjHGs1FlhjtnTAQ,1500
|
|
39
|
+
test/integration/connectors/test_google_drive.py,sha256=ceiFoVnaguTsQrLHZk8jv-IZ-i_EP4wenHSX-QKHvTM,10300
|
|
40
|
+
test/integration/connectors/test_jira.py,sha256=0FnxFe42d32EGuArfxxnfINkoYNoCsgJjP7ZU6fePu8,2073
|
|
41
|
+
test/integration/connectors/test_lancedb.py,sha256=E8yFuvQMx68w1s1PXIBP8gUlNuUpCtiGNYd7YnDA6Aw,9213
|
|
42
|
+
test/integration/connectors/test_milvus.py,sha256=_cYmJMocsZuUroalT5uc9rcsHFnTIpJyJjIwK8oDDYc,7177
|
|
43
|
+
test/integration/connectors/test_mongodb.py,sha256=wt5o-7qtMtjGv0IPKlhEnD3-sJjBX8cv1acn1Mcq-TY,12450
|
|
44
|
+
test/integration/connectors/test_neo4j.py,sha256=BSOqRTY4ZV8o6TV1MOmUKQq7DzRFU_z9umjDk-yw-Jg,8450
|
|
45
|
+
test/integration/connectors/test_notion.py,sha256=3OXFcSM-jE1_E_JoGw--pz-cv3dPZvt18scACJiHjwo,5397
|
|
46
|
+
test/integration/connectors/test_onedrive.py,sha256=0SZB818cNsxYZlBJJpuvU1PqsFDxRaOiLfJTRcc9Bv0,5233
|
|
47
|
+
test/integration/connectors/test_pinecone.py,sha256=0XBK9xxZhry6Rnv0s-chIWgtN5d1p8Lx-kEEQMNuAnA,13650
|
|
48
|
+
test/integration/connectors/test_qdrant.py,sha256=z3RThQJKzCafCtfH0ocy_DNDlzmDdu_opQH3mKTn0CE,8031
|
|
49
|
+
test/integration/connectors/test_redis.py,sha256=gUU6Dv616tX9KANiqhkMrPWvmhbV2Gk1pNuIv2MvZG8,5093
|
|
50
|
+
test/integration/connectors/test_s3.py,sha256=Cd9HsPjrSB6xss1DO4YHqSORJJ2pUXNVaAlrlpqjZS8,7477
|
|
51
|
+
test/integration/connectors/test_sharepoint.py,sha256=wq4G6J5ffXhYquUySVd5UUtYWC43RoXgCSY4fdlX2z0,7643
|
|
52
|
+
test/integration/connectors/test_vectara.py,sha256=08GIh6J2QTSuupdDOJ_TiyQrYYK3vamUaEQe3_B5-WY,9278
|
|
53
|
+
test/integration/connectors/test_zendesk.py,sha256=15bl3wy0pLxS2dkBlE11yPOX71k6Vbxo0BEFQK-qcFs,3724
|
|
54
|
+
test/integration/connectors/databricks/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
55
|
+
test/integration/connectors/databricks/test_volumes_native.py,sha256=RbxImt0JPnvl8TAK_rAtIspaFuRmEFzjL9rLqkm6Juk,9563
|
|
56
|
+
test/integration/connectors/discord/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
57
|
+
test/integration/connectors/discord/test_discord.py,sha256=WeB0ST572GvELMlgorRMwRxYIWkleIobXn6ULhjo1rw,3173
|
|
58
|
+
test/integration/connectors/duckdb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
59
|
+
test/integration/connectors/duckdb/conftest.py,sha256=rlBHMJTiJ2a5xbvIxTOyhhcuTBc9DO-yTzD6Kf8X3hY,301
|
|
60
|
+
test/integration/connectors/duckdb/test_duckdb.py,sha256=o3CKTG2T15QyWwPTh7Yyv42eJ39opm7g9b508y1o1m8,2973
|
|
61
|
+
test/integration/connectors/duckdb/test_motherduck.py,sha256=S2EtKVy4HE0ysB3OvdFOUe5O-0w5Bk4Loy2Gyyff8b0,3218
|
|
62
|
+
test/integration/connectors/elasticsearch/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
63
|
+
test/integration/connectors/elasticsearch/conftest.py,sha256=-i4_7MkIxSQENz7nuD2uHuhGU9mZ33vpeTPhHtRpQfs,989
|
|
64
|
+
test/integration/connectors/elasticsearch/test_elasticsearch.py,sha256=NUUL88Z7uWfnEopZ0wkQtWMA94WDZw87v_oCkPShVM4,12076
|
|
65
|
+
test/integration/connectors/elasticsearch/test_opensearch.py,sha256=nV3gHD_tb79KRE8DqfUWpOfzem9LjojACspUHTSI7dw,11454
|
|
66
|
+
test/integration/connectors/sql/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
67
|
+
test/integration/connectors/sql/test_databricks_delta_tables.py,sha256=hYfmT9ud6NqJk1pibaF-1LvNgrfXBGUq0FTHkcIvICE,6145
|
|
68
|
+
test/integration/connectors/sql/test_postgres.py,sha256=b0do75CAxKFEgoODx7mNQqo5vEgZbWHSifMNV_H2IgU,6974
|
|
69
|
+
test/integration/connectors/sql/test_singlestore.py,sha256=uuw_T8EefwMcRD7clzviJxwb45f9k4G2dZIYqbNhM1s,6157
|
|
70
|
+
test/integration/connectors/sql/test_snowflake.py,sha256=dNHR8fk5V1WsvN6P1CesPKCsRbKTuf6zXgjyf7vgueg,7498
|
|
71
|
+
test/integration/connectors/sql/test_sqlite.py,sha256=6By1-XKiGCA5KlR1DHlM6ArU5c_2GjM5mE2RhMoNPg8,5960
|
|
72
|
+
test/integration/connectors/sql/test_vastdb.py,sha256=A0W-kHl1GRf2zHCmTWXOJjV8HPi3xlWvCTKgjebVZUY,1066
|
|
73
|
+
test/integration/connectors/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
74
|
+
test/integration/connectors/utils/constants.py,sha256=JhTk6YNw7JVpkk-Pl8zn2YYkExeL1oE9VBWm_kMYGfo,369
|
|
75
|
+
test/integration/connectors/utils/docker.py,sha256=4g1STiSbYN5qcmDTXyPxVJgwx97O6wk7n-DJ-zgzgag,4971
|
|
76
|
+
test/integration/connectors/utils/docker_compose.py,sha256=GVTB6Cel05c0VQ2n4AwkQQx_cBfz13ZTs1HpbaYipNU,2223
|
|
77
|
+
test/integration/connectors/utils/validation/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
78
|
+
test/integration/connectors/utils/validation/destination.py,sha256=m5RHgZ3_h6HA2SsWbg15rmKhZjzsyKqOtFlUqpy33SI,2746
|
|
79
|
+
test/integration/connectors/utils/validation/equality.py,sha256=R6d_1c-Si5518WJcBcshF_wBRnywnZ0ORQ-NL0xNmGo,2602
|
|
80
|
+
test/integration/connectors/utils/validation/source.py,sha256=WX67a1tYpyUFXvSxxZrTLEkpyVqZiUXhAsJ11RQzcqQ,13701
|
|
81
|
+
test/integration/connectors/utils/validation/utils.py,sha256=xYYvAbqP6_lZyH09_JjB4w2Sf8aQPvDVT5vZTs05ILs,1428
|
|
82
|
+
test/integration/connectors/weaviate/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
83
|
+
test/integration/connectors/weaviate/conftest.py,sha256=6Q6QdrLJmGHowRFSmoVSzup2EX6qASfS2Z5tqlpTm9M,387
|
|
84
|
+
test/integration/connectors/weaviate/test_cloud.py,sha256=1r16tNUSsq8JawfjgeRWtcfw2COYma0b298mBDZU__o,1281
|
|
85
|
+
test/integration/connectors/weaviate/test_local.py,sha256=q8vSpmFeTapSoUSNChIpc6qfyMdcICo28CJSm7L7V-o,5337
|
|
86
|
+
test/integration/embedders/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
87
|
+
test/integration/embedders/conftest.py,sha256=B2W771RbijR7G_GybsCzRyIvOzXqzbKZdRIlNDd5AGY,334
|
|
88
|
+
test/integration/embedders/test_azure_openai.py,sha256=nQle565sZu9N4xjWHBOfiOFGtldOdIK6S1YID00hK78,1787
|
|
89
|
+
test/integration/embedders/test_bedrock.py,sha256=-hy4wPmgBpXrk7OtPbZ8IE0qip6Ht1GptGLpmpqHxiw,3550
|
|
90
|
+
test/integration/embedders/test_huggingface.py,sha256=jNNBpXUA_UpgXXVo_Q2xYGFaknIZJu8eKJ4ifq19eig,986
|
|
91
|
+
test/integration/embedders/test_mixedbread.py,sha256=0Mcq9JU9wAJ_Wz2Enwyz4qGSbivDDqmE6ZJxlZpMuWw,1993
|
|
92
|
+
test/integration/embedders/test_octoai.py,sha256=R6NcBxPL_sVJLGmVTEjsaxfqjnLWxViXwL6vaze666s,2194
|
|
93
|
+
test/integration/embedders/test_openai.py,sha256=iwk56ZK1gllFtatcp6W_PA7x9h2M2ReIg4GXIWXp5qo,2124
|
|
94
|
+
test/integration/embedders/test_togetherai.py,sha256=5PzIdnvjMpjods_rhUqQ2nbVRXgld_F7OGWssnHxa0I,2202
|
|
95
|
+
test/integration/embedders/test_vertexai.py,sha256=xpjauYnRBxOqft0HXEMFk1iRoeQJm7E2eSunZbjj_H4,1827
|
|
96
|
+
test/integration/embedders/test_voyageai.py,sha256=kcuGxhG6kR1XVqmTw7La3MXnIC06CtjOq_n48nkF-eQ,2411
|
|
97
|
+
test/integration/embedders/utils.py,sha256=Sqqg-X31ZV1hojqPQBaZgM2lb2u8cG6s6OnH9JRsFjs,2717
|
|
98
|
+
test/integration/partitioners/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
99
|
+
test/integration/partitioners/test_partitioner.py,sha256=UYQd9x2-66F_FFeulC_2eg3FtjswK0Mt9Hwmg4b_pPs,2784
|
|
100
|
+
test/unit/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
101
|
+
test/unit/test_error.py,sha256=RflmngCdFNKOLXVfLnUdNfY3Mfg3k7DTEzfIl0B-syU,840
|
|
102
|
+
test/unit/test_html.py,sha256=ubsck9pVOnPDFL0P8TZkko_46MIaFLlSNQcsgFDgYoE,4496
|
|
103
|
+
test/unit/test_interfaces.py,sha256=Gv3WMJsw_3xPLy3nI3dIcJuLa2WvKYszSjI_W9XLtVM,787
|
|
104
|
+
test/unit/test_logger.py,sha256=0SKndXE_VRd8XmUHkrj7zuBQHZscXx3ZQllMEOvtF9Y,2380
|
|
105
|
+
test/unit/test_utils.py,sha256=xeSM02zOChSOO3dzDOVAEiQme1rQ8drjnJF93S3BFmk,7247
|
|
106
|
+
test/unit/chunkers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
107
|
+
test/unit/chunkers/test_chunkers.py,sha256=wRxbSj7P1FwRGDyVcARkm8CQSVCBCro3nTe54UoUBzc,1769
|
|
108
|
+
test/unit/connectors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
109
|
+
test/unit/connectors/test_confluence.py,sha256=Hr91nKw6018FEih-vSrVXFk0p0E9bSL1IeZVDxvITJ0,1916
|
|
110
|
+
test/unit/connectors/test_jira.py,sha256=sPRjoBVDmc-o2RWilcjs-VW_jkafIqSXBE9duCELfoA,12110
|
|
111
|
+
test/unit/connectors/ibm_watsonx/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
112
|
+
test/unit/connectors/ibm_watsonx/test_ibm_watsonx_s3.py,sha256=Yj9swJ_phiam-CFBzGnAFCkd8_oqzdA3ZQJQdpV8T1E,14503
|
|
113
|
+
test/unit/connectors/motherduck/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
114
|
+
test/unit/connectors/motherduck/test_base.py,sha256=4SHI3Hx1a28eNE_VDbl8gAssNZRIUNSGPNZgrkzjYWs,2429
|
|
115
|
+
test/unit/connectors/sql/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
116
|
+
test/unit/connectors/sql/test_sql.py,sha256=SfWYDBrR7pHFziKVEe6IAq5E3EQIz99ikQN3LnF1DrY,4622
|
|
117
|
+
test/unit/embed/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
118
|
+
test/unit/embed/test_mixedbreadai.py,sha256=Z9A9jg5eJRF4OgYTgbIzQUI27J16uv2qj2kp_Rv0r9k,1428
|
|
119
|
+
test/unit/embed/test_octoai.py,sha256=CWVrieqJh-N40J9n3nzqQPLOH9T1_mldkpZYRiHKxrg,1055
|
|
120
|
+
test/unit/embed/test_openai.py,sha256=RQ-4QIcRvq0JSBFNit_NRcy61EsOv7xh_TcKJKHwHGM,1186
|
|
121
|
+
test/unit/embed/test_vertexai.py,sha256=k_dK-yR_yx1RAOpmAgfcPo-osRDJP9aRCMCsJmQPxYI,1050
|
|
122
|
+
test/unit/embed/test_voyageai.py,sha256=QWoDZEX8cAIkTgn4NtIyGKzOAu-GmudD4VMujnfi1Gg,983
|
|
123
|
+
test/unit/embedders/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
124
|
+
test/unit/embedders/test_bedrock.py,sha256=HMaweO_v_9Y1SE2m5QImXP73cb26vNTUfc1onTBa1-g,1074
|
|
125
|
+
test/unit/embedders/test_huggingface.py,sha256=BpMC_AMlifjNf4Y61yBNR_8UU3H_x3ut2NnpFuB4kDo,1543
|
|
126
|
+
test/unit/embedders/test_mixedbread.py,sha256=8yT942TVVXC5EkrT_ReZie1In537BaAD6esRjntgxuU,1021
|
|
127
|
+
test/unit/embedders/test_octoai.py,sha256=JMfrFz25QfEh0ieB4bJneZd4XtNcdPOnNsN1Fj7gU-Q,1012
|
|
128
|
+
test/unit/embedders/test_openai.py,sha256=HoEW95289Ijgo3PJ-pEaDOknfdkSjPXTgkXmE6jJomY,1012
|
|
129
|
+
test/unit/embedders/test_togetherai.py,sha256=s24V_geDNZzblU74sSdC_m4Lqlzjp00RMpy56ptfdx0,1009
|
|
130
|
+
test/unit/embedders/test_vertexai.py,sha256=4gLJaV9Nr2k_SgA-EyJ_sDvm8XvyGbn2zTs4F4CXU2g,1142
|
|
131
|
+
test/unit/embedders/test_voyageai.py,sha256=VaWthF64pmxc-fOBbAQsEzMw7tV4t4Nz_H_Cc5tuAYQ,1193
|
|
132
|
+
test/unit/partitioners/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
133
|
+
test/unit/partitioners/test_partitioner.py,sha256=eJoUDbiKtweyU1WYfsY5KqVqoPjbx1MUsyHkbvvTNEk,2275
|
|
134
|
+
test/unit/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
135
|
+
test/unit/utils/data_generator.py,sha256=UoYVNjG4S4wlaA9gceQ82HIpF9_6I1UTHD1_GrQBHp0,973
|
|
136
|
+
unstructured_ingest/__init__.py,sha256=U4S_2y3zgLZVfMenHRaJFBW8yqh2mUBuI291LGQVOJ8,35
|
|
137
|
+
unstructured_ingest/__version__.py,sha256=YP5dlQlaTHZ-KOck8o_UzdjIFae7iENB5d3AMIKlZ3M,42
|
|
138
|
+
unstructured_ingest/error.py,sha256=qDncnJgbf5ils956RcO2CGlAKYDT5OaEM9Clv1JVTNc,1448
|
|
139
|
+
unstructured_ingest/errors_v2.py,sha256=9RuRCi7lbDxCguDz07y5RiHoQiFIOWwOD7xqzJ2B3Yw,436
|
|
140
|
+
unstructured_ingest/logger.py,sha256=S5nSqGcABoQyeicgRnBQFjDScCaTvFVivOCvbo-laL0,4479
|
|
141
|
+
unstructured_ingest/main.py,sha256=82G_7eG4PNhc_xIqj4Y_sFbDV9VI-nwSfsfJQMzovMk,169
|
|
142
|
+
unstructured_ingest/otel.py,sha256=NsUqOolA0gt69eFhZLABjVpcKoM9aus-AbxIKqWqPTc,4127
|
|
143
|
+
unstructured_ingest/unstructured_api.py,sha256=hWUXUhGtyfi2OcDR-BriHJyT4jJywf4zfG1qpSCf9Bo,5002
|
|
144
|
+
unstructured_ingest/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
145
|
+
unstructured_ingest/cli/cli.py,sha256=ZeIE9jP8fe7260nE8v7xYgLdqX9OtkQXAXSGWIkHLcA,645
|
|
146
|
+
unstructured_ingest/cli/cmds.py,sha256=EhDW5UX4V-N8Svjba4w7YWnRYl26__ADwzNXrfFBxM4,483
|
|
147
|
+
unstructured_ingest/cli/base/__init__.py,sha256=zXCa7F4FMqItmzxfUIVmyI-CeGh8X85yF8lRxwX_OYQ,83
|
|
148
|
+
unstructured_ingest/cli/base/cmd.py,sha256=M5twsXAna8yOX250eTDDq-WX1kyqnkuwveEZg8MMxmo,11477
|
|
149
|
+
unstructured_ingest/cli/base/dest.py,sha256=DW3zhdEbXM04Xb7yCqAjxYCei1-gidgANDm7XPI5xXw,3153
|
|
150
|
+
unstructured_ingest/cli/base/importer.py,sha256=nRt0QQ3qpi264-n_mR0l55C2ddM8nowTNzT1jsWaam8,1128
|
|
151
|
+
unstructured_ingest/cli/base/src.py,sha256=IyMWZJ1IB-d7FYAZf5fUUPVeQqk9HHi8psA6Lbh9hDg,2535
|
|
152
|
+
unstructured_ingest/cli/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
153
|
+
unstructured_ingest/cli/utils/click.py,sha256=1_eJgrwS2DFBl1jZPLsj1vgVgR7agFBIEBe4A_n7mH4,7827
|
|
154
|
+
unstructured_ingest/cli/utils/model_conversion.py,sha256=hMjAfOVvO1RXTDsw26mmersdncvddkb_rP9JTEgVVCw,7649
|
|
155
|
+
unstructured_ingest/data_types/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
156
|
+
unstructured_ingest/data_types/file_data.py,sha256=J0RQa7YXhhxiLVzhPbF5Hl2nzSpxLFK9vrP6RTBWlSg,3833
|
|
157
|
+
unstructured_ingest/embed/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
158
|
+
unstructured_ingest/embed/azure_openai.py,sha256=_-I-nwd-wdCiKkSdYBL4UKrTZ2UPWsM_0T69fcObs_I,1707
|
|
159
|
+
unstructured_ingest/embed/bedrock.py,sha256=t58V_QQjWPO62CTuP0aLFMDisPeXpxG2xSFGUhN-JvI,7726
|
|
160
|
+
unstructured_ingest/embed/huggingface.py,sha256=-ZD17O_H_UnK80fqig6y6wNKJckjx0HuAkY5vgPvk8M,2259
|
|
161
|
+
unstructured_ingest/embed/interfaces.py,sha256=SdB3t8eMPB8CbXzOYBpgwjzTvyb4T19L61Sr6Jy3_rw,5099
|
|
162
|
+
unstructured_ingest/embed/mixedbreadai.py,sha256=-Y0J27G9CL1t3ZTIeNjTjRviErSMAzJRf2zgDgMHUmg,4499
|
|
163
|
+
unstructured_ingest/embed/octoai.py,sha256=136UzSuQgV8Nxel2pB8Iv-4AvlFU6RRCa7N64fWFl6o,3855
|
|
164
|
+
unstructured_ingest/embed/openai.py,sha256=hK98QXb_8oN1E-QwNT6JElzYOxG1mvZCFYQW57pjv0E,3372
|
|
165
|
+
unstructured_ingest/embed/togetherai.py,sha256=T0v0_yTovy3sSeLPvk3PJccqcnmqCc_vxYs6pumjK3I,2983
|
|
166
|
+
unstructured_ingest/embed/vertexai.py,sha256=WwCIebqdZTFfMyqhM0nlG3_oeU69A3GuX3Vo5ayng1I,3688
|
|
167
|
+
unstructured_ingest/embed/voyageai.py,sha256=84O49p-vQuQzhNndPIfwCYcCNBoHFIX9QHZvc8m5DdA,4496
|
|
168
|
+
unstructured_ingest/interfaces/__init__.py,sha256=QIkWqjsq9INTa89gPuXlMlQL4s3y5TqLmPkuVuTyXcs,795
|
|
169
|
+
unstructured_ingest/interfaces/connector.py,sha256=qUFFJ3qgDMenTCZMtVRjq1DIwsVak6pxNjQOH2eVkMw,1623
|
|
170
|
+
unstructured_ingest/interfaces/downloader.py,sha256=xX0ZzsFRSzZb7SAeoeQph8sIbVq13DRw-3MYkdADrY0,2918
|
|
171
|
+
unstructured_ingest/interfaces/indexer.py,sha256=c2FwWJEQHfFD6vO-tGfYLpLiIs-TYViLAt8YmHfDbaM,824
|
|
172
|
+
unstructured_ingest/interfaces/process.py,sha256=S3A_9gkwwGC-iQxvnpj3Er6IJAjAT5npzpSgxuFAzUM,449
|
|
173
|
+
unstructured_ingest/interfaces/processor.py,sha256=VX7JqXlbG1plxMK8THWhWINPbTICaaUEk4XUXhnOixY,3303
|
|
174
|
+
unstructured_ingest/interfaces/upload_stager.py,sha256=nsS8VgFX44YIaESneyXQfa-mQUsKzowVdhwLpJjWxGM,3137
|
|
175
|
+
unstructured_ingest/interfaces/uploader.py,sha256=6Ax-Qn7it0yKVdUBun5-lJ3jxISPEq2b2gLXpzJh5Lg,2038
|
|
176
|
+
unstructured_ingest/pipeline/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
177
|
+
unstructured_ingest/pipeline/interfaces.py,sha256=Um2dQoRVppiRRYWkKnvRrYI9HdkV229Tu8_y2HmEaCc,8646
|
|
178
|
+
unstructured_ingest/pipeline/otel.py,sha256=wUVmUPWIk_X3yw0MuI-5QJ2wU2rQgaapinnS98iQBxI,1082
|
|
179
|
+
unstructured_ingest/pipeline/pipeline.py,sha256=2DShnmC5Hn5_YVswKQwejgCr6JT7BixMDgSrOeQGogk,16785
|
|
180
|
+
unstructured_ingest/pipeline/steps/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
181
|
+
unstructured_ingest/pipeline/steps/chunk.py,sha256=LiJMzgB0ZEDnPuYz5IwuK2k2iJoBIcfftp9cVXMOlf0,3179
|
|
182
|
+
unstructured_ingest/pipeline/steps/download.py,sha256=cw8KbZ4CNZ_on4xam-VehNnLvKkUourazvcaUB-ihGY,8205
|
|
183
|
+
unstructured_ingest/pipeline/steps/embed.py,sha256=3DfiHCaEAr1kakPZKnBYLhK1xNaPH0HZCmGmY62R5OY,3157
|
|
184
|
+
unstructured_ingest/pipeline/steps/filter.py,sha256=-bchttmqdNKSORSbqOU8bnhYMlj9XD09INvF7y5MyEk,1199
|
|
185
|
+
unstructured_ingest/pipeline/steps/index.py,sha256=_mfLj-3rF0ym1ZN6D31lwkGvTHrYSfeAUxzztd6SZb8,3564
|
|
186
|
+
unstructured_ingest/pipeline/steps/partition.py,sha256=OA-5DrYn2OdjRyMRVKtt0agm14Sy0bwYeRpta2b3ZrI,3240
|
|
187
|
+
unstructured_ingest/pipeline/steps/stage.py,sha256=oobrvLtZOOPEnXQXMDUnhaaKhheuSp9KvhUXCG1J8jc,2334
|
|
188
|
+
unstructured_ingest/pipeline/steps/uncompress.py,sha256=clyZKwKQLLKbkQDD2q98Aw1UAe3VqUY0n7_KWtGVMSw,1756
|
|
189
|
+
unstructured_ingest/pipeline/steps/upload.py,sha256=4hvh--03jzbGlxO0l1_2D5ec_EaGu04I5bFsxH0MnTg,1986
|
|
190
|
+
unstructured_ingest/processes/__init__.py,sha256=FaHWSCGyc7GWVnAsNEUUj7L8hT8gCVY3_hUE2VzWtUg,462
|
|
191
|
+
unstructured_ingest/processes/chunker.py,sha256=HCZM294_EmA1nnPsGA0OYVN8oPkF-EkskzNmwuWH4iw,5600
|
|
192
|
+
unstructured_ingest/processes/connector_registry.py,sha256=PoNhB-qOxvalaN-ssPWWhZSQ9QDdKMa6KzskCYYebfA,2195
|
|
193
|
+
unstructured_ingest/processes/embedder.py,sha256=ViDf-zpoAadroxdYVzeM_g5sfXdvTu7qbgm-3RUQPNk,7884
|
|
194
|
+
unstructured_ingest/processes/filter.py,sha256=EaNmJkv598ok6JkyJMPGwnNPpmlXXepN-Po_nv_Y_so,2151
|
|
195
|
+
unstructured_ingest/processes/partitioner.py,sha256=BMwSLTVhTYsydZy7S55EQGf-d1G2HXPYovGc4sMhvLk,9911
|
|
196
|
+
unstructured_ingest/processes/uncompress.py,sha256=o9JL3Bza4KPUTmrB39-v_5SuK_fYwhwFAhjQi2Pm8h8,2426
|
|
197
|
+
unstructured_ingest/processes/connectors/__init__.py,sha256=cR4ZH2dpPod7QR6OsgMx8X9kpFcEc1TVfQndUNoKGzI,6812
|
|
198
|
+
unstructured_ingest/processes/connectors/airtable.py,sha256=NcXTGqtBvx83JvCakcczCkj8zkRIYXYBOTs7pL5phzs,8955
|
|
199
|
+
unstructured_ingest/processes/connectors/astradb.py,sha256=illjFV-INZ8iOTNPjvhbK2g1xHuuNM5Gr0Qoh7Xjjsk,18297
|
|
200
|
+
unstructured_ingest/processes/connectors/azure_ai_search.py,sha256=x5kBnC01YQ61Ndovmkft9gq9jPl2o8G_Dbs_butQ7Kk,11528
|
|
201
|
+
unstructured_ingest/processes/connectors/chroma.py,sha256=q5_Fu4xb6_W_NyrPxVa3-jVwZLqVdlBNlR4dFvbd7l0,7235
|
|
202
|
+
unstructured_ingest/processes/connectors/confluence.py,sha256=0yqnJBgawx58rog07jK7keJ6sfZ-UEz3hz0WMGksoOA,12091
|
|
203
|
+
unstructured_ingest/processes/connectors/couchbase.py,sha256=KCHoYDNya9B05NIB5D78zXoizFyfpJRepcYBe1nLSOs,12298
|
|
204
|
+
unstructured_ingest/processes/connectors/delta_table.py,sha256=ZiHiqZf81i_Hxwasde_sba7kDQjmjV5-Jvy-fOTIqLs,7279
|
|
205
|
+
unstructured_ingest/processes/connectors/discord.py,sha256=6yEJ_agfKUqsV43wFsbMkcd8lcLJC0uqbo4izjdZ3rU,5294
|
|
206
|
+
unstructured_ingest/processes/connectors/github.py,sha256=smHCz6jOH1p_hW2S25bYunBBj_pYjz8HTw6wkzaJz_A,7765
|
|
207
|
+
unstructured_ingest/processes/connectors/gitlab.py,sha256=t69yLnBd5NtcLYmluNDbcRU1tXi8zTM75ofEc1k4oAY,10032
|
|
208
|
+
unstructured_ingest/processes/connectors/google_drive.py,sha256=GfxnjBRSY_eZQd1OkkLfD8DCXuwMpmysQs1ZAE6vbD8,20057
|
|
209
|
+
unstructured_ingest/processes/connectors/jira.py,sha256=eG8yTn8ZVEz7rBJ-ha8i_d9hEh6VALN6QJT_vbYvbL0,17142
|
|
210
|
+
unstructured_ingest/processes/connectors/kdbai.py,sha256=EbaBNnFk21LzqtwBOHoDPdwVaIchAYXz7_mf061lTcQ,5119
|
|
211
|
+
unstructured_ingest/processes/connectors/local.py,sha256=LluTLKv4g7FbJb4A6vuSxI9VhzKZuuQUpDS-cVNAQ2g,7426
|
|
212
|
+
unstructured_ingest/processes/connectors/milvus.py,sha256=Jr9cul7By03tGAPFnFBoqncnNWwbhKd-qbmkuqnin8U,8908
|
|
213
|
+
unstructured_ingest/processes/connectors/mongodb.py,sha256=1g_5bfbS6lah3nsOXqLAanR3zNYJ47_Njw_uV-uj3_U,14324
|
|
214
|
+
unstructured_ingest/processes/connectors/neo4j.py,sha256=eAM2XWSLA5caKJmbcd7ctn2TapreIJEXRoHoxT1OZwA,18718
|
|
215
|
+
unstructured_ingest/processes/connectors/onedrive.py,sha256=VBkKlbJgR7uKlKTnjNybAw6ZawLKflDPpy2uVvgWYWw,19296
|
|
216
|
+
unstructured_ingest/processes/connectors/outlook.py,sha256=FfHV9OfajGbj5VQZccqHsSyYJ0f6a4CLGQJi1s9UJjo,9294
|
|
217
|
+
unstructured_ingest/processes/connectors/pinecone.py,sha256=TG-1hVfOsKFepxPfy2MCwEVBEZF4msg8lfNQZBpo35Y,13980
|
|
218
|
+
unstructured_ingest/processes/connectors/redisdb.py,sha256=5LX6KtuNCzqjHqnJPw0zdKLE0iLx7Dk5RN9e_KT-up4,6975
|
|
219
|
+
unstructured_ingest/processes/connectors/salesforce.py,sha256=a2Erx5pXbxKIj--oJWTGk2TeOcdmipuxgleazbD62o4,11664
|
|
220
|
+
unstructured_ingest/processes/connectors/sharepoint.py,sha256=PowaqMzWr-VCW1rnwcAeRhHyE55kJ9J9FCVlrmtzN0E,4827
|
|
221
|
+
unstructured_ingest/processes/connectors/slack.py,sha256=e4ntATdht_olAPsco1DKwlrOkpKLyDznPO1NJmsr0A8,9243
|
|
222
|
+
unstructured_ingest/processes/connectors/utils.py,sha256=TAd0hb1f291N-q7-TUe6JKSCGkhqDyo7Ij8zmliBZUc,2071
|
|
223
|
+
unstructured_ingest/processes/connectors/vectara.py,sha256=frKJkc7ffstQhXD9-HkAGoQAofGkl6AsnKJhGcl8LgA,12294
|
|
224
|
+
unstructured_ingest/processes/connectors/assets/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
225
|
+
unstructured_ingest/processes/connectors/databricks/__init__.py,sha256=RtKAPyNtXh6fzEsOQ08pA0-vC1uMr3KqYG6cqiBoo70,2133
|
|
226
|
+
unstructured_ingest/processes/connectors/databricks/volumes.py,sha256=OWQrne9-5hPzc-kxGa2P53M3DoksDzMDyjLhQyihdCo,8020
|
|
227
|
+
unstructured_ingest/processes/connectors/databricks/volumes_aws.py,sha256=RP9rq2sfysygiqzXj6eX0CXeZpxk65xmrz7HZnWRQWA,2961
|
|
228
|
+
unstructured_ingest/processes/connectors/databricks/volumes_azure.py,sha256=NOHsRbvG4IB-8HWlwvCw2uuJqEwcvz332NC2kSBUAH8,3746
|
|
229
|
+
unstructured_ingest/processes/connectors/databricks/volumes_gcp.py,sha256=89N7YqtW8nHFmiq4_D201Ib-zXTLYU98Ap71goGoNEY,2997
|
|
230
|
+
unstructured_ingest/processes/connectors/databricks/volumes_native.py,sha256=pivySGMmFSsyuB42ARAWAPXFQ7qTQxO3dfEoE23pBNM,3104
|
|
231
|
+
unstructured_ingest/processes/connectors/databricks/volumes_table.py,sha256=ctQSoStHR1P1alhIH84Mpqmw4Wtnt3FsmBG7iH14iPE,8214
|
|
232
|
+
unstructured_ingest/processes/connectors/duckdb/__init__.py,sha256=Dr6BRJJGefJnnp_vn5W5gBd7vrCCXTMLweuDIqTP-fM,558
|
|
233
|
+
unstructured_ingest/processes/connectors/duckdb/base.py,sha256=-8TKht_HCssKM8EBA6rszAB2GdbeGZ25Vbp-Y_gRTfI,2935
|
|
234
|
+
unstructured_ingest/processes/connectors/duckdb/duckdb.py,sha256=-C4gxvy52TFopc7LdIaJeNgBhx5UUH2DRABuyun5W9Y,4429
|
|
235
|
+
unstructured_ingest/processes/connectors/duckdb/motherduck.py,sha256=lxE7vyEj3lD3SdGwgfuMhZKvRPbynscPu9u_xukwM30,4692
|
|
236
|
+
unstructured_ingest/processes/connectors/elasticsearch/__init__.py,sha256=M8mmBWoP6J5R3hxg6BQUMexYlTUxUxdBoIcjUop8yt8,826
|
|
237
|
+
unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py,sha256=iNedi-JVkAvdF15CbKwVRwXJazyST6ha3zcNyyGwVmQ,19003
|
|
238
|
+
unstructured_ingest/processes/connectors/elasticsearch/opensearch.py,sha256=wggHvw8h-X0-3WPNxj9rt2xkrE7Pv7CV0B0KzTMzBB4,6944
|
|
239
|
+
unstructured_ingest/processes/connectors/fsspec/__init__.py,sha256=3HTdw4L4mdN4W8UX0jQbMxBg0ZfITPbEXU7Bwdo1BfI,1843
|
|
240
|
+
unstructured_ingest/processes/connectors/fsspec/azure.py,sha256=31VNiG5YnXfhrFX7QJ2O1ubeWHxbe1sYVIztefbscAQ,7148
|
|
241
|
+
unstructured_ingest/processes/connectors/fsspec/box.py,sha256=1gLS7xR2vbjgKBrQ4ZpI1fKTsJuIDfXuAzx_a4FzxG4,5873
|
|
242
|
+
unstructured_ingest/processes/connectors/fsspec/dropbox.py,sha256=HwwKjQmjM7yFk9Esh_F20xDisRPXGUkFduzaasByRDE,8355
|
|
243
|
+
unstructured_ingest/processes/connectors/fsspec/fsspec.py,sha256=13TJmipcz9mYQT6Qi4WmqUV3veHIhbLZIW_70qY-5tI,14469
|
|
244
|
+
unstructured_ingest/processes/connectors/fsspec/gcs.py,sha256=ouxISCKpZTAj3T6pWGYbASu93wytJjl5WSICvQcrgfE,7172
|
|
245
|
+
unstructured_ingest/processes/connectors/fsspec/s3.py,sha256=6tICE_qECwnWW7ViiF08Ax1y91EkDhfs8Bf-d7udJeA,7125
|
|
246
|
+
unstructured_ingest/processes/connectors/fsspec/sftp.py,sha256=pR_a2SgLjt8ffNkariHrPB1E0HVSTj5h3pt7KxTU3TI,6371
|
|
247
|
+
unstructured_ingest/processes/connectors/fsspec/utils.py,sha256=jec_Qfe2hbfahBuY-u8FnvHuv933AI5HwPFjOL3kEEY,456
|
|
248
|
+
unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py,sha256=kf0UpgdAY2KK1R1FbAB6GEBBAIOeYQ8cZIr3bp660qM,374
|
|
249
|
+
unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py,sha256=vTW12EN3WIYgxtonedamSNuwDPt8sPsbp0ehQ81enf4,11601
|
|
250
|
+
unstructured_ingest/processes/connectors/kafka/__init__.py,sha256=pFN2cWwAStiGTAsQ616GIWKi_hDv0s74ZvNqhJEp1Pc,751
|
|
251
|
+
unstructured_ingest/processes/connectors/kafka/cloud.py,sha256=Ki6iOLoZ86tYWdnLnMWYvb2hUCneKqo4mTJcfXh7YoQ,3432
|
|
252
|
+
unstructured_ingest/processes/connectors/kafka/kafka.py,sha256=7NMvWijfoliyAgnmz8TM8oJt5x7RDzC-ABPdYAm7J3w,10306
|
|
253
|
+
unstructured_ingest/processes/connectors/kafka/local.py,sha256=coYclqRVdiluhvLBnE8ZUj-tI9Rt88fQArFeL2vIh60,2575
|
|
254
|
+
unstructured_ingest/processes/connectors/lancedb/__init__.py,sha256=B_Qc9Ivi1xfNAk7_2TU3M-kkYxJ_Orl90KNWLt1ywaE,1250
|
|
255
|
+
unstructured_ingest/processes/connectors/lancedb/aws.py,sha256=zmnOMho11p30ibbLRlsJBuaCEEms1LftjjSvsyTj5tU,1404
|
|
256
|
+
unstructured_ingest/processes/connectors/lancedb/azure.py,sha256=UTcEjnMad8EgT2rRwG842Vinlyod6uWMhMfj1ULbRb4,1452
|
|
257
|
+
unstructured_ingest/processes/connectors/lancedb/cloud.py,sha256=ykhcCSUaw6VOpH6BKRFJlEIdLS0wZtdjLUi2TaeEzt0,1332
|
|
258
|
+
unstructured_ingest/processes/connectors/lancedb/gcp.py,sha256=4-3ZJ-I47chrVXmizDq_xHCFHBipoxZp8cvOGxVE6c8,1352
|
|
259
|
+
unstructured_ingest/processes/connectors/lancedb/lancedb.py,sha256=qyco2ZPcE-MqEO10UURyycBBOSQ6TJfm-f8A89a2pBk,5825
|
|
260
|
+
unstructured_ingest/processes/connectors/lancedb/local.py,sha256=rhRxoK-h1Q0wdRhUq8Y5y48fbkvvCcIbA4gZvtteHq4,1263
|
|
261
|
+
unstructured_ingest/processes/connectors/notion/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
262
|
+
unstructured_ingest/processes/connectors/notion/client.py,sha256=wmlkbuER2crKjrqYm1dJwrCe8qH9gX-R4yckg5GQ41I,13174
|
|
263
|
+
unstructured_ingest/processes/connectors/notion/connector.py,sha256=6dPNQQNkEaFMbztVe6fkuB29hnCSBpm3gkacoH6VTNA,13310
|
|
264
|
+
unstructured_ingest/processes/connectors/notion/helpers.py,sha256=Z4qjdsdFyrgE0KwE8gDZdZ88LsP_NYQit697Po6w878,16424
|
|
265
|
+
unstructured_ingest/processes/connectors/notion/interfaces.py,sha256=SrTT-9c0nvk0fMqVgudYF647r04AdMKi6wkIkMy7Szw,563
|
|
266
|
+
unstructured_ingest/processes/connectors/notion/ingest_backoff/__init__.py,sha256=cfdIJuZDFcF3w84sTyYqZ8vXnSMfMABXFc100r3g5kU,63
|
|
267
|
+
unstructured_ingest/processes/connectors/notion/ingest_backoff/_common.py,sha256=ey0PN6Hf7aEpQQau710EHlEmQ3hq4YyYzgNLhPzzK58,3724
|
|
268
|
+
unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py,sha256=uZDljTCBIJ-9QNSw_TB2FJUJ37Noi9ev-ipyfGtGcjk,4181
|
|
269
|
+
unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py,sha256=CvNAL5YXPbGpa9ynH0R4c-yUTh-cFSFYtVViY_NV7RA,926
|
|
270
|
+
unstructured_ingest/processes/connectors/notion/types/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
271
|
+
unstructured_ingest/processes/connectors/notion/types/block.py,sha256=pEhy3fFCXSRd3HjRV2k5tT9dcMGNZE4G4Jjg9dPF0iM,3072
|
|
272
|
+
unstructured_ingest/processes/connectors/notion/types/database.py,sha256=4VNhpX06dGKmA-COLLzh-sfdSoxQzdUxl1Sk05_B258,2636
|
|
273
|
+
unstructured_ingest/processes/connectors/notion/types/date.py,sha256=VNLs5nTAIGWKxkFUwE13Yoeo5kVQiI-bxUVhjW9SWhE,753
|
|
274
|
+
unstructured_ingest/processes/connectors/notion/types/file.py,sha256=MpEWi7OE0mpA3efq11HJQJTlaVpMMM8cXVE_Pk0m0kg,1315
|
|
275
|
+
unstructured_ingest/processes/connectors/notion/types/page.py,sha256=0fExZsJHXBzaRLwJAKpZwtnfQf_gZ7KnTIbyIyDYC4Q,1471
|
|
276
|
+
unstructured_ingest/processes/connectors/notion/types/parent.py,sha256=l-EJBKU0HNpDg7p87cATqw0WlUSATD9btyVF7B2A2nI,1706
|
|
277
|
+
unstructured_ingest/processes/connectors/notion/types/rich_text.py,sha256=LPeyFconK_-8Kl3DSLFiCmxwXH3LWthBiYSzj4FAJKY,5483
|
|
278
|
+
unstructured_ingest/processes/connectors/notion/types/user.py,sha256=AKV2ZUcOPe8a98VmyOEaQf-ow6lR5kzudvmTH9BJTKU,1824
|
|
279
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/__init__.py,sha256=mp-jlTLXntT94jdG3koguXTwQ4q_a-ZRR9M_yYew3Jc,1505
|
|
280
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py,sha256=-SDNODMDsp92-YGtKR0ZDAdcWJ7v-YMyrXf2iat-9oU,1191
|
|
281
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py,sha256=uR2EwXyAMCBSj-nG4Vp_biZg4CMNXQt4HVwCUS2K08Q,493
|
|
282
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py,sha256=VyP0l6mNk4-u9vWQOC0Y_lkKhv81b7z74UMcCSiycbo,993
|
|
283
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/callout.py,sha256=MUi8TSn2fL-mfd-yiwOEG5nvjN550YzFAiwSC88UBGA,2619
|
|
284
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py,sha256=0HkAZHFQtRa8rN48JW7x2pJzvJScjCl5yDhmym8UPHc,544
|
|
285
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py,sha256=r4fp_O0NYP4UxUfncJdhOGl7C_spprqzq3etK9tILIE,564
|
|
286
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/code.py,sha256=DkhXFYkNzSswwuGh0it4p-RucTAuQPPxPuyEUj09OkI,1404
|
|
287
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py,sha256=6xGe2rdXFrYIrJVl_j9S-lMVnUiJ_yUS500gcZ6ZQ5s,765
|
|
288
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/divider.py,sha256=olfRUhY2lrrC-M2a2QlFwIq5yuFKLbd2l4pyrvyAyC4,576
|
|
289
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/embed.py,sha256=jraPIVEmHmBzzkCz6u5FPa-k46_EGWgjWvuGY3ysG6o,1113
|
|
290
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/equation.py,sha256=8jlcHwF5nrt_2xVHb_g5xjQ-__Wz2vhXJr-oNwF4BQU,548
|
|
291
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/file.py,sha256=LbrdGg1cbUz9EZk1o97lBPrlijLb_SZS7REhveWgrGo,1725
|
|
292
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/heading.py,sha256=e8RWpxBwI9Ffkg25Hv76mhO_wERlu-EJl7XNk_nWUIY,1157
|
|
293
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/image.py,sha256=D3aQ5IgFs12GRM19ePG7ZXpbDQkcqlToy4fEruAR9XA,658
|
|
294
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py,sha256=AL2MGHVJQa3E1-HqBQtnrowCGvnHMboqWVlV1a-teHY,591
|
|
295
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py,sha256=nH8ETMhlRl5JZ6cSN3Iknlv9DvoCYfO7zTNxw_dlh9s,756
|
|
296
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py,sha256=QzcGKjtz6uAyx6BesBDwE6e8A9heBU0G4Y269gSOpjM,959
|
|
297
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py,sha256=qvc4orjP2XcbaeBWor-a3xAEglLkyb-epknm7SXgU1E,992
|
|
298
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py,sha256=St43RmpefAzDwJKTwz2CdGVm-xeUwHkYgtQtLYQbnw0,1661
|
|
299
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/quote.py,sha256=yl7npmdcO6oFNgTNGVN_Ihvzexv12Xwg1r4NWAOjILQ,1176
|
|
300
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py,sha256=Rc3xyKtnOwovx-O-dzmS9pX0h4-s41YnWmmEz5TYxdU,1333
|
|
301
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/table.py,sha256=eYUlRp4uCwjy_eB0mLh7MGMe1qrr_hnOxXS5RfUM2DQ,1724
|
|
302
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py,sha256=bR5DdecXFz468okM5WOs10DK8_14Dj7OCLSRusMZzsk,534
|
|
303
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/template.py,sha256=bq2Vh2X7ptpofs9OZnATHySZe2DzbOLsNNfpEI70NgM,968
|
|
304
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/todo.py,sha256=Kigaah1060H-YG4MWhKqlsOcBEQs1iYtknZa181jzDk,1386
|
|
305
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py,sha256=6ae_eR3SOfUgTw-XO_F3JRBaczSp8UZfLBFMRMO5NHo,1188
|
|
306
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py,sha256=q_p9XH8sQB8xwFqi9yEl6Fvur3fTLdeVdQCh0gSju58,442
|
|
307
|
+
unstructured_ingest/processes/connectors/notion/types/blocks/video.py,sha256=XK-O7XPs5ejTUWrg2FTLvbOZajs-yDtVhR79HSEcxvo,779
|
|
308
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py,sha256=iUdtLGlHe52daXBWVlGghXcGSxCOCDiFASsuKb4_UAM,3225
|
|
309
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py,sha256=1GiebXsYYoQmM1GZJBrzv9dnM9P9dtQJ-dwbQDo6PdI,1010
|
|
310
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py,sha256=NvOuM_1SVBdn-6acYxKJ1ThMuWJ935aYtaKV1TOBTFQ,949
|
|
311
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py,sha256=HPf6Dp7wWWRQ-j7AGFWMm-wkakuJ4R8_rfz9RPNZuec,834
|
|
312
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/date.py,sha256=5nYyh8S9HzFyZb2bZZttSZj8CE0Q2dc73cA27m-H1k4,1067
|
|
313
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/email.py,sha256=0powD6-ZftD0WSHxjTHMQ388RK-WfWLaYuEJIT19mdM,831
|
|
314
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/files.py,sha256=1-Jnx1YyWptNW3737oOzr7WGItS7aNj68BYaWyBRljo,1020
|
|
315
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py,sha256=LV9d6NRLGu7eIr6wpfnkLxgQug107LGAFC1Z9ooc3xw,1069
|
|
316
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py,sha256=1TMFWA5GIb6pJbYAF_Q2ZPOWNa9y0p8ELk6UzLMZ2FY,926
|
|
317
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py,sha256=MvZgXTBx1uS-vn9vITFCIRPFnV26_rcao1YhBiZu5bU,864
|
|
318
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py,sha256=WnEJyDmEaI39ETopeoXwFp6Iog-rF2TYWG3o-DRv2ic,1917
|
|
319
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/number.py,sha256=LbrTryg5z8Q1dLekxwXi_qCvOwH6n_LD4iVYsVBNGB4,1056
|
|
320
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/people.py,sha256=LXNbhBo53Lf7jM_bLYgarwLao7ymEJjZhJ-U5xMBbLc,1184
|
|
321
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py,sha256=NoIVkd31mvvZYa0DOkE4JibJdhJjIEL8C78jNxcxtVo,909
|
|
322
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py,sha256=e4zQmjtP2w1RNfKDaWu2-AOhwjM_QP_TrjyxAQUnpN4,1528
|
|
323
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py,sha256=EeWvzLx9zYT3crH_eshAOf1L60k5gMqJUqQGiI-is7c,1171
|
|
324
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py,sha256=xyaA2yIvDfe-tu_TXi6ZjCz2jCawFS2DVKvfSr-nxjQ,1277
|
|
325
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/select.py,sha256=wF-V5JKzi4y3i1-eE6kXQWeSbqYo33D1LXdXJIpTkyM,1756
|
|
326
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/status.py,sha256=GneqbmGaBqOecoApH6I4YWf5flvuVk2m5wMJrRw7Nvo,2044
|
|
327
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/title.py,sha256=4Tnfxxx_Nr-Wkwd7urotp1xTGO9itWe8qI3OnfooLrE,1023
|
|
328
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py,sha256=i95msSj2-l3yG8tw02dIChADDEy695MWmNWXJq0jGD4,1173
|
|
329
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/url.py,sha256=azWD7VwkYlI4vFYgsuMvr2618skr4MCtagSTuJ509bg,873
|
|
330
|
+
unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py,sha256=bge_vjWUYh9-CJ_gmVg7ESVLAxHeq_wicp-6vlqNRwQ,2367
|
|
331
|
+
unstructured_ingest/processes/connectors/qdrant/__init__.py,sha256=7WN_3M3qQ0O7pUJSXIKtPqAvKX2tQ_WxClCHbFeqPfc,757
|
|
332
|
+
unstructured_ingest/processes/connectors/qdrant/cloud.py,sha256=H5Plp2xqFheESLertj56o78CL4exyCQhBDE1TGAzcWU,1618
|
|
333
|
+
unstructured_ingest/processes/connectors/qdrant/local.py,sha256=3b43kSVoGMcFWTRiIHMPcctKyVBdsaLi8KXloAwq76o,1582
|
|
334
|
+
unstructured_ingest/processes/connectors/qdrant/qdrant.py,sha256=1Y1-nfKqt4YooqKMqRKVE_ItV0S1v__PTaEhI3vvtOE,5456
|
|
335
|
+
unstructured_ingest/processes/connectors/qdrant/server.py,sha256=biyF4xr6e7CH0loj_OPt02Xrx4DMkkxqYMAsVXuJ5-Q,1607
|
|
336
|
+
unstructured_ingest/processes/connectors/sql/__init__.py,sha256=WNO7jSL1ABw7K5IxLc-eeKWGGJDk7jCp_OTLdTTkZug,2056
|
|
337
|
+
unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py,sha256=9fu-SmBkkrhxF6gC2FFd7tAsPoTswtM3YlMw3fYGjB4,9084
|
|
338
|
+
unstructured_ingest/processes/connectors/sql/postgres.py,sha256=MY_jDMdXj82UsGQDcpMbMDnl7wpNuyFaHh1_QxJtFv4,5115
|
|
339
|
+
unstructured_ingest/processes/connectors/sql/singlestore.py,sha256=162FnOvQ9fERUUQarfiHfTTimLj_5y5MoBl8j0toCtA,5702
|
|
340
|
+
unstructured_ingest/processes/connectors/sql/snowflake.py,sha256=92PZYhAGEwbhMJ-tqwfAqfLH59BTZ3rZZn5az6GhAKw,9367
|
|
341
|
+
unstructured_ingest/processes/connectors/sql/sql.py,sha256=uUPTJYuUDrivRd8Z66NA-JXLXJo4dsYbBwfotxFp2kI,15722
|
|
342
|
+
unstructured_ingest/processes/connectors/sql/sqlite.py,sha256=mpzthGrRjVtGsmm7E_eCZzxuLUtpgxki0lx1y7s8l5I,5310
|
|
343
|
+
unstructured_ingest/processes/connectors/sql/vastdb.py,sha256=vXYQ5it2uK-PjvKduBQa31MI4y6vAD60-gGE3hp6dPc,9605
|
|
344
|
+
unstructured_ingest/processes/connectors/weaviate/__init__.py,sha256=1Vnz8hm_Cf3NkQUTz5ZD4QkbLSVql4UvRoY2j2FnC9k,853
|
|
345
|
+
unstructured_ingest/processes/connectors/weaviate/cloud.py,sha256=tDQ4Vfph1RwADzS0Lk4TSoeT6TZ2gX9DNi78yXkgDw0,6245
|
|
346
|
+
unstructured_ingest/processes/connectors/weaviate/embedded.py,sha256=buizqBd6PSbd9VgRrOj43GZEorBpDFkUIkE6sN9emhw,3008
|
|
347
|
+
unstructured_ingest/processes/connectors/weaviate/local.py,sha256=4fgZsL9dgnWuaSNqVlKROm-S3Ql3naLmKvigLBgUQdw,2195
|
|
348
|
+
unstructured_ingest/processes/connectors/weaviate/weaviate.py,sha256=SqtGcQgejGH0N1R49tGrUtGcTB8mt7sywXmWFTIcpB8,12866
|
|
349
|
+
unstructured_ingest/processes/connectors/zendesk/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
350
|
+
unstructured_ingest/processes/connectors/zendesk/client.py,sha256=GvPIpx4aYdD58-edHgvCFjFao94uR0O5Yf4dT9NCmSk,11952
|
|
351
|
+
unstructured_ingest/processes/connectors/zendesk/zendesk.py,sha256=kBBiSmP4_2Z8mdOzHRXK1vE-i0xvrLLn5E3rRdThxwg,9035
|
|
352
|
+
unstructured_ingest/processes/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
353
|
+
unstructured_ingest/processes/utils/blob_storage.py,sha256=4pY2MMdw7ib_taAshZxFLlhxaRnrrJFndHDDt09qhTM,1013
|
|
354
|
+
unstructured_ingest/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
355
|
+
unstructured_ingest/utils/chunking.py,sha256=9b3sXMA6L8RW5xAkKQbwdtVudGLAcj_sgT6Grh5tyYM,1870
|
|
356
|
+
unstructured_ingest/utils/compression.py,sha256=_BkFREoa0fkJ6z-1lY76HCmy8mLymbPCg55iMUQTd5c,2653
|
|
357
|
+
unstructured_ingest/utils/constants.py,sha256=pDspTYz-nEojHBqrZNfssGEiujmVa02pIWL63PQP9sU,103
|
|
358
|
+
unstructured_ingest/utils/data_prep.py,sha256=s4i_P5VYcOk9O1rsAfSiFpWdxfnc02WfQf5j3iOdiVo,8150
|
|
359
|
+
unstructured_ingest/utils/dep_check.py,sha256=SXXcUna2H0RtxA6j1S2NGkvQa9JP2DujWhmyBa7776Y,2400
|
|
360
|
+
unstructured_ingest/utils/html.py,sha256=0WduP8tI5S3nHFQi6XHNPHgsIC9j3iWwyIayX9gDLiE,6386
|
|
361
|
+
unstructured_ingest/utils/ndjson.py,sha256=nz8VUOPEgAFdhaDOpuveknvCU4x82fVwqE01qAbElH0,1201
|
|
362
|
+
unstructured_ingest/utils/pydantic_models.py,sha256=BT_j15e4rX40wQbt8LUXbqfPhA3rJn1PHTI_G_A_EHY,1720
|
|
363
|
+
unstructured_ingest/utils/string_and_date_utils.py,sha256=QBj8HXZGvDZQSULLOQwJ8tb3r2aYrTBQ71rkiV6gZdI,2519
|
|
364
|
+
unstructured_ingest/utils/table.py,sha256=WZechczgVFvlodUWFcsnCGvBNh1xRm6hr0VbJTPxKAc,3669
|
|
365
|
+
unstructured_ingest-0.7.1.dist-info/LICENSE.md,sha256=SxkKP_62uIAKb9mb1eH7FH4Kn2aYT09fgjKpJt5PyTk,11360
|
|
366
|
+
unstructured_ingest-0.7.1.dist-info/METADATA,sha256=Ex_8EkItZzbGEoRJwR7Fqm_t0aajIZLVdtzwL7XBsQw,15050
|
|
367
|
+
unstructured_ingest-0.7.1.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
|
|
368
|
+
unstructured_ingest-0.7.1.dist-info/entry_points.txt,sha256=gUAAFnjFPnBgThJSEbw0N5ZjxtaKlT1s9e05_arQrNw,70
|
|
369
|
+
unstructured_ingest-0.7.1.dist-info/top_level.txt,sha256=85vUyT6fV2A5eCEM3M3FPRUUI9vZOVK1xVZt7eo1oV8,34
|
|
370
|
+
unstructured_ingest-0.7.1.dist-info/RECORD,,
|
test/unit/v2/test_utils.py
DELETED
|
@@ -1,82 +0,0 @@
|
|
|
1
|
-
import json
|
|
2
|
-
from typing import Any
|
|
3
|
-
|
|
4
|
-
from pydantic import BaseModel, Field, Secret, SecretStr
|
|
5
|
-
from pydantic.types import _SecretBase
|
|
6
|
-
|
|
7
|
-
from unstructured_ingest.v2.utils import serialize_base_model, serialize_base_model_json
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
class MockChildBaseModel(BaseModel):
|
|
11
|
-
child_secret_str: SecretStr
|
|
12
|
-
child_secret_float: Secret[float]
|
|
13
|
-
child_not_secret_dict: dict[str, Any] = Field(default_factory=dict)
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
class MockBaseModel(BaseModel):
|
|
17
|
-
secret_str: SecretStr
|
|
18
|
-
not_secret_bool: bool
|
|
19
|
-
secret_child_base: Secret[MockChildBaseModel]
|
|
20
|
-
not_secret_list: list[int] = Field(default_factory=list)
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
model = MockBaseModel(
|
|
24
|
-
secret_str="secret string",
|
|
25
|
-
not_secret_bool=False,
|
|
26
|
-
secret_child_base=MockChildBaseModel(
|
|
27
|
-
child_secret_str="child secret string",
|
|
28
|
-
child_secret_float=3.14,
|
|
29
|
-
child_not_secret_dict={"key": "value"},
|
|
30
|
-
),
|
|
31
|
-
not_secret_list=[1, 2, 3],
|
|
32
|
-
)
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
def test_serialize_base_model():
|
|
36
|
-
|
|
37
|
-
serialized_dict = model.model_dump()
|
|
38
|
-
assert isinstance(serialized_dict["secret_str"], _SecretBase)
|
|
39
|
-
assert isinstance(serialized_dict["secret_child_base"], _SecretBase)
|
|
40
|
-
|
|
41
|
-
serialized_dict_w_secrets = serialize_base_model(model=model)
|
|
42
|
-
assert not isinstance(serialized_dict_w_secrets["secret_str"], _SecretBase)
|
|
43
|
-
assert not isinstance(serialized_dict_w_secrets["secret_child_base"], _SecretBase)
|
|
44
|
-
|
|
45
|
-
expected_dict = {
|
|
46
|
-
"secret_str": "secret string",
|
|
47
|
-
"not_secret_bool": False,
|
|
48
|
-
"secret_child_base": {
|
|
49
|
-
"child_secret_str": "child secret string",
|
|
50
|
-
"child_secret_float": 3.14,
|
|
51
|
-
"child_not_secret_dict": {"key": "value"},
|
|
52
|
-
},
|
|
53
|
-
"not_secret_list": [1, 2, 3],
|
|
54
|
-
}
|
|
55
|
-
|
|
56
|
-
assert serialized_dict_w_secrets == expected_dict
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
def test_serialize_base_model_json():
|
|
60
|
-
serialized_json = model.model_dump_json()
|
|
61
|
-
serialized_dict = json.loads(serialized_json)
|
|
62
|
-
expected_dict = {
|
|
63
|
-
"secret_str": "**********",
|
|
64
|
-
"not_secret_bool": False,
|
|
65
|
-
"secret_child_base": "**********",
|
|
66
|
-
"not_secret_list": [1, 2, 3],
|
|
67
|
-
}
|
|
68
|
-
assert expected_dict == serialized_dict
|
|
69
|
-
|
|
70
|
-
serialized_json_w_secrets = serialize_base_model_json(model=model)
|
|
71
|
-
serialized_dict_w_secrets = json.loads(serialized_json_w_secrets)
|
|
72
|
-
expected_dict_w_secrets = {
|
|
73
|
-
"secret_str": "secret string",
|
|
74
|
-
"not_secret_bool": False,
|
|
75
|
-
"secret_child_base": {
|
|
76
|
-
"child_secret_str": "child secret string",
|
|
77
|
-
"child_secret_float": 3.14,
|
|
78
|
-
"child_not_secret_dict": {"key": "value"},
|
|
79
|
-
},
|
|
80
|
-
"not_secret_list": [1, 2, 3],
|
|
81
|
-
}
|
|
82
|
-
assert expected_dict_w_secrets == serialized_dict_w_secrets
|
|
@@ -1,12 +0,0 @@
|
|
|
1
|
-
import typing as t
|
|
2
|
-
|
|
3
|
-
from unstructured_ingest.cli.base.src import BaseSrcCmd
|
|
4
|
-
from unstructured_ingest.cli.cmds import base_src_cmd_fns
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
def get_src_cmd_map() -> t.Dict[str, t.Callable[[], BaseSrcCmd]]:
|
|
8
|
-
return {b().cmd_name_key: b for b in base_src_cmd_fns}
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
def get_src_cmd(cmd_name: str) -> t.Callable[[], BaseSrcCmd]:
|
|
12
|
-
return get_src_cmd_map()[cmd_name]
|
|
@@ -1,145 +0,0 @@
|
|
|
1
|
-
from __future__ import annotations
|
|
2
|
-
|
|
3
|
-
import collections
|
|
4
|
-
import typing as t
|
|
5
|
-
|
|
6
|
-
from unstructured_ingest.cli.base.src import BaseSrcCmd
|
|
7
|
-
from unstructured_ingest.cli.cmds.fsspec.sftp import get_base_src_cmd as sftp_base_src_cmd
|
|
8
|
-
|
|
9
|
-
from .airtable import get_base_src_cmd as airtable_base_src_cmd
|
|
10
|
-
from .astradb import get_base_dest_cmd as astradb_base_dest_cmd
|
|
11
|
-
from .astradb import get_base_src_cmd as astradb_base_src_cmd
|
|
12
|
-
from .azure_ai_search import get_base_dest_cmd as azure_ai_search_base_dest_cmd
|
|
13
|
-
from .biomed import get_base_src_cmd as biomed_base_src_cmd
|
|
14
|
-
from .chroma import get_base_dest_cmd as chroma_base_dest_cmd
|
|
15
|
-
from .clarifai import get_base_dest_cmd as clarifai_base_dest_cmd
|
|
16
|
-
from .confluence import get_base_src_cmd as confluence_base_src_cmd
|
|
17
|
-
from .databricks_volumes import get_base_dest_cmd as databricks_volumes_dest_cmd
|
|
18
|
-
from .delta_table import get_base_dest_cmd as delta_table_dest_cmd
|
|
19
|
-
from .delta_table import get_base_src_cmd as delta_table_base_src_cmd
|
|
20
|
-
from .discord import get_base_src_cmd as discord_base_src_cmd
|
|
21
|
-
from .elasticsearch import get_base_dest_cmd as elasticsearch_base_dest_cmd
|
|
22
|
-
from .elasticsearch import get_base_src_cmd as elasticsearch_base_src_cmd
|
|
23
|
-
from .fsspec.azure import get_base_dest_cmd as azure_base_dest_cmd
|
|
24
|
-
from .fsspec.azure import get_base_src_cmd as azure_base_src_cmd
|
|
25
|
-
from .fsspec.box import get_base_dest_cmd as box_base_dest_cmd
|
|
26
|
-
from .fsspec.box import get_base_src_cmd as box_base_src_cmd
|
|
27
|
-
from .fsspec.dropbox import get_base_dest_cmd as dropbox_base_dest_cmd
|
|
28
|
-
from .fsspec.dropbox import get_base_src_cmd as dropbox_base_src_cmd
|
|
29
|
-
from .fsspec.fsspec import get_base_dest_cmd as fsspec_base_dest_cmd
|
|
30
|
-
from .fsspec.fsspec import get_base_src_cmd as fsspec_base_src_cmd
|
|
31
|
-
from .fsspec.gcs import get_base_dest_cmd as gcs_base_dest_cmd
|
|
32
|
-
from .fsspec.gcs import get_base_src_cmd as gcs_base_src_cmd
|
|
33
|
-
from .fsspec.s3 import get_base_dest_cmd as s3_base_dest_cmd
|
|
34
|
-
from .fsspec.s3 import get_base_src_cmd as s3_base_src_cmd
|
|
35
|
-
from .github import get_base_src_cmd as github_base_src_cmd
|
|
36
|
-
from .gitlab import get_base_src_cmd as gitlab_base_src_cmd
|
|
37
|
-
from .google_drive import get_base_src_cmd as google_drive_base_src_cmd
|
|
38
|
-
from .hubspot import get_base_src_cmd as hubspot_base_src_cmd
|
|
39
|
-
from .jira import get_base_src_cmd as jira_base_src_cmd
|
|
40
|
-
from .kafka import get_base_dest_cmd as kafka_base_dest_cmd
|
|
41
|
-
from .kafka import get_base_src_cmd as kafka_base_src_cmd
|
|
42
|
-
from .local import get_base_src_cmd as local_base_src_cmd
|
|
43
|
-
from .mongodb import get_base_dest_cmd as mongo_base_dest_cmd
|
|
44
|
-
from .mongodb import get_base_src_cmd as mongodb_base_src_cmd
|
|
45
|
-
from .notion import get_base_src_cmd as notion_base_src_cmd
|
|
46
|
-
from .onedrive import get_base_src_cmd as onedrive_base_src_cmd
|
|
47
|
-
from .opensearch import get_base_dest_cmd as opensearch_base_dest_cmd
|
|
48
|
-
from .opensearch import get_base_src_cmd as opensearch_base_src_cmd
|
|
49
|
-
from .outlook import get_base_src_cmd as outlook_base_src_cmd
|
|
50
|
-
from .pinecone import get_base_dest_cmd as pinecone_base_dest_cmd
|
|
51
|
-
from .qdrant import get_base_dest_cmd as qdrant_base_dest_cmd
|
|
52
|
-
from .reddit import get_base_src_cmd as reddit_base_src_cmd
|
|
53
|
-
from .salesforce import get_base_src_cmd as salesforce_base_src_cmd
|
|
54
|
-
from .sharepoint import get_base_src_cmd as sharepoint_base_src_cmd
|
|
55
|
-
from .slack import get_base_src_cmd as slack_base_src_cmd
|
|
56
|
-
from .sql import get_base_dest_cmd as sql_base_dest_cmd
|
|
57
|
-
from .vectara import get_base_dest_cmd as vectara_base_dest_cmd
|
|
58
|
-
from .weaviate import get_base_dest_cmd as weaviate_dest_cmd
|
|
59
|
-
from .wikipedia import get_base_src_cmd as wikipedia_base_src_cmd
|
|
60
|
-
|
|
61
|
-
if t.TYPE_CHECKING:
|
|
62
|
-
from unstructured_ingest.cli.base.dest import BaseDestCmd
|
|
63
|
-
|
|
64
|
-
base_src_cmd_fns: t.List[t.Callable[[], BaseSrcCmd]] = [
|
|
65
|
-
airtable_base_src_cmd,
|
|
66
|
-
astradb_base_src_cmd,
|
|
67
|
-
azure_base_src_cmd,
|
|
68
|
-
biomed_base_src_cmd,
|
|
69
|
-
box_base_src_cmd,
|
|
70
|
-
confluence_base_src_cmd,
|
|
71
|
-
delta_table_base_src_cmd,
|
|
72
|
-
discord_base_src_cmd,
|
|
73
|
-
dropbox_base_src_cmd,
|
|
74
|
-
elasticsearch_base_src_cmd,
|
|
75
|
-
fsspec_base_src_cmd,
|
|
76
|
-
gcs_base_src_cmd,
|
|
77
|
-
github_base_src_cmd,
|
|
78
|
-
gitlab_base_src_cmd,
|
|
79
|
-
google_drive_base_src_cmd,
|
|
80
|
-
hubspot_base_src_cmd,
|
|
81
|
-
jira_base_src_cmd,
|
|
82
|
-
kafka_base_src_cmd,
|
|
83
|
-
local_base_src_cmd,
|
|
84
|
-
mongodb_base_src_cmd,
|
|
85
|
-
notion_base_src_cmd,
|
|
86
|
-
onedrive_base_src_cmd,
|
|
87
|
-
opensearch_base_src_cmd,
|
|
88
|
-
outlook_base_src_cmd,
|
|
89
|
-
reddit_base_src_cmd,
|
|
90
|
-
salesforce_base_src_cmd,
|
|
91
|
-
sftp_base_src_cmd,
|
|
92
|
-
sharepoint_base_src_cmd,
|
|
93
|
-
slack_base_src_cmd,
|
|
94
|
-
s3_base_src_cmd,
|
|
95
|
-
wikipedia_base_src_cmd,
|
|
96
|
-
]
|
|
97
|
-
|
|
98
|
-
# Make sure there are not overlapping names
|
|
99
|
-
src_cmd_names = [b().cmd_name for b in base_src_cmd_fns]
|
|
100
|
-
src_duplicates = [item for item, count in collections.Counter(src_cmd_names).items() if count > 1]
|
|
101
|
-
if src_duplicates:
|
|
102
|
-
raise ValueError(
|
|
103
|
-
"multiple base src commands defined with the same names: {}".format(
|
|
104
|
-
", ".join(src_duplicates),
|
|
105
|
-
),
|
|
106
|
-
)
|
|
107
|
-
|
|
108
|
-
base_dest_cmd_fns: t.List[t.Callable[[], "BaseDestCmd"]] = [
|
|
109
|
-
astradb_base_dest_cmd,
|
|
110
|
-
azure_base_dest_cmd,
|
|
111
|
-
box_base_dest_cmd,
|
|
112
|
-
chroma_base_dest_cmd,
|
|
113
|
-
clarifai_base_dest_cmd,
|
|
114
|
-
databricks_volumes_dest_cmd,
|
|
115
|
-
dropbox_base_dest_cmd,
|
|
116
|
-
elasticsearch_base_dest_cmd,
|
|
117
|
-
fsspec_base_dest_cmd,
|
|
118
|
-
gcs_base_dest_cmd,
|
|
119
|
-
kafka_base_dest_cmd,
|
|
120
|
-
s3_base_dest_cmd,
|
|
121
|
-
azure_ai_search_base_dest_cmd,
|
|
122
|
-
delta_table_dest_cmd,
|
|
123
|
-
sql_base_dest_cmd,
|
|
124
|
-
weaviate_dest_cmd,
|
|
125
|
-
mongo_base_dest_cmd,
|
|
126
|
-
pinecone_base_dest_cmd,
|
|
127
|
-
qdrant_base_dest_cmd,
|
|
128
|
-
opensearch_base_dest_cmd,
|
|
129
|
-
vectara_base_dest_cmd,
|
|
130
|
-
]
|
|
131
|
-
|
|
132
|
-
# Make sure there are not overlapping names
|
|
133
|
-
dest_cmd_names = [b().cmd_name for b in base_dest_cmd_fns]
|
|
134
|
-
dest_duplicates = [item for item, count in collections.Counter(dest_cmd_names).items() if count > 1]
|
|
135
|
-
if dest_duplicates:
|
|
136
|
-
raise ValueError(
|
|
137
|
-
"multiple base dest commands defined with the same names: {}".format(
|
|
138
|
-
", ".join(dest_duplicates),
|
|
139
|
-
),
|
|
140
|
-
)
|
|
141
|
-
|
|
142
|
-
__all__ = [
|
|
143
|
-
"base_src_cmd_fns",
|
|
144
|
-
"base_dest_cmd_fns",
|
|
145
|
-
]
|