unstructured-ingest 1.0.1__tar.gz → 1.0.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (238) hide show
  1. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/PKG-INFO +2 -2
  2. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/pyproject.toml +0 -1
  3. unstructured_ingest-1.0.2/unstructured_ingest/__version__.py +1 -0
  4. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/astradb.py +47 -33
  5. unstructured_ingest-1.0.1/unstructured_ingest/__version__.py +0 -1
  6. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/.gitignore +0 -0
  7. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/LICENSE.md +0 -0
  8. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/README.md +0 -0
  9. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/__init__.py +0 -0
  10. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/README.md +0 -0
  11. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/__init__.py +0 -0
  12. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/base/__init__.py +0 -0
  13. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/base/cmd.py +0 -0
  14. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/base/dest.py +0 -0
  15. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/base/importer.py +0 -0
  16. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/base/src.py +0 -0
  17. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/cli.py +0 -0
  18. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/cmds.py +0 -0
  19. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/utils/__init__.py +0 -0
  20. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/utils/click.py +0 -0
  21. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/cli/utils/model_conversion.py +0 -0
  22. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/data_types/__init__.py +0 -0
  23. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/data_types/file_data.py +0 -0
  24. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/__init__.py +0 -0
  25. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/azure_openai.py +0 -0
  26. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/bedrock.py +0 -0
  27. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/huggingface.py +0 -0
  28. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/interfaces.py +0 -0
  29. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  30. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/octoai.py +0 -0
  31. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/openai.py +0 -0
  32. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/togetherai.py +0 -0
  33. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/vertexai.py +0 -0
  34. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/embed/voyageai.py +0 -0
  35. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/error.py +0 -0
  36. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/errors_v2.py +0 -0
  37. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/__init__.py +0 -0
  38. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/connector.py +0 -0
  39. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/downloader.py +0 -0
  40. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/indexer.py +0 -0
  41. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/process.py +0 -0
  42. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/processor.py +0 -0
  43. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/upload_stager.py +0 -0
  44. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/interfaces/uploader.py +0 -0
  45. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/logger.py +0 -0
  46. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/main.py +0 -0
  47. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/otel.py +0 -0
  48. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/__init__.py +0 -0
  49. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/interfaces.py +0 -0
  50. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/otel.py +0 -0
  51. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/pipeline.py +0 -0
  52. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/__init__.py +0 -0
  53. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/chunk.py +0 -0
  54. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/download.py +0 -0
  55. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/embed.py +0 -0
  56. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/filter.py +0 -0
  57. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/index.py +0 -0
  58. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/partition.py +0 -0
  59. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/stage.py +0 -0
  60. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/uncompress.py +0 -0
  61. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/pipeline/steps/upload.py +0 -0
  62. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/__init__.py +0 -0
  63. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/chunker.py +0 -0
  64. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connector_registry.py +0 -0
  65. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/__init__.py +0 -0
  66. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/airtable.py +0 -0
  67. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/assets/__init__.py +0 -0
  68. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql +0 -0
  69. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json +0 -0
  70. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/azure_ai_search.py +0 -0
  71. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/chroma.py +0 -0
  72. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/confluence.py +0 -0
  73. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/couchbase.py +0 -0
  74. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/__init__.py +0 -0
  75. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/volumes.py +0 -0
  76. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/volumes_aws.py +0 -0
  77. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/volumes_azure.py +0 -0
  78. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/volumes_gcp.py +0 -0
  79. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/volumes_native.py +0 -0
  80. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/databricks/volumes_table.py +0 -0
  81. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/delta_table.py +0 -0
  82. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/discord.py +0 -0
  83. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/duckdb/__init__.py +0 -0
  84. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/duckdb/base.py +0 -0
  85. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/duckdb/duckdb.py +0 -0
  86. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/duckdb/motherduck.py +0 -0
  87. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/elasticsearch/__init__.py +0 -0
  88. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py +0 -0
  89. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/elasticsearch/opensearch.py +0 -0
  90. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/__init__.py +0 -0
  91. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/azure.py +0 -0
  92. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/box.py +0 -0
  93. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/dropbox.py +0 -0
  94. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/fsspec.py +0 -0
  95. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/gcs.py +0 -0
  96. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/s3.py +0 -0
  97. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/sftp.py +0 -0
  98. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/fsspec/utils.py +0 -0
  99. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/github.py +0 -0
  100. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/gitlab.py +0 -0
  101. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/google_drive.py +0 -0
  102. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py +0 -0
  103. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +0 -0
  104. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/jira.py +0 -0
  105. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/kafka/__init__.py +0 -0
  106. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/kafka/cloud.py +0 -0
  107. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/kafka/kafka.py +0 -0
  108. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/kafka/local.py +0 -0
  109. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/kdbai.py +0 -0
  110. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/__init__.py +0 -0
  111. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/aws.py +0 -0
  112. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/azure.py +0 -0
  113. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/cloud.py +0 -0
  114. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/gcp.py +0 -0
  115. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/lancedb.py +0 -0
  116. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/lancedb/local.py +0 -0
  117. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/local.py +0 -0
  118. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/milvus.py +0 -0
  119. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/mongodb.py +0 -0
  120. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/neo4j.py +0 -0
  121. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/__init__.py +0 -0
  122. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/client.py +0 -0
  123. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/connector.py +0 -0
  124. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/helpers.py +0 -0
  125. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/__init__.py +0 -0
  126. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_common.py +0 -0
  127. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py +0 -0
  128. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +0 -0
  129. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/interfaces.py +0 -0
  130. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/__init__.py +0 -0
  131. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/block.py +0 -0
  132. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/__init__.py +0 -0
  133. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py +0 -0
  134. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py +0 -0
  135. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -0
  136. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/callout.py +0 -0
  137. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py +0 -0
  138. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py +0 -0
  139. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/code.py +0 -0
  140. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py +0 -0
  141. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/divider.py +0 -0
  142. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/embed.py +0 -0
  143. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/equation.py +0 -0
  144. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/file.py +0 -0
  145. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/heading.py +0 -0
  146. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/image.py +0 -0
  147. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py +0 -0
  148. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py +0 -0
  149. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py +0 -0
  150. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py +0 -0
  151. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py +0 -0
  152. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/quote.py +0 -0
  153. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +0 -0
  154. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/table.py +0 -0
  155. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py +0 -0
  156. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/template.py +0 -0
  157. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/todo.py +0 -0
  158. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py +0 -0
  159. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py +0 -0
  160. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/blocks/video.py +0 -0
  161. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database.py +0 -0
  162. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py +0 -0
  163. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py +0 -0
  164. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py +0 -0
  165. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py +0 -0
  166. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/date.py +0 -0
  167. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/email.py +0 -0
  168. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/files.py +0 -0
  169. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py +0 -0
  170. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -0
  171. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py +0 -0
  172. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py +0 -0
  173. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/number.py +0 -0
  174. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/people.py +0 -0
  175. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py +0 -0
  176. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py +0 -0
  177. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py +0 -0
  178. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py +0 -0
  179. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/select.py +0 -0
  180. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/status.py +0 -0
  181. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/title.py +0 -0
  182. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py +0 -0
  183. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/url.py +0 -0
  184. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py +0 -0
  185. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/date.py +0 -0
  186. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/file.py +0 -0
  187. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/page.py +0 -0
  188. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/parent.py +0 -0
  189. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/rich_text.py +0 -0
  190. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/notion/types/user.py +0 -0
  191. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/onedrive.py +0 -0
  192. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/outlook.py +0 -0
  193. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/pinecone.py +0 -0
  194. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/qdrant/__init__.py +0 -0
  195. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/qdrant/cloud.py +0 -0
  196. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/qdrant/local.py +0 -0
  197. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/qdrant/qdrant.py +0 -0
  198. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/qdrant/server.py +0 -0
  199. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/redisdb.py +0 -0
  200. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/salesforce.py +0 -0
  201. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sharepoint.py +0 -0
  202. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/slack.py +0 -0
  203. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/__init__.py +0 -0
  204. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py +0 -0
  205. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/postgres.py +0 -0
  206. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/singlestore.py +0 -0
  207. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/snowflake.py +0 -0
  208. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/sql.py +0 -0
  209. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/sqlite.py +0 -0
  210. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/sql/vastdb.py +0 -0
  211. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/utils.py +0 -0
  212. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/vectara.py +0 -0
  213. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/weaviate/__init__.py +0 -0
  214. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/weaviate/cloud.py +0 -0
  215. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/weaviate/embedded.py +0 -0
  216. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/weaviate/local.py +0 -0
  217. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/weaviate/weaviate.py +0 -0
  218. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/zendesk/__init__.py +0 -0
  219. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/zendesk/client.py +0 -0
  220. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/connectors/zendesk/zendesk.py +0 -0
  221. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/embedder.py +0 -0
  222. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/filter.py +0 -0
  223. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/partitioner.py +0 -0
  224. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/uncompress.py +0 -0
  225. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/utils/__init__.py +0 -0
  226. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/processes/utils/blob_storage.py +0 -0
  227. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/unstructured_api.py +0 -0
  228. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/__init__.py +0 -0
  229. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/chunking.py +0 -0
  230. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/compression.py +0 -0
  231. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/constants.py +0 -0
  232. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/data_prep.py +0 -0
  233. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/dep_check.py +0 -0
  234. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/html.py +0 -0
  235. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/ndjson.py +0 -0
  236. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/pydantic_models.py +0 -0
  237. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  238. {unstructured_ingest-1.0.1 → unstructured_ingest-1.0.2}/unstructured_ingest/utils/table.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: unstructured_ingest
3
- Version: 1.0.1
3
+ Version: 1.0.2
4
4
  Summary: Local ETL data pipeline to get data RAG ready
5
5
  Author-email: Unstructured Technologies <devops@unstructuredai.io>
6
6
  License-Expression: Apache-2.0
@@ -28,7 +28,7 @@ Provides-Extra: airtable
28
28
  Requires-Dist: pandas; extra == 'airtable'
29
29
  Requires-Dist: pyairtable; extra == 'airtable'
30
30
  Provides-Extra: astradb
31
- Requires-Dist: astrapy; extra == 'astradb'
31
+ Requires-Dist: astrapy>2.0.0; extra == 'astradb'
32
32
  Provides-Extra: azure
33
33
  Requires-Dist: adlfs; extra == 'azure'
34
34
  Requires-Dist: fsspec; extra == 'azure'
@@ -172,7 +172,6 @@ ci = [
172
172
  "lancedb<=0.15.0",
173
173
  # TODO: versions higher than this are missing the macos wheel
174
174
  "pykx==2.5.3",
175
- "astrapy<2.0.0"
176
175
  ]
177
176
 
178
177
  [project.scripts]
@@ -0,0 +1 @@
1
+ __version__ = "1.0.2" # pragma: no cover
@@ -1,5 +1,7 @@
1
+ import asyncio
1
2
  import csv
2
3
  import hashlib
4
+ import os
3
5
  import re
4
6
  from dataclasses import dataclass, field
5
7
  from pathlib import Path
@@ -8,7 +10,6 @@ from typing import TYPE_CHECKING, Any, Generator, Optional
8
10
 
9
11
  from pydantic import BaseModel, Field, Secret
10
12
 
11
- from unstructured_ingest import __name__ as integration_name
12
13
  from unstructured_ingest.__version__ import __version__ as integration_version
13
14
  from unstructured_ingest.data_types.file_data import (
14
15
  BatchFileData,
@@ -83,10 +84,8 @@ class AstraDBConnectionConfig(ConnectionConfig):
83
84
 
84
85
  # Create a client object to interact with the Astra DB
85
86
  # caller_name/version for Astra DB tracking
86
- return AstraDBClient(
87
- caller_name=integration_name,
88
- caller_version=integration_version,
89
- )
87
+ user_agent = os.getenv("UNSTRUCTURED_USER_AGENT", "unstructuredio_oss")
88
+ return AstraDBClient(callers=[(user_agent, integration_version)])
90
89
 
91
90
 
92
91
  def get_astra_db(
@@ -141,7 +140,7 @@ async def get_async_astra_collection(
141
140
  )
142
141
 
143
142
  # Get async collection from AsyncDatabase
144
- async_astra_db_collection = await async_astra_db.get_collection(name=collection_name)
143
+ async_astra_db_collection = async_astra_db.get_collection(name=collection_name)
145
144
  return async_astra_db_collection
146
145
 
147
146
 
@@ -360,13 +359,22 @@ class AstraDBUploader(Uploader):
360
359
  upload_config: AstraDBUploaderConfig
361
360
  connector_type: str = CONNECTOR_TYPE
362
361
 
362
+ def is_async(self) -> bool:
363
+ return True
364
+
363
365
  def init(self, **kwargs: Any) -> None:
364
366
  self.create_destination(**kwargs)
365
367
 
368
+ @requires_dependencies(["astrapy"], extras="astradb")
366
369
  def precheck(self) -> None:
367
370
  try:
368
371
  if self.upload_config.collection_name:
369
- self.get_collection(collection_name=self.upload_config.collection_name).options()
372
+ collection = get_astra_collection(
373
+ connection_config=self.connection_config,
374
+ collection_name=self.upload_config.collection_name,
375
+ keyspace=self.upload_config.keyspace,
376
+ )
377
+ collection.options()
370
378
  else:
371
379
  # check for db connection only if collection name is not provided
372
380
  get_astra_db(
@@ -377,17 +385,7 @@ class AstraDBUploader(Uploader):
377
385
  logger.error(f"Failed to validate connection {e}", exc_info=True)
378
386
  raise DestinationConnectionError(f"failed to validate connection: {e}")
379
387
 
380
- @requires_dependencies(["astrapy"], extras="astradb")
381
- def get_collection(self, collection_name: Optional[str] = None) -> "AstraDBCollection":
382
- return get_astra_collection(
383
- connection_config=self.connection_config,
384
- collection_name=collection_name or self.upload_config.collection_name,
385
- keyspace=self.upload_config.keyspace,
386
- )
387
-
388
388
  def _collection_exists(self, collection_name: str):
389
- from astrapy.exceptions import CollectionNotFoundException
390
-
391
389
  collection = get_astra_collection(
392
390
  connection_config=self.connection_config,
393
391
  collection_name=collection_name,
@@ -397,8 +395,10 @@ class AstraDBUploader(Uploader):
397
395
  try:
398
396
  collection.options()
399
397
  return True
400
- except CollectionNotFoundException:
401
- return False
398
+ except RuntimeError as e:
399
+ if "not found" in str(e):
400
+ return False
401
+ raise DestinationConnectionError(f"failed to check if astra collection exists : {e}")
402
402
  except Exception as e:
403
403
  logger.error(f"failed to check if astra collection exists : {e}")
404
404
  raise DestinationConnectionError(f"failed to check if astra collection exists : {e}")
@@ -422,6 +422,8 @@ class AstraDBUploader(Uploader):
422
422
  self.upload_config.collection_name = collection_name
423
423
 
424
424
  if not self._collection_exists(collection_name):
425
+ from astrapy.info import CollectionDefinition
426
+
425
427
  astra_db = get_astra_db(
426
428
  connection_config=self.connection_config, keyspace=self.upload_config.keyspace
427
429
  )
@@ -429,44 +431,56 @@ class AstraDBUploader(Uploader):
429
431
  f"creating default astra collection '{collection_name}' with dimension "
430
432
  f"{vector_length} and metric {similarity_metric}"
431
433
  )
432
- astra_db.create_collection(
433
- collection_name,
434
- dimension=vector_length,
435
- metric=similarity_metric,
434
+ definition = (
435
+ CollectionDefinition.builder()
436
+ .set_vector_dimension(dimension=vector_length)
437
+ .set_vector_metric(similarity_metric)
438
+ .build()
436
439
  )
440
+ (astra_db.create_collection(collection_name, definition=definition),)
437
441
  return True
438
442
  logger.debug(f"collection with name '{collection_name}' already exists, skipping creation")
439
443
  return False
440
444
 
441
- def delete_by_record_id(self, collection: "AstraDBCollection", file_data: FileData):
445
+ async def delete_by_record_id(self, collection: "AstraDBAsyncCollection", file_data: FileData):
442
446
  logger.debug(
443
447
  f"deleting records from collection {collection.name} "
444
448
  f"with {self.upload_config.record_id_key} "
445
449
  f"set to {file_data.identifier}"
446
450
  )
447
451
  delete_filter = {self.upload_config.record_id_key: {"$eq": file_data.identifier}}
448
- delete_resp = collection.delete_many(filter=delete_filter)
452
+ delete_resp = await collection.delete_many(filter=delete_filter)
449
453
  logger.debug(
450
454
  f"deleted {delete_resp.deleted_count} records from collection {collection.name}"
451
455
  )
452
456
 
453
- def run_data(self, data: list[dict], file_data: FileData, **kwargs: Any) -> None:
457
+ async def run_data(self, data: list[dict], file_data: FileData, **kwargs: Any) -> None:
454
458
  logger.info(
455
459
  f"writing {len(data)} objects to destination "
456
460
  f"collection {self.upload_config.collection_name}"
457
461
  )
458
462
 
459
463
  astra_db_batch_size = self.upload_config.batch_size
460
- collection = self.get_collection()
461
-
462
- self.delete_by_record_id(collection=collection, file_data=file_data)
464
+ async_astra_collection = await get_async_astra_collection(
465
+ connection_config=self.connection_config,
466
+ collection_name=self.upload_config.collection_name,
467
+ keyspace=self.upload_config.keyspace,
468
+ )
463
469
 
464
- for chunk in batch_generator(data, astra_db_batch_size):
465
- collection.insert_many(chunk)
470
+ await self.delete_by_record_id(collection=async_astra_collection, file_data=file_data)
471
+ await asyncio.gather(
472
+ *[
473
+ async_astra_collection.insert_many(chunk)
474
+ for chunk in batch_generator(data, astra_db_batch_size)
475
+ ]
476
+ )
466
477
 
467
- def run(self, path: Path, file_data: FileData, **kwargs: Any) -> None:
478
+ async def run_async(self, path: Path, file_data: FileData, **kwargs: Any) -> None:
468
479
  data = get_json_data(path=path)
469
- self.run_data(data=data, file_data=file_data, **kwargs)
480
+ await self.run_data(data=data, file_data=file_data)
481
+
482
+ def run(self, **kwargs: Any) -> Any:
483
+ raise NotImplementedError("Use astradb run_async instead")
470
484
 
471
485
 
472
486
  astra_db_source_entry = SourceRegistryEntry(
@@ -1 +0,0 @@
1
- __version__ = "1.0.1" # pragma: no cover