unstructured-ingest 0.3.4__tar.gz → 0.3.6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (476) hide show
  1. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/PKG-INFO +19 -19
  2. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_lancedb.py +46 -9
  3. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_pinecone.py +60 -9
  4. unstructured_ingest-0.3.6/unstructured_ingest/__version__.py +1 -0
  5. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/azure_ai_search.py +1 -2
  6. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/elasticsearch/elasticsearch.py +1 -5
  7. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/lancedb.py +12 -2
  8. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/pinecone.py +31 -21
  9. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/weaviate/__init__.py +0 -3
  10. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/weaviate/weaviate.py +0 -10
  11. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest.egg-info/PKG-INFO +19 -19
  12. unstructured_ingest-0.3.4/unstructured_ingest/__version__.py +0 -1
  13. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/LICENSE.md +0 -0
  14. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/README.md +0 -0
  15. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/pyproject.toml +0 -0
  16. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/setup.cfg +0 -0
  17. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/setup.py +0 -0
  18. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/__init__.py +0 -0
  19. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/__init__.py +0 -0
  20. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/chunkers/__init__.py +0 -0
  21. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/chunkers/test_chunkers.py +0 -0
  22. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/__init__.py +0 -0
  23. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/conftest.py +0 -0
  24. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/databricks_tests/__init__.py +0 -0
  25. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/databricks_tests/test_volumes_native.py +0 -0
  26. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/elasticsearch/__init__.py +0 -0
  27. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/elasticsearch/conftest.py +0 -0
  28. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/elasticsearch/test_elasticsearch.py +0 -0
  29. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/elasticsearch/test_opensearch.py +0 -0
  30. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/sql/__init__.py +0 -0
  31. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/sql/test_postgres.py +0 -0
  32. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/sql/test_singlestore.py +0 -0
  33. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/sql/test_snowflake.py +0 -0
  34. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/sql/test_sqlite.py +0 -0
  35. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_astradb.py +0 -0
  36. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_azure_ai_search.py +0 -0
  37. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_confluence.py +0 -0
  38. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_delta_table.py +0 -0
  39. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_kafka.py +0 -0
  40. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_milvus.py +0 -0
  41. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_mongodb.py +0 -0
  42. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_onedrive.py +0 -0
  43. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_qdrant.py +0 -0
  44. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/test_s3.py +0 -0
  45. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/utils/__init__.py +0 -0
  46. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/utils/constants.py +0 -0
  47. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/utils/docker.py +0 -0
  48. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/utils/docker_compose.py +0 -0
  49. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/utils/validation.py +0 -0
  50. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/weaviate/__init__.py +0 -0
  51. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/weaviate/conftest.py +0 -0
  52. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/weaviate/test_cloud.py +0 -0
  53. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/connectors/weaviate/test_local.py +0 -0
  54. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/__init__.py +0 -0
  55. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/conftest.py +0 -0
  56. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_azure_openai.py +0 -0
  57. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_bedrock.py +0 -0
  58. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_huggingface.py +0 -0
  59. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_mixedbread.py +0 -0
  60. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_octoai.py +0 -0
  61. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_openai.py +0 -0
  62. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_togetherai.py +0 -0
  63. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_vertexai.py +0 -0
  64. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/test_voyageai.py +0 -0
  65. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/embedders/utils.py +0 -0
  66. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/partitioners/__init__.py +0 -0
  67. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/partitioners/test_partitioner.py +0 -0
  68. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/integration/utils.py +0 -0
  69. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/__init__.py +0 -0
  70. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/embed/__init__.py +0 -0
  71. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/embed/test_mixedbreadai.py +0 -0
  72. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/embed/test_octoai.py +0 -0
  73. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/embed/test_openai.py +0 -0
  74. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/embed/test_vertexai.py +0 -0
  75. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/embed/test_voyageai.py +0 -0
  76. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/test_chunking_utils.py +0 -0
  77. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/test_error.py +0 -0
  78. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/test_interfaces.py +0 -0
  79. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/test_logger.py +0 -0
  80. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/test_utils.py +0 -0
  81. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/__init__.py +0 -0
  82. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/chunkers/__init__.py +0 -0
  83. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/chunkers/test_chunkers.py +0 -0
  84. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/connectors/__init__.py +0 -0
  85. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/__init__.py +0 -0
  86. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_bedrock.py +0 -0
  87. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_huggingface.py +0 -0
  88. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_mixedbread.py +0 -0
  89. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_octoai.py +0 -0
  90. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_openai.py +0 -0
  91. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_togetherai.py +0 -0
  92. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_vertexai.py +0 -0
  93. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/embedders/test_voyageai.py +0 -0
  94. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/partitioners/__init__.py +0 -0
  95. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/partitioners/test_partitioner.py +0 -0
  96. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/test_interfaces.py +0 -0
  97. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/test_utils.py +0 -0
  98. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/utils/__init__.py +0 -0
  99. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/test/unit/v2/utils/data_generator.py +0 -0
  100. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/__init__.py +0 -0
  101. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/__init__.py +0 -0
  102. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/base/__init__.py +0 -0
  103. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/base/cmd.py +0 -0
  104. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/base/dest.py +0 -0
  105. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/base/src.py +0 -0
  106. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cli.py +0 -0
  107. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmd_factory.py +0 -0
  108. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/__init__.py +0 -0
  109. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/airtable.py +0 -0
  110. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/astradb.py +0 -0
  111. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/azure_ai_search.py +0 -0
  112. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/biomed.py +0 -0
  113. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/chroma.py +0 -0
  114. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/clarifai.py +0 -0
  115. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/confluence.py +0 -0
  116. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -0
  117. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/delta_table.py +0 -0
  118. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/discord.py +0 -0
  119. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/elasticsearch.py +0 -0
  120. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/__init__.py +0 -0
  121. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -0
  122. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/box.py +0 -0
  123. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -0
  124. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -0
  125. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -0
  126. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -0
  127. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -0
  128. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/github.py +0 -0
  129. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/gitlab.py +0 -0
  130. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/google_drive.py +0 -0
  131. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/hubspot.py +0 -0
  132. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/jira.py +0 -0
  133. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/kafka.py +0 -0
  134. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/local.py +0 -0
  135. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/mongodb.py +0 -0
  136. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/notion.py +0 -0
  137. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/onedrive.py +0 -0
  138. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/opensearch.py +0 -0
  139. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/outlook.py +0 -0
  140. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/pinecone.py +0 -0
  141. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/qdrant.py +0 -0
  142. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/reddit.py +0 -0
  143. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/salesforce.py +0 -0
  144. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/sharepoint.py +0 -0
  145. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/slack.py +0 -0
  146. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/sql.py +0 -0
  147. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/vectara.py +0 -0
  148. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/weaviate.py +0 -0
  149. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/cmds/wikipedia.py +0 -0
  150. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/common.py +0 -0
  151. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/interfaces.py +0 -0
  152. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/cli/utils.py +0 -0
  153. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/__init__.py +0 -0
  154. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/airtable.py +0 -0
  155. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/astradb.py +0 -0
  156. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/azure_ai_search.py +0 -0
  157. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/biomed.py +0 -0
  158. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/chroma.py +0 -0
  159. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/clarifai.py +0 -0
  160. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/confluence.py +0 -0
  161. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/databricks_volumes.py +0 -0
  162. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/delta_table.py +0 -0
  163. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/discord.py +0 -0
  164. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/elasticsearch.py +0 -0
  165. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/__init__.py +0 -0
  166. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/azure.py +0 -0
  167. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/box.py +0 -0
  168. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/dropbox.py +0 -0
  169. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/fsspec.py +0 -0
  170. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/gcs.py +0 -0
  171. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/s3.py +0 -0
  172. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/fsspec/sftp.py +0 -0
  173. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/git.py +0 -0
  174. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/github.py +0 -0
  175. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/gitlab.py +0 -0
  176. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/google_drive.py +0 -0
  177. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/hubspot.py +0 -0
  178. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/jira.py +0 -0
  179. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/kafka.py +0 -0
  180. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/local.py +0 -0
  181. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/mongodb.py +0 -0
  182. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/__init__.py +0 -0
  183. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/client.py +0 -0
  184. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/connector.py +0 -0
  185. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/helpers.py +0 -0
  186. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/interfaces.py +0 -0
  187. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/__init__.py +0 -0
  188. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/block.py +0 -0
  189. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/__init__.py +0 -0
  190. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -0
  191. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -0
  192. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -0
  193. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -0
  194. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -0
  195. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -0
  196. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/code.py +0 -0
  197. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -0
  198. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -0
  199. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -0
  200. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -0
  201. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/file.py +0 -0
  202. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -0
  203. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/image.py +0 -0
  204. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -0
  205. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -0
  206. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -0
  207. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -0
  208. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -0
  209. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -0
  210. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -0
  211. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/table.py +0 -0
  212. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -0
  213. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/template.py +0 -0
  214. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -0
  215. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -0
  216. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -0
  217. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/blocks/video.py +0 -0
  218. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database.py +0 -0
  219. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -0
  220. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -0
  221. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -0
  222. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -0
  223. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -0
  224. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -0
  225. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -0
  226. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -0
  227. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -0
  228. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -0
  229. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -0
  230. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -0
  231. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -0
  232. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -0
  233. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -0
  234. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -0
  235. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -0
  236. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -0
  237. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -0
  238. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -0
  239. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -0
  240. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -0
  241. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -0
  242. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/date.py +0 -0
  243. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/file.py +0 -0
  244. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/page.py +0 -0
  245. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/parent.py +0 -0
  246. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/rich_text.py +0 -0
  247. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/notion/types/user.py +0 -0
  248. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/onedrive.py +0 -0
  249. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/opensearch.py +0 -0
  250. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/outlook.py +0 -0
  251. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/pinecone.py +0 -0
  252. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/qdrant.py +0 -0
  253. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/reddit.py +0 -0
  254. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/registry.py +0 -0
  255. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/salesforce.py +0 -0
  256. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/sharepoint.py +0 -0
  257. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/slack.py +0 -0
  258. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/sql.py +0 -0
  259. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/vectara.py +0 -0
  260. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/weaviate.py +0 -0
  261. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/connector/wikipedia.py +0 -0
  262. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/__init__.py +0 -0
  263. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/azure_openai.py +0 -0
  264. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/bedrock.py +0 -0
  265. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/huggingface.py +0 -0
  266. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/interfaces.py +0 -0
  267. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  268. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/octoai.py +0 -0
  269. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/openai.py +0 -0
  270. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/togetherai.py +0 -0
  271. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/vertexai.py +0 -0
  272. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/embed/voyageai.py +0 -0
  273. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/enhanced_dataclass/__init__.py +0 -0
  274. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/enhanced_dataclass/core.py +0 -0
  275. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -0
  276. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -0
  277. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/error.py +0 -0
  278. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/ingest_backoff/__init__.py +0 -0
  279. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/ingest_backoff/_common.py +0 -0
  280. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/ingest_backoff/_wrapper.py +0 -0
  281. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/interfaces.py +0 -0
  282. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/logger.py +0 -0
  283. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/main.py +0 -0
  284. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/__init__.py +0 -0
  285. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/copy.py +0 -0
  286. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/doc_factory.py +0 -0
  287. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/interfaces.py +0 -0
  288. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/partition.py +0 -0
  289. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/permissions.py +0 -0
  290. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/pipeline.py +0 -0
  291. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/reformat/__init__.py +0 -0
  292. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/reformat/chunking.py +0 -0
  293. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/reformat/embedding.py +0 -0
  294. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/source.py +0 -0
  295. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/utils.py +0 -0
  296. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/pipeline/write.py +0 -0
  297. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/processor.py +0 -0
  298. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/__init__.py +0 -0
  299. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/airtable.py +0 -0
  300. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/astradb.py +0 -0
  301. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/base_runner.py +0 -0
  302. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/biomed.py +0 -0
  303. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/confluence.py +0 -0
  304. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/delta_table.py +0 -0
  305. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/discord.py +0 -0
  306. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/elasticsearch.py +0 -0
  307. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/__init__.py +0 -0
  308. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/azure.py +0 -0
  309. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/box.py +0 -0
  310. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/dropbox.py +0 -0
  311. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/fsspec.py +0 -0
  312. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/gcs.py +0 -0
  313. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/s3.py +0 -0
  314. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/fsspec/sftp.py +0 -0
  315. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/github.py +0 -0
  316. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/gitlab.py +0 -0
  317. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/google_drive.py +0 -0
  318. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/hubspot.py +0 -0
  319. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/jira.py +0 -0
  320. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/kafka.py +0 -0
  321. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/local.py +0 -0
  322. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/mongodb.py +0 -0
  323. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/notion.py +0 -0
  324. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/onedrive.py +0 -0
  325. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/opensearch.py +0 -0
  326. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/outlook.py +0 -0
  327. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/reddit.py +0 -0
  328. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/salesforce.py +0 -0
  329. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/sharepoint.py +0 -0
  330. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/slack.py +0 -0
  331. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/utils.py +0 -0
  332. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/wikipedia.py +0 -0
  333. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/__init__.py +0 -0
  334. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/astradb.py +0 -0
  335. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/azure_ai_search.py +0 -0
  336. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/base_writer.py +0 -0
  337. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/chroma.py +0 -0
  338. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/clarifai.py +0 -0
  339. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/databricks_volumes.py +0 -0
  340. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/delta_table.py +0 -0
  341. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/elasticsearch.py +0 -0
  342. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/fsspec/__init__.py +0 -0
  343. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/fsspec/azure.py +0 -0
  344. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/fsspec/box.py +0 -0
  345. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -0
  346. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -0
  347. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/fsspec/s3.py +0 -0
  348. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/kafka.py +0 -0
  349. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/mongodb.py +0 -0
  350. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/opensearch.py +0 -0
  351. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/pinecone.py +0 -0
  352. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/qdrant.py +0 -0
  353. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/sql.py +0 -0
  354. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/vectara.py +0 -0
  355. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/runner/writers/weaviate.py +0 -0
  356. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/__init__.py +0 -0
  357. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/chunking.py +0 -0
  358. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/compression.py +0 -0
  359. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/data_prep.py +0 -0
  360. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/dep_check.py +0 -0
  361. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/google_filetype.py +0 -0
  362. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  363. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/utils/table.py +0 -0
  364. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/__init__.py +0 -0
  365. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/__init__.py +0 -0
  366. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/base/__init__.py +0 -0
  367. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/base/cmd.py +0 -0
  368. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/base/dest.py +0 -0
  369. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/base/importer.py +0 -0
  370. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/base/src.py +0 -0
  371. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/cli.py +0 -0
  372. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/cmds.py +0 -0
  373. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/utils/__init__.py +0 -0
  374. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/utils/click.py +0 -0
  375. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/cli/utils/model_conversion.py +0 -0
  376. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/constants.py +0 -0
  377. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/__init__.py +0 -0
  378. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/connector.py +0 -0
  379. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/downloader.py +0 -0
  380. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/file_data.py +0 -0
  381. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/indexer.py +0 -0
  382. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/process.py +0 -0
  383. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/processor.py +0 -0
  384. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/upload_stager.py +0 -0
  385. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/interfaces/uploader.py +0 -0
  386. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/logger.py +0 -0
  387. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/main.py +0 -0
  388. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/otel.py +0 -0
  389. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/__init__.py +0 -0
  390. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/interfaces.py +0 -0
  391. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/otel.py +0 -0
  392. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/pipeline.py +0 -0
  393. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
  394. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -0
  395. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/download.py +0 -0
  396. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/embed.py +0 -0
  397. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/filter.py +0 -0
  398. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/index.py +0 -0
  399. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/partition.py +0 -0
  400. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/stage.py +0 -0
  401. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -0
  402. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/pipeline/steps/upload.py +0 -0
  403. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/__init__.py +0 -0
  404. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/chunker.py +0 -0
  405. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connector_registry.py +0 -0
  406. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/__init__.py +0 -0
  407. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/airtable.py +0 -0
  408. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/astradb.py +0 -0
  409. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/chroma.py +0 -0
  410. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/confluence.py +0 -0
  411. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/couchbase.py +0 -0
  412. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/databricks/__init__.py +0 -0
  413. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/databricks/volumes.py +0 -0
  414. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/databricks/volumes_aws.py +0 -0
  415. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/databricks/volumes_azure.py +0 -0
  416. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/databricks/volumes_gcp.py +0 -0
  417. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/databricks/volumes_native.py +0 -0
  418. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/delta_table.py +0 -0
  419. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/elasticsearch/__init__.py +0 -0
  420. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/elasticsearch/opensearch.py +0 -0
  421. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -0
  422. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +0 -0
  423. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/box.py +0 -0
  424. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +0 -0
  425. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -0
  426. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +0 -0
  427. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +0 -0
  428. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -0
  429. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/fsspec/utils.py +0 -0
  430. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/gitlab.py +0 -0
  431. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -0
  432. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/kafka/__init__.py +0 -0
  433. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/kafka/cloud.py +0 -0
  434. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/kafka/kafka.py +0 -0
  435. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/kafka/local.py +0 -0
  436. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/kdbai.py +0 -0
  437. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/__init__.py +0 -0
  438. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/aws.py +0 -0
  439. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/azure.py +0 -0
  440. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/cloud.py +0 -0
  441. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/gcp.py +0 -0
  442. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/lancedb/local.py +0 -0
  443. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/local.py +0 -0
  444. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/milvus.py +0 -0
  445. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/mongodb.py +0 -0
  446. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -0
  447. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/outlook.py +0 -0
  448. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/qdrant/__init__.py +0 -0
  449. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/qdrant/cloud.py +0 -0
  450. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/qdrant/local.py +0 -0
  451. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/qdrant/qdrant.py +0 -0
  452. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/qdrant/server.py +0 -0
  453. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -0
  454. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -0
  455. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/slack.py +0 -0
  456. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sql/__init__.py +0 -0
  457. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sql/postgres.py +0 -0
  458. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sql/singlestore.py +0 -0
  459. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sql/snowflake.py +0 -0
  460. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sql/sql.py +0 -0
  461. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/sql/sqlite.py +0 -0
  462. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/utils.py +0 -0
  463. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/weaviate/cloud.py +0 -0
  464. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/weaviate/embedded.py +0 -0
  465. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/connectors/weaviate/local.py +0 -0
  466. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/embedder.py +0 -0
  467. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/filter.py +0 -0
  468. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/partitioner.py +0 -0
  469. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/processes/uncompress.py +0 -0
  470. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/unstructured_api.py +0 -0
  471. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest/v2/utils.py +0 -0
  472. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest.egg-info/SOURCES.txt +0 -0
  473. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  474. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest.egg-info/entry_points.txt +0 -0
  475. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest.egg-info/requires.txt +18 -18
  476. {unstructured_ingest-0.3.4 → unstructured_ingest-0.3.6}/unstructured_ingest.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.3.4
3
+ Version: 0.3.6
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,13 +22,13 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.13
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: pydantic>=2.7
26
- Requires-Dist: click
27
- Requires-Dist: dataclasses_json
28
- Requires-Dist: opentelemetry-sdk
29
25
  Requires-Dist: python-dateutil
30
26
  Requires-Dist: pandas
27
+ Requires-Dist: pydantic>=2.7
28
+ Requires-Dist: opentelemetry-sdk
29
+ Requires-Dist: dataclasses_json
31
30
  Requires-Dist: tqdm
31
+ Requires-Dist: click
32
32
  Provides-Extra: remote
33
33
  Requires-Dist: unstructured-client>=0.26.1; extra == "remote"
34
34
  Provides-Extra: csv
@@ -66,28 +66,28 @@ Requires-Dist: pyairtable; extra == "airtable"
66
66
  Provides-Extra: astradb
67
67
  Requires-Dist: astrapy; extra == "astradb"
68
68
  Provides-Extra: azure
69
- Requires-Dist: fsspec; extra == "azure"
70
69
  Requires-Dist: adlfs; extra == "azure"
70
+ Requires-Dist: fsspec; extra == "azure"
71
71
  Provides-Extra: azure-ai-search
72
72
  Requires-Dist: azure-search-documents; extra == "azure-ai-search"
73
73
  Provides-Extra: biomed
74
74
  Requires-Dist: bs4; extra == "biomed"
75
75
  Requires-Dist: requests; extra == "biomed"
76
76
  Provides-Extra: box
77
- Requires-Dist: fsspec; extra == "box"
78
77
  Requires-Dist: boxfs; extra == "box"
78
+ Requires-Dist: fsspec; extra == "box"
79
79
  Provides-Extra: chroma
80
80
  Requires-Dist: chromadb; extra == "chroma"
81
81
  Provides-Extra: clarifai
82
82
  Requires-Dist: clarifai; extra == "clarifai"
83
83
  Provides-Extra: confluence
84
- Requires-Dist: requests; extra == "confluence"
85
84
  Requires-Dist: atlassian-python-api; extra == "confluence"
85
+ Requires-Dist: requests; extra == "confluence"
86
86
  Provides-Extra: couchbase
87
87
  Requires-Dist: couchbase; extra == "couchbase"
88
88
  Provides-Extra: delta-table
89
- Requires-Dist: boto3; extra == "delta-table"
90
89
  Requires-Dist: deltalake; extra == "delta-table"
90
+ Requires-Dist: boto3; extra == "delta-table"
91
91
  Provides-Extra: discord
92
92
  Requires-Dist: discord-py; extra == "discord"
93
93
  Provides-Extra: dropbox
@@ -96,19 +96,19 @@ Requires-Dist: dropboxdrivefs; extra == "dropbox"
96
96
  Provides-Extra: elasticsearch
97
97
  Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
98
98
  Provides-Extra: gcs
99
- Requires-Dist: fsspec; extra == "gcs"
100
99
  Requires-Dist: gcsfs; extra == "gcs"
101
100
  Requires-Dist: bs4; extra == "gcs"
101
+ Requires-Dist: fsspec; extra == "gcs"
102
102
  Provides-Extra: github
103
- Requires-Dist: pygithub>1.58.0; extra == "github"
104
103
  Requires-Dist: requests; extra == "github"
104
+ Requires-Dist: pygithub>1.58.0; extra == "github"
105
105
  Provides-Extra: gitlab
106
106
  Requires-Dist: python-gitlab; extra == "gitlab"
107
107
  Provides-Extra: google-drive
108
108
  Requires-Dist: google-api-python-client; extra == "google-drive"
109
109
  Provides-Extra: hubspot
110
- Requires-Dist: hubspot-api-client; extra == "hubspot"
111
110
  Requires-Dist: urllib3; extra == "hubspot"
111
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
112
112
  Provides-Extra: jira
113
113
  Requires-Dist: atlassian-python-api; extra == "jira"
114
114
  Provides-Extra: kafka
@@ -122,19 +122,19 @@ Requires-Dist: pymilvus; extra == "milvus"
122
122
  Provides-Extra: mongodb
123
123
  Requires-Dist: pymongo; extra == "mongodb"
124
124
  Provides-Extra: notion
125
- Requires-Dist: notion-client; extra == "notion"
125
+ Requires-Dist: backoff; extra == "notion"
126
126
  Requires-Dist: htmlBuilder; extra == "notion"
127
+ Requires-Dist: notion-client; extra == "notion"
127
128
  Requires-Dist: httpx; extra == "notion"
128
- Requires-Dist: backoff; extra == "notion"
129
129
  Provides-Extra: onedrive
130
- Requires-Dist: msal; extra == "onedrive"
131
130
  Requires-Dist: bs4; extra == "onedrive"
132
131
  Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
132
+ Requires-Dist: msal; extra == "onedrive"
133
133
  Provides-Extra: opensearch
134
134
  Requires-Dist: opensearch-py; extra == "opensearch"
135
135
  Provides-Extra: outlook
136
- Requires-Dist: msal; extra == "outlook"
137
136
  Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
137
+ Requires-Dist: msal; extra == "outlook"
138
138
  Provides-Extra: pinecone
139
139
  Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
140
140
  Provides-Extra: postgres
@@ -144,16 +144,16 @@ Requires-Dist: qdrant-client; extra == "qdrant"
144
144
  Provides-Extra: reddit
145
145
  Requires-Dist: praw; extra == "reddit"
146
146
  Provides-Extra: s3
147
- Requires-Dist: fsspec; extra == "s3"
148
147
  Requires-Dist: s3fs; extra == "s3"
148
+ Requires-Dist: fsspec; extra == "s3"
149
149
  Provides-Extra: sharepoint
150
- Requires-Dist: msal; extra == "sharepoint"
151
150
  Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
151
+ Requires-Dist: msal; extra == "sharepoint"
152
152
  Provides-Extra: salesforce
153
153
  Requires-Dist: simple-salesforce; extra == "salesforce"
154
154
  Provides-Extra: sftp
155
- Requires-Dist: fsspec; extra == "sftp"
156
155
  Requires-Dist: paramiko; extra == "sftp"
156
+ Requires-Dist: fsspec; extra == "sftp"
157
157
  Provides-Extra: slack
158
158
  Requires-Dist: slack_sdk[optional]; extra == "slack"
159
159
  Provides-Extra: snowflake
@@ -12,6 +12,7 @@ from lancedb import AsyncConnection
12
12
  from upath import UPath
13
13
 
14
14
  from test.integration.connectors.utils.constants import DESTINATION_TAG
15
+ from unstructured_ingest.v2.constants import RECORD_ID_LABEL
15
16
  from unstructured_ingest.v2.interfaces.file_data import FileData, SourceIdentifiers
16
17
  from unstructured_ingest.v2.processes.connectors.lancedb.aws import (
17
18
  LanceDBAwsAccessConfig,
@@ -43,7 +44,6 @@ DATABASE_NAME = "database"
43
44
  TABLE_NAME = "elements"
44
45
  DIMENSION = 384
45
46
  NUMBER_EXPECTED_ROWS = 22
46
- NUMBER_EXPECTED_COLUMNS = 10
47
47
  S3_BUCKET = "s3://utic-ingest-test-fixtures/"
48
48
  GS_BUCKET = "gs://utic-test-ingest-fixtures-output/"
49
49
  AZURE_BUCKET = "az://utic-ingest-test-fixtures-output/"
@@ -54,9 +54,9 @@ REQUIRED_ENV_VARS = {
54
54
  "local": (),
55
55
  }
56
56
 
57
-
58
57
  SCHEMA = pa.schema(
59
58
  [
59
+ pa.field(RECORD_ID_LABEL, pa.string()),
60
60
  pa.field("vector", pa.list_(pa.float16(), DIMENSION)),
61
61
  pa.field("text", pa.string(), nullable=True),
62
62
  pa.field("type", pa.string(), nullable=True),
@@ -69,6 +69,7 @@ SCHEMA = pa.schema(
69
69
  pa.field("metadata-page_number", pa.int32(), nullable=True),
70
70
  ]
71
71
  )
72
+ NUMBER_EXPECTED_COLUMNS = len(SCHEMA.names)
72
73
 
73
74
 
74
75
  @pytest_asyncio.fixture
@@ -116,7 +117,7 @@ async def test_lancedb_destination(
116
117
  file_data = FileData(
117
118
  source_identifiers=SourceIdentifiers(fullpath=upload_file.name, filename=upload_file.name),
118
119
  connector_type=CONNECTOR_TYPE,
119
- identifier="mock file data",
120
+ identifier="mock-file-data",
120
121
  )
121
122
  stager = LanceDBUploadStager()
122
123
  uploader = _get_uploader(uri)
@@ -129,17 +130,52 @@ async def test_lancedb_destination(
129
130
 
130
131
  await uploader.run_async(path=staged_file_path, file_data=file_data)
131
132
 
132
- table = await connection.open_table(TABLE_NAME)
133
- table_df: pd.DataFrame = await table.to_pandas()
133
+ # Test upload to empty table
134
+ with await connection.open_table(TABLE_NAME) as table:
135
+ table_df: pd.DataFrame = await table.to_pandas()
134
136
 
135
137
  assert len(table_df) == NUMBER_EXPECTED_ROWS
136
138
  assert len(table_df.columns) == NUMBER_EXPECTED_COLUMNS
137
139
 
140
+ assert table_df[RECORD_ID_LABEL][0] == file_data.identifier
138
141
  assert table_df["element_id"][0] == "2470d8dc42215b3d68413b55bf00fed2"
139
142
  assert table_df["type"][0] == "CompositeElement"
140
143
  assert table_df["metadata-filename"][0] == "DA-1p-with-duplicate-pages.pdf.json"
141
144
  assert table_df["metadata-text_as_html"][0] is None
142
145
 
146
+ # Test upload of the second file, rows should be appended
147
+ file_data.identifier = "mock-file-data-2"
148
+ staged_second_file_path = stager.run(
149
+ elements_filepath=upload_file,
150
+ file_data=file_data,
151
+ output_dir=tmp_path,
152
+ output_filename=f"{upload_file.stem}-2{upload_file.suffix}",
153
+ )
154
+ await uploader.run_async(path=staged_second_file_path, file_data=file_data)
155
+ with await connection.open_table(TABLE_NAME) as table:
156
+ appended_table_df: pd.DataFrame = await table.to_pandas()
157
+ assert len(appended_table_df) == 2 * NUMBER_EXPECTED_ROWS
158
+
159
+ # Test re-upload of the first file, rows should be overwritten, not appended
160
+ await uploader.run_async(path=staged_file_path, file_data=file_data)
161
+ with await connection.open_table(TABLE_NAME) as table:
162
+ overwritten_table_df: pd.DataFrame = await table.to_pandas()
163
+ assert len(overwritten_table_df) == 2 * NUMBER_EXPECTED_ROWS
164
+
165
+
166
+ class TestPrecheck:
167
+ @pytest.mark.tags(CONNECTOR_TYPE, DESTINATION_TAG)
168
+ @pytest.mark.parametrize("connection_with_uri", ["local", "s3", "gcs", "az"], indirect=True)
169
+ def test_succeeds(
170
+ self,
171
+ upload_file: Path,
172
+ connection_with_uri: tuple[AsyncConnection, str],
173
+ tmp_path: Path,
174
+ ) -> None:
175
+ _, uri = connection_with_uri
176
+ uploader = _get_uploader(uri)
177
+ uploader.precheck()
178
+
143
179
 
144
180
  def _get_uri(target: Literal["local", "s3", "gcs", "az"], local_base_path: Path) -> str:
145
181
  if target == "local":
@@ -158,11 +194,12 @@ def _get_uploader(
158
194
  uri: str,
159
195
  ) -> Union[LanceDBAzureUploader, LanceDBAzureUploader, LanceDBAwsUploader, LanceDBGSPUploader]:
160
196
  target = uri.split("://", maxsplit=1)[0] if uri.startswith(("s3", "az", "gs")) else "local"
197
+ upload_config = LanceDBUploaderConfig(table_name=TABLE_NAME)
161
198
  if target == "az":
162
199
  azure_connection_string = os.getenv("AZURE_DEST_CONNECTION_STR")
163
200
  access_config_kwargs = _parse_azure_connection_string(azure_connection_string)
164
201
  return LanceDBAzureUploader(
165
- upload_config=LanceDBUploaderConfig(table_name=TABLE_NAME),
202
+ upload_config=upload_config,
166
203
  connection_config=LanceDBAzureConnectionConfig(
167
204
  access_config=LanceDBAzureAccessConfig(**access_config_kwargs),
168
205
  uri=uri,
@@ -171,7 +208,7 @@ def _get_uploader(
171
208
 
172
209
  elif target == "s3":
173
210
  return LanceDBAwsUploader(
174
- upload_config=LanceDBUploaderConfig(table_name=TABLE_NAME),
211
+ upload_config=upload_config,
175
212
  connection_config=LanceDBAwsConnectionConfig(
176
213
  access_config=LanceDBAwsAccessConfig(
177
214
  aws_access_key_id=os.getenv("S3_INGEST_TEST_ACCESS_KEY"),
@@ -182,7 +219,7 @@ def _get_uploader(
182
219
  )
183
220
  elif target == "gs":
184
221
  return LanceDBGSPUploader(
185
- upload_config=LanceDBUploaderConfig(table_name=TABLE_NAME),
222
+ upload_config=upload_config,
186
223
  connection_config=LanceDBGCSConnectionConfig(
187
224
  access_config=LanceDBGCSAccessConfig(
188
225
  google_service_account_key=os.getenv("GCP_INGEST_SERVICE_KEY")
@@ -192,7 +229,7 @@ def _get_uploader(
192
229
  )
193
230
  else:
194
231
  return LanceDBLocalUploader(
195
- upload_config=LanceDBUploaderConfig(table_name=TABLE_NAME),
232
+ upload_config=upload_config,
196
233
  connection_config=LanceDBLocalConnectionConfig(
197
234
  access_config=LanceDBLocalAccessConfig(),
198
235
  uri=uri,
@@ -1,4 +1,5 @@
1
1
  import json
2
+ import math
2
3
  import os
3
4
  import re
4
5
  import time
@@ -19,6 +20,7 @@ from unstructured_ingest.v2.interfaces import FileData, SourceIdentifiers
19
20
  from unstructured_ingest.v2.logger import logger
20
21
  from unstructured_ingest.v2.processes.connectors.pinecone import (
21
22
  CONNECTOR_TYPE,
23
+ MAX_QUERY_RESULTS,
22
24
  PineconeAccessConfig,
23
25
  PineconeConnectionConfig,
24
26
  PineconeUploader,
@@ -118,7 +120,10 @@ def validate_pinecone_index(
118
120
  f"retry attempt {i}: expected {expected_num_of_vectors} != vector count {vector_count}"
119
121
  )
120
122
  time.sleep(interval)
121
- assert vector_count == expected_num_of_vectors
123
+ assert vector_count == expected_num_of_vectors, (
124
+ f"vector count from index ({vector_count}) doesn't "
125
+ f"match expected number: {expected_num_of_vectors}"
126
+ )
122
127
 
123
128
 
124
129
  @requires_env(API_KEY)
@@ -147,10 +152,7 @@ async def test_pinecone_destination(pinecone_index: str, upload_file: Path, temp
147
152
  uploader = PineconeUploader(connection_config=connection_config, upload_config=upload_config)
148
153
  uploader.precheck()
149
154
 
150
- if uploader.is_async():
151
- await uploader.run_async(path=new_upload_file, file_data=file_data)
152
- else:
153
- uploader.run(path=new_upload_file, file_data=file_data)
155
+ uploader.run(path=new_upload_file, file_data=file_data)
154
156
  with new_upload_file.open() as f:
155
157
  staged_content = json.load(f)
156
158
  expected_num_of_vectors = len(staged_content)
@@ -160,10 +162,59 @@ async def test_pinecone_destination(pinecone_index: str, upload_file: Path, temp
160
162
  )
161
163
 
162
164
  # Rerun uploader and make sure no duplicates exist
163
- if uploader.is_async():
164
- await uploader.run_async(path=new_upload_file, file_data=file_data)
165
- else:
166
- uploader.run(path=new_upload_file, file_data=file_data)
165
+ uploader.run(path=new_upload_file, file_data=file_data)
166
+ logger.info("validating second upload")
167
+ validate_pinecone_index(
168
+ index_name=pinecone_index, expected_num_of_vectors=expected_num_of_vectors
169
+ )
170
+
171
+
172
+ @requires_env(API_KEY)
173
+ @pytest.mark.asyncio
174
+ @pytest.mark.tags(CONNECTOR_TYPE, DESTINATION_TAG)
175
+ @pytest.mark.skip(reason="TODO: get this to work")
176
+ async def test_pinecone_destination_large_index(
177
+ pinecone_index: str, upload_file: Path, temp_dir: Path
178
+ ):
179
+ new_file = temp_dir / "large_file.json"
180
+ with upload_file.open() as f:
181
+ upload_content = json.load(f)
182
+
183
+ min_entries = math.ceil((MAX_QUERY_RESULTS * 2) / len(upload_content))
184
+ new_content = (upload_content * min_entries)[: (2 * MAX_QUERY_RESULTS)]
185
+ print(f"Creating large index content with {len(new_content)} records")
186
+ with new_file.open("w") as f:
187
+ json.dump(new_content, f)
188
+
189
+ expected_num_of_vectors = len(new_content)
190
+ file_data = FileData(
191
+ source_identifiers=SourceIdentifiers(fullpath=new_file.name, filename=new_file.name),
192
+ connector_type=CONNECTOR_TYPE,
193
+ identifier="pinecone_mock_id",
194
+ )
195
+ connection_config = PineconeConnectionConfig(
196
+ index_name=pinecone_index,
197
+ access_config=PineconeAccessConfig(api_key=get_api_key()),
198
+ )
199
+ stager_config = PineconeUploadStagerConfig()
200
+ stager = PineconeUploadStager(upload_stager_config=stager_config)
201
+ new_upload_file = stager.run(
202
+ elements_filepath=new_file,
203
+ output_dir=temp_dir,
204
+ output_filename=new_file.name,
205
+ file_data=file_data,
206
+ )
207
+
208
+ upload_config = PineconeUploaderConfig()
209
+ uploader = PineconeUploader(connection_config=connection_config, upload_config=upload_config)
210
+ uploader.precheck()
211
+
212
+ uploader.run(path=new_upload_file, file_data=file_data)
213
+ validate_pinecone_index(
214
+ index_name=pinecone_index, expected_num_of_vectors=expected_num_of_vectors
215
+ )
216
+ # Rerun uploader and make sure no duplicates exist
217
+ uploader.run(path=new_upload_file, file_data=file_data)
167
218
  logger.info("validating second upload")
168
219
  validate_pinecone_index(
169
220
  index_name=pinecone_index, expected_num_of_vectors=expected_num_of_vectors
@@ -0,0 +1 @@
1
+ __version__ = "0.3.6" # pragma: no cover
@@ -233,8 +233,7 @@ class AzureAISearchUploader(Uploader):
233
233
  raise WriteError(
234
234
  ", ".join(
235
235
  [
236
- f"{error.azure_ai_search_key}: "
237
- f"[{error.status_code}] {error.error_message}"
236
+ f"{error.key}: " f"[{error.status_code}] {error.error_message}"
238
237
  for error in errors
239
238
  ],
240
239
  ),
@@ -142,8 +142,6 @@ class ElasticsearchIndexer(Indexer):
142
142
  def precheck(self) -> None:
143
143
  try:
144
144
  with self.connection_config.get_client() as client:
145
- if not client.ping():
146
- raise SourceConnectionError("cluster not detected")
147
145
  indices = client.indices.get_alias(index="*")
148
146
  if self.index_config.index_name not in indices:
149
147
  raise SourceConnectionError(
@@ -393,11 +391,9 @@ class ElasticsearchUploader(Uploader):
393
391
  def precheck(self) -> None:
394
392
  try:
395
393
  with self.connection_config.get_client() as client:
396
- if not client.ping():
397
- raise DestinationConnectionError("cluster not detected")
398
394
  indices = client.indices.get_alias(index="*")
399
395
  if self.upload_config.index_name not in indices:
400
- raise SourceConnectionError(
396
+ raise DestinationConnectionError(
401
397
  "index {} not found: {}".format(
402
398
  self.upload_config.index_name, ", ".join(indices.keys())
403
399
  )
@@ -15,6 +15,7 @@ from unstructured_ingest.error import DestinationConnectionError
15
15
  from unstructured_ingest.logger import logger
16
16
  from unstructured_ingest.utils.data_prep import flatten_dict
17
17
  from unstructured_ingest.utils.dep_check import requires_dependencies
18
+ from unstructured_ingest.v2.constants import RECORD_ID_LABEL
18
19
  from unstructured_ingest.v2.interfaces.connector import ConnectionConfig
19
20
  from unstructured_ingest.v2.interfaces.file_data import FileData
20
21
  from unstructured_ingest.v2.interfaces.upload_stager import UploadStager, UploadStagerConfig
@@ -84,7 +85,7 @@ class LanceDBUploadStager(UploadStager):
84
85
 
85
86
  df = pd.DataFrame(
86
87
  [
87
- self._conform_element_contents(element_contents)
88
+ self._conform_element_contents(element_contents, file_data)
88
89
  for element_contents in elements_contents
89
90
  ]
90
91
  )
@@ -94,9 +95,10 @@ class LanceDBUploadStager(UploadStager):
94
95
 
95
96
  return output_path
96
97
 
97
- def _conform_element_contents(self, element: dict) -> dict:
98
+ def _conform_element_contents(self, element: dict, file_data: FileData) -> dict:
98
99
  return {
99
100
  "vector": element.pop("embeddings", None),
101
+ RECORD_ID_LABEL: file_data.identifier,
100
102
  **flatten_dict(element, separator="-"),
101
103
  }
102
104
 
@@ -134,6 +136,14 @@ class LanceDBUploader(Uploader):
134
136
  async with self.get_table() as table:
135
137
  schema = await table.schema()
136
138
  df = self._fit_to_schema(df, schema)
139
+ if RECORD_ID_LABEL not in schema.names:
140
+ logger.warning(
141
+ f"Designated table doesn't contain {RECORD_ID_LABEL} column of type"
142
+ " string which is required to support overwriting updates on subsequent"
143
+ " uploads of the same record. New rows will be appended instead."
144
+ )
145
+ else:
146
+ await table.delete(f'{RECORD_ID_LABEL} = "{file_data.identifier}"')
137
147
  await table.add(data=df)
138
148
 
139
149
  def _fit_to_schema(self, df: pd.DataFrame, schema) -> pd.DataFrame:
@@ -31,6 +31,7 @@ CONNECTOR_TYPE = "pinecone"
31
31
  MAX_PAYLOAD_SIZE = 2 * 1024 * 1024 # 2MB
32
32
  MAX_POOL_THREADS = 100
33
33
  MAX_METADATA_BYTES = 40960 # 40KB https://docs.pinecone.io/reference/quotas-and-limits#hard-limits
34
+ MAX_QUERY_RESULTS = 10000
34
35
 
35
36
 
36
37
  class PineconeAccessConfig(AccessConfig):
@@ -84,7 +85,7 @@ ALLOWED_FIELDS = (
84
85
 
85
86
  class PineconeUploadStagerConfig(UploadStagerConfig):
86
87
  metadata_fields: list[str] = Field(
87
- default=str(ALLOWED_FIELDS),
88
+ default=list(ALLOWED_FIELDS),
88
89
  description=(
89
90
  "which metadata from the source element to map to the payload metadata being sent to "
90
91
  "Pinecone."
@@ -137,7 +138,6 @@ class PineconeUploadStager(UploadStager):
137
138
  flatten_lists=True,
138
139
  remove_none=True,
139
140
  )
140
- metadata[RECORD_ID_LABEL] = file_data.identifier
141
141
  metadata_size_bytes = len(json.dumps(metadata).encode())
142
142
  if metadata_size_bytes > MAX_METADATA_BYTES:
143
143
  logger.info(
@@ -146,6 +146,8 @@ class PineconeUploadStager(UploadStager):
146
146
  )
147
147
  metadata = {}
148
148
 
149
+ metadata[RECORD_ID_LABEL] = file_data.identifier
150
+
149
151
  return {
150
152
  "id": str(uuid.uuid4()),
151
153
  "values": embeddings,
@@ -213,6 +215,18 @@ class PineconeUploader(Uploader):
213
215
  f"from pinecone index: {resp}"
214
216
  )
215
217
 
218
+ def delete_by_query(self, index: "PineconeIndex", query_params: dict) -> None:
219
+ while True:
220
+ query_results = index.query(**query_params)
221
+ matches = query_results.get("matches", [])
222
+ if not matches:
223
+ break
224
+ ids = [match["id"] for match in matches]
225
+ delete_params = {"ids": ids}
226
+ if namespace := self.upload_config.namespace:
227
+ delete_params["namespace"] = namespace
228
+ index.delete(**delete_params)
229
+
216
230
  def serverless_delete_by_record_id(self, file_data: FileData) -> None:
217
231
  logger.debug(
218
232
  f"deleting any content with metadata "
@@ -221,29 +235,25 @@ class PineconeUploader(Uploader):
221
235
  )
222
236
  index = self.connection_config.get_index(pool_threads=MAX_POOL_THREADS)
223
237
  index_stats = index.describe_index_stats()
238
+ dimension = index_stats["dimension"]
224
239
  total_vectors = index_stats["total_vector_count"]
225
240
  if total_vectors == 0:
226
241
  return
227
- dimension = index_stats["dimension"]
228
- query_params = {
229
- "filter": {self.upload_config.record_id_key: {"$eq": file_data.identifier}},
230
- "vector": [0] * dimension,
231
- "top_k": total_vectors,
232
- }
233
- if namespace := self.upload_config.namespace:
234
- query_params["namespace"] = namespace
235
- while True:
236
- query_results = index.query(**query_params)
237
- matches = query_results.get("matches", [])
238
- if not matches:
239
- break
240
- ids = [match["id"] for match in matches]
241
- delete_params = {"ids": ids}
242
+ while total_vectors > 0:
243
+ top_k = min(total_vectors, MAX_QUERY_RESULTS)
244
+ query_params = {
245
+ "filter": {self.upload_config.record_id_key: {"$eq": file_data.identifier}},
246
+ "vector": [0] * dimension,
247
+ "top_k": top_k,
248
+ }
242
249
  if namespace := self.upload_config.namespace:
243
- delete_params["namespace"] = namespace
244
- index.delete(**delete_params)
245
- logger.debug(
246
- f"deleted any content with metadata "
250
+ query_params["namespace"] = namespace
251
+ self.delete_by_query(index=index, query_params=query_params)
252
+ index_stats = index.describe_index_stats()
253
+ total_vectors = index_stats["total_vector_count"]
254
+
255
+ logger.info(
256
+ f"deleted {total_vectors} records with metadata "
247
257
  f"{self.upload_config.record_id_key}={file_data.identifier} "
248
258
  f"from pinecone index"
249
259
  )
@@ -10,8 +10,6 @@ from .embedded import CONNECTOR_TYPE as EMBEDDED_WEAVIATE_CONNECTOR_TYPE
10
10
  from .embedded import weaviate_embedded_destination_entry
11
11
  from .local import CONNECTOR_TYPE as LOCAL_WEAVIATE_CONNECTOR_TYPE
12
12
  from .local import weaviate_local_destination_entry
13
- from .weaviate import CONNECTOR_TYPE as WEAVIATE_CONNECTOR_TYPE
14
- from .weaviate import weaviate_destination_entry
15
13
 
16
14
  add_destination_entry(
17
15
  destination_type=LOCAL_WEAVIATE_CONNECTOR_TYPE, entry=weaviate_local_destination_entry
@@ -22,4 +20,3 @@ add_destination_entry(
22
20
  add_destination_entry(
23
21
  destination_type=EMBEDDED_WEAVIATE_CONNECTOR_TYPE, entry=weaviate_embedded_destination_entry
24
22
  )
25
- add_destination_entry(destination_type=WEAVIATE_CONNECTOR_TYPE, entry=weaviate_destination_entry)
@@ -22,7 +22,6 @@ from unstructured_ingest.v2.interfaces import (
22
22
  UploadStagerConfig,
23
23
  )
24
24
  from unstructured_ingest.v2.logger import logger
25
- from unstructured_ingest.v2.processes.connector_registry import DestinationRegistryEntry
26
25
 
27
26
  if TYPE_CHECKING:
28
27
  from weaviate.classes.init import Timeout
@@ -288,12 +287,3 @@ class WeaviateUploader(Uploader, ABC):
288
287
  vector=vector,
289
288
  )
290
289
  self.check_for_errors(client=weaviate_client)
291
-
292
-
293
- weaviate_destination_entry = DestinationRegistryEntry(
294
- connection_config=WeaviateConnectionConfig,
295
- uploader=WeaviateUploader,
296
- uploader_config=WeaviateUploaderConfig,
297
- upload_stager=WeaviateUploadStager,
298
- upload_stager_config=WeaviateUploadStagerConfig,
299
- )