unstructured-ingest 0.7.0__tar.gz → 0.7.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (382) hide show
  1. unstructured_ingest-0.7.2/MANIFEST.in +2 -0
  2. {unstructured_ingest-0.7.0/unstructured_ingest.egg-info → unstructured_ingest-0.7.2}/PKG-INFO +24 -23
  3. unstructured_ingest-0.7.2/unstructured_ingest/__version__.py +1 -0
  4. unstructured_ingest-0.7.2/unstructured_ingest/logger.py +39 -0
  5. unstructured_ingest-0.7.2/unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql +10 -0
  6. unstructured_ingest-0.7.2/unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json +23 -0
  7. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/onedrive.py +45 -17
  8. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sharepoint.py +1 -1
  9. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/string_and_date_utils.py +3 -3
  10. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2/unstructured_ingest.egg-info}/PKG-INFO +24 -23
  11. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest.egg-info/SOURCES.txt +2 -1
  12. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest.egg-info/requires.txt +23 -22
  13. unstructured_ingest-0.7.0/MANIFEST.in +0 -2
  14. unstructured_ingest-0.7.0/test/unit/test_logger.py +0 -78
  15. unstructured_ingest-0.7.0/unstructured_ingest/__version__.py +0 -1
  16. unstructured_ingest-0.7.0/unstructured_ingest/logger.py +0 -130
  17. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/LICENSE.md +0 -0
  18. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/README.md +0 -0
  19. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/__init__.py +0 -0
  20. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/airtable.py +0 -0
  21. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/azure_cognitive_search.py +0 -0
  22. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/chroma.py +0 -0
  23. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/couchbase.py +0 -0
  24. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/databricks_volumes_dest.py +0 -0
  25. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/databricks_volumes_source.py +0 -0
  26. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/delta_table.py +0 -0
  27. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/discord_example.py +0 -0
  28. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/elasticsearch.py +0 -0
  29. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/google_drive.py +0 -0
  30. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/kdbai.py +0 -0
  31. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/local.py +0 -0
  32. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/milvus.py +0 -0
  33. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/mongodb.py +0 -0
  34. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/opensearch.py +0 -0
  35. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/pinecone.py +0 -0
  36. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/s3.py +0 -0
  37. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/salesforce.py +0 -0
  38. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/sharepoint.py +0 -0
  39. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/singlestore.py +0 -0
  40. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/sql.py +0 -0
  41. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/vectara.py +0 -0
  42. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/examples/weaviate.py +0 -0
  43. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/pyproject.toml +0 -0
  44. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/setup.cfg +0 -0
  45. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/setup.py +0 -0
  46. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/__init__.py +0 -0
  47. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/__init__.py +0 -0
  48. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/chunkers/__init__.py +0 -0
  49. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/chunkers/test_chunkers.py +0 -0
  50. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/__init__.py +0 -0
  51. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/conftest.py +0 -0
  52. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/databricks/__init__.py +0 -0
  53. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/databricks/test_volumes_native.py +0 -0
  54. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/discord/__init__.py +0 -0
  55. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/discord/test_discord.py +0 -0
  56. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/duckdb/__init__.py +0 -0
  57. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/duckdb/conftest.py +0 -0
  58. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/duckdb/test_duckdb.py +0 -0
  59. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/duckdb/test_motherduck.py +0 -0
  60. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/elasticsearch/__init__.py +0 -0
  61. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/elasticsearch/conftest.py +0 -0
  62. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/elasticsearch/test_elasticsearch.py +0 -0
  63. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/elasticsearch/test_opensearch.py +0 -0
  64. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/__init__.py +0 -0
  65. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/test_databricks_delta_tables.py +0 -0
  66. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/test_postgres.py +0 -0
  67. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/test_singlestore.py +0 -0
  68. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/test_snowflake.py +0 -0
  69. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/test_sqlite.py +0 -0
  70. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/sql/test_vastdb.py +0 -0
  71. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_astradb.py +0 -0
  72. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_azure_ai_search.py +0 -0
  73. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_chroma.py +0 -0
  74. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_confluence.py +0 -0
  75. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_delta_table.py +0 -0
  76. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_dropbox.py +0 -0
  77. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_github.py +0 -0
  78. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_google_drive.py +0 -0
  79. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_jira.py +0 -0
  80. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_lancedb.py +0 -0
  81. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_milvus.py +0 -0
  82. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_mongodb.py +0 -0
  83. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_neo4j.py +0 -0
  84. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_notion.py +0 -0
  85. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_onedrive.py +0 -0
  86. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_pinecone.py +0 -0
  87. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_qdrant.py +0 -0
  88. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_redis.py +0 -0
  89. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_s3.py +0 -0
  90. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_sharepoint.py +0 -0
  91. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_vectara.py +0 -0
  92. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/test_zendesk.py +0 -0
  93. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/__init__.py +0 -0
  94. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/constants.py +0 -0
  95. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/docker.py +0 -0
  96. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/docker_compose.py +0 -0
  97. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/validation/__init__.py +0 -0
  98. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/validation/destination.py +0 -0
  99. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/validation/equality.py +0 -0
  100. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/validation/source.py +0 -0
  101. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/utils/validation/utils.py +0 -0
  102. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/weaviate/__init__.py +0 -0
  103. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/weaviate/conftest.py +0 -0
  104. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/weaviate/test_cloud.py +0 -0
  105. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/connectors/weaviate/test_local.py +0 -0
  106. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/__init__.py +0 -0
  107. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/conftest.py +0 -0
  108. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_azure_openai.py +0 -0
  109. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_bedrock.py +0 -0
  110. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_huggingface.py +0 -0
  111. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_mixedbread.py +0 -0
  112. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_octoai.py +0 -0
  113. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_openai.py +0 -0
  114. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_togetherai.py +0 -0
  115. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_vertexai.py +0 -0
  116. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/test_voyageai.py +0 -0
  117. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/embedders/utils.py +0 -0
  118. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/partitioners/__init__.py +0 -0
  119. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/partitioners/test_partitioner.py +0 -0
  120. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/integration/utils.py +0 -0
  121. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/__init__.py +0 -0
  122. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/chunkers/__init__.py +0 -0
  123. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/chunkers/test_chunkers.py +0 -0
  124. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/__init__.py +0 -0
  125. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/ibm_watsonx/__init__.py +0 -0
  126. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/ibm_watsonx/test_ibm_watsonx_s3.py +0 -0
  127. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/motherduck/__init__.py +0 -0
  128. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/motherduck/test_base.py +0 -0
  129. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/sql/__init__.py +0 -0
  130. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/sql/test_sql.py +0 -0
  131. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/test_confluence.py +0 -0
  132. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/connectors/test_jira.py +0 -0
  133. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embed/__init__.py +0 -0
  134. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embed/test_mixedbreadai.py +0 -0
  135. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embed/test_octoai.py +0 -0
  136. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embed/test_openai.py +0 -0
  137. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embed/test_vertexai.py +0 -0
  138. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embed/test_voyageai.py +0 -0
  139. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/__init__.py +0 -0
  140. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_bedrock.py +0 -0
  141. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_huggingface.py +0 -0
  142. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_mixedbread.py +0 -0
  143. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_octoai.py +0 -0
  144. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_openai.py +0 -0
  145. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_togetherai.py +0 -0
  146. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_vertexai.py +0 -0
  147. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/embedders/test_voyageai.py +0 -0
  148. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/partitioners/__init__.py +0 -0
  149. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/partitioners/test_partitioner.py +0 -0
  150. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/test_error.py +0 -0
  151. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/test_html.py +0 -0
  152. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/test_interfaces.py +0 -0
  153. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/test_utils.py +0 -0
  154. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/utils/__init__.py +0 -0
  155. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/test/unit/utils/data_generator.py +0 -0
  156. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/__init__.py +0 -0
  157. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/__init__.py +0 -0
  158. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/base/__init__.py +0 -0
  159. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/base/cmd.py +0 -0
  160. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/base/dest.py +0 -0
  161. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/base/importer.py +0 -0
  162. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/base/src.py +0 -0
  163. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/cli.py +0 -0
  164. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/cmds.py +0 -0
  165. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/utils/__init__.py +0 -0
  166. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/utils/click.py +0 -0
  167. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/cli/utils/model_conversion.py +0 -0
  168. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/data_types/__init__.py +0 -0
  169. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/data_types/file_data.py +0 -0
  170. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/__init__.py +0 -0
  171. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/azure_openai.py +0 -0
  172. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/bedrock.py +0 -0
  173. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/huggingface.py +0 -0
  174. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/interfaces.py +0 -0
  175. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  176. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/octoai.py +0 -0
  177. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/openai.py +0 -0
  178. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/togetherai.py +0 -0
  179. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/vertexai.py +0 -0
  180. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/embed/voyageai.py +0 -0
  181. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/error.py +0 -0
  182. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/errors_v2.py +0 -0
  183. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/__init__.py +0 -0
  184. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/connector.py +0 -0
  185. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/downloader.py +0 -0
  186. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/indexer.py +0 -0
  187. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/process.py +0 -0
  188. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/processor.py +0 -0
  189. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/upload_stager.py +0 -0
  190. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/interfaces/uploader.py +0 -0
  191. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/main.py +0 -0
  192. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/otel.py +0 -0
  193. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/__init__.py +0 -0
  194. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/interfaces.py +0 -0
  195. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/otel.py +0 -0
  196. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/pipeline.py +0 -0
  197. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/__init__.py +0 -0
  198. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/chunk.py +0 -0
  199. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/download.py +0 -0
  200. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/embed.py +0 -0
  201. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/filter.py +0 -0
  202. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/index.py +0 -0
  203. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/partition.py +0 -0
  204. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/stage.py +0 -0
  205. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/uncompress.py +0 -0
  206. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/pipeline/steps/upload.py +0 -0
  207. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/__init__.py +0 -0
  208. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/chunker.py +0 -0
  209. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connector_registry.py +0 -0
  210. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/__init__.py +0 -0
  211. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/airtable.py +0 -0
  212. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/assets/__init__.py +0 -0
  213. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/astradb.py +0 -0
  214. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/azure_ai_search.py +0 -0
  215. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/chroma.py +0 -0
  216. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/confluence.py +0 -0
  217. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/couchbase.py +0 -0
  218. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/__init__.py +0 -0
  219. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/volumes.py +0 -0
  220. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/volumes_aws.py +0 -0
  221. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/volumes_azure.py +0 -0
  222. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/volumes_gcp.py +0 -0
  223. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/volumes_native.py +0 -0
  224. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/databricks/volumes_table.py +0 -0
  225. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/delta_table.py +0 -0
  226. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/discord.py +0 -0
  227. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/duckdb/__init__.py +0 -0
  228. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/duckdb/base.py +0 -0
  229. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/duckdb/duckdb.py +0 -0
  230. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/duckdb/motherduck.py +0 -0
  231. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/elasticsearch/__init__.py +0 -0
  232. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py +0 -0
  233. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/elasticsearch/opensearch.py +0 -0
  234. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/__init__.py +0 -0
  235. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/azure.py +0 -0
  236. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/box.py +0 -0
  237. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/dropbox.py +0 -0
  238. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/fsspec.py +0 -0
  239. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/gcs.py +0 -0
  240. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/s3.py +0 -0
  241. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/sftp.py +0 -0
  242. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/fsspec/utils.py +0 -0
  243. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/github.py +0 -0
  244. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/gitlab.py +0 -0
  245. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/google_drive.py +0 -0
  246. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py +0 -0
  247. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +0 -0
  248. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/jira.py +0 -0
  249. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/kafka/__init__.py +0 -0
  250. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/kafka/cloud.py +0 -0
  251. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/kafka/kafka.py +0 -0
  252. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/kafka/local.py +0 -0
  253. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/kdbai.py +0 -0
  254. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/__init__.py +0 -0
  255. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/aws.py +0 -0
  256. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/azure.py +0 -0
  257. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/cloud.py +0 -0
  258. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/gcp.py +0 -0
  259. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/lancedb.py +0 -0
  260. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/lancedb/local.py +0 -0
  261. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/local.py +0 -0
  262. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/milvus.py +0 -0
  263. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/mongodb.py +0 -0
  264. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/neo4j.py +0 -0
  265. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/__init__.py +0 -0
  266. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/client.py +0 -0
  267. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/connector.py +0 -0
  268. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/helpers.py +0 -0
  269. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/__init__.py +0 -0
  270. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_common.py +0 -0
  271. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py +0 -0
  272. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +0 -0
  273. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/interfaces.py +0 -0
  274. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/__init__.py +0 -0
  275. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/block.py +0 -0
  276. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/__init__.py +0 -0
  277. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py +0 -0
  278. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py +0 -0
  279. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -0
  280. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/callout.py +0 -0
  281. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py +0 -0
  282. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py +0 -0
  283. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/code.py +0 -0
  284. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py +0 -0
  285. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/divider.py +0 -0
  286. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/embed.py +0 -0
  287. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/equation.py +0 -0
  288. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/file.py +0 -0
  289. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/heading.py +0 -0
  290. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/image.py +0 -0
  291. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py +0 -0
  292. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py +0 -0
  293. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py +0 -0
  294. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py +0 -0
  295. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py +0 -0
  296. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/quote.py +0 -0
  297. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +0 -0
  298. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/table.py +0 -0
  299. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py +0 -0
  300. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/template.py +0 -0
  301. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/todo.py +0 -0
  302. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py +0 -0
  303. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py +0 -0
  304. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/blocks/video.py +0 -0
  305. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database.py +0 -0
  306. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py +0 -0
  307. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py +0 -0
  308. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py +0 -0
  309. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py +0 -0
  310. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/date.py +0 -0
  311. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/email.py +0 -0
  312. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/files.py +0 -0
  313. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py +0 -0
  314. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -0
  315. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py +0 -0
  316. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py +0 -0
  317. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/number.py +0 -0
  318. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/people.py +0 -0
  319. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py +0 -0
  320. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py +0 -0
  321. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py +0 -0
  322. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py +0 -0
  323. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/select.py +0 -0
  324. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/status.py +0 -0
  325. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/title.py +0 -0
  326. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py +0 -0
  327. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/url.py +0 -0
  328. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py +0 -0
  329. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/date.py +0 -0
  330. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/file.py +0 -0
  331. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/page.py +0 -0
  332. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/parent.py +0 -0
  333. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/rich_text.py +0 -0
  334. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/notion/types/user.py +0 -0
  335. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/outlook.py +0 -0
  336. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/pinecone.py +0 -0
  337. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/qdrant/__init__.py +0 -0
  338. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/qdrant/cloud.py +0 -0
  339. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/qdrant/local.py +0 -0
  340. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/qdrant/qdrant.py +0 -0
  341. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/qdrant/server.py +0 -0
  342. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/redisdb.py +0 -0
  343. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/salesforce.py +0 -0
  344. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/slack.py +0 -0
  345. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/__init__.py +0 -0
  346. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py +0 -0
  347. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/postgres.py +0 -0
  348. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/singlestore.py +0 -0
  349. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/snowflake.py +0 -0
  350. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/sql.py +0 -0
  351. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/sqlite.py +0 -0
  352. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/sql/vastdb.py +0 -0
  353. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/utils.py +0 -0
  354. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/vectara.py +0 -0
  355. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/weaviate/__init__.py +0 -0
  356. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/weaviate/cloud.py +0 -0
  357. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/weaviate/embedded.py +0 -0
  358. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/weaviate/local.py +0 -0
  359. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/weaviate/weaviate.py +0 -0
  360. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/zendesk/__init__.py +0 -0
  361. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/zendesk/client.py +0 -0
  362. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/connectors/zendesk/zendesk.py +0 -0
  363. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/embedder.py +0 -0
  364. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/filter.py +0 -0
  365. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/partitioner.py +0 -0
  366. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/uncompress.py +0 -0
  367. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/utils/__init__.py +0 -0
  368. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/processes/utils/blob_storage.py +0 -0
  369. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/unstructured_api.py +0 -0
  370. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/__init__.py +0 -0
  371. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/chunking.py +0 -0
  372. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/compression.py +0 -0
  373. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/constants.py +0 -0
  374. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/data_prep.py +0 -0
  375. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/dep_check.py +0 -0
  376. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/html.py +0 -0
  377. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/ndjson.py +0 -0
  378. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/pydantic_models.py +0 -0
  379. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest/utils/table.py +0 -0
  380. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  381. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest.egg-info/entry_points.txt +0 -0
  382. {unstructured_ingest-0.7.0 → unstructured_ingest-0.7.2}/unstructured_ingest.egg-info/top_level.txt +0 -0
@@ -0,0 +1,2 @@
1
+ # Connector specific assets
2
+ include unstructured_ingest/processes/connectors/assets/*
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: unstructured-ingest
3
- Version: 0.7.0
3
+ Version: 0.7.2
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,12 +22,12 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.14
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
+ Requires-Dist: click
26
+ Requires-Dist: pydantic>=2.7
27
+ Requires-Dist: opentelemetry-sdk
25
28
  Requires-Dist: tqdm
26
29
  Requires-Dist: python-dateutil
27
- Requires-Dist: click
28
30
  Requires-Dist: dataclasses_json
29
- Requires-Dist: opentelemetry-sdk
30
- Requires-Dist: pydantic>=2.7
31
31
  Requires-Dist: numpy
32
32
  Requires-Dist: pandas
33
33
  Provides-Extra: remote
@@ -103,8 +103,8 @@ Requires-Dist: astrapy; extra == "astradb"
103
103
  Requires-Dist: numpy; extra == "astradb"
104
104
  Requires-Dist: pandas; extra == "astradb"
105
105
  Provides-Extra: azure
106
- Requires-Dist: adlfs; extra == "azure"
107
106
  Requires-Dist: fsspec; extra == "azure"
107
+ Requires-Dist: adlfs; extra == "azure"
108
108
  Requires-Dist: numpy; extra == "azure"
109
109
  Requires-Dist: pandas; extra == "azure"
110
110
  Provides-Extra: azure-ai-search
@@ -139,8 +139,8 @@ Requires-Dist: couchbase; extra == "couchbase"
139
139
  Requires-Dist: numpy; extra == "couchbase"
140
140
  Requires-Dist: pandas; extra == "couchbase"
141
141
  Provides-Extra: delta-table
142
- Requires-Dist: boto3; extra == "delta-table"
143
142
  Requires-Dist: deltalake; extra == "delta-table"
143
+ Requires-Dist: boto3; extra == "delta-table"
144
144
  Requires-Dist: numpy; extra == "delta-table"
145
145
  Requires-Dist: pandas; extra == "delta-table"
146
146
  Provides-Extra: discord
@@ -148,8 +148,8 @@ Requires-Dist: discord.py; extra == "discord"
148
148
  Requires-Dist: numpy; extra == "discord"
149
149
  Requires-Dist: pandas; extra == "discord"
150
150
  Provides-Extra: dropbox
151
- Requires-Dist: dropboxdrivefs; extra == "dropbox"
152
151
  Requires-Dist: fsspec; extra == "dropbox"
152
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
153
153
  Requires-Dist: numpy; extra == "dropbox"
154
154
  Requires-Dist: pandas; extra == "dropbox"
155
155
  Provides-Extra: duckdb
@@ -161,9 +161,9 @@ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
161
161
  Requires-Dist: numpy; extra == "elasticsearch"
162
162
  Requires-Dist: pandas; extra == "elasticsearch"
163
163
  Provides-Extra: gcs
164
+ Requires-Dist: fsspec; extra == "gcs"
164
165
  Requires-Dist: bs4; extra == "gcs"
165
166
  Requires-Dist: gcsfs; extra == "gcs"
166
- Requires-Dist: fsspec; extra == "gcs"
167
167
  Requires-Dist: numpy; extra == "gcs"
168
168
  Requires-Dist: pandas; extra == "gcs"
169
169
  Provides-Extra: github
@@ -180,15 +180,15 @@ Requires-Dist: google-api-python-client; extra == "google-drive"
180
180
  Requires-Dist: numpy; extra == "google-drive"
181
181
  Requires-Dist: pandas; extra == "google-drive"
182
182
  Provides-Extra: hubspot
183
- Requires-Dist: hubspot-api-client; extra == "hubspot"
184
183
  Requires-Dist: urllib3; extra == "hubspot"
184
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
185
185
  Requires-Dist: numpy; extra == "hubspot"
186
186
  Requires-Dist: pandas; extra == "hubspot"
187
187
  Provides-Extra: ibm-watsonx-s3
188
188
  Requires-Dist: pyiceberg; extra == "ibm-watsonx-s3"
189
189
  Requires-Dist: tenacity; extra == "ibm-watsonx-s3"
190
- Requires-Dist: httpx; extra == "ibm-watsonx-s3"
191
190
  Requires-Dist: pyarrow; extra == "ibm-watsonx-s3"
191
+ Requires-Dist: httpx; extra == "ibm-watsonx-s3"
192
192
  Requires-Dist: numpy; extra == "ibm-watsonx-s3"
193
193
  Requires-Dist: pandas; extra == "ibm-watsonx-s3"
194
194
  Provides-Extra: jira
@@ -216,22 +216,22 @@ Requires-Dist: pymongo; extra == "mongodb"
216
216
  Requires-Dist: numpy; extra == "mongodb"
217
217
  Requires-Dist: pandas; extra == "mongodb"
218
218
  Provides-Extra: neo4j
219
- Requires-Dist: networkx; extra == "neo4j"
220
219
  Requires-Dist: cymple; extra == "neo4j"
220
+ Requires-Dist: networkx; extra == "neo4j"
221
221
  Requires-Dist: neo4j-rust-ext; extra == "neo4j"
222
222
  Requires-Dist: numpy; extra == "neo4j"
223
223
  Requires-Dist: pandas; extra == "neo4j"
224
224
  Provides-Extra: notion
225
- Requires-Dist: backoff; extra == "notion"
226
- Requires-Dist: htmlBuilder; extra == "notion"
227
225
  Requires-Dist: httpx; extra == "notion"
226
+ Requires-Dist: htmlBuilder; extra == "notion"
227
+ Requires-Dist: backoff; extra == "notion"
228
228
  Requires-Dist: notion-client; extra == "notion"
229
229
  Requires-Dist: numpy; extra == "notion"
230
230
  Requires-Dist: pandas; extra == "notion"
231
231
  Provides-Extra: onedrive
232
- Requires-Dist: bs4; extra == "onedrive"
233
- Requires-Dist: msal; extra == "onedrive"
234
232
  Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
233
+ Requires-Dist: msal; extra == "onedrive"
234
+ Requires-Dist: requests; extra == "onedrive"
235
235
  Requires-Dist: numpy; extra == "onedrive"
236
236
  Requires-Dist: pandas; extra == "onedrive"
237
237
  Provides-Extra: opensearch
@@ -239,8 +239,8 @@ Requires-Dist: opensearch-py; extra == "opensearch"
239
239
  Requires-Dist: numpy; extra == "opensearch"
240
240
  Requires-Dist: pandas; extra == "opensearch"
241
241
  Provides-Extra: outlook
242
- Requires-Dist: msal; extra == "outlook"
243
242
  Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
243
+ Requires-Dist: msal; extra == "outlook"
244
244
  Requires-Dist: numpy; extra == "outlook"
245
245
  Requires-Dist: pandas; extra == "outlook"
246
246
  Provides-Extra: pinecone
@@ -269,8 +269,9 @@ Requires-Dist: s3fs; extra == "s3"
269
269
  Requires-Dist: numpy; extra == "s3"
270
270
  Requires-Dist: pandas; extra == "s3"
271
271
  Provides-Extra: sharepoint
272
- Requires-Dist: msal; extra == "sharepoint"
273
272
  Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
273
+ Requires-Dist: msal; extra == "sharepoint"
274
+ Requires-Dist: requests; extra == "sharepoint"
274
275
  Requires-Dist: numpy; extra == "sharepoint"
275
276
  Requires-Dist: pandas; extra == "sharepoint"
276
277
  Provides-Extra: salesforce
@@ -278,8 +279,8 @@ Requires-Dist: simple-salesforce; extra == "salesforce"
278
279
  Requires-Dist: numpy; extra == "salesforce"
279
280
  Requires-Dist: pandas; extra == "salesforce"
280
281
  Provides-Extra: sftp
281
- Requires-Dist: paramiko; extra == "sftp"
282
282
  Requires-Dist: fsspec; extra == "sftp"
283
+ Requires-Dist: paramiko; extra == "sftp"
283
284
  Requires-Dist: numpy; extra == "sftp"
284
285
  Requires-Dist: pandas; extra == "sftp"
285
286
  Provides-Extra: slack
@@ -287,8 +288,8 @@ Requires-Dist: slack_sdk[optional]; extra == "slack"
287
288
  Requires-Dist: numpy; extra == "slack"
288
289
  Requires-Dist: pandas; extra == "slack"
289
290
  Provides-Extra: snowflake
290
- Requires-Dist: psycopg2-binary; extra == "snowflake"
291
291
  Requires-Dist: snowflake-connector-python; extra == "snowflake"
292
+ Requires-Dist: psycopg2-binary; extra == "snowflake"
292
293
  Requires-Dist: numpy; extra == "snowflake"
293
294
  Requires-Dist: pandas; extra == "snowflake"
294
295
  Provides-Extra: wikipedia
@@ -312,21 +313,21 @@ Requires-Dist: singlestoredb; extra == "singlestore"
312
313
  Requires-Dist: numpy; extra == "singlestore"
313
314
  Requires-Dist: pandas; extra == "singlestore"
314
315
  Provides-Extra: vectara
315
- Requires-Dist: aiofiles; extra == "vectara"
316
316
  Requires-Dist: httpx; extra == "vectara"
317
+ Requires-Dist: aiofiles; extra == "vectara"
317
318
  Requires-Dist: requests; extra == "vectara"
318
319
  Requires-Dist: numpy; extra == "vectara"
319
320
  Requires-Dist: pandas; extra == "vectara"
320
321
  Provides-Extra: vastdb
321
322
  Requires-Dist: ibis; extra == "vastdb"
322
- Requires-Dist: pyarrow; extra == "vastdb"
323
323
  Requires-Dist: vastdb; extra == "vastdb"
324
+ Requires-Dist: pyarrow; extra == "vastdb"
324
325
  Requires-Dist: numpy; extra == "vastdb"
325
326
  Requires-Dist: pandas; extra == "vastdb"
326
327
  Provides-Extra: zendesk
328
+ Requires-Dist: aiofiles; extra == "zendesk"
327
329
  Requires-Dist: bs4; extra == "zendesk"
328
330
  Requires-Dist: httpx; extra == "zendesk"
329
- Requires-Dist: aiofiles; extra == "zendesk"
330
331
  Requires-Dist: numpy; extra == "zendesk"
331
332
  Requires-Dist: pandas; extra == "zendesk"
332
333
  Provides-Extra: embed-huggingface
@@ -356,8 +357,8 @@ Requires-Dist: tiktoken; extra == "openai"
356
357
  Requires-Dist: numpy; extra == "openai"
357
358
  Requires-Dist: pandas; extra == "openai"
358
359
  Provides-Extra: bedrock
359
- Requires-Dist: boto3; extra == "bedrock"
360
360
  Requires-Dist: aioboto3; extra == "bedrock"
361
+ Requires-Dist: boto3; extra == "bedrock"
361
362
  Requires-Dist: numpy; extra == "bedrock"
362
363
  Requires-Dist: pandas; extra == "bedrock"
363
364
  Provides-Extra: togetherai
@@ -0,0 +1 @@
1
+ __version__ = "0.7.2" # pragma: no cover
@@ -0,0 +1,39 @@
1
+ import logging
2
+
3
+ logger = logging.getLogger("unstructured_ingest")
4
+
5
+
6
+ def remove_root_handlers(logger: logging.Logger) -> None:
7
+ # NOTE(robinson): in some environments such as Google Colab, there is a root handler
8
+ # that doesn't not mask secrets, meaning sensitive info such as api keys appear in logs.
9
+ # Removing these when they exist prevents this behavior
10
+ if logger.root.hasHandlers():
11
+ for handler in logger.root.handlers:
12
+ logger.root.removeHandler(handler)
13
+
14
+
15
+ def ingest_log_streaming_init(level: int) -> None:
16
+ handler = logging.StreamHandler()
17
+ handler.name = "ingest_log_handler"
18
+ formatter = logging.Formatter("%(asctime)s %(processName)-10s %(levelname)-8s %(message)s")
19
+ handler.setFormatter(formatter)
20
+
21
+ # Only want to add the handler once
22
+ if "ingest_log_handler" not in [h.name for h in logger.handlers]:
23
+ logger.addHandler(handler)
24
+
25
+ remove_root_handlers(logger)
26
+ logger.setLevel(level)
27
+
28
+
29
+ def make_default_logger(level: int) -> logging.Logger:
30
+ """Return a custom logger."""
31
+ logger = logging.getLogger("unstructured_ingest")
32
+ handler = logging.StreamHandler()
33
+ handler.name = "ingest_log_handler"
34
+ formatter = logging.Formatter("%(asctime)s %(processName)-10s %(levelname)-8s %(message)s")
35
+ handler.setFormatter(formatter)
36
+ logger.addHandler(handler)
37
+ logger.setLevel(level)
38
+ remove_root_handlers(logger)
39
+ return logger
@@ -0,0 +1,10 @@
1
+ CREATE TABLE elements (
2
+ id STRING NOT NULL PRIMARY KEY,
3
+ record_id STRING NOT NULL,
4
+ element_id STRING NOT NULL,
5
+ text STRING,
6
+ embeddings ARRAY<FLOAT>,
7
+ type STRING,
8
+ metadata VARIANT
9
+ );
10
+
@@ -0,0 +1,23 @@
1
+ {
2
+ "properties": [
3
+ {
4
+ "dataType": [
5
+ "text"
6
+ ],
7
+ "indexFilterable": true,
8
+ "indexSearchable": true,
9
+ "name": "record_id",
10
+ "tokenization": "word"
11
+ },
12
+ {
13
+ "dataType": [
14
+ "text"
15
+ ],
16
+ "indexFilterable": true,
17
+ "indexSearchable": true,
18
+ "name": "text",
19
+ "tokenization": "word"
20
+ }
21
+ ],
22
+ "vectorizer": "none"
23
+ }
@@ -53,11 +53,14 @@ MAX_BYTES_SIZE = 512_000_000
53
53
 
54
54
  class OnedriveAccessConfig(AccessConfig):
55
55
  client_cred: str = Field(description="Microsoft App client secret")
56
+ password: Optional[str] = Field(description="Service account password", default=None)
56
57
 
57
58
 
58
59
  class OnedriveConnectionConfig(ConnectionConfig):
59
60
  client_id: str = Field(description="Microsoft app client ID")
60
- user_pname: str = Field(description="User principal name, usually is your Azure AD email.")
61
+ user_pname: str = Field(
62
+ description="User principal name or service account, usually your Azure AD email."
63
+ )
61
64
  tenant: str = Field(
62
65
  repr=False, description="ID or domain name associated with your Azure AD instance"
63
66
  )
@@ -74,25 +77,50 @@ class OnedriveConnectionConfig(ConnectionConfig):
74
77
  drive = client.users[self.user_pname].drive
75
78
  return drive
76
79
 
77
- @requires_dependencies(["msal"], extras="onedrive")
80
+ @requires_dependencies(["msal", "requests"], extras="onedrive")
78
81
  def get_token(self):
79
82
  from msal import ConfidentialClientApplication
83
+ from requests import post
84
+
85
+ if self.access_config.get_secret_value().password:
86
+ url = f"https://login.microsoftonline.com/{self.tenant}/oauth2/v2.0/token"
87
+ headers = {"Content-Type": "application/x-www-form-urlencoded"}
88
+ data = {
89
+ "grant_type": "password",
90
+ "username": self.user_pname,
91
+ "password": self.access_config.get_secret_value().password,
92
+ "client_id": self.client_id,
93
+ "client_secret": self.access_config.get_secret_value().client_cred,
94
+ "scope": "https://graph.microsoft.com/.default",
95
+ }
96
+ response = post(url, headers=headers, data=data)
97
+ if response.status_code == 200:
98
+ return response.json()
99
+ else:
100
+ raise SourceConnectionError(
101
+ f"Oauth2 authentication failed with {response.status_code}: {response.text}"
102
+ )
80
103
 
81
- try:
82
- app = ConfidentialClientApplication(
83
- authority=f"{self.authority_url}/{self.tenant}",
84
- client_id=self.client_id,
85
- client_credential=self.access_config.get_secret_value().client_cred,
86
- )
87
- token = app.acquire_token_for_client(scopes=["https://graph.microsoft.com/.default"])
88
- except ValueError as exc:
89
- logger.error("Couldn't set up credentials for OneDrive")
90
- raise exc
91
- if "error" in token:
92
- raise SourceConnectionNetworkError(
93
- "failed to fetch token, {}: {}".format(token["error"], token["error_description"])
94
- )
95
- return token
104
+ else:
105
+ try:
106
+ app = ConfidentialClientApplication(
107
+ authority=f"{self.authority_url}/{self.tenant}",
108
+ client_id=self.client_id,
109
+ client_credential=self.access_config.get_secret_value().client_cred,
110
+ )
111
+ token = app.acquire_token_for_client(
112
+ scopes=["https://graph.microsoft.com/.default"]
113
+ )
114
+ except ValueError as exc:
115
+ logger.error("Couldn't set up credentials.")
116
+ raise exc
117
+ if "error" in token:
118
+ raise SourceConnectionNetworkError(
119
+ "failed to fetch token, {}: {}".format(
120
+ token["error"], token["error_description"]
121
+ )
122
+ )
123
+ return token
96
124
 
97
125
  @requires_dependencies(["office365"], extras="onedrive")
98
126
  def get_client(self) -> "GraphClient":
@@ -100,7 +100,7 @@ class SharepointDownloader(OnedriveDownloader):
100
100
  connector_type: str = CONNECTOR_TYPE
101
101
 
102
102
  @SourceConnectionNetworkError.wrap
103
- @requires_dependencies(["office365"], extras="onedrive")
103
+ @requires_dependencies(["office365"], extras="sharepoint")
104
104
  def _fetch_file(self, file_data: FileData) -> DriveItem:
105
105
  from office365.runtime.client_request_exception import ClientRequestException
106
106
 
@@ -1,14 +1,14 @@
1
1
  import json
2
2
  import re
3
- import typing as t
4
3
  from datetime import datetime
4
+ from typing import Any, Union
5
5
 
6
6
  from dateutil import parser
7
7
 
8
8
  from unstructured_ingest.logger import logger
9
9
 
10
10
 
11
- def json_to_dict(json_string: str) -> t.Union[str, t.Dict[str, t.Any]]:
11
+ def json_to_dict(json_string: str) -> Union[str, dict[str, Any]]:
12
12
  """Helper function attempts to deserialize json string to a dictionary."""
13
13
  try:
14
14
  return json.loads(json_string)
@@ -24,7 +24,7 @@ def json_to_dict(json_string: str) -> t.Union[str, t.Dict[str, t.Any]]:
24
24
  return json_string
25
25
 
26
26
 
27
- def ensure_isoformat_datetime(timestamp: t.Union[datetime, str]) -> str:
27
+ def ensure_isoformat_datetime(timestamp: Union[datetime, str]) -> str:
28
28
  """
29
29
  Ensures that the input value is converted to an ISO format datetime string.
30
30
  Handles both datetime objects and strings.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: unstructured-ingest
3
- Version: 0.7.0
3
+ Version: 0.7.2
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,12 +22,12 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.14
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
+ Requires-Dist: click
26
+ Requires-Dist: pydantic>=2.7
27
+ Requires-Dist: opentelemetry-sdk
25
28
  Requires-Dist: tqdm
26
29
  Requires-Dist: python-dateutil
27
- Requires-Dist: click
28
30
  Requires-Dist: dataclasses_json
29
- Requires-Dist: opentelemetry-sdk
30
- Requires-Dist: pydantic>=2.7
31
31
  Requires-Dist: numpy
32
32
  Requires-Dist: pandas
33
33
  Provides-Extra: remote
@@ -103,8 +103,8 @@ Requires-Dist: astrapy; extra == "astradb"
103
103
  Requires-Dist: numpy; extra == "astradb"
104
104
  Requires-Dist: pandas; extra == "astradb"
105
105
  Provides-Extra: azure
106
- Requires-Dist: adlfs; extra == "azure"
107
106
  Requires-Dist: fsspec; extra == "azure"
107
+ Requires-Dist: adlfs; extra == "azure"
108
108
  Requires-Dist: numpy; extra == "azure"
109
109
  Requires-Dist: pandas; extra == "azure"
110
110
  Provides-Extra: azure-ai-search
@@ -139,8 +139,8 @@ Requires-Dist: couchbase; extra == "couchbase"
139
139
  Requires-Dist: numpy; extra == "couchbase"
140
140
  Requires-Dist: pandas; extra == "couchbase"
141
141
  Provides-Extra: delta-table
142
- Requires-Dist: boto3; extra == "delta-table"
143
142
  Requires-Dist: deltalake; extra == "delta-table"
143
+ Requires-Dist: boto3; extra == "delta-table"
144
144
  Requires-Dist: numpy; extra == "delta-table"
145
145
  Requires-Dist: pandas; extra == "delta-table"
146
146
  Provides-Extra: discord
@@ -148,8 +148,8 @@ Requires-Dist: discord.py; extra == "discord"
148
148
  Requires-Dist: numpy; extra == "discord"
149
149
  Requires-Dist: pandas; extra == "discord"
150
150
  Provides-Extra: dropbox
151
- Requires-Dist: dropboxdrivefs; extra == "dropbox"
152
151
  Requires-Dist: fsspec; extra == "dropbox"
152
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
153
153
  Requires-Dist: numpy; extra == "dropbox"
154
154
  Requires-Dist: pandas; extra == "dropbox"
155
155
  Provides-Extra: duckdb
@@ -161,9 +161,9 @@ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
161
161
  Requires-Dist: numpy; extra == "elasticsearch"
162
162
  Requires-Dist: pandas; extra == "elasticsearch"
163
163
  Provides-Extra: gcs
164
+ Requires-Dist: fsspec; extra == "gcs"
164
165
  Requires-Dist: bs4; extra == "gcs"
165
166
  Requires-Dist: gcsfs; extra == "gcs"
166
- Requires-Dist: fsspec; extra == "gcs"
167
167
  Requires-Dist: numpy; extra == "gcs"
168
168
  Requires-Dist: pandas; extra == "gcs"
169
169
  Provides-Extra: github
@@ -180,15 +180,15 @@ Requires-Dist: google-api-python-client; extra == "google-drive"
180
180
  Requires-Dist: numpy; extra == "google-drive"
181
181
  Requires-Dist: pandas; extra == "google-drive"
182
182
  Provides-Extra: hubspot
183
- Requires-Dist: hubspot-api-client; extra == "hubspot"
184
183
  Requires-Dist: urllib3; extra == "hubspot"
184
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
185
185
  Requires-Dist: numpy; extra == "hubspot"
186
186
  Requires-Dist: pandas; extra == "hubspot"
187
187
  Provides-Extra: ibm-watsonx-s3
188
188
  Requires-Dist: pyiceberg; extra == "ibm-watsonx-s3"
189
189
  Requires-Dist: tenacity; extra == "ibm-watsonx-s3"
190
- Requires-Dist: httpx; extra == "ibm-watsonx-s3"
191
190
  Requires-Dist: pyarrow; extra == "ibm-watsonx-s3"
191
+ Requires-Dist: httpx; extra == "ibm-watsonx-s3"
192
192
  Requires-Dist: numpy; extra == "ibm-watsonx-s3"
193
193
  Requires-Dist: pandas; extra == "ibm-watsonx-s3"
194
194
  Provides-Extra: jira
@@ -216,22 +216,22 @@ Requires-Dist: pymongo; extra == "mongodb"
216
216
  Requires-Dist: numpy; extra == "mongodb"
217
217
  Requires-Dist: pandas; extra == "mongodb"
218
218
  Provides-Extra: neo4j
219
- Requires-Dist: networkx; extra == "neo4j"
220
219
  Requires-Dist: cymple; extra == "neo4j"
220
+ Requires-Dist: networkx; extra == "neo4j"
221
221
  Requires-Dist: neo4j-rust-ext; extra == "neo4j"
222
222
  Requires-Dist: numpy; extra == "neo4j"
223
223
  Requires-Dist: pandas; extra == "neo4j"
224
224
  Provides-Extra: notion
225
- Requires-Dist: backoff; extra == "notion"
226
- Requires-Dist: htmlBuilder; extra == "notion"
227
225
  Requires-Dist: httpx; extra == "notion"
226
+ Requires-Dist: htmlBuilder; extra == "notion"
227
+ Requires-Dist: backoff; extra == "notion"
228
228
  Requires-Dist: notion-client; extra == "notion"
229
229
  Requires-Dist: numpy; extra == "notion"
230
230
  Requires-Dist: pandas; extra == "notion"
231
231
  Provides-Extra: onedrive
232
- Requires-Dist: bs4; extra == "onedrive"
233
- Requires-Dist: msal; extra == "onedrive"
234
232
  Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
233
+ Requires-Dist: msal; extra == "onedrive"
234
+ Requires-Dist: requests; extra == "onedrive"
235
235
  Requires-Dist: numpy; extra == "onedrive"
236
236
  Requires-Dist: pandas; extra == "onedrive"
237
237
  Provides-Extra: opensearch
@@ -239,8 +239,8 @@ Requires-Dist: opensearch-py; extra == "opensearch"
239
239
  Requires-Dist: numpy; extra == "opensearch"
240
240
  Requires-Dist: pandas; extra == "opensearch"
241
241
  Provides-Extra: outlook
242
- Requires-Dist: msal; extra == "outlook"
243
242
  Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
243
+ Requires-Dist: msal; extra == "outlook"
244
244
  Requires-Dist: numpy; extra == "outlook"
245
245
  Requires-Dist: pandas; extra == "outlook"
246
246
  Provides-Extra: pinecone
@@ -269,8 +269,9 @@ Requires-Dist: s3fs; extra == "s3"
269
269
  Requires-Dist: numpy; extra == "s3"
270
270
  Requires-Dist: pandas; extra == "s3"
271
271
  Provides-Extra: sharepoint
272
- Requires-Dist: msal; extra == "sharepoint"
273
272
  Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
273
+ Requires-Dist: msal; extra == "sharepoint"
274
+ Requires-Dist: requests; extra == "sharepoint"
274
275
  Requires-Dist: numpy; extra == "sharepoint"
275
276
  Requires-Dist: pandas; extra == "sharepoint"
276
277
  Provides-Extra: salesforce
@@ -278,8 +279,8 @@ Requires-Dist: simple-salesforce; extra == "salesforce"
278
279
  Requires-Dist: numpy; extra == "salesforce"
279
280
  Requires-Dist: pandas; extra == "salesforce"
280
281
  Provides-Extra: sftp
281
- Requires-Dist: paramiko; extra == "sftp"
282
282
  Requires-Dist: fsspec; extra == "sftp"
283
+ Requires-Dist: paramiko; extra == "sftp"
283
284
  Requires-Dist: numpy; extra == "sftp"
284
285
  Requires-Dist: pandas; extra == "sftp"
285
286
  Provides-Extra: slack
@@ -287,8 +288,8 @@ Requires-Dist: slack_sdk[optional]; extra == "slack"
287
288
  Requires-Dist: numpy; extra == "slack"
288
289
  Requires-Dist: pandas; extra == "slack"
289
290
  Provides-Extra: snowflake
290
- Requires-Dist: psycopg2-binary; extra == "snowflake"
291
291
  Requires-Dist: snowflake-connector-python; extra == "snowflake"
292
+ Requires-Dist: psycopg2-binary; extra == "snowflake"
292
293
  Requires-Dist: numpy; extra == "snowflake"
293
294
  Requires-Dist: pandas; extra == "snowflake"
294
295
  Provides-Extra: wikipedia
@@ -312,21 +313,21 @@ Requires-Dist: singlestoredb; extra == "singlestore"
312
313
  Requires-Dist: numpy; extra == "singlestore"
313
314
  Requires-Dist: pandas; extra == "singlestore"
314
315
  Provides-Extra: vectara
315
- Requires-Dist: aiofiles; extra == "vectara"
316
316
  Requires-Dist: httpx; extra == "vectara"
317
+ Requires-Dist: aiofiles; extra == "vectara"
317
318
  Requires-Dist: requests; extra == "vectara"
318
319
  Requires-Dist: numpy; extra == "vectara"
319
320
  Requires-Dist: pandas; extra == "vectara"
320
321
  Provides-Extra: vastdb
321
322
  Requires-Dist: ibis; extra == "vastdb"
322
- Requires-Dist: pyarrow; extra == "vastdb"
323
323
  Requires-Dist: vastdb; extra == "vastdb"
324
+ Requires-Dist: pyarrow; extra == "vastdb"
324
325
  Requires-Dist: numpy; extra == "vastdb"
325
326
  Requires-Dist: pandas; extra == "vastdb"
326
327
  Provides-Extra: zendesk
328
+ Requires-Dist: aiofiles; extra == "zendesk"
327
329
  Requires-Dist: bs4; extra == "zendesk"
328
330
  Requires-Dist: httpx; extra == "zendesk"
329
- Requires-Dist: aiofiles; extra == "zendesk"
330
331
  Requires-Dist: numpy; extra == "zendesk"
331
332
  Requires-Dist: pandas; extra == "zendesk"
332
333
  Provides-Extra: embed-huggingface
@@ -356,8 +357,8 @@ Requires-Dist: tiktoken; extra == "openai"
356
357
  Requires-Dist: numpy; extra == "openai"
357
358
  Requires-Dist: pandas; extra == "openai"
358
359
  Provides-Extra: bedrock
359
- Requires-Dist: boto3; extra == "bedrock"
360
360
  Requires-Dist: aioboto3; extra == "bedrock"
361
+ Requires-Dist: boto3; extra == "bedrock"
361
362
  Requires-Dist: numpy; extra == "bedrock"
362
363
  Requires-Dist: pandas; extra == "bedrock"
363
364
  Provides-Extra: togetherai
@@ -107,7 +107,6 @@ test/unit/__init__.py
107
107
  test/unit/test_error.py
108
108
  test/unit/test_html.py
109
109
  test/unit/test_interfaces.py
110
- test/unit/test_logger.py
111
110
  test/unit/test_utils.py
112
111
  test/unit/chunkers/__init__.py
113
112
  test/unit/chunkers/test_chunkers.py
@@ -234,6 +233,8 @@ unstructured_ingest/processes/connectors/slack.py
234
233
  unstructured_ingest/processes/connectors/utils.py
235
234
  unstructured_ingest/processes/connectors/vectara.py
236
235
  unstructured_ingest/processes/connectors/assets/__init__.py
236
+ unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql
237
+ unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json
237
238
  unstructured_ingest/processes/connectors/databricks/__init__.py
238
239
  unstructured_ingest/processes/connectors/databricks/volumes.py
239
240
  unstructured_ingest/processes/connectors/databricks/volumes_aws.py