unstructured-ingest 0.0.18__tar.gz → 0.0.21__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (360) hide show
  1. {unstructured-ingest-0.0.18/unstructured_ingest.egg-info → unstructured-ingest-0.0.21}/PKG-INFO +1 -1
  2. unstructured-ingest-0.0.21/unstructured_ingest/__version__.py +1 -0
  3. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/astradb.py +2 -2
  4. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/astradb.py +54 -24
  5. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/chunker.py +8 -29
  6. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/astradb.py +26 -19
  7. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/chroma.py +2 -5
  8. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/databricks_volumes.py +12 -14
  9. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +1 -6
  10. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/box.py +1 -6
  11. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +2 -5
  12. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +1 -6
  13. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +1 -6
  14. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/kdbai.py +2 -5
  15. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/local.py +2 -5
  16. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/milvus.py +2 -5
  17. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/mongodb.py +2 -5
  18. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/pinecone.py +2 -5
  19. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/sql.py +1 -6
  20. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/weaviate.py +2 -5
  21. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/partitioner.py +9 -55
  22. unstructured-ingest-0.0.21/unstructured_ingest/v2/unstructured_api.py +87 -0
  23. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21/unstructured_ingest.egg-info}/PKG-INFO +1 -1
  24. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/SOURCES.txt +1 -0
  25. unstructured-ingest-0.0.18/unstructured_ingest/__version__.py +0 -1
  26. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/LICENSE.md +0 -0
  27. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/README.md +0 -0
  28. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/pyproject.toml +0 -0
  29. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/setup.cfg +0 -0
  30. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/setup.py +0 -0
  31. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_chunking_utils.py +0 -0
  32. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_error.py +0 -0
  33. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_interfaces.py +0 -0
  34. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_logger.py +0 -0
  35. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_utils.py +0 -0
  36. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/test/test_utils_v2.py +0 -0
  37. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/__init__.py +0 -0
  38. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/__init__.py +0 -0
  39. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/__init__.py +0 -0
  40. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/cmd.py +0 -0
  41. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/dest.py +0 -0
  42. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/base/src.py +0 -0
  43. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cli.py +0 -0
  44. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmd_factory.py +0 -0
  45. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/__init__.py +0 -0
  46. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/airtable.py +0 -0
  47. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/azure_cognitive_search.py +0 -0
  48. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/biomed.py +0 -0
  49. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/chroma.py +0 -0
  50. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/clarifai.py +0 -0
  51. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/confluence.py +0 -0
  52. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -0
  53. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/delta_table.py +0 -0
  54. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/discord.py +0 -0
  55. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/elasticsearch.py +0 -0
  56. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/__init__.py +0 -0
  57. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -0
  58. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/box.py +0 -0
  59. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -0
  60. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -0
  61. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -0
  62. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -0
  63. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -0
  64. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/github.py +0 -0
  65. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/gitlab.py +0 -0
  66. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/google_drive.py +0 -0
  67. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/hubspot.py +0 -0
  68. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/jira.py +0 -0
  69. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/kafka.py +0 -0
  70. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/local.py +0 -0
  71. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/mongodb.py +0 -0
  72. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/notion.py +0 -0
  73. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/onedrive.py +0 -0
  74. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/opensearch.py +0 -0
  75. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/outlook.py +0 -0
  76. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/pinecone.py +0 -0
  77. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/qdrant.py +0 -0
  78. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/reddit.py +0 -0
  79. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/salesforce.py +0 -0
  80. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/sharepoint.py +0 -0
  81. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/slack.py +0 -0
  82. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/sql.py +0 -0
  83. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/vectara.py +0 -0
  84. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/weaviate.py +0 -0
  85. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/cmds/wikipedia.py +0 -0
  86. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/common.py +0 -0
  87. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/interfaces.py +0 -0
  88. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/cli/utils.py +0 -0
  89. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/__init__.py +0 -0
  90. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/airtable.py +0 -0
  91. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/azure_cognitive_search.py +0 -0
  92. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/biomed.py +0 -0
  93. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/chroma.py +0 -0
  94. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/clarifai.py +0 -0
  95. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/confluence.py +0 -0
  96. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/databricks_volumes.py +0 -0
  97. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/delta_table.py +0 -0
  98. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/discord.py +0 -0
  99. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/elasticsearch.py +0 -0
  100. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/__init__.py +0 -0
  101. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/azure.py +0 -0
  102. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/box.py +0 -0
  103. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/dropbox.py +0 -0
  104. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/fsspec.py +0 -0
  105. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/gcs.py +0 -0
  106. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/s3.py +0 -0
  107. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/fsspec/sftp.py +0 -0
  108. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/git.py +0 -0
  109. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/github.py +0 -0
  110. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/gitlab.py +0 -0
  111. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/google_drive.py +0 -0
  112. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/hubspot.py +0 -0
  113. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/jira.py +0 -0
  114. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/kafka.py +0 -0
  115. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/local.py +0 -0
  116. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/mongodb.py +0 -0
  117. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/__init__.py +0 -0
  118. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/client.py +0 -0
  119. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/connector.py +0 -0
  120. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/helpers.py +0 -0
  121. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/interfaces.py +0 -0
  122. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/__init__.py +0 -0
  123. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/block.py +0 -0
  124. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/__init__.py +0 -0
  125. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -0
  126. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -0
  127. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -0
  128. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -0
  129. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -0
  130. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -0
  131. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/code.py +0 -0
  132. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -0
  133. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -0
  134. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -0
  135. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -0
  136. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/file.py +0 -0
  137. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -0
  138. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/image.py +0 -0
  139. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -0
  140. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -0
  141. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -0
  142. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -0
  143. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -0
  144. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -0
  145. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -0
  146. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/table.py +0 -0
  147. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -0
  148. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/template.py +0 -0
  149. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -0
  150. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -0
  151. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -0
  152. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/blocks/video.py +0 -0
  153. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database.py +0 -0
  154. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -0
  155. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -0
  156. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -0
  157. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -0
  158. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -0
  159. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -0
  160. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -0
  161. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -0
  162. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -0
  163. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -0
  164. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -0
  165. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -0
  166. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -0
  167. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -0
  168. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -0
  169. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -0
  170. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -0
  171. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -0
  172. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -0
  173. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -0
  174. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -0
  175. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -0
  176. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -0
  177. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/date.py +0 -0
  178. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/file.py +0 -0
  179. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/page.py +0 -0
  180. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/parent.py +0 -0
  181. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/rich_text.py +0 -0
  182. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/notion/types/user.py +0 -0
  183. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/onedrive.py +0 -0
  184. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/opensearch.py +0 -0
  185. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/outlook.py +0 -0
  186. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/pinecone.py +0 -0
  187. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/qdrant.py +0 -0
  188. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/reddit.py +0 -0
  189. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/registry.py +0 -0
  190. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/salesforce.py +0 -0
  191. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/sharepoint.py +0 -0
  192. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/slack.py +0 -0
  193. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/sql.py +0 -0
  194. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/vectara.py +0 -0
  195. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/weaviate.py +0 -0
  196. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/connector/wikipedia.py +0 -0
  197. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/__init__.py +0 -0
  198. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/bedrock.py +0 -0
  199. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/huggingface.py +0 -0
  200. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/interfaces.py +0 -0
  201. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  202. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/octoai.py +0 -0
  203. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/openai.py +0 -0
  204. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/vertexai.py +0 -0
  205. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/embed/voyageai.py +0 -0
  206. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/__init__.py +0 -0
  207. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/core.py +0 -0
  208. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -0
  209. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -0
  210. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/error.py +0 -0
  211. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/ingest_backoff/__init__.py +0 -0
  212. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/ingest_backoff/_common.py +0 -0
  213. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/ingest_backoff/_wrapper.py +0 -0
  214. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/interfaces.py +0 -0
  215. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/logger.py +0 -0
  216. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/main.py +0 -0
  217. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/__init__.py +0 -0
  218. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/copy.py +0 -0
  219. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/doc_factory.py +0 -0
  220. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/interfaces.py +0 -0
  221. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/partition.py +0 -0
  222. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/permissions.py +0 -0
  223. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/pipeline.py +0 -0
  224. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/reformat/__init__.py +0 -0
  225. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/reformat/chunking.py +0 -0
  226. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/reformat/embedding.py +0 -0
  227. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/source.py +0 -0
  228. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/utils.py +0 -0
  229. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/pipeline/write.py +0 -0
  230. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/processor.py +0 -0
  231. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/__init__.py +0 -0
  232. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/airtable.py +0 -0
  233. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/astradb.py +0 -0
  234. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/base_runner.py +0 -0
  235. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/biomed.py +0 -0
  236. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/confluence.py +0 -0
  237. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/delta_table.py +0 -0
  238. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/discord.py +0 -0
  239. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/elasticsearch.py +0 -0
  240. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/__init__.py +0 -0
  241. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/azure.py +0 -0
  242. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/box.py +0 -0
  243. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/dropbox.py +0 -0
  244. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/fsspec.py +0 -0
  245. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/gcs.py +0 -0
  246. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/s3.py +0 -0
  247. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/fsspec/sftp.py +0 -0
  248. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/github.py +0 -0
  249. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/gitlab.py +0 -0
  250. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/google_drive.py +0 -0
  251. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/hubspot.py +0 -0
  252. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/jira.py +0 -0
  253. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/kafka.py +0 -0
  254. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/local.py +0 -0
  255. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/mongodb.py +0 -0
  256. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/notion.py +0 -0
  257. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/onedrive.py +0 -0
  258. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/opensearch.py +0 -0
  259. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/outlook.py +0 -0
  260. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/reddit.py +0 -0
  261. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/salesforce.py +0 -0
  262. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/sharepoint.py +0 -0
  263. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/slack.py +0 -0
  264. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/utils.py +0 -0
  265. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/wikipedia.py +0 -0
  266. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/__init__.py +0 -0
  267. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/astradb.py +0 -0
  268. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/azure_cognitive_search.py +0 -0
  269. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/base_writer.py +0 -0
  270. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/chroma.py +0 -0
  271. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/clarifai.py +0 -0
  272. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/databricks_volumes.py +0 -0
  273. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/delta_table.py +0 -0
  274. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/elasticsearch.py +0 -0
  275. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/__init__.py +0 -0
  276. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/azure.py +0 -0
  277. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/box.py +0 -0
  278. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -0
  279. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -0
  280. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/fsspec/s3.py +0 -0
  281. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/kafka.py +0 -0
  282. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/mongodb.py +0 -0
  283. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/opensearch.py +0 -0
  284. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/pinecone.py +0 -0
  285. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/qdrant.py +0 -0
  286. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/sql.py +0 -0
  287. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/vectara.py +0 -0
  288. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/runner/writers/weaviate.py +0 -0
  289. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/__init__.py +0 -0
  290. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/chunking.py +0 -0
  291. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/compression.py +0 -0
  292. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/data_prep.py +0 -0
  293. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/dep_check.py +0 -0
  294. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/google_filetype.py +0 -0
  295. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  296. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/utils/table.py +0 -0
  297. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/__init__.py +0 -0
  298. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/__init__.py +0 -0
  299. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/__init__.py +0 -0
  300. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/cmd.py +0 -0
  301. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/dest.py +0 -0
  302. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/importer.py +0 -0
  303. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/base/src.py +0 -0
  304. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/cli.py +0 -0
  305. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/cmds.py +0 -0
  306. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/utils/__init__.py +0 -0
  307. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/utils/click.py +0 -0
  308. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/cli/utils/model_conversion.py +0 -0
  309. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/__init__.py +0 -0
  310. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/connector.py +0 -0
  311. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/downloader.py +0 -0
  312. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/file_data.py +0 -0
  313. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/indexer.py +0 -0
  314. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/process.py +0 -0
  315. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/processor.py +0 -0
  316. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/upload_stager.py +0 -0
  317. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/interfaces/uploader.py +0 -0
  318. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/logger.py +0 -0
  319. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/main.py +0 -0
  320. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/otel.py +0 -0
  321. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/__init__.py +0 -0
  322. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/interfaces.py +0 -0
  323. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/otel.py +0 -0
  324. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/pipeline.py +0 -0
  325. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
  326. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -0
  327. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/download.py +0 -0
  328. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/embed.py +0 -0
  329. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/filter.py +0 -0
  330. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/index.py +0 -0
  331. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/partition.py +0 -0
  332. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/stage.py +0 -0
  333. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -0
  334. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/pipeline/steps/upload.py +0 -0
  335. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/__init__.py +0 -0
  336. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connector_registry.py +0 -0
  337. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/__init__.py +0 -0
  338. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/airtable.py +0 -0
  339. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py +0 -0
  340. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/couchbase.py +0 -0
  341. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/elasticsearch.py +0 -0
  342. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -0
  343. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -0
  344. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -0
  345. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/fsspec/utils.py +0 -0
  346. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -0
  347. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -0
  348. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/opensearch.py +0 -0
  349. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -0
  350. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -0
  351. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/singlestore.py +0 -0
  352. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/connectors/utils.py +0 -0
  353. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/embedder.py +0 -0
  354. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/filter.py +0 -0
  355. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/processes/uncompress.py +0 -0
  356. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest/v2/utils.py +0 -0
  357. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  358. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/entry_points.txt +0 -0
  359. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/requires.txt +276 -276
  360. {unstructured-ingest-0.0.18 → unstructured-ingest-0.0.21}/unstructured_ingest.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.18
3
+ Version: 0.0.21
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -0,0 +1 @@
1
+ __version__ = "0.0.21" # pragma: no cover
@@ -37,11 +37,11 @@ class AstraDBCliConfig(SimpleAstraDBConfig, CliConfig):
37
37
  "numbers, and underscores.",
38
38
  ),
39
39
  click.Option(
40
- ["--namespace"],
40
+ ["--keyspace"],
41
41
  required=False,
42
42
  default=None,
43
43
  type=str,
44
- help="The Astra DB connection namespace.",
44
+ help="The Astra DB connection keyspace.",
45
45
  ),
46
46
  ]
47
47
  return options
@@ -24,7 +24,8 @@ from unstructured_ingest.utils.data_prep import batch_generator, flatten_dict
24
24
  from unstructured_ingest.utils.dep_check import requires_dependencies
25
25
 
26
26
  if t.TYPE_CHECKING:
27
- from astrapy.db import AstraDB, AstraDBCollection
27
+ from astrapy import Collection as AstraDBCollection
28
+ from astrapy import Database as AstraDB
28
29
 
29
30
  NON_INDEXED_FIELDS = ["metadata._node_content", "content"]
30
31
 
@@ -39,6 +40,7 @@ class AstraDBAccessConfig(AccessConfig):
39
40
  class SimpleAstraDBConfig(BaseConnectorConfig):
40
41
  access_config: AstraDBAccessConfig
41
42
  collection_name: str
43
+ keyspace: t.Optional[str] = None
42
44
  namespace: t.Optional[str] = None
43
45
 
44
46
 
@@ -98,22 +100,30 @@ class AstraDBSourceConnector(SourceConnectorCleanupMixin, BaseSourceConnector):
98
100
  @requires_dependencies(["astrapy"], extras="astradb")
99
101
  def astra_db_collection(self) -> "AstraDBCollection":
100
102
  if self._astra_db_collection is None:
101
- from astrapy.db import AstraDB
103
+ from astrapy import DataAPIClient as AstraDBClient
102
104
 
103
- # Build the Astra DB object.
105
+ # Choose keyspace or deprecated namespace
106
+ keyspace_param = self.connector_config.keyspace or self.connector_config.namespace
107
+
108
+ # Create a client object to interact with the Astra DB
104
109
  # caller_name/version for Astra DB tracking
105
- self._astra_db = AstraDB(
106
- api_endpoint=self.connector_config.access_config.api_endpoint,
107
- token=self.connector_config.access_config.token,
108
- namespace=self.connector_config.namespace,
110
+ my_client = AstraDBClient(
109
111
  caller_name=integration_name,
110
112
  caller_version=integration_version,
111
113
  )
112
114
 
113
- # Create and connect to the collection
114
- self._astra_db_collection = self._astra_db.collection(
115
- collection_name=self.connector_config.collection_name,
115
+ # Get the database object
116
+ self._astra_db = my_client.get_database(
117
+ api_endpoint=self.connector_config.access_config.api_endpoint,
118
+ token=self.connector_config.access_config.token,
119
+ keyspace=keyspace_param,
116
120
  )
121
+
122
+ # Create and connect to the newly created collection
123
+ self._astra_db_collection = self._astra_db.get_collection(
124
+ name=self.connector_config.collection_name,
125
+ )
126
+
117
127
  return self._astra_db_collection # type: ignore
118
128
 
119
129
  @requires_dependencies(["astrapy"], extras="astradb")
@@ -132,8 +142,14 @@ class AstraDBSourceConnector(SourceConnectorCleanupMixin, BaseSourceConnector):
132
142
  @requires_dependencies(["astrapy"], extras="astradb")
133
143
  def get_ingest_docs(self): # type: ignore
134
144
  # Perform the find operation
135
- astra_db_docs = list(self.astra_db_collection.paginated_find())
145
+ astra_db_docs_cursor = self.astra_db_collection.find({})
136
146
 
147
+ # Iterate over the cursor
148
+ astra_db_docs = []
149
+ for result in astra_db_docs_cursor:
150
+ astra_db_docs.append(result)
151
+
152
+ # Create a list of AstraDBIngestDoc objects
137
153
  doc_list = []
138
154
  for record in astra_db_docs:
139
155
  doc = AstraDBIngestDoc(
@@ -182,30 +198,41 @@ class AstraDBDestinationConnector(BaseDestinationConnector):
182
198
  @requires_dependencies(["astrapy"], extras="astradb")
183
199
  def astra_db_collection(self) -> "AstraDBCollection":
184
200
  if self._astra_db_collection is None:
185
- from astrapy.db import AstraDB
201
+ from astrapy import DataAPIClient as AstraDBClient
202
+ from astrapy.exceptions import CollectionAlreadyExistsException
203
+
204
+ # Choose keyspace or deprecated namespace
205
+ keyspace_param = self.connector_config.keyspace or self.connector_config.namespace
186
206
 
187
207
  collection_name = self.connector_config.collection_name
188
208
  embedding_dimension = self.write_config.embedding_dimension
189
-
190
- # If the user has requested an indexing policy, pass it to the Astra DB
191
209
  requested_indexing_policy = self.write_config.requested_indexing_policy
192
- options = {"indexing": requested_indexing_policy} if requested_indexing_policy else None
193
210
 
211
+ # Create a client object to interact with the Astra DB
194
212
  # caller_name/version for Astra DB tracking
195
- self._astra_db = AstraDB(
196
- api_endpoint=self.connector_config.access_config.api_endpoint,
197
- token=self.connector_config.access_config.token,
198
- namespace=self.connector_config.namespace,
213
+ my_client = AstraDBClient(
199
214
  caller_name=integration_name,
200
215
  caller_version=integration_version,
201
216
  )
202
217
 
203
- # Create and connect to the newly created collection
204
- self._astra_db_collection = self._astra_db.create_collection(
205
- collection_name=collection_name,
206
- dimension=embedding_dimension,
207
- options=options,
218
+ # Get the database object
219
+ self._astra_db = my_client.get_database(
220
+ api_endpoint=self.connector_config.access_config.api_endpoint,
221
+ token=self.connector_config.access_config.token,
222
+ keyspace=keyspace_param,
208
223
  )
224
+
225
+ # Create and connect to the newly created collection
226
+ try:
227
+ self._astra_db_collection = self._astra_db.create_collection(
228
+ name=collection_name,
229
+ dimension=embedding_dimension,
230
+ indexing=requested_indexing_policy,
231
+ )
232
+ except CollectionAlreadyExistsException as e:
233
+ logger.info(f"{e}", exc_info=True)
234
+ self._astra_db_collection = self._astra_db.get_collection(name=collection_name)
235
+
209
236
  return self._astra_db_collection
210
237
 
211
238
  @requires_dependencies(["astrapy"], extras="astradb")
@@ -224,6 +251,9 @@ class AstraDBDestinationConnector(BaseDestinationConnector):
224
251
  def write_dict(self, *args, elements_dict: t.List[t.Dict[str, t.Any]], **kwargs) -> None:
225
252
  logger.info(f"inserting / updating {len(elements_dict)} documents to Astra DB.")
226
253
 
254
+ if self._astra_db_collection is None:
255
+ raise DestinationConnectionError("Astra DB collection not available for insertion.")
256
+
227
257
  astra_db_batch_size = self.write_config.batch_size
228
258
 
229
259
  for batch in batch_generator(elements_dict, astra_db_batch_size):
@@ -1,5 +1,5 @@
1
1
  from abc import ABC
2
- from dataclasses import dataclass, fields
2
+ from dataclasses import dataclass
3
3
  from pathlib import Path
4
4
  from typing import Any, Optional
5
5
 
@@ -9,6 +9,7 @@ from unstructured_ingest.utils.chunking import assign_and_map_hash_ids
9
9
  from unstructured_ingest.utils.dep_check import requires_dependencies
10
10
  from unstructured_ingest.v2.interfaces.process import BaseProcess
11
11
  from unstructured_ingest.v2.logger import logger
12
+ from unstructured_ingest.v2.unstructured_api import call_api
12
13
 
13
14
  CHUNK_MAX_CHARS_DEFAULT: int = 500
14
15
  CHUNK_MULTI_PAGE_DEFAULT: bool = True
@@ -111,35 +112,13 @@ class Chunker(BaseProcess, ABC):
111
112
 
112
113
  @requires_dependencies(dependencies=["unstructured_client"], extras="remote")
113
114
  async def run_async(self, elements_filepath: Path, **kwargs: Any) -> list[dict]:
114
- from unstructured_client import UnstructuredClient
115
- from unstructured_client.models.operations import PartitionRequest
116
- from unstructured_client.models.shared import Files, PartitionParameters
117
-
118
- client = UnstructuredClient(
119
- api_key_auth=self.config.chunk_api_key.get_secret_value(),
115
+ elements = await call_api(
120
116
  server_url=self.config.chunking_endpoint,
117
+ api_key=self.config.chunk_api_key.get_secret_value(),
118
+ filename=elements_filepath,
119
+ api_parameters=self.config.to_chunking_kwargs(),
121
120
  )
122
- partition_request = self.config.to_chunking_kwargs()
123
- possible_fields = [f.name for f in fields(PartitionParameters)]
124
- filtered_partition_request = {
125
- k: v for k, v in partition_request.items() if k in possible_fields
126
- }
127
- if len(filtered_partition_request) != len(partition_request):
128
- logger.debug(
129
- "Following fields were omitted due to not being "
130
- "supported by the currently used unstructured client: {}".format(
131
- ", ".join([v for v in partition_request if v not in filtered_partition_request])
132
- )
133
- )
134
- with open(elements_filepath, "rb") as f:
135
- files = Files(
136
- content=f.read(),
137
- file_name=str(elements_filepath.resolve()),
138
- )
139
- filtered_partition_request["files"] = files
140
- partition_params = PartitionParameters(**filtered_partition_request)
141
- partition_request_obj = PartitionRequest(partition_params)
142
- resp = client.general.partition(partition_request_obj)
143
- elements = resp.elements or []
121
+
144
122
  elements = assign_and_map_hash_ids(elements=elements)
123
+
145
124
  return elements
@@ -25,7 +25,8 @@ from unstructured_ingest.v2.processes.connector_registry import (
25
25
  )
26
26
 
27
27
  if TYPE_CHECKING:
28
- from astrapy.db import AstraDBCollection
28
+ from astrapy import Collection as AstraDBCollection
29
+
29
30
 
30
31
  CONNECTOR_TYPE = "astradb"
31
32
 
@@ -85,7 +86,12 @@ class AstraDBUploaderConfig(UploaderConfig):
85
86
  embedding_dimension: int = Field(
86
87
  default=384, description="The dimensionality of the embeddings"
87
88
  )
88
- namespace: Optional[str] = Field(default=None, description="The Astra DB connection namespace.")
89
+ keyspace: Optional[str] = Field(default=None, description="The Astra DB connection keyspace.")
90
+ namespace: Optional[str] = Field(
91
+ default=None,
92
+ description="The Astra DB connection namespace.",
93
+ deprecated="Please use 'keyspace' instead.",
94
+ )
89
95
  requested_indexing_policy: Optional[dict[str, Any]] = Field(
90
96
  default=None,
91
97
  description="The indexing policy to use for the collection.",
@@ -109,33 +115,34 @@ class AstraDBUploader(Uploader):
109
115
 
110
116
  @requires_dependencies(["astrapy"], extras="astradb")
111
117
  def get_collection(self) -> "AstraDBCollection":
112
- from astrapy.db import AstraDB
118
+ from astrapy import DataAPIClient as AstraDBClient
113
119
 
114
- # Get the collection_name and embedding dimension
115
- collection_name = self.upload_config.collection_name
116
- embedding_dimension = self.upload_config.embedding_dimension
117
- requested_indexing_policy = self.upload_config.requested_indexing_policy
120
+ # Choose keyspace or deprecated namespace
121
+ keyspace_param = self.upload_config.keyspace or self.upload_config.namespace
118
122
 
119
- # If the user has requested an indexing policy, pass it to the Astra DB
120
- options = {"indexing": requested_indexing_policy} if requested_indexing_policy else None
123
+ # Get the collection_name
124
+ collection_name = self.upload_config.collection_name
121
125
 
122
126
  # Build the Astra DB object.
123
- # caller_name/version for AstraDB tracking
124
127
  access_configs = self.connection_config.access_config.get_secret_value()
125
- astra_db = AstraDB(
126
- api_endpoint=access_configs.api_endpoint,
127
- token=access_configs.token,
128
- namespace=self.upload_config.namespace,
128
+
129
+ # Create a client object to interact with the Astra DB
130
+ # caller_name/version for Astra DB tracking
131
+ my_client = AstraDBClient(
129
132
  caller_name=integration_name,
130
133
  caller_version=integration_version,
131
134
  )
132
135
 
133
- # Create and connect to the newly created collection
134
- astra_db_collection = astra_db.create_collection(
135
- collection_name=collection_name,
136
- dimension=embedding_dimension,
137
- options=options,
136
+ # Get the database object
137
+ astra_db = my_client.get_database(
138
+ api_endpoint=access_configs.api_endpoint,
139
+ token=access_configs.token,
140
+ keyspace=keyspace_param,
138
141
  )
142
+
143
+ # Connect to the newly created collection
144
+ astra_db_collection = astra_db.get_collection(name=collection_name)
145
+
139
146
  return astra_db_collection
140
147
 
141
148
  def run(self, path: Path, file_data: FileData, **kwargs: Any) -> None:
@@ -41,13 +41,10 @@ class ChromaAccessConfig(AccessConfig):
41
41
  )
42
42
 
43
43
 
44
- SecretChromaAccessConfig = Secret[ChromaAccessConfig]
45
-
46
-
47
44
  class ChromaConnectionConfig(ConnectionConfig):
48
45
  collection_name: str = Field(description="The name of the Chroma collection to write into.")
49
- access_config: SecretChromaAccessConfig = Field(
50
- default=SecretChromaAccessConfig(secret_value=ChromaAccessConfig())
46
+ access_config: Secret[ChromaAccessConfig] = Field(
47
+ default=ChromaAccessConfig(), validate_default=True
51
48
  )
52
49
  path: Optional[str] = Field(
53
50
  default=None, description="Location where Chroma is persisted, if not connecting via http."
@@ -42,8 +42,10 @@ class DatabricksVolumesAccessConfig(AccessConfig):
42
42
  description="The Databricks password part of basic authentication. "
43
43
  "Only possible when Host is *.cloud.databricks.com (AWS).",
44
44
  )
45
- client_id: Optional[str] = Field(default=None)
46
- client_secret: Optional[str] = Field(default=None)
45
+ client_id: Optional[str] = Field(default=None, description="Client ID of the OAuth app.")
46
+ client_secret: Optional[str] = Field(
47
+ default=None, description="Client Secret of the OAuth app."
48
+ )
47
49
  token: Optional[str] = Field(
48
50
  default=None,
49
51
  description="The Databricks personal access token (PAT) (AWS, Azure, and GCP) or "
@@ -81,14 +83,9 @@ class DatabricksVolumesAccessConfig(AccessConfig):
81
83
  google_service_account: Optional[str] = None
82
84
 
83
85
 
84
- SecretDatabricksVolumesAccessConfig = Secret[DatabricksVolumesAccessConfig]
85
-
86
-
87
86
  class DatabricksVolumesConnectionConfig(ConnectionConfig):
88
- access_config: SecretDatabricksVolumesAccessConfig = Field(
89
- default_factory=lambda: SecretDatabricksVolumesAccessConfig(
90
- secret_value=DatabricksVolumesAccessConfig()
91
- )
87
+ access_config: Secret[DatabricksVolumesAccessConfig] = Field(
88
+ default=DatabricksVolumesAccessConfig(), validate_default=True
92
89
  )
93
90
  host: Optional[str] = Field(
94
91
  default=None,
@@ -145,11 +142,12 @@ class DatabricksVolumesUploader(Uploader):
145
142
 
146
143
  def run(self, path: Path, file_data: FileData, **kwargs: Any) -> None:
147
144
  output_path = os.path.join(self.upload_config.path, path.name)
148
- self.get_client().files.upload(
149
- file_path=output_path,
150
- contents=path,
151
- overwrite=self.upload_config.overwrite,
152
- )
145
+ with open(path, "rb") as elements_file:
146
+ self.get_client().files.upload(
147
+ file_path=output_path,
148
+ contents=elements_file,
149
+ overwrite=self.upload_config.overwrite,
150
+ )
153
151
 
154
152
 
155
153
  databricks_volumes_destination_entry = DestinationRegistryEntry(
@@ -76,14 +76,9 @@ class AzureAccessConfig(FsspecAccessConfig):
76
76
  raise ValueError("either connection_string or account_name must be set")
77
77
 
78
78
 
79
- SecretAzureAccessConfig = Secret[AzureAccessConfig]
80
-
81
-
82
79
  class AzureConnectionConfig(FsspecConnectionConfig):
83
80
  supported_protocols: list[str] = field(default_factory=lambda: ["az"], init=False)
84
- access_config: SecretAzureAccessConfig = Field(
85
- default_factory=lambda: SecretAzureAccessConfig(secret_value=AzureAccessConfig())
86
- )
81
+ access_config: Secret[AzureAccessConfig]
87
82
  connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
88
83
 
89
84
  def get_access_config(self) -> dict[str, Any]:
@@ -36,14 +36,9 @@ class BoxAccessConfig(FsspecAccessConfig):
36
36
  )
37
37
 
38
38
 
39
- SecretBoxAccessConfig = Secret[BoxAccessConfig]
40
-
41
-
42
39
  class BoxConnectionConfig(FsspecConnectionConfig):
43
40
  supported_protocols: list[str] = field(default_factory=lambda: ["box"], init=False)
44
- access_config: SecretBoxAccessConfig = Field(
45
- default_factory=lambda: SecretBoxAccessConfig(secret_value=BoxAccessConfig())
46
- )
41
+ access_config: Secret[BoxAccessConfig] = Field(default=BoxAccessConfig(), validate_default=True)
47
42
  connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
48
43
 
49
44
  def get_access_config(self) -> dict[str, Any]:
@@ -35,13 +35,10 @@ class DropboxAccessConfig(FsspecAccessConfig):
35
35
  token: Optional[str] = Field(default=None, description="Dropbox access token.")
36
36
 
37
37
 
38
- SecretDropboxAccessConfig = Secret[DropboxAccessConfig]
39
-
40
-
41
38
  class DropboxConnectionConfig(FsspecConnectionConfig):
42
39
  supported_protocols: list[str] = field(default_factory=lambda: ["dropbox"], init=False)
43
- access_config: SecretDropboxAccessConfig = Field(
44
- default_factory=lambda: SecretDropboxAccessConfig(secret_value=DropboxAccessConfig())
40
+ access_config: Secret[DropboxAccessConfig] = Field(
41
+ default=DropboxAccessConfig(), validate_default=True
45
42
  )
46
43
  connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
47
44
 
@@ -86,14 +86,9 @@ class GcsAccessConfig(FsspecAccessConfig):
86
86
  raise ValueError("Invalid auth token value")
87
87
 
88
88
 
89
- SecretGcsAccessConfig = Secret[GcsAccessConfig]
90
-
91
-
92
89
  class GcsConnectionConfig(FsspecConnectionConfig):
93
90
  supported_protocols: list[str] = field(default_factory=lambda: ["gs", "gcs"], init=False)
94
- access_config: SecretGcsAccessConfig = Field(
95
- default_factory=lambda: SecretGcsAccessConfig(secret_value=GcsAccessConfig())
96
- )
91
+ access_config: Secret[GcsAccessConfig] = Field(default=GcsAccessConfig(), validate_default=True)
97
92
  connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
98
93
 
99
94
 
@@ -49,14 +49,9 @@ class S3AccessConfig(FsspecAccessConfig):
49
49
  )
50
50
 
51
51
 
52
- SecretS3AccessConfig = Secret[S3AccessConfig]
53
-
54
-
55
52
  class S3ConnectionConfig(FsspecConnectionConfig):
56
53
  supported_protocols: list[str] = field(default_factory=lambda: ["s3", "s3a"], init=False)
57
- access_config: SecretS3AccessConfig = Field(
58
- default_factory=lambda: SecretS3AccessConfig(secret_value=S3AccessConfig())
59
- )
54
+ access_config: Secret[S3AccessConfig] = Field(default=S3AccessConfig(), validate_default=True)
60
55
  endpoint_url: Optional[str] = Field(
61
56
  default=None,
62
57
  description="Use this endpoint_url, if specified. Needed for "
@@ -39,12 +39,9 @@ class KdbaiAccessConfig(AccessConfig):
39
39
  )
40
40
 
41
41
 
42
- SecretKdbaiAccessConfig = Secret[KdbaiAccessConfig]
43
-
44
-
45
42
  class KdbaiConnectionConfig(ConnectionConfig):
46
- access_config: SecretKdbaiAccessConfig = Field(
47
- default=SecretKdbaiAccessConfig(secret_value=KdbaiAccessConfig())
43
+ access_config: Secret[KdbaiAccessConfig] = Field(
44
+ default=KdbaiAccessConfig(), validate_default=True
48
45
  )
49
46
  endpoint: str = Field(
50
47
  default="http://localhost:8082", description="Endpoint url where KDBAI is hosted."
@@ -34,12 +34,9 @@ class LocalAccessConfig(AccessConfig):
34
34
  pass
35
35
 
36
36
 
37
- SecretLocalAccessConfig = Secret[LocalAccessConfig]
38
-
39
-
40
37
  class LocalConnectionConfig(ConnectionConfig):
41
- access_config: SecretLocalAccessConfig = Field(
42
- default_factory=lambda: SecretLocalAccessConfig(secret_value=LocalAccessConfig())
38
+ access_config: Secret[LocalAccessConfig] = Field(
39
+ default=LocalAccessConfig(), validate_default=True
43
40
  )
44
41
 
45
42
 
@@ -36,12 +36,9 @@ class MilvusAccessConfig(AccessConfig):
36
36
  token: Optional[str] = Field(default=None, description="Milvus access token")
37
37
 
38
38
 
39
- SecretMilvusAccessConfig = Secret[MilvusAccessConfig]
40
-
41
-
42
39
  class MilvusConnectionConfig(ConnectionConfig):
43
- access_config: SecretMilvusAccessConfig = Field(
44
- default_factory=lambda: SecretMilvusAccessConfig(secret_value=MilvusAccessConfig())
40
+ access_config: Secret[MilvusAccessConfig] = Field(
41
+ default=MilvusAccessConfig(), validate_default=True
45
42
  )
46
43
  uri: Optional[str] = Field(
47
44
  default=None, description="Milvus uri", examples=["http://localhost:19530"]
@@ -34,12 +34,9 @@ class MongoDBAccessConfig(AccessConfig):
34
34
  uri: Optional[str] = Field(default=None, description="URI to user when connecting")
35
35
 
36
36
 
37
- SecretMongoDBAccessConfig = Secret[MongoDBAccessConfig]
38
-
39
-
40
37
  class MongoDBConnectionConfig(ConnectionConfig):
41
- access_config: SecretMongoDBAccessConfig = Field(
42
- default_factory=lambda: SecretMongoDBAccessConfig(secret_value=MongoDBAccessConfig())
38
+ access_config: Secret[MongoDBAccessConfig] = Field(
39
+ default=MongoDBAccessConfig(), validate_default=True
43
40
  )
44
41
  host: Optional[str] = Field(
45
42
  default=None,
@@ -36,13 +36,10 @@ class PineconeAccessConfig(AccessConfig):
36
36
  )
37
37
 
38
38
 
39
- SecretPineconeAccessConfig = Secret[PineconeAccessConfig]
40
-
41
-
42
39
  class PineconeConnectionConfig(ConnectionConfig):
43
40
  index_name: str = Field(description="Name of the index to connect to.")
44
- access_config: SecretPineconeAccessConfig = Field(
45
- default_factory=lambda: SecretPineconeAccessConfig(secret_value=PineconeAccessConfig())
41
+ access_config: Secret[PineconeAccessConfig] = Field(
42
+ default=PineconeAccessConfig(), validate_default=True
46
43
  )
47
44
 
48
45
  @requires_dependencies(["pinecone"], extras="pinecone")
@@ -40,9 +40,6 @@ class SQLAccessConfig(AccessConfig):
40
40
  password: Optional[str] = Field(default=None, description="DB password")
41
41
 
42
42
 
43
- SecreteSQLAccessConfig = Secret[SQLAccessConfig]
44
-
45
-
46
43
  class SQLConnectionConfig(ConnectionConfig):
47
44
  db_type: Literal["sqlite", "postgresql"] = Field(
48
45
  default=SQLITE_DB, description="Type of the database backend"
@@ -53,9 +50,7 @@ class SQLConnectionConfig(ConnectionConfig):
53
50
  )
54
51
  host: Optional[str] = Field(default=None, description="DB host")
55
52
  port: Optional[int] = Field(default=5432, description="DB host connection port")
56
- access_config: SecreteSQLAccessConfig = Field(
57
- default_factory=lambda: SecreteSQLAccessConfig(secret_value=SQLAccessConfig())
58
- )
53
+ access_config: Secret[SQLAccessConfig] = Field(default=SQLAccessConfig(), validate_default=True)
59
54
  connector_type: str = Field(default=CONNECTOR_TYPE, init=False)
60
55
 
61
56
  def __post_init__(self):
@@ -38,16 +38,13 @@ class WeaviateAccessConfig(AccessConfig):
38
38
  password: Optional[str] = None
39
39
 
40
40
 
41
- SecretWeaviateAccessConfig = Secret[WeaviateAccessConfig]
42
-
43
-
44
41
  class WeaviateConnectionConfig(ConnectionConfig):
45
42
  host_url: str = Field(description="Weaviate instance url")
46
43
  class_name: str = Field(
47
44
  description="Name of the class to push the records into, e.g: Pdf-elements"
48
45
  )
49
- access_config: SecretWeaviateAccessConfig = Field(
50
- default_factory=lambda: SecretWeaviateAccessConfig(secret_value=WeaviateAccessConfig())
46
+ access_config: Secret[WeaviateAccessConfig] = Field(
47
+ default=WeaviateAccessConfig(), validate_default=True
51
48
  )
52
49
  username: Optional[str] = None
53
50
  anonymous: bool = Field(default=False, description="if set, all auth values will be ignored")