unstructured-ingest 0.0.22__tar.gz → 0.0.24__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (361) hide show
  1. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/PKG-INFO +20 -20
  2. unstructured_ingest-0.0.24/unstructured_ingest/__version__.py +1 -0
  3. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/interfaces.py +5 -5
  4. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/vertexai.py +1 -1
  5. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/voyageai.py +2 -2
  6. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/interfaces.py +5 -5
  7. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/utils/model_conversion.py +3 -3
  8. unstructured_ingest-0.0.24/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
  9. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/pinecone.py +32 -21
  10. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/embedder.py +10 -10
  11. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest.egg-info/PKG-INFO +20 -20
  12. unstructured_ingest-0.0.22/unstructured_ingest/__version__.py +0 -1
  13. unstructured_ingest-0.0.22/unstructured_ingest/embed/__init__.py +0 -17
  14. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/LICENSE.md +0 -0
  15. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/README.md +0 -0
  16. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/pyproject.toml +0 -0
  17. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/setup.cfg +0 -0
  18. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/setup.py +0 -0
  19. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/test/test_chunking_utils.py +0 -0
  20. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/test/test_error.py +0 -0
  21. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/test/test_interfaces.py +0 -0
  22. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/test/test_logger.py +0 -0
  23. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/test/test_utils.py +0 -0
  24. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/test/test_utils_v2.py +0 -0
  25. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/__init__.py +0 -0
  26. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/__init__.py +0 -0
  27. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/base/__init__.py +0 -0
  28. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/base/cmd.py +0 -0
  29. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/base/dest.py +0 -0
  30. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/base/src.py +0 -0
  31. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cli.py +0 -0
  32. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmd_factory.py +0 -0
  33. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/__init__.py +0 -0
  34. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/airtable.py +0 -0
  35. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/astradb.py +0 -0
  36. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/azure_cognitive_search.py +0 -0
  37. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/biomed.py +0 -0
  38. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/chroma.py +0 -0
  39. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/clarifai.py +0 -0
  40. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/confluence.py +0 -0
  41. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -0
  42. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/delta_table.py +0 -0
  43. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/discord.py +0 -0
  44. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/elasticsearch.py +0 -0
  45. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/__init__.py +0 -0
  46. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -0
  47. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/box.py +0 -0
  48. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -0
  49. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -0
  50. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -0
  51. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -0
  52. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -0
  53. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/github.py +0 -0
  54. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/gitlab.py +0 -0
  55. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/google_drive.py +0 -0
  56. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/hubspot.py +0 -0
  57. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/jira.py +0 -0
  58. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/kafka.py +0 -0
  59. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/local.py +0 -0
  60. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/mongodb.py +0 -0
  61. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/notion.py +0 -0
  62. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/onedrive.py +0 -0
  63. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/opensearch.py +0 -0
  64. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/outlook.py +0 -0
  65. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/pinecone.py +0 -0
  66. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/qdrant.py +0 -0
  67. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/reddit.py +0 -0
  68. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/salesforce.py +0 -0
  69. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/sharepoint.py +0 -0
  70. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/slack.py +0 -0
  71. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/sql.py +0 -0
  72. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/vectara.py +0 -0
  73. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/weaviate.py +0 -0
  74. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/cmds/wikipedia.py +0 -0
  75. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/common.py +0 -0
  76. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/cli/utils.py +0 -0
  77. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/__init__.py +0 -0
  78. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/airtable.py +0 -0
  79. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/astradb.py +0 -0
  80. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/azure_cognitive_search.py +0 -0
  81. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/biomed.py +0 -0
  82. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/chroma.py +0 -0
  83. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/clarifai.py +0 -0
  84. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/confluence.py +0 -0
  85. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/databricks_volumes.py +0 -0
  86. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/delta_table.py +0 -0
  87. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/discord.py +0 -0
  88. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/elasticsearch.py +0 -0
  89. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/__init__.py +0 -0
  90. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/azure.py +0 -0
  91. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/box.py +0 -0
  92. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/dropbox.py +0 -0
  93. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/fsspec.py +0 -0
  94. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/gcs.py +0 -0
  95. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/s3.py +0 -0
  96. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/fsspec/sftp.py +0 -0
  97. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/git.py +0 -0
  98. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/github.py +0 -0
  99. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/gitlab.py +0 -0
  100. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/google_drive.py +0 -0
  101. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/hubspot.py +0 -0
  102. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/jira.py +0 -0
  103. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/kafka.py +0 -0
  104. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/local.py +0 -0
  105. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/mongodb.py +0 -0
  106. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/__init__.py +0 -0
  107. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/client.py +0 -0
  108. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/connector.py +0 -0
  109. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/helpers.py +0 -0
  110. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/interfaces.py +0 -0
  111. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/__init__.py +0 -0
  112. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/block.py +0 -0
  113. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/__init__.py +0 -0
  114. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -0
  115. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -0
  116. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -0
  117. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -0
  118. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -0
  119. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -0
  120. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/code.py +0 -0
  121. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -0
  122. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -0
  123. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -0
  124. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -0
  125. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/file.py +0 -0
  126. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -0
  127. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/image.py +0 -0
  128. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -0
  129. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -0
  130. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -0
  131. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -0
  132. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -0
  133. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -0
  134. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -0
  135. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/table.py +0 -0
  136. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -0
  137. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/template.py +0 -0
  138. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -0
  139. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -0
  140. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -0
  141. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/blocks/video.py +0 -0
  142. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database.py +0 -0
  143. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -0
  144. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -0
  145. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -0
  146. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -0
  147. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -0
  148. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -0
  149. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -0
  150. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -0
  151. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -0
  152. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -0
  153. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -0
  154. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -0
  155. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -0
  156. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -0
  157. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -0
  158. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -0
  159. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -0
  160. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -0
  161. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -0
  162. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -0
  163. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -0
  164. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -0
  165. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -0
  166. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/date.py +0 -0
  167. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/file.py +0 -0
  168. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/page.py +0 -0
  169. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/parent.py +0 -0
  170. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/rich_text.py +0 -0
  171. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/notion/types/user.py +0 -0
  172. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/onedrive.py +0 -0
  173. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/opensearch.py +0 -0
  174. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/outlook.py +0 -0
  175. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/pinecone.py +0 -0
  176. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/qdrant.py +0 -0
  177. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/reddit.py +0 -0
  178. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/registry.py +0 -0
  179. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/salesforce.py +0 -0
  180. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/sharepoint.py +0 -0
  181. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/slack.py +0 -0
  182. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/sql.py +0 -0
  183. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/vectara.py +0 -0
  184. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/weaviate.py +0 -0
  185. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/connector/wikipedia.py +0 -0
  186. {unstructured_ingest-0.0.22/unstructured_ingest/pipeline/reformat → unstructured_ingest-0.0.24/unstructured_ingest/embed}/__init__.py +0 -0
  187. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/bedrock.py +0 -0
  188. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/huggingface.py +0 -0
  189. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/interfaces.py +0 -0
  190. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  191. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/octoai.py +0 -0
  192. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/embed/openai.py +0 -0
  193. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/enhanced_dataclass/__init__.py +0 -0
  194. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/enhanced_dataclass/core.py +0 -0
  195. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -0
  196. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -0
  197. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/error.py +0 -0
  198. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/ingest_backoff/__init__.py +0 -0
  199. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/ingest_backoff/_common.py +0 -0
  200. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/ingest_backoff/_wrapper.py +0 -0
  201. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/logger.py +0 -0
  202. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/main.py +0 -0
  203. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/__init__.py +0 -0
  204. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/copy.py +0 -0
  205. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/doc_factory.py +0 -0
  206. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/interfaces.py +0 -0
  207. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/partition.py +0 -0
  208. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/permissions.py +0 -0
  209. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/pipeline.py +0 -0
  210. {unstructured_ingest-0.0.22/unstructured_ingest/runner/fsspec → unstructured_ingest-0.0.24/unstructured_ingest/pipeline/reformat}/__init__.py +0 -0
  211. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/reformat/chunking.py +0 -0
  212. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/reformat/embedding.py +0 -0
  213. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/source.py +0 -0
  214. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/utils.py +0 -0
  215. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/pipeline/write.py +0 -0
  216. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/processor.py +0 -0
  217. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/__init__.py +0 -0
  218. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/airtable.py +0 -0
  219. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/astradb.py +0 -0
  220. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/base_runner.py +0 -0
  221. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/biomed.py +0 -0
  222. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/confluence.py +0 -0
  223. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/delta_table.py +0 -0
  224. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/discord.py +0 -0
  225. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/elasticsearch.py +0 -0
  226. {unstructured_ingest-0.0.22/unstructured_ingest/runner/writers → unstructured_ingest-0.0.24/unstructured_ingest/runner}/fsspec/__init__.py +0 -0
  227. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/azure.py +0 -0
  228. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/box.py +0 -0
  229. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/dropbox.py +0 -0
  230. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/fsspec.py +0 -0
  231. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/gcs.py +0 -0
  232. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/s3.py +0 -0
  233. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/fsspec/sftp.py +0 -0
  234. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/github.py +0 -0
  235. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/gitlab.py +0 -0
  236. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/google_drive.py +0 -0
  237. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/hubspot.py +0 -0
  238. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/jira.py +0 -0
  239. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/kafka.py +0 -0
  240. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/local.py +0 -0
  241. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/mongodb.py +0 -0
  242. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/notion.py +0 -0
  243. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/onedrive.py +0 -0
  244. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/opensearch.py +0 -0
  245. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/outlook.py +0 -0
  246. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/reddit.py +0 -0
  247. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/salesforce.py +0 -0
  248. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/sharepoint.py +0 -0
  249. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/slack.py +0 -0
  250. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/utils.py +0 -0
  251. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/wikipedia.py +0 -0
  252. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/__init__.py +0 -0
  253. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/astradb.py +0 -0
  254. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/azure_cognitive_search.py +0 -0
  255. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/base_writer.py +0 -0
  256. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/chroma.py +0 -0
  257. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/clarifai.py +0 -0
  258. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/databricks_volumes.py +0 -0
  259. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/delta_table.py +0 -0
  260. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/elasticsearch.py +0 -0
  261. {unstructured_ingest-0.0.22/unstructured_ingest/utils → unstructured_ingest-0.0.24/unstructured_ingest/runner/writers/fsspec}/__init__.py +0 -0
  262. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/fsspec/azure.py +0 -0
  263. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/fsspec/box.py +0 -0
  264. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -0
  265. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -0
  266. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/fsspec/s3.py +0 -0
  267. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/kafka.py +0 -0
  268. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/mongodb.py +0 -0
  269. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/opensearch.py +0 -0
  270. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/pinecone.py +0 -0
  271. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/qdrant.py +0 -0
  272. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/sql.py +0 -0
  273. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/vectara.py +0 -0
  274. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/runner/writers/weaviate.py +0 -0
  275. {unstructured_ingest-0.0.22/unstructured_ingest/v2/cli → unstructured_ingest-0.0.24/unstructured_ingest/utils}/__init__.py +0 -0
  276. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/chunking.py +0 -0
  277. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/compression.py +0 -0
  278. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/data_prep.py +0 -0
  279. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/dep_check.py +0 -0
  280. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/google_filetype.py +0 -0
  281. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  282. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/utils/table.py +0 -0
  283. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/__init__.py +0 -0
  284. {unstructured_ingest-0.0.22/unstructured_ingest/v2/cli/utils → unstructured_ingest-0.0.24/unstructured_ingest/v2/cli}/__init__.py +0 -0
  285. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/base/__init__.py +0 -0
  286. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/base/cmd.py +0 -0
  287. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/base/dest.py +0 -0
  288. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/base/importer.py +0 -0
  289. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/base/src.py +0 -0
  290. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/cli.py +0 -0
  291. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/cmds.py +0 -0
  292. {unstructured_ingest-0.0.22/unstructured_ingest/v2/pipeline → unstructured_ingest-0.0.24/unstructured_ingest/v2/cli/utils}/__init__.py +0 -0
  293. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/cli/utils/click.py +0 -0
  294. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/__init__.py +0 -0
  295. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/connector.py +0 -0
  296. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/downloader.py +0 -0
  297. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/file_data.py +0 -0
  298. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/indexer.py +0 -0
  299. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/process.py +0 -0
  300. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/processor.py +0 -0
  301. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/upload_stager.py +0 -0
  302. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/interfaces/uploader.py +0 -0
  303. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/logger.py +0 -0
  304. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/main.py +0 -0
  305. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/otel.py +0 -0
  306. {unstructured_ingest-0.0.22/unstructured_ingest/v2/pipeline/steps → unstructured_ingest-0.0.24/unstructured_ingest/v2/pipeline}/__init__.py +0 -0
  307. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/interfaces.py +0 -0
  308. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/otel.py +0 -0
  309. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/pipeline.py +0 -0
  310. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -0
  311. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/download.py +0 -0
  312. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/embed.py +0 -0
  313. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/filter.py +0 -0
  314. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/index.py +0 -0
  315. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/partition.py +0 -0
  316. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/stage.py +0 -0
  317. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -0
  318. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/pipeline/steps/upload.py +0 -0
  319. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/__init__.py +0 -0
  320. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/chunker.py +0 -0
  321. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connector_registry.py +0 -0
  322. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/__init__.py +0 -0
  323. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/airtable.py +0 -0
  324. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/astradb.py +0 -0
  325. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py +0 -0
  326. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/chroma.py +0 -0
  327. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/couchbase.py +0 -0
  328. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/databricks_volumes.py +0 -0
  329. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/elasticsearch.py +0 -0
  330. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -0
  331. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +0 -0
  332. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/box.py +0 -0
  333. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +0 -0
  334. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -0
  335. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +0 -0
  336. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +0 -0
  337. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -0
  338. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/fsspec/utils.py +0 -0
  339. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -0
  340. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/kdbai.py +0 -0
  341. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/local.py +0 -0
  342. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/milvus.py +0 -0
  343. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/mongodb.py +0 -0
  344. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -0
  345. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/opensearch.py +0 -0
  346. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -0
  347. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -0
  348. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/singlestore.py +0 -0
  349. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/sql.py +0 -0
  350. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/utils.py +0 -0
  351. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/connectors/weaviate.py +0 -0
  352. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/filter.py +0 -0
  353. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/partitioner.py +0 -0
  354. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/processes/uncompress.py +0 -0
  355. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/unstructured_api.py +0 -0
  356. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest/v2/utils.py +0 -0
  357. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest.egg-info/SOURCES.txt +0 -0
  358. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  359. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest.egg-info/entry_points.txt +0 -0
  360. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest.egg-info/requires.txt +19 -19
  361. {unstructured_ingest-0.0.22 → unstructured_ingest-0.0.24}/unstructured_ingest.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.22
3
+ Version: 0.0.24
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,13 +22,13 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.13
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: pandas
26
- Requires-Dist: pydantic>=2.7
27
- Requires-Dist: click
28
- Requires-Dist: opentelemetry-sdk
29
25
  Requires-Dist: dataclasses_json
30
26
  Requires-Dist: tqdm
27
+ Requires-Dist: pydantic>=2.7
28
+ Requires-Dist: click
29
+ Requires-Dist: pandas
31
30
  Requires-Dist: python-dateutil
31
+ Requires-Dist: opentelemetry-sdk
32
32
  Provides-Extra: remote
33
33
  Requires-Dist: unstructured-client>=0.25.8; extra == "remote"
34
34
  Provides-Extra: csv
@@ -66,23 +66,23 @@ Requires-Dist: pyairtable; extra == "airtable"
66
66
  Provides-Extra: astradb
67
67
  Requires-Dist: astrapy; extra == "astradb"
68
68
  Provides-Extra: azure
69
- Requires-Dist: adlfs; extra == "azure"
70
69
  Requires-Dist: fsspec; extra == "azure"
70
+ Requires-Dist: adlfs; extra == "azure"
71
71
  Provides-Extra: azure-cognitive-search
72
72
  Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
73
73
  Provides-Extra: biomed
74
- Requires-Dist: requests; extra == "biomed"
75
74
  Requires-Dist: bs4; extra == "biomed"
75
+ Requires-Dist: requests; extra == "biomed"
76
76
  Provides-Extra: box
77
- Requires-Dist: fsspec; extra == "box"
78
77
  Requires-Dist: boxfs; extra == "box"
78
+ Requires-Dist: fsspec; extra == "box"
79
79
  Provides-Extra: chroma
80
80
  Requires-Dist: chromadb; extra == "chroma"
81
81
  Provides-Extra: clarifai
82
82
  Requires-Dist: clarifai; extra == "clarifai"
83
83
  Provides-Extra: confluence
84
- Requires-Dist: requests; extra == "confluence"
85
84
  Requires-Dist: atlassian-python-api; extra == "confluence"
85
+ Requires-Dist: requests; extra == "confluence"
86
86
  Provides-Extra: couchbase
87
87
  Requires-Dist: couchbase; extra == "couchbase"
88
88
  Provides-Extra: delta-table
@@ -96,12 +96,12 @@ Requires-Dist: dropboxdrivefs; extra == "dropbox"
96
96
  Provides-Extra: elasticsearch
97
97
  Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
98
98
  Provides-Extra: gcs
99
+ Requires-Dist: bs4; extra == "gcs"
99
100
  Requires-Dist: gcsfs; extra == "gcs"
100
101
  Requires-Dist: fsspec; extra == "gcs"
101
- Requires-Dist: bs4; extra == "gcs"
102
102
  Provides-Extra: github
103
- Requires-Dist: requests; extra == "github"
104
103
  Requires-Dist: pygithub>1.58.0; extra == "github"
104
+ Requires-Dist: requests; extra == "github"
105
105
  Provides-Extra: gitlab
106
106
  Requires-Dist: python-gitlab; extra == "gitlab"
107
107
  Provides-Extra: google-drive
@@ -120,19 +120,19 @@ Requires-Dist: pymilvus; extra == "milvus"
120
120
  Provides-Extra: mongodb
121
121
  Requires-Dist: pymongo; extra == "mongodb"
122
122
  Provides-Extra: notion
123
+ Requires-Dist: notion-client; extra == "notion"
123
124
  Requires-Dist: httpx; extra == "notion"
124
125
  Requires-Dist: htmlBuilder; extra == "notion"
125
- Requires-Dist: notion-client; extra == "notion"
126
126
  Requires-Dist: backoff; extra == "notion"
127
127
  Provides-Extra: onedrive
128
- Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
129
- Requires-Dist: msal; extra == "onedrive"
130
128
  Requires-Dist: bs4; extra == "onedrive"
129
+ Requires-Dist: msal; extra == "onedrive"
130
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
131
131
  Provides-Extra: opensearch
132
132
  Requires-Dist: opensearch-py; extra == "opensearch"
133
133
  Provides-Extra: outlook
134
- Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
135
134
  Requires-Dist: msal; extra == "outlook"
135
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
136
136
  Provides-Extra: pinecone
137
137
  Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
138
138
  Provides-Extra: postgres
@@ -142,16 +142,16 @@ Requires-Dist: qdrant-client; extra == "qdrant"
142
142
  Provides-Extra: reddit
143
143
  Requires-Dist: praw; extra == "reddit"
144
144
  Provides-Extra: s3
145
- Requires-Dist: s3fs; extra == "s3"
146
145
  Requires-Dist: fsspec; extra == "s3"
146
+ Requires-Dist: s3fs; extra == "s3"
147
147
  Provides-Extra: sharepoint
148
- Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
149
148
  Requires-Dist: msal; extra == "sharepoint"
149
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
150
150
  Provides-Extra: salesforce
151
151
  Requires-Dist: simple-salesforce; extra == "salesforce"
152
152
  Provides-Extra: sftp
153
- Requires-Dist: paramiko; extra == "sftp"
154
153
  Requires-Dist: fsspec; extra == "sftp"
154
+ Requires-Dist: paramiko; extra == "sftp"
155
155
  Provides-Extra: slack
156
156
  Requires-Dist: slack_sdk; extra == "slack"
157
157
  Provides-Extra: wikipedia
@@ -167,8 +167,8 @@ Requires-Dist: requests; extra == "vectara"
167
167
  Provides-Extra: embed-huggingface
168
168
  Requires-Dist: sentence-transformers; extra == "embed-huggingface"
169
169
  Provides-Extra: embed-octoai
170
- Requires-Dist: tiktoken; extra == "embed-octoai"
171
170
  Requires-Dist: openai; extra == "embed-octoai"
171
+ Requires-Dist: tiktoken; extra == "embed-octoai"
172
172
  Provides-Extra: embed-vertexai
173
173
  Requires-Dist: vertexai; extra == "embed-vertexai"
174
174
  Provides-Extra: embed-voyageai
@@ -176,8 +176,8 @@ Requires-Dist: voyageai; extra == "embed-voyageai"
176
176
  Provides-Extra: embed-mixedbreadai
177
177
  Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
178
178
  Provides-Extra: openai
179
- Requires-Dist: tiktoken; extra == "openai"
180
179
  Requires-Dist: openai; extra == "openai"
180
+ Requires-Dist: tiktoken; extra == "openai"
181
181
  Provides-Extra: bedrock
182
182
  Requires-Dist: boto3; extra == "bedrock"
183
183
 
@@ -0,0 +1 @@
1
+ __version__ = "0.0.24" # pragma: no cover
@@ -415,11 +415,11 @@ class CliEmbeddingConfig(EmbeddingConfig, CliMixin):
415
415
  @staticmethod
416
416
  def get_cli_options() -> t.List[click.Option]:
417
417
  embed_providers = [
418
- "langchain-openai",
419
- "langchain-huggingface",
420
- "langchain-aws-bedrock",
421
- "langchain-vertexai",
422
- "langchain-voyageai",
418
+ "openai",
419
+ "huggingface",
420
+ "aws-bedrock",
421
+ "vertexai",
422
+ "voyageai",
423
423
  "octoai",
424
424
  ]
425
425
  options = [
@@ -45,7 +45,7 @@ class VertexAIEmbeddingConfig(EmbeddingConfig):
45
45
  extras="embed-vertexai",
46
46
  )
47
47
  def get_client(self) -> "TextEmbeddingModel":
48
- """Creates a Langchain VertexAI python client to embed elements."""
48
+ """Creates a VertexAI python client to embed elements."""
49
49
  from vertexai.language_models import TextEmbeddingModel
50
50
 
51
51
  self.register_application_credentials()
@@ -20,11 +20,11 @@ class VoyageAIEmbeddingConfig(EmbeddingConfig):
20
20
  timeout_in_seconds: Optional[int] = None
21
21
 
22
22
  @requires_dependencies(
23
- ["langchain", "langchain_voyageai"],
23
+ ["voyageai"],
24
24
  extras="embed-voyageai",
25
25
  )
26
26
  def get_client(self) -> "VoyageAIClient":
27
- """Creates a Langchain VoyageAI python client to embed elements."""
27
+ """Creates a VoyageAI python client to embed elements."""
28
28
  from voyageai import Client as VoyageAIClient
29
29
 
30
30
  client = VoyageAIClient(
@@ -204,14 +204,14 @@ class EmbeddingConfig(BaseConfig):
204
204
  if self.model_name:
205
205
  kwargs["model_name"] = self.model_name
206
206
  # TODO make this more dynamic to map to encoder configs
207
- if self.provider == "langchain-openai":
207
+ if self.provider == "openai":
208
208
  from unstructured_ingest.embed.openai import (
209
209
  OpenAIEmbeddingConfig,
210
210
  OpenAIEmbeddingEncoder,
211
211
  )
212
212
 
213
213
  return OpenAIEmbeddingEncoder(config=OpenAIEmbeddingConfig(**kwargs))
214
- elif self.provider == "langchain-huggingface":
214
+ elif self.provider == "huggingface":
215
215
  from unstructured_ingest.embed.huggingface import (
216
216
  HuggingFaceEmbeddingConfig,
217
217
  HuggingFaceEmbeddingEncoder,
@@ -225,7 +225,7 @@ class EmbeddingConfig(BaseConfig):
225
225
  )
226
226
 
227
227
  return OctoAIEmbeddingEncoder(config=OctoAiEmbeddingConfig(**kwargs))
228
- elif self.provider == "langchain-aws-bedrock":
228
+ elif self.provider == "aws-bedrock":
229
229
  from unstructured_ingest.embed.bedrock import (
230
230
  BedrockEmbeddingConfig,
231
231
  BedrockEmbeddingEncoder,
@@ -238,14 +238,14 @@ class EmbeddingConfig(BaseConfig):
238
238
  region_name=self.aws_region,
239
239
  )
240
240
  )
241
- elif self.provider == "langchain-vertexai":
241
+ elif self.provider == "vertexai":
242
242
  from unstructured_ingest.embed.vertexai import (
243
243
  VertexAIEmbeddingConfig,
244
244
  VertexAIEmbeddingEncoder,
245
245
  )
246
246
 
247
247
  return VertexAIEmbeddingEncoder(config=VertexAIEmbeddingConfig(**kwargs))
248
- elif self.provider == "langchain-voyageai":
248
+ elif self.provider == "voyageai":
249
249
  from unstructured_ingest.embed.voyageai import (
250
250
  VoyageAIEmbeddingConfig,
251
251
  VoyageAIEmbeddingEncoder,
@@ -155,14 +155,14 @@ def _get_type_from_field(field: FieldInfo) -> click.ParamType:
155
155
 
156
156
  def get_option_from_field(option_name: str, field_info: FieldInfo) -> Option:
157
157
  param_decls = [option_name]
158
- help = field_info.description or ""
158
+ help_text = field_info.description or ""
159
159
  if examples := field_info.examples:
160
- help += f" [Examples: {', '.join(examples)}]"
160
+ help_text += f" [Examples: {', '.join(examples)}]"
161
161
  option_kwargs = {
162
162
  "type": _get_type_from_field(field_info),
163
163
  "default": get_default_value_from_field(field_info),
164
164
  "required": field_info.is_required(),
165
- "help": help,
165
+ "help": str(help_text),
166
166
  "is_flag": is_boolean_flag(field_info),
167
167
  "show_default": field_info.default is not PydanticUndefined,
168
168
  }
@@ -58,20 +58,6 @@ class PineconeConnectionConfig(ConnectionConfig):
58
58
  return index
59
59
 
60
60
 
61
- class PineconeUploadStagerConfig(UploadStagerConfig):
62
- pass
63
-
64
-
65
- class PineconeUploaderConfig(UploaderConfig):
66
- batch_size: Optional[int] = Field(
67
- default=None,
68
- description="Optional number of records per batch. Will otherwise limit by size.",
69
- )
70
- pool_threads: Optional[int] = Field(
71
- default=1, description="Optional limit on number of threads to use for upload"
72
- )
73
-
74
-
75
61
  ALLOWED_FIELDS = (
76
62
  "element_id",
77
63
  "text",
@@ -86,31 +72,56 @@ ALLOWED_FIELDS = (
86
72
  "is_continuation",
87
73
  "link_urls",
88
74
  "link_texts",
75
+ "text_as_html",
89
76
  )
90
77
 
91
78
 
79
+ class PineconeUploadStagerConfig(UploadStagerConfig):
80
+ metadata_fields: list[str] = Field(
81
+ default=str(ALLOWED_FIELDS),
82
+ description=(
83
+ "which metadata from the source element to map to the payload metadata being sent to "
84
+ "Pinecone."
85
+ ),
86
+ )
87
+
88
+
89
+ class PineconeUploaderConfig(UploaderConfig):
90
+ batch_size: Optional[int] = Field(
91
+ default=None,
92
+ description="Optional number of records per batch. Will otherwise limit by size.",
93
+ )
94
+ pool_threads: Optional[int] = Field(
95
+ default=1, description="Optional limit on number of threads to use for upload"
96
+ )
97
+
98
+
92
99
  @dataclass
93
100
  class PineconeUploadStager(UploadStager):
94
101
  upload_stager_config: PineconeUploadStagerConfig = field(
95
102
  default_factory=lambda: PineconeUploadStagerConfig()
96
103
  )
97
104
 
98
- @staticmethod
99
- def conform_dict(element_dict: dict) -> dict:
105
+ def conform_dict(self, element_dict: dict) -> dict:
100
106
  embeddings = element_dict.pop("embeddings", None)
101
107
  metadata: dict[str, Any] = element_dict.pop("metadata", {})
102
108
  data_source = metadata.pop("data_source", {})
103
109
  coordinates = metadata.pop("coordinates", {})
104
-
105
- element_dict.update(metadata)
106
- element_dict.update(data_source)
107
- element_dict.update(coordinates)
110
+ pinecone_metadata = {}
111
+ for possible_meta in [element_dict, metadata, data_source, coordinates]:
112
+ pinecone_metadata.update(
113
+ {
114
+ k: v
115
+ for k, v in possible_meta.items()
116
+ if k in self.upload_stager_config.metadata_fields
117
+ }
118
+ )
108
119
 
109
120
  return {
110
121
  "id": str(uuid.uuid4()),
111
122
  "values": embeddings,
112
123
  "metadata": flatten_dict(
113
- {k: v for k, v in element_dict.items() if k in ALLOWED_FIELDS},
124
+ pinecone_metadata,
114
125
  separator="-",
115
126
  flatten_lists=True,
116
127
  remove_none=True,
@@ -15,11 +15,11 @@ if TYPE_CHECKING:
15
15
  class EmbedderConfig(BaseModel):
16
16
  embedding_provider: Optional[
17
17
  Literal[
18
- "langchain-openai",
19
- "langchain-huggingface",
20
- "langchain-aws-bedrock",
21
- "langchain-vertexai",
22
- "langchain-voyageai",
18
+ "openai",
19
+ "huggingface",
20
+ "aws-bedrock",
21
+ "vertexai",
22
+ "voyageai",
23
23
  "octoai",
24
24
  "mixedbread-ai",
25
25
  ]
@@ -114,22 +114,22 @@ class EmbedderConfig(BaseModel):
114
114
  if self.embedding_model_name:
115
115
  kwargs["model_name"] = self.embedding_model_name
116
116
  # TODO make this more dynamic to map to encoder configs
117
- if self.embedding_provider == "langchain-openai":
117
+ if self.embedding_provider == "openai":
118
118
  return self.get_openai_embedder(embedding_kwargs=kwargs)
119
119
 
120
- if self.embedding_provider == "langchain-huggingface":
120
+ if self.embedding_provider == "huggingface":
121
121
  return self.get_huggingface_embedder(embedding_kwargs=kwargs)
122
122
 
123
123
  if self.embedding_provider == "octoai":
124
124
  return self.get_octoai_embedder(embedding_kwargs=kwargs)
125
125
 
126
- if self.embedding_provider == "langchain-aws-bedrock":
126
+ if self.embedding_provider == "aws-bedrock":
127
127
  return self.get_bedrock_embedder()
128
128
 
129
- if self.embedding_provider == "langchain-vertexai":
129
+ if self.embedding_provider == "vertexai":
130
130
  return self.get_vertexai_embedder(embedding_kwargs=kwargs)
131
131
 
132
- if self.embedding_provider == "langchain-voyageai":
132
+ if self.embedding_provider == "voyageai":
133
133
  return self.get_voyageai_embedder(embedding_kwargs=kwargs)
134
134
  if self.embedding_provider == "mixedbread-ai":
135
135
  return self.get_mixedbread_embedder(embedding_kwargs=kwargs)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.22
3
+ Version: 0.0.24
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -22,13 +22,13 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
22
  Requires-Python: >=3.9.0,<3.13
23
23
  Description-Content-Type: text/markdown
24
24
  License-File: LICENSE.md
25
- Requires-Dist: pandas
26
- Requires-Dist: pydantic>=2.7
27
- Requires-Dist: click
28
- Requires-Dist: opentelemetry-sdk
29
25
  Requires-Dist: dataclasses_json
30
26
  Requires-Dist: tqdm
27
+ Requires-Dist: pydantic>=2.7
28
+ Requires-Dist: click
29
+ Requires-Dist: pandas
31
30
  Requires-Dist: python-dateutil
31
+ Requires-Dist: opentelemetry-sdk
32
32
  Provides-Extra: remote
33
33
  Requires-Dist: unstructured-client>=0.25.8; extra == "remote"
34
34
  Provides-Extra: csv
@@ -66,23 +66,23 @@ Requires-Dist: pyairtable; extra == "airtable"
66
66
  Provides-Extra: astradb
67
67
  Requires-Dist: astrapy; extra == "astradb"
68
68
  Provides-Extra: azure
69
- Requires-Dist: adlfs; extra == "azure"
70
69
  Requires-Dist: fsspec; extra == "azure"
70
+ Requires-Dist: adlfs; extra == "azure"
71
71
  Provides-Extra: azure-cognitive-search
72
72
  Requires-Dist: azure-search-documents; extra == "azure-cognitive-search"
73
73
  Provides-Extra: biomed
74
- Requires-Dist: requests; extra == "biomed"
75
74
  Requires-Dist: bs4; extra == "biomed"
75
+ Requires-Dist: requests; extra == "biomed"
76
76
  Provides-Extra: box
77
- Requires-Dist: fsspec; extra == "box"
78
77
  Requires-Dist: boxfs; extra == "box"
78
+ Requires-Dist: fsspec; extra == "box"
79
79
  Provides-Extra: chroma
80
80
  Requires-Dist: chromadb; extra == "chroma"
81
81
  Provides-Extra: clarifai
82
82
  Requires-Dist: clarifai; extra == "clarifai"
83
83
  Provides-Extra: confluence
84
- Requires-Dist: requests; extra == "confluence"
85
84
  Requires-Dist: atlassian-python-api; extra == "confluence"
85
+ Requires-Dist: requests; extra == "confluence"
86
86
  Provides-Extra: couchbase
87
87
  Requires-Dist: couchbase; extra == "couchbase"
88
88
  Provides-Extra: delta-table
@@ -96,12 +96,12 @@ Requires-Dist: dropboxdrivefs; extra == "dropbox"
96
96
  Provides-Extra: elasticsearch
97
97
  Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
98
98
  Provides-Extra: gcs
99
+ Requires-Dist: bs4; extra == "gcs"
99
100
  Requires-Dist: gcsfs; extra == "gcs"
100
101
  Requires-Dist: fsspec; extra == "gcs"
101
- Requires-Dist: bs4; extra == "gcs"
102
102
  Provides-Extra: github
103
- Requires-Dist: requests; extra == "github"
104
103
  Requires-Dist: pygithub>1.58.0; extra == "github"
104
+ Requires-Dist: requests; extra == "github"
105
105
  Provides-Extra: gitlab
106
106
  Requires-Dist: python-gitlab; extra == "gitlab"
107
107
  Provides-Extra: google-drive
@@ -120,19 +120,19 @@ Requires-Dist: pymilvus; extra == "milvus"
120
120
  Provides-Extra: mongodb
121
121
  Requires-Dist: pymongo; extra == "mongodb"
122
122
  Provides-Extra: notion
123
+ Requires-Dist: notion-client; extra == "notion"
123
124
  Requires-Dist: httpx; extra == "notion"
124
125
  Requires-Dist: htmlBuilder; extra == "notion"
125
- Requires-Dist: notion-client; extra == "notion"
126
126
  Requires-Dist: backoff; extra == "notion"
127
127
  Provides-Extra: onedrive
128
- Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
129
- Requires-Dist: msal; extra == "onedrive"
130
128
  Requires-Dist: bs4; extra == "onedrive"
129
+ Requires-Dist: msal; extra == "onedrive"
130
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
131
131
  Provides-Extra: opensearch
132
132
  Requires-Dist: opensearch-py; extra == "opensearch"
133
133
  Provides-Extra: outlook
134
- Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
135
134
  Requires-Dist: msal; extra == "outlook"
135
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
136
136
  Provides-Extra: pinecone
137
137
  Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
138
138
  Provides-Extra: postgres
@@ -142,16 +142,16 @@ Requires-Dist: qdrant-client; extra == "qdrant"
142
142
  Provides-Extra: reddit
143
143
  Requires-Dist: praw; extra == "reddit"
144
144
  Provides-Extra: s3
145
- Requires-Dist: s3fs; extra == "s3"
146
145
  Requires-Dist: fsspec; extra == "s3"
146
+ Requires-Dist: s3fs; extra == "s3"
147
147
  Provides-Extra: sharepoint
148
- Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
149
148
  Requires-Dist: msal; extra == "sharepoint"
149
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
150
150
  Provides-Extra: salesforce
151
151
  Requires-Dist: simple-salesforce; extra == "salesforce"
152
152
  Provides-Extra: sftp
153
- Requires-Dist: paramiko; extra == "sftp"
154
153
  Requires-Dist: fsspec; extra == "sftp"
154
+ Requires-Dist: paramiko; extra == "sftp"
155
155
  Provides-Extra: slack
156
156
  Requires-Dist: slack_sdk; extra == "slack"
157
157
  Provides-Extra: wikipedia
@@ -167,8 +167,8 @@ Requires-Dist: requests; extra == "vectara"
167
167
  Provides-Extra: embed-huggingface
168
168
  Requires-Dist: sentence-transformers; extra == "embed-huggingface"
169
169
  Provides-Extra: embed-octoai
170
- Requires-Dist: tiktoken; extra == "embed-octoai"
171
170
  Requires-Dist: openai; extra == "embed-octoai"
171
+ Requires-Dist: tiktoken; extra == "embed-octoai"
172
172
  Provides-Extra: embed-vertexai
173
173
  Requires-Dist: vertexai; extra == "embed-vertexai"
174
174
  Provides-Extra: embed-voyageai
@@ -176,8 +176,8 @@ Requires-Dist: voyageai; extra == "embed-voyageai"
176
176
  Provides-Extra: embed-mixedbreadai
177
177
  Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
178
178
  Provides-Extra: openai
179
- Requires-Dist: tiktoken; extra == "openai"
180
179
  Requires-Dist: openai; extra == "openai"
180
+ Requires-Dist: tiktoken; extra == "openai"
181
181
  Provides-Extra: bedrock
182
182
  Requires-Dist: boto3; extra == "bedrock"
183
183
 
@@ -1 +0,0 @@
1
- __version__ = "0.0.22" # pragma: no cover
@@ -1,17 +0,0 @@
1
- from unstructured_ingest.embed.bedrock import BedrockEmbeddingEncoder
2
- from unstructured_ingest.embed.huggingface import HuggingFaceEmbeddingEncoder
3
- from unstructured_ingest.embed.mixedbreadai import MixedbreadAIEmbeddingEncoder
4
- from unstructured_ingest.embed.octoai import OctoAIEmbeddingEncoder
5
- from unstructured_ingest.embed.openai import OpenAIEmbeddingEncoder
6
- from unstructured_ingest.embed.vertexai import VertexAIEmbeddingEncoder
7
- from unstructured_ingest.embed.voyageai import VoyageAIEmbeddingEncoder
8
-
9
- EMBEDDING_PROVIDER_TO_CLASS_MAP = {
10
- "langchain-openai": OpenAIEmbeddingEncoder,
11
- "langchain-huggingface": HuggingFaceEmbeddingEncoder,
12
- "langchain-aws-bedrock": BedrockEmbeddingEncoder,
13
- "langchain-vertexai": VertexAIEmbeddingEncoder,
14
- "langchain-voyageai": VoyageAIEmbeddingEncoder,
15
- "mixedbread-ai": MixedbreadAIEmbeddingEncoder,
16
- "octoai": OctoAIEmbeddingEncoder,
17
- }