unstructured-ingest 0.0.0__tar.gz → 0.0.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (369) hide show
  1. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/PKG-INFO +2 -1
  2. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/setup.py +1 -0
  3. unstructured-ingest-0.0.1/unstructured_ingest/__version__.py +1 -0
  4. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/helpers.py +1 -1
  5. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/logger.py +2 -2
  6. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/__init__.py +2 -0
  7. unstructured-ingest-0.0.1/unstructured_ingest/v2/cli/cmds/milvus.py +72 -0
  8. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/logger.py +1 -1
  9. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/interfaces.py +4 -0
  10. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/__init__.py +4 -2
  11. unstructured-ingest-0.0.1/unstructured_ingest/v2/processes/connectors/milvus.py +200 -0
  12. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/pinecone.py +4 -4
  13. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest.egg-info/PKG-INFO +2 -1
  14. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest.egg-info/SOURCES.txt +2 -0
  15. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest.egg-info/requires.txt +15 -12
  16. unstructured-ingest-0.0.0/unstructured_ingest/__version__.py +0 -1
  17. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/README.md +0 -0
  18. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/pyproject.toml +0 -0
  19. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/setup.cfg +0 -0
  20. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/test/test_error.py +0 -0
  21. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/test/test_interfaces.py +0 -0
  22. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/test/test_logger.py +0 -0
  23. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/test/test_utils.py +0 -0
  24. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/__init__.py +0 -0
  25. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/__init__.py +0 -0
  26. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/base/__init__.py +0 -0
  27. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/base/cmd.py +0 -0
  28. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/base/dest.py +0 -0
  29. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/base/src.py +0 -0
  30. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cli.py +0 -0
  31. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmd_factory.py +0 -0
  32. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/__init__.py +0 -0
  33. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/airtable.py +0 -0
  34. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/astra.py +0 -0
  35. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/azure_cognitive_search.py +0 -0
  36. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/biomed.py +0 -0
  37. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/chroma.py +0 -0
  38. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/clarifai.py +0 -0
  39. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/confluence.py +0 -0
  40. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -0
  41. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/delta_table.py +0 -0
  42. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/discord.py +0 -0
  43. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/elasticsearch.py +0 -0
  44. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/__init__.py +0 -0
  45. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -0
  46. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/box.py +0 -0
  47. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -0
  48. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -0
  49. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -0
  50. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -0
  51. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -0
  52. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/github.py +0 -0
  53. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/gitlab.py +0 -0
  54. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/google_drive.py +0 -0
  55. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/hubspot.py +0 -0
  56. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/jira.py +0 -0
  57. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/kafka.py +0 -0
  58. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/local.py +0 -0
  59. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/mongodb.py +0 -0
  60. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/notion.py +0 -0
  61. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/onedrive.py +0 -0
  62. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/opensearch.py +0 -0
  63. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/outlook.py +0 -0
  64. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/pinecone.py +0 -0
  65. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/qdrant.py +0 -0
  66. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/reddit.py +0 -0
  67. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/salesforce.py +0 -0
  68. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/sharepoint.py +0 -0
  69. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/slack.py +0 -0
  70. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/sql.py +0 -0
  71. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/vectara.py +0 -0
  72. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/weaviate.py +0 -0
  73. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/cmds/wikipedia.py +0 -0
  74. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/common.py +0 -0
  75. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/interfaces.py +0 -0
  76. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/cli/utils.py +0 -0
  77. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/__init__.py +0 -0
  78. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/airtable.py +0 -0
  79. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/astra.py +0 -0
  80. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/azure_cognitive_search.py +0 -0
  81. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/biomed.py +0 -0
  82. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/chroma.py +0 -0
  83. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/clarifai.py +0 -0
  84. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/confluence.py +0 -0
  85. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/databricks_volumes.py +0 -0
  86. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/delta_table.py +0 -0
  87. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/discord.py +0 -0
  88. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/elasticsearch.py +0 -0
  89. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/__init__.py +0 -0
  90. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/azure.py +0 -0
  91. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/box.py +0 -0
  92. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/dropbox.py +0 -0
  93. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/fsspec.py +0 -0
  94. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/gcs.py +0 -0
  95. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/s3.py +0 -0
  96. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/fsspec/sftp.py +0 -0
  97. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/git.py +0 -0
  98. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/github.py +0 -0
  99. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/gitlab.py +0 -0
  100. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/google_drive.py +0 -0
  101. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/hubspot.py +0 -0
  102. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/jira.py +0 -0
  103. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/kafka.py +0 -0
  104. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/local.py +0 -0
  105. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/mongodb.py +0 -0
  106. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/__init__.py +0 -0
  107. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/client.py +0 -0
  108. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/connector.py +0 -0
  109. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/interfaces.py +0 -0
  110. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/__init__.py +0 -0
  111. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/block.py +0 -0
  112. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/__init__.py +0 -0
  113. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -0
  114. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -0
  115. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -0
  116. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -0
  117. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -0
  118. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -0
  119. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/code.py +0 -0
  120. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -0
  121. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -0
  122. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -0
  123. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -0
  124. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/file.py +0 -0
  125. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -0
  126. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/image.py +0 -0
  127. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -0
  128. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -0
  129. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -0
  130. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -0
  131. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -0
  132. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -0
  133. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -0
  134. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/table.py +0 -0
  135. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -0
  136. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/template.py +0 -0
  137. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -0
  138. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -0
  139. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -0
  140. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/blocks/video.py +0 -0
  141. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database.py +0 -0
  142. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -0
  143. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -0
  144. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -0
  145. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -0
  146. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -0
  147. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -0
  148. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -0
  149. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -0
  150. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -0
  151. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -0
  152. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -0
  153. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -0
  154. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -0
  155. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -0
  156. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -0
  157. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -0
  158. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -0
  159. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -0
  160. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -0
  161. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -0
  162. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -0
  163. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -0
  164. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -0
  165. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/date.py +0 -0
  166. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/file.py +0 -0
  167. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/page.py +0 -0
  168. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/parent.py +0 -0
  169. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/rich_text.py +0 -0
  170. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/notion/types/user.py +0 -0
  171. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/onedrive.py +0 -0
  172. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/opensearch.py +0 -0
  173. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/outlook.py +0 -0
  174. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/pinecone.py +0 -0
  175. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/qdrant.py +0 -0
  176. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/reddit.py +0 -0
  177. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/registry.py +0 -0
  178. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/salesforce.py +0 -0
  179. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/sharepoint.py +0 -0
  180. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/slack.py +0 -0
  181. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/sql.py +0 -0
  182. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/vectara.py +0 -0
  183. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/weaviate.py +0 -0
  184. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/connector/wikipedia.py +0 -0
  185. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/enhanced_dataclass/__init__.py +0 -0
  186. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/enhanced_dataclass/core.py +0 -0
  187. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -0
  188. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -0
  189. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/error.py +0 -0
  190. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/evaluate.py +0 -0
  191. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/ingest_backoff/__init__.py +0 -0
  192. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/ingest_backoff/_common.py +0 -0
  193. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/ingest_backoff/_wrapper.py +0 -0
  194. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/interfaces.py +0 -0
  195. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/main.py +0 -0
  196. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/__init__.py +0 -0
  197. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/copy.py +0 -0
  198. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/doc_factory.py +0 -0
  199. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/interfaces.py +0 -0
  200. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/partition.py +0 -0
  201. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/permissions.py +0 -0
  202. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/pipeline.py +0 -0
  203. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/reformat/__init__.py +0 -0
  204. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/reformat/chunking.py +0 -0
  205. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/reformat/embedding.py +0 -0
  206. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/source.py +0 -0
  207. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/utils.py +0 -0
  208. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/pipeline/write.py +0 -0
  209. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/processor.py +0 -0
  210. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/__init__.py +0 -0
  211. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/airtable.py +0 -0
  212. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/astra.py +0 -0
  213. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/base_runner.py +0 -0
  214. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/biomed.py +0 -0
  215. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/confluence.py +0 -0
  216. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/delta_table.py +0 -0
  217. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/discord.py +0 -0
  218. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/elasticsearch.py +0 -0
  219. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/__init__.py +0 -0
  220. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/azure.py +0 -0
  221. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/box.py +0 -0
  222. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/dropbox.py +0 -0
  223. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/fsspec.py +0 -0
  224. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/gcs.py +0 -0
  225. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/s3.py +0 -0
  226. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/fsspec/sftp.py +0 -0
  227. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/github.py +0 -0
  228. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/gitlab.py +0 -0
  229. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/google_drive.py +0 -0
  230. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/hubspot.py +0 -0
  231. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/jira.py +0 -0
  232. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/kafka.py +0 -0
  233. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/local.py +0 -0
  234. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/mongodb.py +0 -0
  235. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/notion.py +0 -0
  236. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/onedrive.py +0 -0
  237. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/opensearch.py +0 -0
  238. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/outlook.py +0 -0
  239. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/reddit.py +0 -0
  240. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/salesforce.py +0 -0
  241. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/sharepoint.py +0 -0
  242. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/slack.py +0 -0
  243. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/utils.py +0 -0
  244. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/wikipedia.py +0 -0
  245. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/__init__.py +0 -0
  246. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/astra.py +0 -0
  247. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/azure_cognitive_search.py +0 -0
  248. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/base_writer.py +0 -0
  249. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/chroma.py +0 -0
  250. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/clarifai.py +0 -0
  251. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/databricks_volumes.py +0 -0
  252. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/delta_table.py +0 -0
  253. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/elasticsearch.py +0 -0
  254. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/fsspec/__init__.py +0 -0
  255. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/fsspec/azure.py +0 -0
  256. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/fsspec/box.py +0 -0
  257. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -0
  258. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -0
  259. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/fsspec/s3.py +0 -0
  260. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/kafka.py +0 -0
  261. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/mongodb.py +0 -0
  262. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/opensearch.py +0 -0
  263. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/pinecone.py +0 -0
  264. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/qdrant.py +0 -0
  265. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/sql.py +0 -0
  266. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/vectara.py +0 -0
  267. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/runner/writers/weaviate.py +0 -0
  268. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/utils/__init__.py +0 -0
  269. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/utils/compression.py +0 -0
  270. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/utils/data_prep.py +0 -0
  271. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/utils/dep_check.py +0 -0
  272. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  273. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/utils/table.py +0 -0
  274. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/__init__.py +0 -0
  275. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/__init__.py +0 -0
  276. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/base/__init__.py +0 -0
  277. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/base/cmd.py +0 -0
  278. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/base/dest.py +0 -0
  279. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/base/importer.py +0 -0
  280. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/base/src.py +0 -0
  281. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cli.py +0 -0
  282. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/astra.py +0 -0
  283. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/azure_cognitive_search.py +0 -0
  284. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/chroma.py +0 -0
  285. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/databricks_volumes.py +0 -0
  286. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/elasticsearch.py +0 -0
  287. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/__init__.py +0 -0
  288. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/azure.py +0 -0
  289. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/box.py +0 -0
  290. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/dropbox.py +0 -0
  291. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/fsspec.py +0 -0
  292. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/gcs.py +0 -0
  293. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/s3.py +0 -0
  294. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/fsspec/sftp.py +0 -0
  295. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/google_drive.py +0 -0
  296. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/local.py +0 -0
  297. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/mongodb.py +0 -0
  298. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/onedrive.py +0 -0
  299. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/opensearch.py +0 -0
  300. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/pinecone.py +0 -0
  301. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/salesforce.py +0 -0
  302. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/sharepoint.py +0 -0
  303. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/singlestore.py +0 -0
  304. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/sql.py +0 -0
  305. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/cmds/weaviate.py +0 -0
  306. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/configs/__init__.py +0 -0
  307. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/configs/chunk.py +0 -0
  308. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/configs/embed.py +0 -0
  309. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/configs/partition.py +0 -0
  310. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/configs/processor.py +0 -0
  311. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/interfaces.py +0 -0
  312. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/cli/utils.py +0 -0
  313. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/example.py +0 -0
  314. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/__init__.py +0 -0
  315. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/connector.py +0 -0
  316. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/downloader.py +0 -0
  317. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/file_data.py +0 -0
  318. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/indexer.py +0 -0
  319. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/process.py +0 -0
  320. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/processor.py +0 -0
  321. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/upload_stager.py +0 -0
  322. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/interfaces/uploader.py +0 -0
  323. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/main.py +0 -0
  324. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/__init__.py +0 -0
  325. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/pipeline.py +0 -0
  326. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
  327. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -0
  328. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/download.py +0 -0
  329. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/embed.py +0 -0
  330. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/index.py +0 -0
  331. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/partition.py +0 -0
  332. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/stage.py +0 -0
  333. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -0
  334. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/steps/upload.py +0 -0
  335. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/pipeline/utils.py +0 -0
  336. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/__init__.py +0 -0
  337. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/chunker.py +0 -0
  338. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connector_registry.py +0 -0
  339. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/astra.py +0 -0
  340. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py +0 -0
  341. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/chroma.py +0 -0
  342. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/databricks_volumes.py +0 -0
  343. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/elasticsearch.py +0 -0
  344. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -0
  345. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +0 -0
  346. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/box.py +0 -0
  347. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +0 -0
  348. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -0
  349. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +0 -0
  350. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +0 -0
  351. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -0
  352. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/fsspec/utils.py +0 -0
  353. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -0
  354. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/local.py +0 -0
  355. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/mongodb.py +0 -0
  356. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -0
  357. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/opensearch.py +0 -0
  358. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -0
  359. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -0
  360. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/singlestore.py +0 -0
  361. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/sql.py +0 -0
  362. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/utils.py +0 -0
  363. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/connectors/weaviate.py +0 -0
  364. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/embedder.py +0 -0
  365. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/partitioner.py +0 -0
  366. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest/v2/processes/uncompress.py +0 -0
  367. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  368. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest.egg-info/entry_points.txt +0 -0
  369. {unstructured-ingest-0.0.0 → unstructured-ingest-0.0.1}/unstructured_ingest.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.0
3
+ Version: 0.0.1
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -56,6 +56,7 @@ Provides-Extra: google-drive
56
56
  Provides-Extra: hubspot
57
57
  Provides-Extra: jira
58
58
  Provides-Extra: kafka
59
+ Provides-Extra: milvus
59
60
  Provides-Extra: mongodb
60
61
  Provides-Extra: notion
61
62
  Provides-Extra: onedrive
@@ -102,6 +102,7 @@ connectors_reqs = {
102
102
  "hubspot": load_requirements("requirements/connectors/hubspot.in"),
103
103
  "jira": load_requirements("requirements/connectors/jira.in"),
104
104
  "kafka": load_requirements("requirements/connectors/kafka.in"),
105
+ "milvus": load_requirements("requirements/connectors/milvus.in"),
105
106
  "mongodb": load_requirements("requirements/connectors/mongodb.in"),
106
107
  "notion": load_requirements("requirements/connectors/notion.in"),
107
108
  "onedrive": load_requirements("requirements/connectors/onedrive.in"),
@@ -0,0 +1 @@
1
+ __version__ = "0.0.1" # pragma: no cover
@@ -5,7 +5,6 @@ from typing import List, Optional, Tuple
5
5
  from urllib.parse import urlparse
6
6
  from uuid import UUID
7
7
 
8
- import unstructured.ingest.connector.notion.types.blocks as notion_blocks
9
8
  from htmlBuilder.attributes import Style, Type
10
9
  from htmlBuilder.tags import (
11
10
  Body,
@@ -23,6 +22,7 @@ from htmlBuilder.tags import (
23
22
  )
24
23
  from notion_client.errors import APIResponseError
25
24
 
25
+ import unstructured_ingest.connector.notion.types.blocks as notion_blocks
26
26
  from unstructured_ingest.connector.notion.client import Client
27
27
  from unstructured_ingest.connector.notion.interfaces import BlockBase
28
28
  from unstructured_ingest.connector.notion.types.block import Block
@@ -3,7 +3,7 @@ import json
3
3
  import logging
4
4
  import typing as t
5
5
 
6
- logger = logging.getLogger("unstructured.ingest")
6
+ logger = logging.getLogger("unstructured_ingest")
7
7
 
8
8
 
9
9
  def default_is_data_sensitive(k: str, v: t.Any) -> bool:
@@ -119,7 +119,7 @@ def ingest_log_streaming_init(level: int) -> None:
119
119
 
120
120
  def make_default_logger(level: int) -> logging.Logger:
121
121
  """Return a custom logger."""
122
- logger = logging.getLogger("unstructured.ingest")
122
+ logger = logging.getLogger("unstructured_ingest")
123
123
  handler = logging.StreamHandler()
124
124
  handler.name = "ingest_log_handler"
125
125
  formatter = SensitiveFormatter("%(asctime)s %(processName)-10s %(levelname)-8s %(message)s")
@@ -15,6 +15,7 @@ from .fsspec.s3 import s3_dest_cmd, s3_src_cmd
15
15
  from .fsspec.sftp import sftp_dest_cmd, sftp_src_cmd
16
16
  from .google_drive import google_drive_src_cmd
17
17
  from .local import local_dest_cmd, local_src_cmd
18
+ from .milvus import milvus_dest_cmd
18
19
  from .mongodb import mongodb_dest_cmd
19
20
  from .onedrive import onedrive_drive_src_cmd
20
21
  from .opensearch import opensearch_dest_cmd, opensearch_src_cmd
@@ -60,6 +61,7 @@ dest_cmds = [
60
61
  elasticsearch_dest_cmd,
61
62
  gcs_dest_cmd,
62
63
  local_dest_cmd,
64
+ milvus_dest_cmd,
63
65
  opensearch_dest_cmd,
64
66
  pinecone_dest_cmd,
65
67
  s3_dest_cmd,
@@ -0,0 +1,72 @@
1
+ from dataclasses import dataclass
2
+
3
+ import click
4
+
5
+ from unstructured_ingest.v2.cli.base import DestCmd
6
+ from unstructured_ingest.v2.cli.interfaces import CliConfig
7
+ from unstructured_ingest.v2.processes.connectors.milvus import CONNECTOR_TYPE
8
+
9
+
10
+ @dataclass
11
+ class MilvusCliConnectionConfig(CliConfig):
12
+ @staticmethod
13
+ def get_cli_options() -> list[click.Option]:
14
+ options = [
15
+ click.Option(
16
+ ["--uri"],
17
+ required=False,
18
+ type=str,
19
+ default=None,
20
+ help="Milvus uri, eg 'http://localhost:19530",
21
+ ),
22
+ click.Option(
23
+ ["--user"],
24
+ required=False,
25
+ type=str,
26
+ default=None,
27
+ help="Milvus user",
28
+ ),
29
+ click.Option(
30
+ ["--password"],
31
+ required=False,
32
+ type=str,
33
+ default=None,
34
+ help="Milvus password",
35
+ ),
36
+ click.Option(
37
+ ["--db-name"],
38
+ required=False,
39
+ type=str,
40
+ default=None,
41
+ help="Milvus database name",
42
+ ),
43
+ ]
44
+ return options
45
+
46
+
47
+ @dataclass
48
+ class MilvusCliUploaderConfig(CliConfig):
49
+ @staticmethod
50
+ def get_cli_options() -> list[click.Option]:
51
+ options = [
52
+ click.Option(
53
+ ["--collection-name"],
54
+ required=True,
55
+ type=str,
56
+ help="Milvus collections to write to",
57
+ ),
58
+ click.Option(
59
+ ["--num-of-processes"],
60
+ type=click.IntRange(min=1),
61
+ default=4,
62
+ help="number of processes to use when writing to support parallel writes",
63
+ ),
64
+ ]
65
+ return options
66
+
67
+
68
+ milvus_dest_cmd = DestCmd(
69
+ cmd_name=CONNECTOR_TYPE,
70
+ connection_config=MilvusCliConnectionConfig,
71
+ uploader_config=MilvusCliUploaderConfig,
72
+ )
@@ -5,7 +5,7 @@ from logging import Formatter, Logger, StreamHandler, getLevelName, getLogger
5
5
  from typing import Any, Callable
6
6
 
7
7
  log_level = os.getenv("INGEST_LOG_LEVEL", "INFO")
8
- LOGGER_NAME = "unstructured.ingest.v2"
8
+ LOGGER_NAME = "unstructured_ingest.v2"
9
9
 
10
10
 
11
11
  def default_is_data_sensitive(k: str, v: Any) -> bool:
@@ -146,6 +146,8 @@ class PipelineStep(ABC):
146
146
  logger.error(f"Exception raised while running {self.identifier}", exc_info=e)
147
147
  if "file_data_path" in kwargs:
148
148
  self.context.status[kwargs["file_data_path"]] = {self.identifier: str(e)}
149
+ else:
150
+ self.context.status[self.identifier] = {"step_error": str(e)}
149
151
  if self.context.raise_on_error:
150
152
  raise e
151
153
  return None
@@ -158,6 +160,8 @@ class PipelineStep(ABC):
158
160
  logger.error(f"Exception raised while running {self.identifier}", exc_info=e)
159
161
  if "file_data_path" in kwargs:
160
162
  self.context.status[kwargs["file_data_path"]] = {self.identifier: str(e)}
163
+ else:
164
+ self.context.status[self.identifier] = {"step_error": str(e)}
161
165
  if self.context.raise_on_error:
162
166
  raise e
163
167
  return None
@@ -1,7 +1,6 @@
1
1
  from __future__ import annotations
2
2
 
3
- import unstructured.ingest.v2.processes.connectors.fsspec # noqa: F401
4
-
3
+ import unstructured_ingest.v2.processes.connectors.fsspec # noqa: F401
5
4
  from unstructured_ingest.v2.processes.connector_registry import (
6
5
  add_destination_entry,
7
6
  add_source_entry,
@@ -19,6 +18,8 @@ from .google_drive import CONNECTOR_TYPE as GOOGLE_DRIVE_CONNECTOR_TYPE
19
18
  from .google_drive import google_drive_source_entry
20
19
  from .local import CONNECTOR_TYPE as LOCAL_CONNECTOR_TYPE
21
20
  from .local import local_destination_entry, local_source_entry
21
+ from .milvus import CONNECTOR_TYPE as MILVUS_CONNECTOR_TYPE
22
+ from .milvus import milvus_destination_entry
22
23
  from .mongodb import CONNECTOR_TYPE as MONGODB_CONNECTOR_TYPE
23
24
  from .mongodb import mongodb_destination_entry
24
25
  from .onedrive import CONNECTOR_TYPE as ONEDRIVE_CONNECTOR_TYPE
@@ -75,3 +76,4 @@ add_source_entry(source_type=SHAREPOINT_CONNECTOR_TYPE, entry=sharepoint_source_
75
76
  add_destination_entry(
76
77
  destination_type=SINGLESTORE_CONNECTOR_TYPE, entry=singlestore_destination_entry
77
78
  )
79
+ add_destination_entry(destination_type=MILVUS_CONNECTOR_TYPE, entry=milvus_destination_entry)
@@ -0,0 +1,200 @@
1
+ import json
2
+ import multiprocessing as mp
3
+ from dataclasses import dataclass, field
4
+ from pathlib import Path
5
+ from typing import TYPE_CHECKING, Any, Optional, Union
6
+
7
+ import pandas as pd
8
+ from dateutil import parser
9
+
10
+ from unstructured_ingest.enhanced_dataclass import enhanced_field
11
+ from unstructured_ingest.error import WriteError
12
+ from unstructured_ingest.utils.data_prep import flatten_dict
13
+ from unstructured_ingest.utils.dep_check import requires_dependencies
14
+ from unstructured_ingest.v2.interfaces import (
15
+ AccessConfig,
16
+ ConnectionConfig,
17
+ FileData,
18
+ UploadContent,
19
+ Uploader,
20
+ UploaderConfig,
21
+ UploadStager,
22
+ UploadStagerConfig,
23
+ )
24
+ from unstructured_ingest.v2.logger import logger
25
+ from unstructured_ingest.v2.processes.connector_registry import (
26
+ DestinationRegistryEntry,
27
+ )
28
+
29
+ if TYPE_CHECKING:
30
+ from pymilvus import MilvusClient
31
+
32
+ CONNECTOR_TYPE = "milvus"
33
+
34
+
35
+ @dataclass
36
+ class MilvusAccessConfig(AccessConfig):
37
+ password: Optional[str] = None
38
+ token: Optional[str] = None
39
+
40
+
41
+ @dataclass
42
+ class MilvusConnectionConfig(ConnectionConfig):
43
+ access_config: MilvusAccessConfig = enhanced_field(
44
+ sensitive=True, default_factory=lambda: MilvusAccessConfig()
45
+ )
46
+ uri: Optional[str] = None
47
+ user: Optional[str] = None
48
+ db_name: Optional[str] = None
49
+
50
+ def get_connection_kwargs(self) -> dict[str, Any]:
51
+ access_config_dict = self.access_config.to_dict()
52
+ connection_config_dict = self.to_dict()
53
+ connection_config_dict.pop("access_config", None)
54
+ connection_config_dict.update(access_config_dict)
55
+ # Drop any that were not set explicitly
56
+ connection_config_dict = {k: v for k, v in connection_config_dict.items() if v is not None}
57
+ return connection_config_dict
58
+
59
+ @requires_dependencies(["pymilvus"], extras="milvus")
60
+ def get_client(self) -> "MilvusClient":
61
+ from pymilvus import MilvusClient
62
+
63
+ return MilvusClient(**self.get_connection_kwargs())
64
+
65
+
66
+ @dataclass
67
+ class MilvusUploadStagerConfig(UploadStagerConfig):
68
+ pass
69
+
70
+
71
+ @dataclass
72
+ class MilvusUploadStager(UploadStager):
73
+ upload_stager_config: MilvusUploadStagerConfig = field(
74
+ default_factory=lambda: MilvusUploadStagerConfig()
75
+ )
76
+
77
+ @staticmethod
78
+ def parse_date_string(date_string: str) -> float:
79
+ try:
80
+ timestamp = float(date_string)
81
+ return timestamp
82
+ except ValueError:
83
+ pass
84
+ return parser.parse(date_string).timestamp()
85
+
86
+ @classmethod
87
+ def conform_dict(cls, data: dict) -> None:
88
+ datetime_columns = [
89
+ "data_source_date_created",
90
+ "data_source_date_modified",
91
+ "data_source_date_processed",
92
+ "last_modified",
93
+ ]
94
+
95
+ json_dumps_fields = ["languages", "data_source_permissions_data"]
96
+
97
+ # TODO: milvus sdk doesn't seem to support defaults via the schema yet,
98
+ # remove once that gets updated
99
+ defaults = {"is_continuation": False}
100
+
101
+ if metadata := data.pop("metadata", None):
102
+ data.update(flatten_dict(metadata, keys_to_omit=["data_source_record_locator"]))
103
+ for datetime_column in datetime_columns:
104
+ if datetime_column in data:
105
+ data[datetime_column] = cls.parse_date_string(data[datetime_column])
106
+ for json_dumps_field in json_dumps_fields:
107
+ if json_dumps_field in data:
108
+ data[json_dumps_field] = json.dumps(data[json_dumps_field])
109
+ for default in defaults:
110
+ if default not in data:
111
+ data[default] = defaults[default]
112
+
113
+ def run(
114
+ self,
115
+ elements_filepath: Path,
116
+ file_data: FileData,
117
+ output_dir: Path,
118
+ output_filename: str,
119
+ **kwargs: Any,
120
+ ) -> Path:
121
+ with open(elements_filepath) as elements_file:
122
+ elements_contents: list[dict[str, Any]] = json.load(elements_file)
123
+ for element in elements_contents:
124
+ self.conform_dict(data=element)
125
+
126
+ output_path = Path(output_dir) / Path(f"{output_filename}.json")
127
+ output_path.parent.mkdir(parents=True, exist_ok=True)
128
+ with output_path.open("w") as output_file:
129
+ json.dump(elements_contents, output_file, indent=2)
130
+ return output_path
131
+
132
+
133
+ @dataclass
134
+ class MilvusUploaderConfig(UploaderConfig):
135
+ collection_name: str
136
+ num_of_processes: int = 4
137
+
138
+
139
+ @dataclass
140
+ class MilvusUploader(Uploader):
141
+ connection_config: MilvusConnectionConfig
142
+ upload_config: MilvusUploaderConfig
143
+ connector_type: str = CONNECTOR_TYPE
144
+
145
+ def upload(self, content: UploadContent) -> None:
146
+ file_extension = content.path.suffix
147
+ if file_extension == ".json":
148
+ self.upload_json(content=content)
149
+ elif file_extension == ".csv":
150
+ self.upload_csv(content=content)
151
+ else:
152
+ raise ValueError(f"Unsupported file extension: {file_extension}")
153
+
154
+ @requires_dependencies(["pymilvus"], extras="milvus")
155
+ def insert_results(self, data: Union[dict, list[dict]]):
156
+ from pymilvus import MilvusException
157
+
158
+ logger.debug(
159
+ f"uploading {len(data)} entries to {self.connection_config.db_name} "
160
+ f"db in collection {self.upload_config.collection_name}"
161
+ )
162
+ client = self.connection_config.get_client()
163
+
164
+ try:
165
+ res = client.insert(collection_name=self.upload_config.collection_name, data=data)
166
+ except MilvusException as milvus_exception:
167
+ raise WriteError("failed to upload records to milvus") from milvus_exception
168
+ if "err_count" in res and isinstance(res["err_count"], int) and res["err_count"] > 0:
169
+ err_count = res["err_count"]
170
+ raise WriteError(f"failed to upload {err_count} docs")
171
+
172
+ def upload_csv(self, content: UploadContent) -> None:
173
+ df = pd.read_csv(content.path)
174
+ data = df.to_dict(orient="records")
175
+ self.insert_results(data=data)
176
+
177
+ def upload_json(self, content: UploadContent) -> None:
178
+ with content.path.open("r") as file:
179
+ data: list[dict] = json.load(file)
180
+ self.insert_results(data=data)
181
+
182
+ def run(self, contents: list[UploadContent], **kwargs: Any) -> None:
183
+ if self.upload_config.num_of_processes == 1:
184
+ for content in contents:
185
+ self.upload(content=content)
186
+
187
+ else:
188
+ with mp.Pool(
189
+ processes=self.upload_config.num_of_processes,
190
+ ) as pool:
191
+ pool.map(self.upload, contents)
192
+
193
+
194
+ milvus_destination_entry = DestinationRegistryEntry(
195
+ connection_config=MilvusConnectionConfig,
196
+ uploader=MilvusUploader,
197
+ uploader_config=MilvusUploaderConfig,
198
+ upload_stager=MilvusUploadStager,
199
+ upload_stager_config=MilvusUploadStagerConfig,
200
+ )
@@ -5,10 +5,6 @@ from dataclasses import dataclass, field
5
5
  from pathlib import Path
6
6
  from typing import TYPE_CHECKING, Any, Optional
7
7
 
8
- from unstructured.ingest.v2.logger import logger
9
- from unstructured.ingest.v2.processes.connector_registry import (
10
- DestinationRegistryEntry,
11
- )
12
8
  from unstructured.staging.base import flatten_dict
13
9
  from unstructured.utils import requires_dependencies
14
10
 
@@ -24,6 +20,10 @@ from unstructured_ingest.v2.interfaces import (
24
20
  UploadStager,
25
21
  UploadStagerConfig,
26
22
  )
23
+ from unstructured_ingest.v2.logger import logger
24
+ from unstructured_ingest.v2.processes.connector_registry import (
25
+ DestinationRegistryEntry,
26
+ )
27
27
 
28
28
  if TYPE_CHECKING:
29
29
  from pinecone import Index as PineconeIndex
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.0
3
+ Version: 0.0.1
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -56,6 +56,7 @@ Provides-Extra: google-drive
56
56
  Provides-Extra: hubspot
57
57
  Provides-Extra: jira
58
58
  Provides-Extra: kafka
59
+ Provides-Extra: milvus
59
60
  Provides-Extra: mongodb
60
61
  Provides-Extra: notion
61
62
  Provides-Extra: onedrive
@@ -286,6 +286,7 @@ unstructured_ingest/v2/cli/cmds/databricks_volumes.py
286
286
  unstructured_ingest/v2/cli/cmds/elasticsearch.py
287
287
  unstructured_ingest/v2/cli/cmds/google_drive.py
288
288
  unstructured_ingest/v2/cli/cmds/local.py
289
+ unstructured_ingest/v2/cli/cmds/milvus.py
289
290
  unstructured_ingest/v2/cli/cmds/mongodb.py
290
291
  unstructured_ingest/v2/cli/cmds/onedrive.py
291
292
  unstructured_ingest/v2/cli/cmds/opensearch.py
@@ -344,6 +345,7 @@ unstructured_ingest/v2/processes/connectors/databricks_volumes.py
344
345
  unstructured_ingest/v2/processes/connectors/elasticsearch.py
345
346
  unstructured_ingest/v2/processes/connectors/google_drive.py
346
347
  unstructured_ingest/v2/processes/connectors/local.py
348
+ unstructured_ingest/v2/processes/connectors/milvus.py
347
349
  unstructured_ingest/v2/processes/connectors/mongodb.py
348
350
  unstructured_ingest/v2/processes/connectors/onedrive.py
349
351
  unstructured_ingest/v2/processes/connectors/opensearch.py
@@ -1,5 +1,5 @@
1
- pandas
2
1
  python-dateutil
2
+ pandas
3
3
  unstructured
4
4
 
5
5
  [airtable]
@@ -16,8 +16,8 @@ fsspec
16
16
  azure-search-documents
17
17
 
18
18
  [bedrock]
19
- langchain-community
20
19
  boto3
20
+ langchain-community
21
21
 
22
22
  [biomed]
23
23
  bs4
@@ -27,8 +27,8 @@ fsspec
27
27
  boxfs
28
28
 
29
29
  [chroma]
30
- typer<=0.9.0
31
30
  chromadb
31
+ typer<=0.9.0
32
32
  importlib-metadata>=7.1.0
33
33
 
34
34
  [clarifai]
@@ -64,29 +64,29 @@ fsspec
64
64
  elasticsearch[async]
65
65
 
66
66
  [embed-huggingface]
67
- huggingface
68
- langchain-community
69
67
  sentence_transformers
68
+ langchain-community
69
+ huggingface
70
70
 
71
71
  [embed-octoai]
72
- tiktoken
73
72
  openai
73
+ tiktoken
74
74
 
75
75
  [embed-vertexai]
76
- langchain-community
77
76
  langchain
77
+ langchain-community
78
78
  langchain-google-vertexai
79
79
 
80
80
  [embed-voyageai]
81
- langchain-voyageai
82
81
  langchain
82
+ langchain-voyageai
83
83
 
84
84
  [epub]
85
85
  unstructured[epub]
86
86
 
87
87
  [gcs]
88
- gcsfs
89
88
  fsspec
89
+ gcsfs
90
90
  bs4
91
91
 
92
92
  [github]
@@ -111,6 +111,9 @@ confluent-kafka
111
111
  [md]
112
112
  unstructured[md]
113
113
 
114
+ [milvus]
115
+ pymilvus
116
+
114
117
  [mongodb]
115
118
  pymongo
116
119
 
@@ -125,14 +128,14 @@ htmlBuilder
125
128
  unstructured[odt]
126
129
 
127
130
  [onedrive]
131
+ bs4
128
132
  msal
129
133
  Office365-REST-Python-Client
130
- bs4
131
134
 
132
135
  [openai]
136
+ openai
133
137
  langchain-community
134
138
  tiktoken
135
- openai
136
139
 
137
140
  [opensearch]
138
141
  opensearch-py
@@ -172,8 +175,8 @@ unstructured[rst]
172
175
  unstructured[rtf]
173
176
 
174
177
  [s3]
175
- s3fs
176
178
  fsspec
179
+ s3fs
177
180
 
178
181
  [salesforce]
179
182
  simple-salesforce
@@ -1 +0,0 @@
1
- __version__ = "0.0.0" # pragma: no cover