unstructured-ingest 0.6.4__tar.gz → 0.7.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (877) hide show
  1. unstructured_ingest-0.7.1/PKG-INFO +383 -0
  2. unstructured_ingest-0.7.1/examples/airtable.py +44 -0
  3. unstructured_ingest-0.7.1/examples/azure_cognitive_search.py +55 -0
  4. unstructured_ingest-0.7.1/examples/chroma.py +54 -0
  5. unstructured_ingest-0.7.1/examples/couchbase.py +55 -0
  6. unstructured_ingest-0.7.1/examples/databricks_volumes_dest.py +55 -0
  7. unstructured_ingest-0.7.1/examples/databricks_volumes_source.py +53 -0
  8. unstructured_ingest-0.7.1/examples/delta_table.py +45 -0
  9. unstructured_ingest-0.7.1/examples/discord_example.py +36 -0
  10. unstructured_ingest-0.7.1/examples/elasticsearch.py +49 -0
  11. unstructured_ingest-0.7.1/examples/google_drive.py +45 -0
  12. unstructured_ingest-0.7.1/examples/kdbai.py +54 -0
  13. unstructured_ingest-0.7.1/examples/local.py +36 -0
  14. unstructured_ingest-0.7.1/examples/milvus.py +44 -0
  15. unstructured_ingest-0.7.1/examples/mongodb.py +53 -0
  16. unstructured_ingest-0.7.1/examples/opensearch.py +50 -0
  17. unstructured_ingest-0.7.1/examples/pinecone.py +57 -0
  18. unstructured_ingest-0.7.1/examples/s3.py +38 -0
  19. unstructured_ingest-0.7.1/examples/salesforce.py +44 -0
  20. unstructured_ingest-0.7.1/examples/sharepoint.py +47 -0
  21. unstructured_ingest-0.7.1/examples/singlestore.py +49 -0
  22. unstructured_ingest-0.7.1/examples/sql.py +90 -0
  23. unstructured_ingest-0.7.1/examples/vectara.py +54 -0
  24. unstructured_ingest-0.7.1/examples/weaviate.py +44 -0
  25. unstructured_ingest-0.7.1/test/integration/chunkers/test_chunkers.py +31 -0
  26. unstructured_ingest-0.7.1/test/integration/connectors/conftest.py +38 -0
  27. unstructured_ingest-0.7.1/test/integration/connectors/databricks/test_volumes_native.py +273 -0
  28. unstructured_ingest-0.7.1/test/integration/connectors/discord/test_discord.py +90 -0
  29. unstructured_ingest-0.7.1/test/integration/connectors/duckdb/test_duckdb.py +90 -0
  30. unstructured_ingest-0.7.1/test/integration/connectors/duckdb/test_motherduck.py +95 -0
  31. unstructured_ingest-0.7.1/test/integration/connectors/elasticsearch/test_elasticsearch.py +331 -0
  32. unstructured_ingest-0.7.1/test/integration/connectors/elasticsearch/test_opensearch.py +326 -0
  33. unstructured_ingest-0.7.1/test/integration/connectors/sql/test_databricks_delta_tables.py +170 -0
  34. unstructured_ingest-0.7.1/test/integration/connectors/sql/test_postgres.py +201 -0
  35. unstructured_ingest-0.7.1/test/integration/connectors/sql/test_singlestore.py +182 -0
  36. unstructured_ingest-0.7.1/test/integration/connectors/sql/test_snowflake.py +244 -0
  37. unstructured_ingest-0.7.1/test/integration/connectors/sql/test_sqlite.py +168 -0
  38. unstructured_ingest-0.7.1/test/integration/connectors/sql/test_vastdb.py +34 -0
  39. unstructured_ingest-0.7.1/test/integration/connectors/test_astradb.py +287 -0
  40. unstructured_ingest-0.7.1/test/integration/connectors/test_azure_ai_search.py +254 -0
  41. unstructured_ingest-0.7.1/test/integration/connectors/test_chroma.py +136 -0
  42. unstructured_ingest-0.7.1/test/integration/connectors/test_confluence.py +111 -0
  43. unstructured_ingest-0.7.1/test/integration/connectors/test_delta_table.py +183 -0
  44. unstructured_ingest-0.7.1/test/integration/connectors/test_dropbox.py +151 -0
  45. unstructured_ingest-0.7.1/test/integration/connectors/test_github.py +49 -0
  46. unstructured_ingest-0.7.1/test/integration/connectors/test_google_drive.py +257 -0
  47. unstructured_ingest-0.7.1/test/integration/connectors/test_jira.py +67 -0
  48. unstructured_ingest-0.7.1/test/integration/connectors/test_lancedb.py +247 -0
  49. unstructured_ingest-0.7.1/test/integration/connectors/test_milvus.py +208 -0
  50. unstructured_ingest-0.7.1/test/integration/connectors/test_mongodb.py +335 -0
  51. unstructured_ingest-0.7.1/test/integration/connectors/test_neo4j.py +244 -0
  52. unstructured_ingest-0.7.1/test/integration/connectors/test_notion.py +152 -0
  53. unstructured_ingest-0.7.1/test/integration/connectors/test_onedrive.py +163 -0
  54. unstructured_ingest-0.7.1/test/integration/connectors/test_pinecone.py +387 -0
  55. unstructured_ingest-0.7.1/test/integration/connectors/test_qdrant.py +216 -0
  56. unstructured_ingest-0.7.1/test/integration/connectors/test_redis.py +143 -0
  57. unstructured_ingest-0.7.1/test/integration/connectors/test_s3.py +184 -0
  58. unstructured_ingest-0.7.1/test/integration/connectors/test_sharepoint.py +222 -0
  59. unstructured_ingest-0.7.1/test/integration/connectors/test_vectara.py +282 -0
  60. unstructured_ingest-0.7.1/test/integration/connectors/test_zendesk.py +120 -0
  61. unstructured_ingest-0.7.1/test/integration/connectors/utils/validation/destination.py +77 -0
  62. unstructured_ingest-0.7.1/test/integration/connectors/utils/validation/source.py +331 -0
  63. unstructured_ingest-0.7.1/test/integration/connectors/weaviate/test_cloud.py +39 -0
  64. unstructured_ingest-0.7.1/test/integration/connectors/weaviate/test_local.py +152 -0
  65. unstructured_ingest-0.7.1/test/integration/embedders/test_azure_openai.py +57 -0
  66. unstructured_ingest-0.7.1/test/integration/embedders/test_bedrock.py +103 -0
  67. unstructured_ingest-0.7.1/test/integration/embedders/test_huggingface.py +24 -0
  68. unstructured_ingest-0.7.1/test/integration/embedders/test_mixedbread.py +71 -0
  69. unstructured_ingest-0.7.1/test/integration/embedders/test_octoai.py +75 -0
  70. unstructured_ingest-0.7.1/test/integration/embedders/test_openai.py +74 -0
  71. unstructured_ingest-0.7.1/test/integration/embedders/test_togetherai.py +71 -0
  72. unstructured_ingest-0.7.1/test/integration/embedders/test_vertexai.py +63 -0
  73. unstructured_ingest-0.7.1/test/integration/embedders/test_voyageai.py +79 -0
  74. unstructured_ingest-0.7.1/test/integration/partitioners/test_partitioner.py +76 -0
  75. unstructured_ingest-0.7.1/test/unit/chunkers/test_chunkers.py +49 -0
  76. unstructured_ingest-0.7.1/test/unit/connectors/ibm_watsonx/test_ibm_watsonx_s3.py +459 -0
  77. unstructured_ingest-0.7.1/test/unit/connectors/motherduck/test_base.py +73 -0
  78. unstructured_ingest-0.7.1/test/unit/connectors/sql/test_sql.py +152 -0
  79. unstructured_ingest-0.7.1/test/unit/connectors/test_confluence.py +71 -0
  80. unstructured_ingest-0.7.1/test/unit/connectors/test_jira.py +401 -0
  81. unstructured_ingest-0.7.1/test/unit/embedders/test_huggingface.py +48 -0
  82. unstructured_ingest-0.7.1/test/unit/embedders/test_vertexai.py +37 -0
  83. unstructured_ingest-0.7.1/test/unit/partitioners/test_partitioner.py +63 -0
  84. unstructured_ingest-0.7.1/test/unit/test_html.py +112 -0
  85. unstructured_ingest-0.7.1/test/unit/test_interfaces.py +26 -0
  86. unstructured_ingest-0.7.1/test/unit/test_utils.py +220 -0
  87. unstructured_ingest-0.7.1/unstructured_ingest/__version__.py +1 -0
  88. unstructured_ingest-0.7.1/unstructured_ingest/cli/base/cmd.py +269 -0
  89. unstructured_ingest-0.7.1/unstructured_ingest/cli/base/dest.py +84 -0
  90. unstructured_ingest-0.7.1/unstructured_ingest/cli/base/src.py +75 -0
  91. unstructured_ingest-0.7.1/unstructured_ingest/cli/cli.py +24 -0
  92. unstructured_ingest-0.7.1/unstructured_ingest/cli/cmds.py +14 -0
  93. unstructured_ingest-0.7.1/unstructured_ingest/cli/utils/model_conversion.py +222 -0
  94. unstructured_ingest-0.7.1/unstructured_ingest/data_types/file_data.py +116 -0
  95. unstructured_ingest-0.7.1/unstructured_ingest/embed/bedrock.py +210 -0
  96. unstructured_ingest-0.7.1/unstructured_ingest/embed/octoai.py +112 -0
  97. unstructured_ingest-0.7.1/unstructured_ingest/embed/openai.py +99 -0
  98. unstructured_ingest-0.7.1/unstructured_ingest/embed/togetherai.py +84 -0
  99. unstructured_ingest-0.7.1/unstructured_ingest/embed/vertexai.py +109 -0
  100. unstructured_ingest-0.7.1/unstructured_ingest/embed/voyageai.py +127 -0
  101. unstructured_ingest-0.7.1/unstructured_ingest/interfaces/downloader.py +88 -0
  102. unstructured_ingest-0.7.1/unstructured_ingest/interfaces/indexer.py +29 -0
  103. unstructured_ingest-0.7.1/unstructured_ingest/interfaces/upload_stager.py +89 -0
  104. unstructured_ingest-0.7.1/unstructured_ingest/interfaces/uploader.py +67 -0
  105. unstructured_ingest-0.7.1/unstructured_ingest/otel.py +111 -0
  106. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/interfaces.py +211 -0
  107. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/otel.py +32 -0
  108. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/pipeline.py +408 -0
  109. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/chunk.py +78 -0
  110. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/download.py +206 -0
  111. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/embed.py +77 -0
  112. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/filter.py +35 -0
  113. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/index.py +86 -0
  114. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/partition.py +77 -0
  115. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/stage.py +65 -0
  116. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/uncompress.py +50 -0
  117. unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps/upload.py +58 -0
  118. unstructured_ingest-0.7.1/unstructured_ingest/processes/chunker.py +127 -0
  119. unstructured_ingest-0.7.1/unstructured_ingest/processes/connector_registry.py +69 -0
  120. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/__init__.py +129 -0
  121. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/airtable.py +234 -0
  122. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/astradb.py +486 -0
  123. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/azure_ai_search.py +275 -0
  124. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/chroma.py +193 -0
  125. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/confluence.py +309 -0
  126. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/couchbase.py +336 -0
  127. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/__init__.py +58 -0
  128. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/volumes.py +219 -0
  129. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/volumes_aws.py +93 -0
  130. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/volumes_azure.py +108 -0
  131. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/volumes_gcp.py +91 -0
  132. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/volumes_native.py +92 -0
  133. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/databricks/volumes_table.py +187 -0
  134. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/delta_table.py +195 -0
  135. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/discord.py +160 -0
  136. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/duckdb/__init__.py +15 -0
  137. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/duckdb/base.py +103 -0
  138. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/duckdb/duckdb.py +130 -0
  139. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/duckdb/motherduck.py +130 -0
  140. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/elasticsearch/__init__.py +19 -0
  141. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py +478 -0
  142. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/elasticsearch/opensearch.py +201 -0
  143. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/__init__.py +37 -0
  144. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/azure.py +203 -0
  145. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/box.py +176 -0
  146. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/dropbox.py +237 -0
  147. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/fsspec.py +366 -0
  148. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/gcs.py +203 -0
  149. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/s3.py +200 -0
  150. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/fsspec/sftp.py +177 -0
  151. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/github.py +221 -0
  152. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/gitlab.py +270 -0
  153. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/google_drive.py +490 -0
  154. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py +10 -0
  155. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +301 -0
  156. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/jira.py +455 -0
  157. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/kafka/__init__.py +17 -0
  158. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/kafka/cloud.py +121 -0
  159. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/kafka/kafka.py +275 -0
  160. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/kafka/local.py +103 -0
  161. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/kdbai.py +155 -0
  162. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/__init__.py +30 -0
  163. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/aws.py +43 -0
  164. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/azure.py +43 -0
  165. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/cloud.py +42 -0
  166. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/gcp.py +44 -0
  167. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/lancedb.py +181 -0
  168. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/lancedb/local.py +44 -0
  169. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/local.py +226 -0
  170. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/milvus.py +225 -0
  171. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/mongodb.py +363 -0
  172. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/neo4j.py +499 -0
  173. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/client.py +349 -0
  174. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/connector.py +348 -0
  175. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/helpers.py +448 -0
  176. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py +126 -0
  177. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +24 -0
  178. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/block.py +96 -0
  179. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py +40 -0
  180. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py +21 -0
  181. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py +31 -0
  182. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/callout.py +94 -0
  183. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py +23 -0
  184. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py +23 -0
  185. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/code.py +43 -0
  186. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py +35 -0
  187. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/divider.py +22 -0
  188. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/embed.py +36 -0
  189. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/equation.py +23 -0
  190. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/file.py +49 -0
  191. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/heading.py +37 -0
  192. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/image.py +21 -0
  193. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py +24 -0
  194. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py +29 -0
  195. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py +29 -0
  196. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py +31 -0
  197. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py +49 -0
  198. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/quote.py +37 -0
  199. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +57 -0
  200. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/table.py +60 -0
  201. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py +23 -0
  202. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/template.py +30 -0
  203. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/todo.py +42 -0
  204. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py +37 -0
  205. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py +20 -0
  206. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/blocks/video.py +22 -0
  207. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database.py +73 -0
  208. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py +106 -0
  209. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py +38 -0
  210. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py +35 -0
  211. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py +34 -0
  212. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/date.py +41 -0
  213. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/email.py +36 -0
  214. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/files.py +37 -0
  215. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py +49 -0
  216. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py +34 -0
  217. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py +34 -0
  218. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py +73 -0
  219. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/number.py +49 -0
  220. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/people.py +41 -0
  221. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py +36 -0
  222. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py +67 -0
  223. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py +43 -0
  224. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py +56 -0
  225. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/select.py +69 -0
  226. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/status.py +81 -0
  227. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/title.py +37 -0
  228. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py +50 -0
  229. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/url.py +37 -0
  230. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py +78 -0
  231. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/date.py +29 -0
  232. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/file.py +54 -0
  233. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/page.py +45 -0
  234. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/parent.py +66 -0
  235. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/rich_text.py +189 -0
  236. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types/user.py +79 -0
  237. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/onedrive.py +467 -0
  238. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/outlook.py +242 -0
  239. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/pinecone.py +373 -0
  240. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/qdrant/__init__.py +16 -0
  241. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/qdrant/cloud.py +59 -0
  242. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/qdrant/local.py +58 -0
  243. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/qdrant/qdrant.py +163 -0
  244. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/qdrant/server.py +60 -0
  245. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/redisdb.py +183 -0
  246. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/salesforce.py +305 -0
  247. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sharepoint.py +134 -0
  248. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/slack.py +248 -0
  249. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/__init__.py +37 -0
  250. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py +222 -0
  251. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/postgres.py +162 -0
  252. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/singlestore.py +171 -0
  253. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/snowflake.py +264 -0
  254. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/sql.py +440 -0
  255. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/sqlite.py +173 -0
  256. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/sql/vastdb.py +259 -0
  257. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/vectara.py +350 -0
  258. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/weaviate/__init__.py +22 -0
  259. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/weaviate/cloud.py +165 -0
  260. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/weaviate/embedded.py +90 -0
  261. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/weaviate/local.py +73 -0
  262. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/weaviate/weaviate.py +317 -0
  263. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/zendesk/client.py +308 -0
  264. unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/zendesk/zendesk.py +236 -0
  265. unstructured_ingest-0.7.1/unstructured_ingest/processes/embedder.py +199 -0
  266. unstructured_ingest-0.7.1/unstructured_ingest/processes/filter.py +60 -0
  267. unstructured_ingest-0.7.1/unstructured_ingest/processes/partitioner.py +229 -0
  268. unstructured_ingest-0.7.1/unstructured_ingest/processes/uncompress.py +61 -0
  269. unstructured_ingest-0.7.1/unstructured_ingest/processes/utils/blob_storage.py +32 -0
  270. unstructured_ingest-0.7.1/unstructured_ingest/unstructured_api.py +135 -0
  271. unstructured_ingest-0.7.1/unstructured_ingest/utils/compression.py +71 -0
  272. unstructured_ingest-0.7.1/unstructured_ingest/utils/data_prep.py +240 -0
  273. unstructured_ingest-0.7.1/unstructured_ingest/utils/html.py +160 -0
  274. unstructured_ingest-0.7.1/unstructured_ingest/utils/pydantic_models.py +52 -0
  275. unstructured_ingest-0.7.1/unstructured_ingest/utils/string_and_date_utils.py +74 -0
  276. unstructured_ingest-0.7.1/unstructured_ingest.egg-info/PKG-INFO +383 -0
  277. unstructured_ingest-0.7.1/unstructured_ingest.egg-info/SOURCES.txt +376 -0
  278. unstructured_ingest-0.7.1/unstructured_ingest.egg-info/requires.txt +418 -0
  279. unstructured_ingest-0.7.1/unstructured_ingest.egg-info/top_level.txt +3 -0
  280. unstructured_ingest-0.6.4/PKG-INFO +0 -382
  281. unstructured_ingest-0.6.4/test/integration/chunkers/test_chunkers.py +0 -31
  282. unstructured_ingest-0.6.4/test/integration/connectors/conftest.py +0 -38
  283. unstructured_ingest-0.6.4/test/integration/connectors/databricks/test_volumes_native.py +0 -273
  284. unstructured_ingest-0.6.4/test/integration/connectors/discord/test_discord.py +0 -90
  285. unstructured_ingest-0.6.4/test/integration/connectors/duckdb/test_duckdb.py +0 -90
  286. unstructured_ingest-0.6.4/test/integration/connectors/duckdb/test_motherduck.py +0 -95
  287. unstructured_ingest-0.6.4/test/integration/connectors/elasticsearch/test_elasticsearch.py +0 -331
  288. unstructured_ingest-0.6.4/test/integration/connectors/elasticsearch/test_opensearch.py +0 -326
  289. unstructured_ingest-0.6.4/test/integration/connectors/sql/test_databricks_delta_tables.py +0 -170
  290. unstructured_ingest-0.6.4/test/integration/connectors/sql/test_postgres.py +0 -201
  291. unstructured_ingest-0.6.4/test/integration/connectors/sql/test_singlestore.py +0 -182
  292. unstructured_ingest-0.6.4/test/integration/connectors/sql/test_snowflake.py +0 -244
  293. unstructured_ingest-0.6.4/test/integration/connectors/sql/test_sqlite.py +0 -168
  294. unstructured_ingest-0.6.4/test/integration/connectors/sql/test_vastdb.py +0 -34
  295. unstructured_ingest-0.6.4/test/integration/connectors/test_astradb.py +0 -287
  296. unstructured_ingest-0.6.4/test/integration/connectors/test_azure_ai_search.py +0 -254
  297. unstructured_ingest-0.6.4/test/integration/connectors/test_chroma.py +0 -136
  298. unstructured_ingest-0.6.4/test/integration/connectors/test_confluence.py +0 -111
  299. unstructured_ingest-0.6.4/test/integration/connectors/test_delta_table.py +0 -183
  300. unstructured_ingest-0.6.4/test/integration/connectors/test_dropbox.py +0 -151
  301. unstructured_ingest-0.6.4/test/integration/connectors/test_github.py +0 -49
  302. unstructured_ingest-0.6.4/test/integration/connectors/test_google_drive.py +0 -257
  303. unstructured_ingest-0.6.4/test/integration/connectors/test_jira.py +0 -67
  304. unstructured_ingest-0.6.4/test/integration/connectors/test_lancedb.py +0 -247
  305. unstructured_ingest-0.6.4/test/integration/connectors/test_milvus.py +0 -208
  306. unstructured_ingest-0.6.4/test/integration/connectors/test_mongodb.py +0 -335
  307. unstructured_ingest-0.6.4/test/integration/connectors/test_neo4j.py +0 -244
  308. unstructured_ingest-0.6.4/test/integration/connectors/test_notion.py +0 -152
  309. unstructured_ingest-0.6.4/test/integration/connectors/test_onedrive.py +0 -163
  310. unstructured_ingest-0.6.4/test/integration/connectors/test_pinecone.py +0 -387
  311. unstructured_ingest-0.6.4/test/integration/connectors/test_qdrant.py +0 -216
  312. unstructured_ingest-0.6.4/test/integration/connectors/test_redis.py +0 -143
  313. unstructured_ingest-0.6.4/test/integration/connectors/test_s3.py +0 -184
  314. unstructured_ingest-0.6.4/test/integration/connectors/test_sharepoint.py +0 -222
  315. unstructured_ingest-0.6.4/test/integration/connectors/test_vectara.py +0 -282
  316. unstructured_ingest-0.6.4/test/integration/connectors/test_zendesk.py +0 -120
  317. unstructured_ingest-0.6.4/test/integration/connectors/utils/validation/destination.py +0 -77
  318. unstructured_ingest-0.6.4/test/integration/connectors/utils/validation/source.py +0 -331
  319. unstructured_ingest-0.6.4/test/integration/connectors/weaviate/test_cloud.py +0 -39
  320. unstructured_ingest-0.6.4/test/integration/connectors/weaviate/test_local.py +0 -152
  321. unstructured_ingest-0.6.4/test/integration/embedders/test_azure_openai.py +0 -57
  322. unstructured_ingest-0.6.4/test/integration/embedders/test_bedrock.py +0 -103
  323. unstructured_ingest-0.6.4/test/integration/embedders/test_huggingface.py +0 -24
  324. unstructured_ingest-0.6.4/test/integration/embedders/test_mixedbread.py +0 -71
  325. unstructured_ingest-0.6.4/test/integration/embedders/test_octoai.py +0 -75
  326. unstructured_ingest-0.6.4/test/integration/embedders/test_openai.py +0 -74
  327. unstructured_ingest-0.6.4/test/integration/embedders/test_togetherai.py +0 -71
  328. unstructured_ingest-0.6.4/test/integration/embedders/test_vertexai.py +0 -63
  329. unstructured_ingest-0.6.4/test/integration/embedders/test_voyageai.py +0 -79
  330. unstructured_ingest-0.6.4/test/integration/partitioners/test_partitioner.py +0 -76
  331. unstructured_ingest-0.6.4/test/unit/test_html.py +0 -112
  332. unstructured_ingest-0.6.4/test/unit/test_utils.py +0 -211
  333. unstructured_ingest-0.6.4/test/unit/v2/chunkers/test_chunkers.py +0 -49
  334. unstructured_ingest-0.6.4/test/unit/v2/connectors/ibm_watsonx/test_ibm_watsonx_s3.py +0 -459
  335. unstructured_ingest-0.6.4/test/unit/v2/connectors/motherduck/test_base.py +0 -73
  336. unstructured_ingest-0.6.4/test/unit/v2/connectors/sql/test_sql.py +0 -152
  337. unstructured_ingest-0.6.4/test/unit/v2/connectors/test_confluence.py +0 -71
  338. unstructured_ingest-0.6.4/test/unit/v2/connectors/test_jira.py +0 -401
  339. unstructured_ingest-0.6.4/test/unit/v2/embedders/test_huggingface.py +0 -48
  340. unstructured_ingest-0.6.4/test/unit/v2/embedders/test_vertexai.py +0 -37
  341. unstructured_ingest-0.6.4/test/unit/v2/partitioners/test_partitioner.py +0 -63
  342. unstructured_ingest-0.6.4/test/unit/v2/test_interfaces.py +0 -26
  343. unstructured_ingest-0.6.4/test/unit/v2/test_utils.py +0 -82
  344. unstructured_ingest-0.6.4/unstructured_ingest/__version__.py +0 -1
  345. unstructured_ingest-0.6.4/unstructured_ingest/cli/__init__.py +0 -14
  346. unstructured_ingest-0.6.4/unstructured_ingest/cli/base/cmd.py +0 -19
  347. unstructured_ingest-0.6.4/unstructured_ingest/cli/base/dest.py +0 -87
  348. unstructured_ingest-0.6.4/unstructured_ingest/cli/base/src.py +0 -57
  349. unstructured_ingest-0.6.4/unstructured_ingest/cli/cli.py +0 -37
  350. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmd_factory.py +0 -12
  351. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/__init__.py +0 -145
  352. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/airtable.py +0 -69
  353. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/astradb.py +0 -99
  354. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/azure_ai_search.py +0 -65
  355. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/biomed.py +0 -52
  356. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/chroma.py +0 -104
  357. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/clarifai.py +0 -71
  358. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/confluence.py +0 -69
  359. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -163
  360. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/delta_table.py +0 -94
  361. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/discord.py +0 -47
  362. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/elasticsearch.py +0 -133
  363. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -94
  364. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/box.py +0 -48
  365. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -51
  366. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -15
  367. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -71
  368. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -74
  369. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -58
  370. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/github.py +0 -54
  371. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/gitlab.py +0 -54
  372. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/google_drive.py +0 -49
  373. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/hubspot.py +0 -70
  374. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/jira.py +0 -71
  375. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/kafka.py +0 -102
  376. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/local.py +0 -43
  377. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/mongodb.py +0 -72
  378. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/notion.py +0 -48
  379. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/onedrive.py +0 -66
  380. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/opensearch.py +0 -117
  381. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/outlook.py +0 -67
  382. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/pinecone.py +0 -71
  383. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/qdrant.py +0 -124
  384. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/reddit.py +0 -67
  385. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/salesforce.py +0 -58
  386. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/sharepoint.py +0 -66
  387. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/slack.py +0 -56
  388. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/sql.py +0 -66
  389. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/vectara.py +0 -66
  390. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/weaviate.py +0 -98
  391. unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/wikipedia.py +0 -40
  392. unstructured_ingest-0.6.4/unstructured_ingest/cli/common.py +0 -7
  393. unstructured_ingest-0.6.4/unstructured_ingest/cli/interfaces.py +0 -663
  394. unstructured_ingest-0.6.4/unstructured_ingest/cli/utils.py +0 -205
  395. unstructured_ingest-0.6.4/unstructured_ingest/connector/airtable.py +0 -309
  396. unstructured_ingest-0.6.4/unstructured_ingest/connector/astradb.py +0 -267
  397. unstructured_ingest-0.6.4/unstructured_ingest/connector/azure_ai_search.py +0 -144
  398. unstructured_ingest-0.6.4/unstructured_ingest/connector/biomed.py +0 -320
  399. unstructured_ingest-0.6.4/unstructured_ingest/connector/chroma.py +0 -158
  400. unstructured_ingest-0.6.4/unstructured_ingest/connector/clarifai.py +0 -122
  401. unstructured_ingest-0.6.4/unstructured_ingest/connector/confluence.py +0 -285
  402. unstructured_ingest-0.6.4/unstructured_ingest/connector/databricks_volumes.py +0 -137
  403. unstructured_ingest-0.6.4/unstructured_ingest/connector/delta_table.py +0 -203
  404. unstructured_ingest-0.6.4/unstructured_ingest/connector/discord.py +0 -180
  405. unstructured_ingest-0.6.4/unstructured_ingest/connector/elasticsearch.py +0 -396
  406. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/azure.py +0 -78
  407. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/box.py +0 -109
  408. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/dropbox.py +0 -160
  409. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/fsspec.py +0 -359
  410. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/gcs.py +0 -82
  411. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/s3.py +0 -62
  412. unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec/sftp.py +0 -81
  413. unstructured_ingest-0.6.4/unstructured_ingest/connector/git.py +0 -124
  414. unstructured_ingest-0.6.4/unstructured_ingest/connector/github.py +0 -174
  415. unstructured_ingest-0.6.4/unstructured_ingest/connector/gitlab.py +0 -142
  416. unstructured_ingest-0.6.4/unstructured_ingest/connector/google_drive.py +0 -348
  417. unstructured_ingest-0.6.4/unstructured_ingest/connector/hubspot.py +0 -278
  418. unstructured_ingest-0.6.4/unstructured_ingest/connector/jira.py +0 -469
  419. unstructured_ingest-0.6.4/unstructured_ingest/connector/kafka.py +0 -293
  420. unstructured_ingest-0.6.4/unstructured_ingest/connector/local.py +0 -139
  421. unstructured_ingest-0.6.4/unstructured_ingest/connector/mongodb.py +0 -284
  422. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/client.py +0 -248
  423. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/connector.py +0 -469
  424. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/helpers.py +0 -584
  425. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/block.py +0 -96
  426. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -40
  427. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -21
  428. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -31
  429. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -94
  430. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -23
  431. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -23
  432. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/code.py +0 -43
  433. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -35
  434. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -22
  435. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -36
  436. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -23
  437. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/file.py +0 -49
  438. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -37
  439. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/image.py +0 -21
  440. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -24
  441. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -29
  442. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -29
  443. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -31
  444. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -49
  445. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -37
  446. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -57
  447. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/table.py +0 -63
  448. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -23
  449. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/template.py +0 -30
  450. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -42
  451. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -37
  452. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -20
  453. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/blocks/video.py +0 -22
  454. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database.py +0 -73
  455. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -106
  456. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -38
  457. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -35
  458. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -34
  459. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -41
  460. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -36
  461. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -37
  462. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -49
  463. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -34
  464. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -34
  465. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -73
  466. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -49
  467. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -40
  468. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -36
  469. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -67
  470. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -43
  471. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -56
  472. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -68
  473. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -80
  474. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -37
  475. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -50
  476. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -37
  477. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -78
  478. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/date.py +0 -26
  479. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/file.py +0 -51
  480. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/page.py +0 -45
  481. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/parent.py +0 -66
  482. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/rich_text.py +0 -189
  483. unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types/user.py +0 -76
  484. unstructured_ingest-0.6.4/unstructured_ingest/connector/onedrive.py +0 -232
  485. unstructured_ingest-0.6.4/unstructured_ingest/connector/opensearch.py +0 -218
  486. unstructured_ingest-0.6.4/unstructured_ingest/connector/outlook.py +0 -285
  487. unstructured_ingest-0.6.4/unstructured_ingest/connector/pinecone.py +0 -150
  488. unstructured_ingest-0.6.4/unstructured_ingest/connector/qdrant.py +0 -144
  489. unstructured_ingest-0.6.4/unstructured_ingest/connector/reddit.py +0 -166
  490. unstructured_ingest-0.6.4/unstructured_ingest/connector/registry.py +0 -109
  491. unstructured_ingest-0.6.4/unstructured_ingest/connector/salesforce.py +0 -301
  492. unstructured_ingest-0.6.4/unstructured_ingest/connector/sharepoint.py +0 -573
  493. unstructured_ingest-0.6.4/unstructured_ingest/connector/slack.py +0 -224
  494. unstructured_ingest-0.6.4/unstructured_ingest/connector/sql.py +0 -199
  495. unstructured_ingest-0.6.4/unstructured_ingest/connector/vectara.py +0 -253
  496. unstructured_ingest-0.6.4/unstructured_ingest/connector/weaviate.py +0 -190
  497. unstructured_ingest-0.6.4/unstructured_ingest/connector/wikipedia.py +0 -208
  498. unstructured_ingest-0.6.4/unstructured_ingest/embed/bedrock.py +0 -210
  499. unstructured_ingest-0.6.4/unstructured_ingest/embed/octoai.py +0 -112
  500. unstructured_ingest-0.6.4/unstructured_ingest/embed/openai.py +0 -99
  501. unstructured_ingest-0.6.4/unstructured_ingest/embed/togetherai.py +0 -84
  502. unstructured_ingest-0.6.4/unstructured_ingest/embed/vertexai.py +0 -109
  503. unstructured_ingest-0.6.4/unstructured_ingest/embed/voyageai.py +0 -127
  504. unstructured_ingest-0.6.4/unstructured_ingest/enhanced_dataclass/__init__.py +0 -4
  505. unstructured_ingest-0.6.4/unstructured_ingest/enhanced_dataclass/core.py +0 -99
  506. unstructured_ingest-0.6.4/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -54
  507. unstructured_ingest-0.6.4/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -125
  508. unstructured_ingest-0.6.4/unstructured_ingest/ingest_backoff/_wrapper.py +0 -122
  509. unstructured_ingest-0.6.4/unstructured_ingest/interfaces.py +0 -852
  510. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/__init__.py +0 -22
  511. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/copy.py +0 -19
  512. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/doc_factory.py +0 -12
  513. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/interfaces.py +0 -270
  514. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/partition.py +0 -60
  515. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/permissions.py +0 -12
  516. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/pipeline.py +0 -117
  517. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/reformat/chunking.py +0 -134
  518. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/reformat/embedding.py +0 -64
  519. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/source.py +0 -77
  520. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/utils.py +0 -6
  521. unstructured_ingest-0.6.4/unstructured_ingest/pipeline/write.py +0 -18
  522. unstructured_ingest-0.6.4/unstructured_ingest/processor.py +0 -93
  523. unstructured_ingest-0.6.4/unstructured_ingest/runner/__init__.py +0 -104
  524. unstructured_ingest-0.6.4/unstructured_ingest/runner/airtable.py +0 -35
  525. unstructured_ingest-0.6.4/unstructured_ingest/runner/astradb.py +0 -34
  526. unstructured_ingest-0.6.4/unstructured_ingest/runner/base_runner.py +0 -89
  527. unstructured_ingest-0.6.4/unstructured_ingest/runner/biomed.py +0 -45
  528. unstructured_ingest-0.6.4/unstructured_ingest/runner/confluence.py +0 -35
  529. unstructured_ingest-0.6.4/unstructured_ingest/runner/delta_table.py +0 -34
  530. unstructured_ingest-0.6.4/unstructured_ingest/runner/discord.py +0 -35
  531. unstructured_ingest-0.6.4/unstructured_ingest/runner/elasticsearch.py +0 -40
  532. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/azure.py +0 -30
  533. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/box.py +0 -28
  534. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/dropbox.py +0 -30
  535. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/fsspec.py +0 -40
  536. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/gcs.py +0 -28
  537. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/s3.py +0 -28
  538. unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec/sftp.py +0 -28
  539. unstructured_ingest-0.6.4/unstructured_ingest/runner/github.py +0 -37
  540. unstructured_ingest-0.6.4/unstructured_ingest/runner/gitlab.py +0 -37
  541. unstructured_ingest-0.6.4/unstructured_ingest/runner/google_drive.py +0 -35
  542. unstructured_ingest-0.6.4/unstructured_ingest/runner/hubspot.py +0 -35
  543. unstructured_ingest-0.6.4/unstructured_ingest/runner/jira.py +0 -35
  544. unstructured_ingest-0.6.4/unstructured_ingest/runner/kafka.py +0 -34
  545. unstructured_ingest-0.6.4/unstructured_ingest/runner/local.py +0 -23
  546. unstructured_ingest-0.6.4/unstructured_ingest/runner/mongodb.py +0 -34
  547. unstructured_ingest-0.6.4/unstructured_ingest/runner/notion.py +0 -61
  548. unstructured_ingest-0.6.4/unstructured_ingest/runner/onedrive.py +0 -35
  549. unstructured_ingest-0.6.4/unstructured_ingest/runner/opensearch.py +0 -40
  550. unstructured_ingest-0.6.4/unstructured_ingest/runner/outlook.py +0 -33
  551. unstructured_ingest-0.6.4/unstructured_ingest/runner/reddit.py +0 -35
  552. unstructured_ingest-0.6.4/unstructured_ingest/runner/salesforce.py +0 -33
  553. unstructured_ingest-0.6.4/unstructured_ingest/runner/sharepoint.py +0 -35
  554. unstructured_ingest-0.6.4/unstructured_ingest/runner/slack.py +0 -33
  555. unstructured_ingest-0.6.4/unstructured_ingest/runner/utils.py +0 -47
  556. unstructured_ingest-0.6.4/unstructured_ingest/runner/wikipedia.py +0 -35
  557. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/__init__.py +0 -48
  558. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/astradb.py +0 -22
  559. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/azure_ai_search.py +0 -24
  560. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/base_writer.py +0 -26
  561. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/chroma.py +0 -22
  562. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/clarifai.py +0 -19
  563. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/databricks_volumes.py +0 -25
  564. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/delta_table.py +0 -24
  565. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/elasticsearch.py +0 -24
  566. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/fsspec/azure.py +0 -24
  567. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/fsspec/box.py +0 -21
  568. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -21
  569. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -19
  570. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/fsspec/s3.py +0 -21
  571. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/kafka.py +0 -21
  572. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/mongodb.py +0 -21
  573. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/opensearch.py +0 -26
  574. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/pinecone.py +0 -21
  575. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/qdrant.py +0 -19
  576. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/sql.py +0 -22
  577. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/vectara.py +0 -22
  578. unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/weaviate.py +0 -21
  579. unstructured_ingest-0.6.4/unstructured_ingest/utils/compression.py +0 -118
  580. unstructured_ingest-0.6.4/unstructured_ingest/utils/data_prep.py +0 -232
  581. unstructured_ingest-0.6.4/unstructured_ingest/utils/google_filetype.py +0 -9
  582. unstructured_ingest-0.6.4/unstructured_ingest/utils/html.py +0 -160
  583. unstructured_ingest-0.6.4/unstructured_ingest/utils/string_and_date_utils.py +0 -74
  584. unstructured_ingest-0.6.4/unstructured_ingest/v2/__init__.py +0 -1
  585. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/base/cmd.py +0 -269
  586. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/base/dest.py +0 -85
  587. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/base/src.py +0 -85
  588. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/cli.py +0 -24
  589. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/cmds.py +0 -14
  590. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/utils/__init__.py +0 -0
  591. unstructured_ingest-0.6.4/unstructured_ingest/v2/cli/utils/model_conversion.py +0 -222
  592. unstructured_ingest-0.6.4/unstructured_ingest/v2/interfaces/downloader.py +0 -88
  593. unstructured_ingest-0.6.4/unstructured_ingest/v2/interfaces/indexer.py +0 -29
  594. unstructured_ingest-0.6.4/unstructured_ingest/v2/interfaces/upload_stager.py +0 -89
  595. unstructured_ingest-0.6.4/unstructured_ingest/v2/interfaces/uploader.py +0 -67
  596. unstructured_ingest-0.6.4/unstructured_ingest/v2/logger.py +0 -126
  597. unstructured_ingest-0.6.4/unstructured_ingest/v2/main.py +0 -11
  598. unstructured_ingest-0.6.4/unstructured_ingest/v2/otel.py +0 -111
  599. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/__init__.py +0 -0
  600. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/interfaces.py +0 -211
  601. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/otel.py +0 -32
  602. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/pipeline.py +0 -408
  603. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
  604. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -78
  605. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/download.py +0 -206
  606. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/embed.py +0 -77
  607. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/filter.py +0 -35
  608. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/index.py +0 -86
  609. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/partition.py +0 -77
  610. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/stage.py +0 -65
  611. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -50
  612. unstructured_ingest-0.6.4/unstructured_ingest/v2/pipeline/steps/upload.py +0 -58
  613. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/chunker.py +0 -127
  614. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connector_registry.py +0 -69
  615. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/__init__.py +0 -129
  616. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/airtable.py +0 -234
  617. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/assets/__init__.py +0 -0
  618. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/assets/databricks_delta_table_schema.sql +0 -10
  619. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/assets/weaviate_collection_config.json +0 -23
  620. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/astradb.py +0 -486
  621. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/azure_ai_search.py +0 -276
  622. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/chroma.py +0 -190
  623. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/confluence.py +0 -309
  624. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/couchbase.py +0 -336
  625. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/__init__.py +0 -58
  626. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/volumes.py +0 -219
  627. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/volumes_aws.py +0 -93
  628. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/volumes_azure.py +0 -108
  629. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/volumes_gcp.py +0 -91
  630. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/volumes_native.py +0 -92
  631. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/databricks/volumes_table.py +0 -188
  632. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/delta_table.py +0 -195
  633. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/discord.py +0 -160
  634. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/duckdb/__init__.py +0 -15
  635. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/duckdb/base.py +0 -104
  636. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/duckdb/duckdb.py +0 -130
  637. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/duckdb/motherduck.py +0 -130
  638. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/elasticsearch/__init__.py +0 -19
  639. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/elasticsearch/elasticsearch.py +0 -478
  640. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/elasticsearch/opensearch.py +0 -201
  641. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -37
  642. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +0 -203
  643. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/box.py +0 -176
  644. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +0 -237
  645. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -366
  646. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +0 -203
  647. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +0 -200
  648. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -177
  649. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/github.py +0 -221
  650. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/gitlab.py +0 -270
  651. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -481
  652. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/ibm_watsonx/__init__.py +0 -10
  653. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +0 -301
  654. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/jira.py +0 -455
  655. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/kafka/__init__.py +0 -17
  656. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/kafka/cloud.py +0 -121
  657. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/kafka/kafka.py +0 -275
  658. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/kafka/local.py +0 -103
  659. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/kdbai.py +0 -151
  660. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/__init__.py +0 -30
  661. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/aws.py +0 -43
  662. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/azure.py +0 -43
  663. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/cloud.py +0 -42
  664. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/gcp.py +0 -44
  665. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/lancedb.py +0 -181
  666. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/lancedb/local.py +0 -44
  667. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/local.py +0 -226
  668. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/milvus.py +0 -225
  669. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/mongodb.py +0 -363
  670. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/neo4j.py +0 -499
  671. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/__init__.py +0 -0
  672. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/client.py +0 -349
  673. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/connector.py +0 -348
  674. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/helpers.py +0 -448
  675. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/interfaces.py +0 -32
  676. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/__init__.py +0 -0
  677. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/block.py +0 -96
  678. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/__init__.py +0 -63
  679. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/bookmark.py +0 -40
  680. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/breadcrumb.py +0 -21
  681. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -31
  682. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/callout.py +0 -94
  683. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/child_database.py +0 -23
  684. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/child_page.py +0 -23
  685. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/code.py +0 -43
  686. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/column_list.py +0 -35
  687. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/divider.py +0 -22
  688. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/embed.py +0 -36
  689. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/equation.py +0 -23
  690. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/file.py +0 -49
  691. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/heading.py +0 -37
  692. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/image.py +0 -21
  693. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/link_preview.py +0 -24
  694. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/link_to_page.py +0 -29
  695. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/numbered_list.py +0 -29
  696. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/paragraph.py +0 -31
  697. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/pdf.py +0 -49
  698. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/quote.py +0 -37
  699. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/synced_block.py +0 -57
  700. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/table.py +0 -63
  701. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/table_of_contents.py +0 -23
  702. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/template.py +0 -30
  703. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/todo.py +0 -42
  704. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/toggle.py +0 -37
  705. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/unsupported.py +0 -20
  706. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/blocks/video.py +0 -22
  707. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database.py +0 -73
  708. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/__init__.py +0 -106
  709. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/checkbox.py +0 -38
  710. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/created_by.py +0 -35
  711. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/created_time.py +0 -34
  712. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/date.py +0 -41
  713. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/email.py +0 -36
  714. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/files.py +0 -37
  715. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/formula.py +0 -49
  716. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -34
  717. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/last_edited_time.py +0 -34
  718. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/multiselect.py +0 -73
  719. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/number.py +0 -49
  720. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/people.py +0 -41
  721. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/phone_number.py +0 -36
  722. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/relation.py +0 -67
  723. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/rich_text.py +0 -43
  724. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/rollup.py +0 -56
  725. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/select.py +0 -69
  726. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/status.py +0 -81
  727. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/title.py +0 -37
  728. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/unique_id.py +0 -50
  729. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/url.py +0 -37
  730. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/database_properties/verification.py +0 -78
  731. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/date.py +0 -29
  732. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/file.py +0 -54
  733. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/page.py +0 -45
  734. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/parent.py +0 -66
  735. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/rich_text.py +0 -189
  736. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/notion/types/user.py +0 -79
  737. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -439
  738. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/outlook.py +0 -242
  739. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/pinecone.py +0 -370
  740. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/qdrant/__init__.py +0 -16
  741. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/qdrant/cloud.py +0 -59
  742. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/qdrant/local.py +0 -58
  743. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/qdrant/qdrant.py +0 -160
  744. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/qdrant/server.py +0 -60
  745. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/redisdb.py +0 -183
  746. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -305
  747. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -134
  748. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/slack.py +0 -248
  749. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/__init__.py +0 -37
  750. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/databricks_delta_tables.py +0 -222
  751. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/postgres.py +0 -162
  752. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/singlestore.py +0 -171
  753. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/snowflake.py +0 -264
  754. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/sql.py +0 -435
  755. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/sqlite.py +0 -173
  756. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/sql/vastdb.py +0 -260
  757. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/vectara.py +0 -350
  758. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/weaviate/__init__.py +0 -22
  759. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/weaviate/cloud.py +0 -165
  760. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/weaviate/embedded.py +0 -90
  761. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/weaviate/local.py +0 -73
  762. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/weaviate/weaviate.py +0 -317
  763. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/zendesk/__init__.py +0 -0
  764. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/zendesk/client.py +0 -308
  765. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/connectors/zendesk/zendesk.py +0 -236
  766. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/embedder.py +0 -199
  767. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/filter.py +0 -60
  768. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/partitioner.py +0 -229
  769. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/uncompress.py +0 -61
  770. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/utils/__init__.py +0 -0
  771. unstructured_ingest-0.6.4/unstructured_ingest/v2/processes/utils/blob_storage.py +0 -32
  772. unstructured_ingest-0.6.4/unstructured_ingest/v2/types/__init__.py +0 -0
  773. unstructured_ingest-0.6.4/unstructured_ingest/v2/types/file_data.py +0 -116
  774. unstructured_ingest-0.6.4/unstructured_ingest/v2/unstructured_api.py +0 -135
  775. unstructured_ingest-0.6.4/unstructured_ingest/v2/utils.py +0 -61
  776. unstructured_ingest-0.6.4/unstructured_ingest.egg-info/PKG-INFO +0 -382
  777. unstructured_ingest-0.6.4/unstructured_ingest.egg-info/SOURCES.txt +0 -597
  778. unstructured_ingest-0.6.4/unstructured_ingest.egg-info/requires.txt +0 -417
  779. unstructured_ingest-0.6.4/unstructured_ingest.egg-info/top_level.txt +0 -2
  780. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/LICENSE.md +0 -0
  781. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/MANIFEST.in +0 -0
  782. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/README.md +0 -0
  783. {unstructured_ingest-0.6.4/test → unstructured_ingest-0.7.1/examples}/__init__.py +0 -0
  784. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/pyproject.toml +0 -0
  785. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/setup.cfg +0 -0
  786. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/setup.py +0 -0
  787. {unstructured_ingest-0.6.4/test/integration → unstructured_ingest-0.7.1/test}/__init__.py +0 -0
  788. {unstructured_ingest-0.6.4/test/integration/chunkers → unstructured_ingest-0.7.1/test/integration}/__init__.py +0 -0
  789. {unstructured_ingest-0.6.4/test/integration/connectors → unstructured_ingest-0.7.1/test/integration/chunkers}/__init__.py +0 -0
  790. {unstructured_ingest-0.6.4/test/integration/connectors/databricks → unstructured_ingest-0.7.1/test/integration/connectors}/__init__.py +0 -0
  791. {unstructured_ingest-0.6.4/test/integration/connectors/discord → unstructured_ingest-0.7.1/test/integration/connectors/databricks}/__init__.py +0 -0
  792. {unstructured_ingest-0.6.4/test/integration/connectors/duckdb → unstructured_ingest-0.7.1/test/integration/connectors/discord}/__init__.py +0 -0
  793. {unstructured_ingest-0.6.4/test/integration/connectors/elasticsearch → unstructured_ingest-0.7.1/test/integration/connectors/duckdb}/__init__.py +0 -0
  794. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/duckdb/conftest.py +0 -0
  795. {unstructured_ingest-0.6.4/test/integration/connectors/sql → unstructured_ingest-0.7.1/test/integration/connectors/elasticsearch}/__init__.py +0 -0
  796. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/elasticsearch/conftest.py +0 -0
  797. {unstructured_ingest-0.6.4/test/integration/connectors/utils → unstructured_ingest-0.7.1/test/integration/connectors/sql}/__init__.py +0 -0
  798. {unstructured_ingest-0.6.4/test/integration/connectors/utils/validation → unstructured_ingest-0.7.1/test/integration/connectors/utils}/__init__.py +0 -0
  799. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/utils/constants.py +0 -0
  800. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/utils/docker.py +0 -0
  801. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/utils/docker_compose.py +0 -0
  802. {unstructured_ingest-0.6.4/test/integration/connectors/weaviate → unstructured_ingest-0.7.1/test/integration/connectors/utils/validation}/__init__.py +0 -0
  803. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/utils/validation/equality.py +0 -0
  804. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/utils/validation/utils.py +0 -0
  805. {unstructured_ingest-0.6.4/test/integration/embedders → unstructured_ingest-0.7.1/test/integration/connectors/weaviate}/__init__.py +0 -0
  806. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/connectors/weaviate/conftest.py +0 -0
  807. {unstructured_ingest-0.6.4/test/integration/partitioners → unstructured_ingest-0.7.1/test/integration/embedders}/__init__.py +0 -0
  808. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/embedders/conftest.py +0 -0
  809. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/embedders/utils.py +0 -0
  810. {unstructured_ingest-0.6.4/test/unit → unstructured_ingest-0.7.1/test/integration/partitioners}/__init__.py +0 -0
  811. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/integration/utils.py +0 -0
  812. {unstructured_ingest-0.6.4/test/unit/embed → unstructured_ingest-0.7.1/test/unit}/__init__.py +0 -0
  813. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit/chunkers}/__init__.py +0 -0
  814. {unstructured_ingest-0.6.4/test/unit/v2/chunkers → unstructured_ingest-0.7.1/test/unit/connectors}/__init__.py +0 -0
  815. {unstructured_ingest-0.6.4/test/unit/v2/connectors → unstructured_ingest-0.7.1/test/unit/connectors/ibm_watsonx}/__init__.py +0 -0
  816. {unstructured_ingest-0.6.4/test/unit/v2/connectors/ibm_watsonx → unstructured_ingest-0.7.1/test/unit/connectors/motherduck}/__init__.py +0 -0
  817. {unstructured_ingest-0.6.4/test/unit/v2/connectors/motherduck → unstructured_ingest-0.7.1/test/unit/connectors/sql}/__init__.py +0 -0
  818. {unstructured_ingest-0.6.4/test/unit/v2/connectors/sql → unstructured_ingest-0.7.1/test/unit/embed}/__init__.py +0 -0
  819. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/embed/test_mixedbreadai.py +0 -0
  820. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/embed/test_octoai.py +0 -0
  821. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/embed/test_openai.py +0 -0
  822. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/embed/test_vertexai.py +0 -0
  823. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/embed/test_voyageai.py +0 -0
  824. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/__init__.py +0 -0
  825. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/test_bedrock.py +0 -0
  826. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/test_mixedbread.py +0 -0
  827. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/test_octoai.py +0 -0
  828. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/test_openai.py +0 -0
  829. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/test_togetherai.py +0 -0
  830. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/embedders/test_voyageai.py +0 -0
  831. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/partitioners/__init__.py +0 -0
  832. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/test_error.py +0 -0
  833. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/test/unit/test_logger.py +0 -0
  834. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/utils/__init__.py +0 -0
  835. {unstructured_ingest-0.6.4/test/unit/v2 → unstructured_ingest-0.7.1/test/unit}/utils/data_generator.py +0 -0
  836. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/__init__.py +0 -0
  837. {unstructured_ingest-0.6.4/unstructured_ingest/cli/base → unstructured_ingest-0.7.1/unstructured_ingest/cli}/__init__.py +0 -0
  838. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/cli/base/__init__.py +0 -0
  839. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/cli/base/importer.py +0 -0
  840. {unstructured_ingest-0.6.4/unstructured_ingest/cli/cmds/fsspec → unstructured_ingest-0.7.1/unstructured_ingest/cli/utils}/__init__.py +0 -0
  841. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/cli/utils/click.py +0 -0
  842. {unstructured_ingest-0.6.4/unstructured_ingest/connector → unstructured_ingest-0.7.1/unstructured_ingest/data_types}/__init__.py +0 -0
  843. {unstructured_ingest-0.6.4/unstructured_ingest/connector/fsspec → unstructured_ingest-0.7.1/unstructured_ingest/embed}/__init__.py +0 -0
  844. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/embed/azure_openai.py +0 -0
  845. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/embed/huggingface.py +0 -0
  846. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/embed/interfaces.py +0 -0
  847. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  848. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/error.py +0 -0
  849. /unstructured_ingest-0.6.4/unstructured_ingest/v2/errors.py → /unstructured_ingest-0.7.1/unstructured_ingest/errors_v2.py +0 -0
  850. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/interfaces/__init__.py +0 -0
  851. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/interfaces/connector.py +0 -0
  852. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/interfaces/process.py +0 -0
  853. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/interfaces/processor.py +0 -0
  854. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/logger.py +0 -0
  855. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/main.py +0 -0
  856. {unstructured_ingest-0.6.4/unstructured_ingest/connector/notion → unstructured_ingest-0.7.1/unstructured_ingest/pipeline}/__init__.py +0 -0
  857. {unstructured_ingest-0.6.4/unstructured_ingest/connector/notion/types → unstructured_ingest-0.7.1/unstructured_ingest/pipeline/steps}/__init__.py +0 -0
  858. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/processes/__init__.py +0 -0
  859. {unstructured_ingest-0.6.4/unstructured_ingest/embed → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/assets}/__init__.py +0 -0
  860. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/processes/connectors/fsspec/utils.py +0 -0
  861. {unstructured_ingest-0.6.4/unstructured_ingest/pipeline/reformat → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion}/__init__.py +0 -0
  862. {unstructured_ingest-0.6.4/unstructured_ingest → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion}/ingest_backoff/__init__.py +0 -0
  863. {unstructured_ingest-0.6.4/unstructured_ingest → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion}/ingest_backoff/_common.py +0 -0
  864. {unstructured_ingest-0.6.4/unstructured_ingest/connector → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors}/notion/interfaces.py +0 -0
  865. {unstructured_ingest-0.6.4/unstructured_ingest/runner/fsspec → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/notion/types}/__init__.py +0 -0
  866. {unstructured_ingest-0.6.4/unstructured_ingest/connector → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors}/notion/types/blocks/__init__.py +0 -0
  867. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest}/processes/connectors/utils.py +0 -0
  868. {unstructured_ingest-0.6.4/unstructured_ingest/runner/writers/fsspec → unstructured_ingest-0.7.1/unstructured_ingest/processes/connectors/zendesk}/__init__.py +0 -0
  869. {unstructured_ingest-0.6.4/unstructured_ingest → unstructured_ingest-0.7.1/unstructured_ingest/processes}/utils/__init__.py +0 -0
  870. {unstructured_ingest-0.6.4/unstructured_ingest/v2/cli → unstructured_ingest-0.7.1/unstructured_ingest/utils}/__init__.py +0 -0
  871. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/utils/chunking.py +0 -0
  872. {unstructured_ingest-0.6.4/unstructured_ingest/v2 → unstructured_ingest-0.7.1/unstructured_ingest/utils}/constants.py +0 -0
  873. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/utils/dep_check.py +0 -0
  874. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/utils/ndjson.py +0 -0
  875. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest/utils/table.py +0 -0
  876. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  877. {unstructured_ingest-0.6.4 → unstructured_ingest-0.7.1}/unstructured_ingest.egg-info/entry_points.txt +0 -0
@@ -0,0 +1,383 @@
1
+ Metadata-Version: 2.2
2
+ Name: unstructured-ingest
3
+ Version: 0.7.1
4
+ Summary: A library that prepares raw documents for downstream ML tasks.
5
+ Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
+ Author: Unstructured Technologies
7
+ Author-email: devops@unstructuredai.io
8
+ License: Apache-2.0
9
+ Keywords: NLP PDF HTML CV XML parsing preprocessing
10
+ Classifier: Development Status :: 4 - Beta
11
+ Classifier: Intended Audience :: Developers
12
+ Classifier: Intended Audience :: Education
13
+ Classifier: Intended Audience :: Science/Research
14
+ Classifier: License :: OSI Approved :: Apache Software License
15
+ Classifier: Operating System :: OS Independent
16
+ Classifier: Programming Language :: Python :: 3
17
+ Classifier: Programming Language :: Python :: 3.9
18
+ Classifier: Programming Language :: Python :: 3.10
19
+ Classifier: Programming Language :: Python :: 3.11
20
+ Classifier: Programming Language :: Python :: 3.12
21
+ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
22
+ Requires-Python: >=3.9.0,<3.14
23
+ Description-Content-Type: text/markdown
24
+ License-File: LICENSE.md
25
+ Requires-Dist: pydantic>=2.7
26
+ Requires-Dist: opentelemetry-sdk
27
+ Requires-Dist: click
28
+ Requires-Dist: dataclasses_json
29
+ Requires-Dist: python-dateutil
30
+ Requires-Dist: tqdm
31
+ Requires-Dist: pandas
32
+ Requires-Dist: numpy
33
+ Provides-Extra: remote
34
+ Requires-Dist: unstructured-client>=0.30.0; extra == "remote"
35
+ Requires-Dist: pandas; extra == "remote"
36
+ Requires-Dist: numpy; extra == "remote"
37
+ Provides-Extra: csv
38
+ Requires-Dist: unstructured[tsv]; extra == "csv"
39
+ Requires-Dist: pandas; extra == "csv"
40
+ Requires-Dist: numpy; extra == "csv"
41
+ Provides-Extra: doc
42
+ Requires-Dist: unstructured[docx]; extra == "doc"
43
+ Requires-Dist: pandas; extra == "doc"
44
+ Requires-Dist: numpy; extra == "doc"
45
+ Provides-Extra: docx
46
+ Requires-Dist: unstructured[docx]; extra == "docx"
47
+ Requires-Dist: pandas; extra == "docx"
48
+ Requires-Dist: numpy; extra == "docx"
49
+ Provides-Extra: epub
50
+ Requires-Dist: unstructured[epub]; extra == "epub"
51
+ Requires-Dist: pandas; extra == "epub"
52
+ Requires-Dist: numpy; extra == "epub"
53
+ Provides-Extra: md
54
+ Requires-Dist: unstructured[md]; extra == "md"
55
+ Requires-Dist: pandas; extra == "md"
56
+ Requires-Dist: numpy; extra == "md"
57
+ Provides-Extra: msg
58
+ Requires-Dist: unstructured[msg]; extra == "msg"
59
+ Requires-Dist: pandas; extra == "msg"
60
+ Requires-Dist: numpy; extra == "msg"
61
+ Provides-Extra: odt
62
+ Requires-Dist: unstructured[odt]; extra == "odt"
63
+ Requires-Dist: pandas; extra == "odt"
64
+ Requires-Dist: numpy; extra == "odt"
65
+ Provides-Extra: org
66
+ Requires-Dist: unstructured[org]; extra == "org"
67
+ Requires-Dist: pandas; extra == "org"
68
+ Requires-Dist: numpy; extra == "org"
69
+ Provides-Extra: pdf
70
+ Requires-Dist: unstructured[pdf]; extra == "pdf"
71
+ Requires-Dist: pandas; extra == "pdf"
72
+ Requires-Dist: numpy; extra == "pdf"
73
+ Provides-Extra: ppt
74
+ Requires-Dist: unstructured[pptx]; extra == "ppt"
75
+ Requires-Dist: pandas; extra == "ppt"
76
+ Requires-Dist: numpy; extra == "ppt"
77
+ Provides-Extra: pptx
78
+ Requires-Dist: unstructured[pptx]; extra == "pptx"
79
+ Requires-Dist: pandas; extra == "pptx"
80
+ Requires-Dist: numpy; extra == "pptx"
81
+ Provides-Extra: rtf
82
+ Requires-Dist: unstructured[rtf]; extra == "rtf"
83
+ Requires-Dist: pandas; extra == "rtf"
84
+ Requires-Dist: numpy; extra == "rtf"
85
+ Provides-Extra: rst
86
+ Requires-Dist: unstructured[rst]; extra == "rst"
87
+ Requires-Dist: pandas; extra == "rst"
88
+ Requires-Dist: numpy; extra == "rst"
89
+ Provides-Extra: tsv
90
+ Requires-Dist: unstructured[tsv]; extra == "tsv"
91
+ Requires-Dist: pandas; extra == "tsv"
92
+ Requires-Dist: numpy; extra == "tsv"
93
+ Provides-Extra: xlsx
94
+ Requires-Dist: unstructured[xlsx]; extra == "xlsx"
95
+ Requires-Dist: pandas; extra == "xlsx"
96
+ Requires-Dist: numpy; extra == "xlsx"
97
+ Provides-Extra: airtable
98
+ Requires-Dist: pyairtable; extra == "airtable"
99
+ Requires-Dist: pandas; extra == "airtable"
100
+ Requires-Dist: numpy; extra == "airtable"
101
+ Provides-Extra: astradb
102
+ Requires-Dist: astrapy; extra == "astradb"
103
+ Requires-Dist: pandas; extra == "astradb"
104
+ Requires-Dist: numpy; extra == "astradb"
105
+ Provides-Extra: azure
106
+ Requires-Dist: fsspec; extra == "azure"
107
+ Requires-Dist: adlfs; extra == "azure"
108
+ Requires-Dist: pandas; extra == "azure"
109
+ Requires-Dist: numpy; extra == "azure"
110
+ Provides-Extra: azure-ai-search
111
+ Requires-Dist: azure-search-documents; extra == "azure-ai-search"
112
+ Requires-Dist: pandas; extra == "azure-ai-search"
113
+ Requires-Dist: numpy; extra == "azure-ai-search"
114
+ Provides-Extra: biomed
115
+ Requires-Dist: requests; extra == "biomed"
116
+ Requires-Dist: bs4; extra == "biomed"
117
+ Requires-Dist: pandas; extra == "biomed"
118
+ Requires-Dist: numpy; extra == "biomed"
119
+ Provides-Extra: box
120
+ Requires-Dist: fsspec; extra == "box"
121
+ Requires-Dist: boxfs; extra == "box"
122
+ Requires-Dist: pandas; extra == "box"
123
+ Requires-Dist: numpy; extra == "box"
124
+ Provides-Extra: chroma
125
+ Requires-Dist: chromadb; extra == "chroma"
126
+ Requires-Dist: pandas; extra == "chroma"
127
+ Requires-Dist: numpy; extra == "chroma"
128
+ Provides-Extra: clarifai
129
+ Requires-Dist: clarifai; extra == "clarifai"
130
+ Requires-Dist: pandas; extra == "clarifai"
131
+ Requires-Dist: numpy; extra == "clarifai"
132
+ Provides-Extra: confluence
133
+ Requires-Dist: requests; extra == "confluence"
134
+ Requires-Dist: atlassian-python-api; extra == "confluence"
135
+ Requires-Dist: pandas; extra == "confluence"
136
+ Requires-Dist: numpy; extra == "confluence"
137
+ Provides-Extra: couchbase
138
+ Requires-Dist: couchbase; extra == "couchbase"
139
+ Requires-Dist: pandas; extra == "couchbase"
140
+ Requires-Dist: numpy; extra == "couchbase"
141
+ Provides-Extra: delta-table
142
+ Requires-Dist: boto3; extra == "delta-table"
143
+ Requires-Dist: deltalake; extra == "delta-table"
144
+ Requires-Dist: pandas; extra == "delta-table"
145
+ Requires-Dist: numpy; extra == "delta-table"
146
+ Provides-Extra: discord
147
+ Requires-Dist: discord.py; extra == "discord"
148
+ Requires-Dist: pandas; extra == "discord"
149
+ Requires-Dist: numpy; extra == "discord"
150
+ Provides-Extra: dropbox
151
+ Requires-Dist: fsspec; extra == "dropbox"
152
+ Requires-Dist: dropboxdrivefs; extra == "dropbox"
153
+ Requires-Dist: pandas; extra == "dropbox"
154
+ Requires-Dist: numpy; extra == "dropbox"
155
+ Provides-Extra: duckdb
156
+ Requires-Dist: duckdb; extra == "duckdb"
157
+ Requires-Dist: pandas; extra == "duckdb"
158
+ Requires-Dist: numpy; extra == "duckdb"
159
+ Provides-Extra: elasticsearch
160
+ Requires-Dist: elasticsearch[async]; extra == "elasticsearch"
161
+ Requires-Dist: pandas; extra == "elasticsearch"
162
+ Requires-Dist: numpy; extra == "elasticsearch"
163
+ Provides-Extra: gcs
164
+ Requires-Dist: fsspec; extra == "gcs"
165
+ Requires-Dist: bs4; extra == "gcs"
166
+ Requires-Dist: gcsfs; extra == "gcs"
167
+ Requires-Dist: pandas; extra == "gcs"
168
+ Requires-Dist: numpy; extra == "gcs"
169
+ Provides-Extra: github
170
+ Requires-Dist: requests; extra == "github"
171
+ Requires-Dist: pygithub>1.58.0; extra == "github"
172
+ Requires-Dist: pandas; extra == "github"
173
+ Requires-Dist: numpy; extra == "github"
174
+ Provides-Extra: gitlab
175
+ Requires-Dist: python-gitlab; extra == "gitlab"
176
+ Requires-Dist: pandas; extra == "gitlab"
177
+ Requires-Dist: numpy; extra == "gitlab"
178
+ Provides-Extra: google-drive
179
+ Requires-Dist: google-api-python-client; extra == "google-drive"
180
+ Requires-Dist: pandas; extra == "google-drive"
181
+ Requires-Dist: numpy; extra == "google-drive"
182
+ Provides-Extra: hubspot
183
+ Requires-Dist: urllib3; extra == "hubspot"
184
+ Requires-Dist: hubspot-api-client; extra == "hubspot"
185
+ Requires-Dist: pandas; extra == "hubspot"
186
+ Requires-Dist: numpy; extra == "hubspot"
187
+ Provides-Extra: ibm-watsonx-s3
188
+ Requires-Dist: pyiceberg; extra == "ibm-watsonx-s3"
189
+ Requires-Dist: pyarrow; extra == "ibm-watsonx-s3"
190
+ Requires-Dist: httpx; extra == "ibm-watsonx-s3"
191
+ Requires-Dist: tenacity; extra == "ibm-watsonx-s3"
192
+ Requires-Dist: pandas; extra == "ibm-watsonx-s3"
193
+ Requires-Dist: numpy; extra == "ibm-watsonx-s3"
194
+ Provides-Extra: jira
195
+ Requires-Dist: atlassian-python-api; extra == "jira"
196
+ Requires-Dist: pandas; extra == "jira"
197
+ Requires-Dist: numpy; extra == "jira"
198
+ Provides-Extra: kafka
199
+ Requires-Dist: confluent-kafka; extra == "kafka"
200
+ Requires-Dist: pandas; extra == "kafka"
201
+ Requires-Dist: numpy; extra == "kafka"
202
+ Provides-Extra: kdbai
203
+ Requires-Dist: kdbai-client>=1.4.0; extra == "kdbai"
204
+ Requires-Dist: pandas; extra == "kdbai"
205
+ Requires-Dist: numpy; extra == "kdbai"
206
+ Provides-Extra: lancedb
207
+ Requires-Dist: lancedb; extra == "lancedb"
208
+ Requires-Dist: pandas; extra == "lancedb"
209
+ Requires-Dist: numpy; extra == "lancedb"
210
+ Provides-Extra: milvus
211
+ Requires-Dist: pymilvus; extra == "milvus"
212
+ Requires-Dist: pandas; extra == "milvus"
213
+ Requires-Dist: numpy; extra == "milvus"
214
+ Provides-Extra: mongodb
215
+ Requires-Dist: pymongo; extra == "mongodb"
216
+ Requires-Dist: pandas; extra == "mongodb"
217
+ Requires-Dist: numpy; extra == "mongodb"
218
+ Provides-Extra: neo4j
219
+ Requires-Dist: networkx; extra == "neo4j"
220
+ Requires-Dist: neo4j-rust-ext; extra == "neo4j"
221
+ Requires-Dist: cymple; extra == "neo4j"
222
+ Requires-Dist: pandas; extra == "neo4j"
223
+ Requires-Dist: numpy; extra == "neo4j"
224
+ Provides-Extra: notion
225
+ Requires-Dist: backoff; extra == "notion"
226
+ Requires-Dist: httpx; extra == "notion"
227
+ Requires-Dist: notion-client; extra == "notion"
228
+ Requires-Dist: htmlBuilder; extra == "notion"
229
+ Requires-Dist: pandas; extra == "notion"
230
+ Requires-Dist: numpy; extra == "notion"
231
+ Provides-Extra: onedrive
232
+ Requires-Dist: Office365-REST-Python-Client; extra == "onedrive"
233
+ Requires-Dist: requests; extra == "onedrive"
234
+ Requires-Dist: msal; extra == "onedrive"
235
+ Requires-Dist: pandas; extra == "onedrive"
236
+ Requires-Dist: numpy; extra == "onedrive"
237
+ Provides-Extra: opensearch
238
+ Requires-Dist: opensearch-py; extra == "opensearch"
239
+ Requires-Dist: pandas; extra == "opensearch"
240
+ Requires-Dist: numpy; extra == "opensearch"
241
+ Provides-Extra: outlook
242
+ Requires-Dist: Office365-REST-Python-Client; extra == "outlook"
243
+ Requires-Dist: msal; extra == "outlook"
244
+ Requires-Dist: pandas; extra == "outlook"
245
+ Requires-Dist: numpy; extra == "outlook"
246
+ Provides-Extra: pinecone
247
+ Requires-Dist: pinecone-client>=3.7.1; extra == "pinecone"
248
+ Requires-Dist: pandas; extra == "pinecone"
249
+ Requires-Dist: numpy; extra == "pinecone"
250
+ Provides-Extra: postgres
251
+ Requires-Dist: psycopg2-binary; extra == "postgres"
252
+ Requires-Dist: pandas; extra == "postgres"
253
+ Requires-Dist: numpy; extra == "postgres"
254
+ Provides-Extra: qdrant
255
+ Requires-Dist: qdrant-client; extra == "qdrant"
256
+ Requires-Dist: pandas; extra == "qdrant"
257
+ Requires-Dist: numpy; extra == "qdrant"
258
+ Provides-Extra: reddit
259
+ Requires-Dist: praw; extra == "reddit"
260
+ Requires-Dist: pandas; extra == "reddit"
261
+ Requires-Dist: numpy; extra == "reddit"
262
+ Provides-Extra: redis
263
+ Requires-Dist: redis; extra == "redis"
264
+ Requires-Dist: pandas; extra == "redis"
265
+ Requires-Dist: numpy; extra == "redis"
266
+ Provides-Extra: s3
267
+ Requires-Dist: fsspec; extra == "s3"
268
+ Requires-Dist: s3fs; extra == "s3"
269
+ Requires-Dist: pandas; extra == "s3"
270
+ Requires-Dist: numpy; extra == "s3"
271
+ Provides-Extra: sharepoint
272
+ Requires-Dist: Office365-REST-Python-Client; extra == "sharepoint"
273
+ Requires-Dist: requests; extra == "sharepoint"
274
+ Requires-Dist: msal; extra == "sharepoint"
275
+ Requires-Dist: pandas; extra == "sharepoint"
276
+ Requires-Dist: numpy; extra == "sharepoint"
277
+ Provides-Extra: salesforce
278
+ Requires-Dist: simple-salesforce; extra == "salesforce"
279
+ Requires-Dist: pandas; extra == "salesforce"
280
+ Requires-Dist: numpy; extra == "salesforce"
281
+ Provides-Extra: sftp
282
+ Requires-Dist: fsspec; extra == "sftp"
283
+ Requires-Dist: paramiko; extra == "sftp"
284
+ Requires-Dist: pandas; extra == "sftp"
285
+ Requires-Dist: numpy; extra == "sftp"
286
+ Provides-Extra: slack
287
+ Requires-Dist: slack_sdk[optional]; extra == "slack"
288
+ Requires-Dist: pandas; extra == "slack"
289
+ Requires-Dist: numpy; extra == "slack"
290
+ Provides-Extra: snowflake
291
+ Requires-Dist: snowflake-connector-python; extra == "snowflake"
292
+ Requires-Dist: psycopg2-binary; extra == "snowflake"
293
+ Requires-Dist: pandas; extra == "snowflake"
294
+ Requires-Dist: numpy; extra == "snowflake"
295
+ Provides-Extra: wikipedia
296
+ Requires-Dist: wikipedia; extra == "wikipedia"
297
+ Requires-Dist: pandas; extra == "wikipedia"
298
+ Requires-Dist: numpy; extra == "wikipedia"
299
+ Provides-Extra: weaviate
300
+ Requires-Dist: weaviate-client; extra == "weaviate"
301
+ Requires-Dist: pandas; extra == "weaviate"
302
+ Requires-Dist: numpy; extra == "weaviate"
303
+ Provides-Extra: databricks-volumes
304
+ Requires-Dist: databricks-sdk; extra == "databricks-volumes"
305
+ Requires-Dist: pandas; extra == "databricks-volumes"
306
+ Requires-Dist: numpy; extra == "databricks-volumes"
307
+ Provides-Extra: databricks-delta-tables
308
+ Requires-Dist: databricks-sql-connector; extra == "databricks-delta-tables"
309
+ Requires-Dist: pandas; extra == "databricks-delta-tables"
310
+ Requires-Dist: numpy; extra == "databricks-delta-tables"
311
+ Provides-Extra: singlestore
312
+ Requires-Dist: singlestoredb; extra == "singlestore"
313
+ Requires-Dist: pandas; extra == "singlestore"
314
+ Requires-Dist: numpy; extra == "singlestore"
315
+ Provides-Extra: vectara
316
+ Requires-Dist: requests; extra == "vectara"
317
+ Requires-Dist: httpx; extra == "vectara"
318
+ Requires-Dist: aiofiles; extra == "vectara"
319
+ Requires-Dist: pandas; extra == "vectara"
320
+ Requires-Dist: numpy; extra == "vectara"
321
+ Provides-Extra: vastdb
322
+ Requires-Dist: pyarrow; extra == "vastdb"
323
+ Requires-Dist: vastdb; extra == "vastdb"
324
+ Requires-Dist: ibis; extra == "vastdb"
325
+ Requires-Dist: pandas; extra == "vastdb"
326
+ Requires-Dist: numpy; extra == "vastdb"
327
+ Provides-Extra: zendesk
328
+ Requires-Dist: httpx; extra == "zendesk"
329
+ Requires-Dist: bs4; extra == "zendesk"
330
+ Requires-Dist: aiofiles; extra == "zendesk"
331
+ Requires-Dist: pandas; extra == "zendesk"
332
+ Requires-Dist: numpy; extra == "zendesk"
333
+ Provides-Extra: embed-huggingface
334
+ Requires-Dist: sentence-transformers; extra == "embed-huggingface"
335
+ Requires-Dist: pandas; extra == "embed-huggingface"
336
+ Requires-Dist: numpy; extra == "embed-huggingface"
337
+ Provides-Extra: embed-octoai
338
+ Requires-Dist: tiktoken; extra == "embed-octoai"
339
+ Requires-Dist: openai; extra == "embed-octoai"
340
+ Requires-Dist: pandas; extra == "embed-octoai"
341
+ Requires-Dist: numpy; extra == "embed-octoai"
342
+ Provides-Extra: embed-vertexai
343
+ Requires-Dist: vertexai; extra == "embed-vertexai"
344
+ Requires-Dist: pandas; extra == "embed-vertexai"
345
+ Requires-Dist: numpy; extra == "embed-vertexai"
346
+ Provides-Extra: embed-voyageai
347
+ Requires-Dist: voyageai; extra == "embed-voyageai"
348
+ Requires-Dist: pandas; extra == "embed-voyageai"
349
+ Requires-Dist: numpy; extra == "embed-voyageai"
350
+ Provides-Extra: embed-mixedbreadai
351
+ Requires-Dist: mixedbread-ai; extra == "embed-mixedbreadai"
352
+ Requires-Dist: pandas; extra == "embed-mixedbreadai"
353
+ Requires-Dist: numpy; extra == "embed-mixedbreadai"
354
+ Provides-Extra: openai
355
+ Requires-Dist: tiktoken; extra == "openai"
356
+ Requires-Dist: openai; extra == "openai"
357
+ Requires-Dist: pandas; extra == "openai"
358
+ Requires-Dist: numpy; extra == "openai"
359
+ Provides-Extra: bedrock
360
+ Requires-Dist: boto3; extra == "bedrock"
361
+ Requires-Dist: aioboto3; extra == "bedrock"
362
+ Requires-Dist: pandas; extra == "bedrock"
363
+ Requires-Dist: numpy; extra == "bedrock"
364
+ Provides-Extra: togetherai
365
+ Requires-Dist: together; extra == "togetherai"
366
+ Requires-Dist: pandas; extra == "togetherai"
367
+ Requires-Dist: numpy; extra == "togetherai"
368
+ Dynamic: author
369
+ Dynamic: author-email
370
+ Dynamic: classifier
371
+ Dynamic: description
372
+ Dynamic: description-content-type
373
+ Dynamic: home-page
374
+ Dynamic: keywords
375
+ Dynamic: license
376
+ Dynamic: provides-extra
377
+ Dynamic: requires-dist
378
+ Dynamic: requires-python
379
+ Dynamic: summary
380
+
381
+ # Unstructured Ingest
382
+
383
+ For details, see the [Unstructured Ingest overview](https://docs.unstructured.io/ingestion/overview) in the Unstructured documentation.
@@ -0,0 +1,44 @@
1
+ import os
2
+ from pathlib import Path
3
+
4
+ from unstructured_ingest.interfaces import ProcessorConfig
5
+ from unstructured_ingest.logger import logger
6
+ from unstructured_ingest.pipeline.pipeline import Pipeline
7
+ from unstructured_ingest.processes.chunker import ChunkerConfig
8
+ from unstructured_ingest.processes.connectors.airtable import (
9
+ CONNECTOR_TYPE,
10
+ AirtableAccessConfig,
11
+ AirtableConnectionConfig,
12
+ AirtableDownloaderConfig,
13
+ AirtableIndexerConfig,
14
+ )
15
+ from unstructured_ingest.processes.connectors.local import (
16
+ LocalUploaderConfig,
17
+ )
18
+ from unstructured_ingest.processes.embedder import EmbedderConfig
19
+ from unstructured_ingest.processes.partitioner import PartitionerConfig
20
+
21
+ base_path = Path(__file__).parent.parent.parent.parent
22
+ docs_path = base_path / "example-docs"
23
+ work_dir = base_path / "tmp_ingest" / CONNECTOR_TYPE
24
+ output_path = work_dir / "output"
25
+ download_path = work_dir / "download"
26
+
27
+ if __name__ == "__main__":
28
+ logger.info(f"writing all content in: {work_dir.resolve()}")
29
+ Pipeline.from_configs(
30
+ context=ProcessorConfig(work_dir=str(work_dir.resolve()), verbose=True),
31
+ indexer_config=AirtableIndexerConfig(
32
+ list_of_paths=["app5YQxSfp220fWtm", "appJ43QmP8I17zu88"]
33
+ ),
34
+ downloader_config=AirtableDownloaderConfig(download_dir=download_path),
35
+ source_connection_config=AirtableConnectionConfig(
36
+ access_config=AirtableAccessConfig(
37
+ personal_access_token=os.getenv("AIRTABLE_PERSONAL_ACCESS_TOKEN")
38
+ )
39
+ ),
40
+ partitioner_config=PartitionerConfig(strategy="fast"),
41
+ chunker_config=ChunkerConfig(chunking_strategy="by_title"),
42
+ embedder_config=EmbedderConfig(embedding_provider="huggingface"),
43
+ uploader_config=LocalUploaderConfig(output_dir=str(output_path.resolve())),
44
+ ).run()
@@ -0,0 +1,55 @@
1
+ import os
2
+ from pathlib import Path
3
+
4
+ from unstructured_ingest.interfaces import ProcessorConfig
5
+ from unstructured_ingest.logger import logger
6
+ from unstructured_ingest.pipeline.pipeline import Pipeline
7
+ from unstructured_ingest.processes.chunker import ChunkerConfig
8
+ from unstructured_ingest.processes.connectors.azure_ai_search import (
9
+ CONNECTOR_TYPE,
10
+ AzureAISearchAccessConfig,
11
+ AzureAISearchConnectionConfig,
12
+ AzureAISearchUploaderConfig,
13
+ AzureAISearchUploadStagerConfig,
14
+ )
15
+ from unstructured_ingest.processes.connectors.local import (
16
+ LocalConnectionConfig,
17
+ LocalDownloaderConfig,
18
+ LocalIndexerConfig,
19
+ )
20
+ from unstructured_ingest.processes.embedder import EmbedderConfig
21
+ from unstructured_ingest.processes.partitioner import PartitionerConfig
22
+
23
+ base_path = Path(__file__).parent.parent.parent.parent
24
+ docs_path = base_path / "example-docs"
25
+ work_dir = base_path / "tmp_ingest" / CONNECTOR_TYPE
26
+ output_path = work_dir / "output"
27
+ download_path = work_dir / "download"
28
+
29
+ if __name__ == "__main__":
30
+ logger.info(f"writing all content in: {work_dir.resolve()}")
31
+ index_name = "ingest-test-destination"
32
+ Pipeline.from_configs(
33
+ context=ProcessorConfig(work_dir=str(work_dir.resolve())),
34
+ indexer_config=LocalIndexerConfig(
35
+ input_path=str(docs_path.resolve()) + "/book-war-and-peace-1p.txt"
36
+ ),
37
+ downloader_config=LocalDownloaderConfig(download_dir=download_path),
38
+ source_connection_config=LocalConnectionConfig(),
39
+ partitioner_config=PartitionerConfig(strategy="fast"),
40
+ chunker_config=ChunkerConfig(
41
+ chunking_strategy="by_title", chunk_include_orig_elements=False
42
+ ),
43
+ embedder_config=EmbedderConfig(
44
+ embedding_provider="openai", embedding_api_key=os.getenv("OPENAI_API_KEY")
45
+ ),
46
+ destination_connection_config=AzureAISearchConnectionConfig(
47
+ access_config=AzureAISearchAccessConfig(
48
+ azure_ai_search_key=os.getenv("AZURE_SEARCH_API_KEY")
49
+ ),
50
+ index=os.getenv("AZURE_SEARCH_INDEX"),
51
+ endpoint=os.getenv("AZURE_SEARCH_ENDPOINT"),
52
+ ),
53
+ uploader_config=AzureAISearchUploaderConfig(batch_size=10),
54
+ stager_config=AzureAISearchUploadStagerConfig(),
55
+ ).run()
@@ -0,0 +1,54 @@
1
+ import random
2
+ from pathlib import Path
3
+
4
+ from unstructured_ingest.interfaces import ProcessorConfig
5
+ from unstructured_ingest.logger import logger
6
+ from unstructured_ingest.pipeline.pipeline import Pipeline
7
+ from unstructured_ingest.processes.chunker import ChunkerConfig
8
+ from unstructured_ingest.processes.connectors.chroma import (
9
+ CONNECTOR_TYPE,
10
+ ChromaAccessConfig,
11
+ ChromaConnectionConfig,
12
+ ChromaUploaderConfig,
13
+ ChromaUploadStagerConfig,
14
+ )
15
+ from unstructured_ingest.processes.connectors.local import (
16
+ LocalConnectionConfig,
17
+ LocalDownloaderConfig,
18
+ LocalIndexerConfig,
19
+ )
20
+ from unstructured_ingest.processes.embedder import EmbedderConfig
21
+ from unstructured_ingest.processes.partitioner import PartitionerConfig
22
+
23
+ base_path = Path(__file__).parent.parent.parent.parent
24
+ docs_path = base_path / "example-docs"
25
+ work_dir = base_path / "tmp_ingest" / CONNECTOR_TYPE
26
+ output_path = work_dir / "output"
27
+ download_path = work_dir / "download"
28
+
29
+ if __name__ == "__main__":
30
+ logger.info(f"writing all content in: {work_dir.resolve()}")
31
+ Pipeline.from_configs(
32
+ context=ProcessorConfig(work_dir=str(work_dir.resolve())),
33
+ indexer_config=LocalIndexerConfig(input_path=docs_path.resolve() / "multisimple"),
34
+ downloader_config=LocalDownloaderConfig(download_dir=download_path),
35
+ source_connection_config=LocalConnectionConfig(),
36
+ partitioner_config=PartitionerConfig(strategy="fast"),
37
+ chunker_config=ChunkerConfig(
38
+ chunking_strategy="by_title",
39
+ chunk_include_orig_elements=False,
40
+ chunk_max_characters=1500,
41
+ chunk_multipage_sections=True,
42
+ ),
43
+ embedder_config=EmbedderConfig(embedding_provider="huggingface"),
44
+ destination_connection_config=ChromaConnectionConfig(
45
+ access_config=ChromaAccessConfig(settings=None, headers=None),
46
+ host="localhost",
47
+ port=8047,
48
+ collection_name=f"test-collection-{random.randint(1000, 9999)}",
49
+ tenant="default_tenant",
50
+ database="default_database",
51
+ ),
52
+ stager_config=ChromaUploadStagerConfig(),
53
+ uploader_config=ChromaUploaderConfig(batch_size=10),
54
+ ).run()
@@ -0,0 +1,55 @@
1
+ from pathlib import Path
2
+
3
+ from unstructured_ingest.interfaces import ProcessorConfig
4
+ from unstructured_ingest.logger import logger
5
+ from unstructured_ingest.pipeline.pipeline import Pipeline
6
+ from unstructured_ingest.processes.chunker import ChunkerConfig
7
+ from unstructured_ingest.processes.connectors.couchbase import (
8
+ CONNECTOR_TYPE,
9
+ CouchbaseAccessConfig,
10
+ CouchbaseConnectionConfig,
11
+ CouchbaseUploaderConfig,
12
+ CouchbaseUploadStagerConfig,
13
+ )
14
+ from unstructured_ingest.processes.connectors.local import (
15
+ LocalConnectionConfig,
16
+ LocalDownloaderConfig,
17
+ LocalIndexerConfig,
18
+ )
19
+ from unstructured_ingest.processes.embedder import EmbedderConfig
20
+ from unstructured_ingest.processes.partitioner import PartitionerConfig
21
+
22
+ base_path = Path(__file__).parent.parent.parent.parent
23
+ docs_path = base_path / "example-docs"
24
+ work_dir = base_path / "tmp_ingest" / CONNECTOR_TYPE
25
+ output_path = work_dir / "output"
26
+ download_path = work_dir / "download"
27
+
28
+ if __name__ == "__main__":
29
+ logger.info(f"writing all content in: {work_dir.resolve()}")
30
+ Pipeline.from_configs(
31
+ context=ProcessorConfig(work_dir=str(work_dir.resolve())),
32
+ indexer_config=LocalIndexerConfig(input_path=str(docs_path.resolve()) + "/multisimple/"),
33
+ downloader_config=LocalDownloaderConfig(download_dir=download_path),
34
+ source_connection_config=LocalConnectionConfig(),
35
+ partitioner_config=PartitionerConfig(strategy="fast"),
36
+ chunker_config=ChunkerConfig(
37
+ chunking_strategy="by_title",
38
+ chunk_include_orig_elements=False,
39
+ chunk_max_characters=1500,
40
+ chunk_multipage_sections=True,
41
+ ),
42
+ embedder_config=EmbedderConfig(embedding_provider="huggingface"),
43
+ destination_connection_config=CouchbaseConnectionConfig(
44
+ access_config=CouchbaseAccessConfig(
45
+ connection_string="couchbase://localhost",
46
+ username="Administrator",
47
+ password="password",
48
+ ),
49
+ bucket="example_bucket",
50
+ scope="example_scope",
51
+ collection="example_collection",
52
+ ),
53
+ stager_config=CouchbaseUploadStagerConfig(),
54
+ uploader_config=CouchbaseUploaderConfig(batch_size=10),
55
+ ).run()
@@ -0,0 +1,55 @@
1
+ import os
2
+ from pathlib import Path
3
+
4
+ from unstructured_ingest.interfaces import ProcessorConfig
5
+ from unstructured_ingest.logger import logger
6
+ from unstructured_ingest.pipeline.pipeline import Pipeline
7
+ from unstructured_ingest.processes.chunker import ChunkerConfig
8
+ from unstructured_ingest.processes.connectors.databricks.volumes_native import (
9
+ CONNECTOR_TYPE,
10
+ DatabricksNativeVolumesAccessConfig,
11
+ DatabricksNativeVolumesConnectionConfig,
12
+ DatabricksNativeVolumesUploaderConfig,
13
+ )
14
+ from unstructured_ingest.processes.connectors.local import (
15
+ LocalConnectionConfig,
16
+ LocalDownloaderConfig,
17
+ LocalIndexerConfig,
18
+ )
19
+ from unstructured_ingest.processes.partitioner import PartitionerConfig
20
+
21
+ base_path = Path(__file__).parent.parent.parent.parent
22
+ docs_path = base_path / "example-docs"
23
+ work_dir = base_path / "tmp_ingest" / CONNECTOR_TYPE
24
+ output_path = work_dir / "output"
25
+ download_path = work_dir / "download"
26
+
27
+ if __name__ == "__main__":
28
+ logger.info(f"writing all content in: {work_dir.resolve()}")
29
+ Pipeline.from_configs(
30
+ context=ProcessorConfig(work_dir=str(work_dir.resolve())),
31
+ indexer_config=LocalIndexerConfig(input_path=str(docs_path.resolve()) + "/fake-text.txt"),
32
+ downloader_config=LocalDownloaderConfig(download_dir=download_path),
33
+ source_connection_config=LocalConnectionConfig(),
34
+ partitioner_config=PartitionerConfig(strategy="fast"),
35
+ chunker_config=ChunkerConfig(
36
+ chunking_strategy="basic",
37
+ ),
38
+ embedder_config=None,
39
+ destination_connection_config=DatabricksNativeVolumesConnectionConfig(
40
+ access_config=DatabricksNativeVolumesAccessConfig(
41
+ client_id=os.environ["DATABRICKS_CLIENT_ID"],
42
+ client_secret=os.environ["DATABRICKS_CLIENT_SECRET"],
43
+ ),
44
+ host=os.environ["DATABRICKS_HOST"],
45
+ catalog=os.environ["DATABRICKS_CATALOG"],
46
+ volume=os.environ["DATABRICKS_VOLUME"],
47
+ volume_path=os.environ["DATABRICKS_VOLUME_PATH"],
48
+ ),
49
+ uploader_config=DatabricksNativeVolumesUploaderConfig(
50
+ overwrite=True,
51
+ catalog=os.environ["DATABRICKS_CATALOG"],
52
+ volume=os.environ["DATABRICKS_VOLUME"],
53
+ volume_path=os.environ["DATABRICKS_VOLUME_PATH"],
54
+ ),
55
+ ).run()