unstructured-ingest 0.0.11__tar.gz → 0.0.13__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (350) hide show
  1. {unstructured-ingest-0.0.11/unstructured_ingest.egg-info → unstructured-ingest-0.0.13}/PKG-INFO +1 -1
  2. unstructured-ingest-0.0.13/unstructured_ingest/__version__.py +1 -0
  3. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/data_prep.py +7 -2
  4. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/pinecone.py +40 -21
  5. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/uncompress.py +2 -2
  6. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13/unstructured_ingest.egg-info}/PKG-INFO +1 -1
  7. unstructured-ingest-0.0.11/unstructured_ingest/__version__.py +0 -1
  8. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/LICENSE.md +0 -0
  9. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/README.md +0 -0
  10. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/pyproject.toml +0 -0
  11. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/setup.cfg +0 -0
  12. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/setup.py +0 -0
  13. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/test/test_chunking_utils.py +0 -0
  14. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/test/test_error.py +0 -0
  15. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/test/test_interfaces.py +0 -0
  16. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/test/test_logger.py +0 -0
  17. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/test/test_utils.py +0 -0
  18. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/test/test_utils_v2.py +0 -0
  19. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/__init__.py +0 -0
  20. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/__init__.py +0 -0
  21. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/base/__init__.py +0 -0
  22. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/base/cmd.py +0 -0
  23. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/base/dest.py +0 -0
  24. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/base/src.py +0 -0
  25. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cli.py +0 -0
  26. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmd_factory.py +0 -0
  27. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/__init__.py +0 -0
  28. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/airtable.py +0 -0
  29. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/astradb.py +0 -0
  30. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/azure_cognitive_search.py +0 -0
  31. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/biomed.py +0 -0
  32. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/chroma.py +0 -0
  33. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/clarifai.py +0 -0
  34. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/confluence.py +0 -0
  35. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/databricks_volumes.py +0 -0
  36. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/delta_table.py +0 -0
  37. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/discord.py +0 -0
  38. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/elasticsearch.py +0 -0
  39. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/__init__.py +0 -0
  40. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/azure.py +0 -0
  41. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/box.py +0 -0
  42. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/dropbox.py +0 -0
  43. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/fsspec.py +0 -0
  44. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/gcs.py +0 -0
  45. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/s3.py +0 -0
  46. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/fsspec/sftp.py +0 -0
  47. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/github.py +0 -0
  48. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/gitlab.py +0 -0
  49. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/google_drive.py +0 -0
  50. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/hubspot.py +0 -0
  51. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/jira.py +0 -0
  52. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/kafka.py +0 -0
  53. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/local.py +0 -0
  54. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/mongodb.py +0 -0
  55. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/notion.py +0 -0
  56. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/onedrive.py +0 -0
  57. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/opensearch.py +0 -0
  58. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/outlook.py +0 -0
  59. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/pinecone.py +0 -0
  60. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/qdrant.py +0 -0
  61. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/reddit.py +0 -0
  62. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/salesforce.py +0 -0
  63. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/sharepoint.py +0 -0
  64. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/slack.py +0 -0
  65. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/sql.py +0 -0
  66. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/vectara.py +0 -0
  67. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/weaviate.py +0 -0
  68. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/cmds/wikipedia.py +0 -0
  69. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/common.py +0 -0
  70. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/interfaces.py +0 -0
  71. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/cli/utils.py +0 -0
  72. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/__init__.py +0 -0
  73. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/airtable.py +0 -0
  74. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/astradb.py +0 -0
  75. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/azure_cognitive_search.py +0 -0
  76. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/biomed.py +0 -0
  77. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/chroma.py +0 -0
  78. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/clarifai.py +0 -0
  79. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/confluence.py +0 -0
  80. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/databricks_volumes.py +0 -0
  81. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/delta_table.py +0 -0
  82. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/discord.py +0 -0
  83. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/elasticsearch.py +0 -0
  84. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/__init__.py +0 -0
  85. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/azure.py +0 -0
  86. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/box.py +0 -0
  87. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/dropbox.py +0 -0
  88. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/fsspec.py +0 -0
  89. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/gcs.py +0 -0
  90. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/s3.py +0 -0
  91. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/fsspec/sftp.py +0 -0
  92. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/git.py +0 -0
  93. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/github.py +0 -0
  94. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/gitlab.py +0 -0
  95. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/google_drive.py +0 -0
  96. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/hubspot.py +0 -0
  97. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/jira.py +0 -0
  98. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/kafka.py +0 -0
  99. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/local.py +0 -0
  100. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/mongodb.py +0 -0
  101. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/__init__.py +0 -0
  102. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/client.py +0 -0
  103. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/connector.py +0 -0
  104. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/helpers.py +0 -0
  105. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/interfaces.py +0 -0
  106. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/__init__.py +0 -0
  107. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/block.py +0 -0
  108. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/__init__.py +0 -0
  109. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/bookmark.py +0 -0
  110. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/breadcrumb.py +0 -0
  111. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/bulleted_list_item.py +0 -0
  112. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/callout.py +0 -0
  113. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/child_database.py +0 -0
  114. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/child_page.py +0 -0
  115. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/code.py +0 -0
  116. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/column_list.py +0 -0
  117. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/divider.py +0 -0
  118. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/embed.py +0 -0
  119. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/equation.py +0 -0
  120. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/file.py +0 -0
  121. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/heading.py +0 -0
  122. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/image.py +0 -0
  123. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/link_preview.py +0 -0
  124. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/link_to_page.py +0 -0
  125. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/numbered_list.py +0 -0
  126. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/paragraph.py +0 -0
  127. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/pdf.py +0 -0
  128. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/quote.py +0 -0
  129. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/synced_block.py +0 -0
  130. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/table.py +0 -0
  131. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/table_of_contents.py +0 -0
  132. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/template.py +0 -0
  133. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/todo.py +0 -0
  134. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/toggle.py +0 -0
  135. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/unsupported.py +0 -0
  136. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/blocks/video.py +0 -0
  137. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database.py +0 -0
  138. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/__init__.py +0 -0
  139. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/checkbox.py +0 -0
  140. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/created_by.py +0 -0
  141. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/created_time.py +0 -0
  142. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/date.py +0 -0
  143. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/email.py +0 -0
  144. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/files.py +0 -0
  145. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/formula.py +0 -0
  146. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/last_edited_by.py +0 -0
  147. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/last_edited_time.py +0 -0
  148. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/multiselect.py +0 -0
  149. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/number.py +0 -0
  150. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/people.py +0 -0
  151. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/phone_number.py +0 -0
  152. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/relation.py +0 -0
  153. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/rich_text.py +0 -0
  154. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/rollup.py +0 -0
  155. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/select.py +0 -0
  156. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/status.py +0 -0
  157. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/title.py +0 -0
  158. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/unique_id.py +0 -0
  159. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/url.py +0 -0
  160. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/database_properties/verification.py +0 -0
  161. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/date.py +0 -0
  162. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/file.py +0 -0
  163. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/page.py +0 -0
  164. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/parent.py +0 -0
  165. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/rich_text.py +0 -0
  166. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/notion/types/user.py +0 -0
  167. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/onedrive.py +0 -0
  168. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/opensearch.py +0 -0
  169. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/outlook.py +0 -0
  170. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/pinecone.py +0 -0
  171. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/qdrant.py +0 -0
  172. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/reddit.py +0 -0
  173. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/registry.py +0 -0
  174. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/salesforce.py +0 -0
  175. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/sharepoint.py +0 -0
  176. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/slack.py +0 -0
  177. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/sql.py +0 -0
  178. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/vectara.py +0 -0
  179. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/weaviate.py +0 -0
  180. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/connector/wikipedia.py +0 -0
  181. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/enhanced_dataclass/__init__.py +0 -0
  182. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/enhanced_dataclass/core.py +0 -0
  183. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/enhanced_dataclass/dataclasses.py +0 -0
  184. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/enhanced_dataclass/json_mixin.py +0 -0
  185. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/error.py +0 -0
  186. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/evaluate.py +0 -0
  187. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/ingest_backoff/__init__.py +0 -0
  188. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/ingest_backoff/_common.py +0 -0
  189. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/ingest_backoff/_wrapper.py +0 -0
  190. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/interfaces.py +0 -0
  191. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/logger.py +0 -0
  192. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/main.py +0 -0
  193. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/__init__.py +0 -0
  194. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/copy.py +0 -0
  195. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/doc_factory.py +0 -0
  196. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/interfaces.py +0 -0
  197. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/partition.py +0 -0
  198. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/permissions.py +0 -0
  199. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/pipeline.py +0 -0
  200. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/reformat/__init__.py +0 -0
  201. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/reformat/chunking.py +0 -0
  202. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/reformat/embedding.py +0 -0
  203. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/source.py +0 -0
  204. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/utils.py +0 -0
  205. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/pipeline/write.py +0 -0
  206. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/processor.py +0 -0
  207. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/__init__.py +0 -0
  208. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/airtable.py +0 -0
  209. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/astradb.py +0 -0
  210. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/base_runner.py +0 -0
  211. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/biomed.py +0 -0
  212. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/confluence.py +0 -0
  213. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/delta_table.py +0 -0
  214. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/discord.py +0 -0
  215. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/elasticsearch.py +0 -0
  216. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/__init__.py +0 -0
  217. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/azure.py +0 -0
  218. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/box.py +0 -0
  219. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/dropbox.py +0 -0
  220. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/fsspec.py +0 -0
  221. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/gcs.py +0 -0
  222. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/s3.py +0 -0
  223. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/fsspec/sftp.py +0 -0
  224. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/github.py +0 -0
  225. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/gitlab.py +0 -0
  226. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/google_drive.py +0 -0
  227. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/hubspot.py +0 -0
  228. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/jira.py +0 -0
  229. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/kafka.py +0 -0
  230. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/local.py +0 -0
  231. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/mongodb.py +0 -0
  232. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/notion.py +0 -0
  233. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/onedrive.py +0 -0
  234. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/opensearch.py +0 -0
  235. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/outlook.py +0 -0
  236. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/reddit.py +0 -0
  237. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/salesforce.py +0 -0
  238. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/sharepoint.py +0 -0
  239. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/slack.py +0 -0
  240. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/utils.py +0 -0
  241. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/wikipedia.py +0 -0
  242. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/__init__.py +0 -0
  243. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/astradb.py +0 -0
  244. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/azure_cognitive_search.py +0 -0
  245. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/base_writer.py +0 -0
  246. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/chroma.py +0 -0
  247. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/clarifai.py +0 -0
  248. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/databricks_volumes.py +0 -0
  249. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/delta_table.py +0 -0
  250. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/elasticsearch.py +0 -0
  251. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/fsspec/__init__.py +0 -0
  252. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/fsspec/azure.py +0 -0
  253. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/fsspec/box.py +0 -0
  254. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/fsspec/dropbox.py +0 -0
  255. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/fsspec/gcs.py +0 -0
  256. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/fsspec/s3.py +0 -0
  257. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/kafka.py +0 -0
  258. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/mongodb.py +0 -0
  259. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/opensearch.py +0 -0
  260. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/pinecone.py +0 -0
  261. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/qdrant.py +0 -0
  262. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/sql.py +0 -0
  263. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/vectara.py +0 -0
  264. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/runner/writers/weaviate.py +0 -0
  265. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/__init__.py +0 -0
  266. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/chunking.py +0 -0
  267. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/compression.py +0 -0
  268. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/dep_check.py +0 -0
  269. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/google_filetype.py +0 -0
  270. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  271. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/utils/table.py +0 -0
  272. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/__init__.py +0 -0
  273. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/__init__.py +0 -0
  274. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/base/__init__.py +0 -0
  275. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/base/cmd.py +0 -0
  276. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/base/dest.py +0 -0
  277. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/base/importer.py +0 -0
  278. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/base/src.py +0 -0
  279. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/cli.py +0 -0
  280. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/cmds.py +0 -0
  281. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/utils/__init__.py +0 -0
  282. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/utils/click.py +0 -0
  283. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/cli/utils/model_conversion.py +0 -0
  284. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/__init__.py +0 -0
  285. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/connector.py +0 -0
  286. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/downloader.py +0 -0
  287. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/file_data.py +0 -0
  288. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/indexer.py +0 -0
  289. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/process.py +0 -0
  290. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/processor.py +0 -0
  291. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/upload_stager.py +0 -0
  292. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/interfaces/uploader.py +0 -0
  293. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/logger.py +0 -0
  294. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/main.py +0 -0
  295. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/otel.py +0 -0
  296. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/__init__.py +0 -0
  297. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/interfaces.py +0 -0
  298. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/otel.py +0 -0
  299. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/pipeline.py +0 -0
  300. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/__init__.py +0 -0
  301. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/chunk.py +0 -0
  302. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/download.py +0 -0
  303. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/embed.py +0 -0
  304. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/filter.py +0 -0
  305. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/index.py +0 -0
  306. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/partition.py +0 -0
  307. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/stage.py +0 -0
  308. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/uncompress.py +0 -0
  309. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/pipeline/steps/upload.py +0 -0
  310. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/__init__.py +0 -0
  311. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/chunker.py +0 -0
  312. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connector_registry.py +0 -0
  313. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/__init__.py +0 -0
  314. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/astradb.py +0 -0
  315. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/azure_cognitive_search.py +0 -0
  316. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/chroma.py +0 -0
  317. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/couchbase.py +0 -0
  318. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/databricks_volumes.py +0 -0
  319. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/elasticsearch.py +0 -0
  320. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/__init__.py +0 -0
  321. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/azure.py +0 -0
  322. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/box.py +0 -0
  323. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/dropbox.py +0 -0
  324. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/fsspec.py +0 -0
  325. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/gcs.py +0 -0
  326. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/s3.py +0 -0
  327. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/sftp.py +0 -0
  328. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/fsspec/utils.py +0 -0
  329. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/google_drive.py +0 -0
  330. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/kdbai.py +0 -0
  331. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/local.py +0 -0
  332. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/milvus.py +0 -0
  333. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/mongodb.py +0 -0
  334. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/onedrive.py +0 -0
  335. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/opensearch.py +0 -0
  336. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/salesforce.py +0 -0
  337. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/sharepoint.py +0 -0
  338. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/singlestore.py +0 -0
  339. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/sql.py +0 -0
  340. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/utils.py +0 -0
  341. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/connectors/weaviate.py +0 -0
  342. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/embedder.py +0 -0
  343. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/filter.py +0 -0
  344. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/processes/partitioner.py +0 -0
  345. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest/v2/utils.py +0 -0
  346. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest.egg-info/SOURCES.txt +0 -0
  347. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest.egg-info/dependency_links.txt +0 -0
  348. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest.egg-info/entry_points.txt +0 -0
  349. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest.egg-info/requires.txt +365 -365
  350. {unstructured-ingest-0.0.11 → unstructured-ingest-0.0.13}/unstructured_ingest.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.11
3
+ Version: 0.0.13
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -0,0 +1 @@
1
+ __version__ = "0.0.13" # pragma: no cover
@@ -15,14 +15,19 @@ def batch_generator(iterable, batch_size=100):
15
15
  chunk = tuple(itertools.islice(it, batch_size))
16
16
 
17
17
 
18
- def generator_batching_wbytes(iterable, batch_size_limit_bytes=15_000_000):
18
+ def generator_batching_wbytes(
19
+ iterable, batch_size_limit_bytes=15_000_000, max_batch_size: int = 1000
20
+ ):
19
21
  """A helper function to break an iterable into chunks of specified bytes."""
20
22
  current_batch, current_batch_size = [], 0
21
23
 
22
24
  for item in iterable:
23
25
  item_size_bytes = len(json.dumps(item).encode("utf-8"))
24
26
 
25
- if current_batch_size + item_size_bytes <= batch_size_limit_bytes:
27
+ if (
28
+ current_batch_size + item_size_bytes <= batch_size_limit_bytes
29
+ or len(current_batch) == 0 # prevent inifite yielding of empty batch
30
+ ) and len(current_batch) < max_batch_size:
26
31
  current_batch.append(item)
27
32
  current_batch_size += item_size_bytes
28
33
  else:
@@ -7,7 +7,7 @@ from typing import TYPE_CHECKING, Any, Optional
7
7
  from pydantic import Field, Secret
8
8
 
9
9
  from unstructured_ingest.error import DestinationConnectionError
10
- from unstructured_ingest.utils.data_prep import batch_generator, flatten_dict
10
+ from unstructured_ingest.utils.data_prep import flatten_dict, generator_batching_wbytes
11
11
  from unstructured_ingest.utils.dep_check import requires_dependencies
12
12
  from unstructured_ingest.v2.interfaces import (
13
13
  AccessConfig,
@@ -19,15 +19,14 @@ from unstructured_ingest.v2.interfaces import (
19
19
  UploadStagerConfig,
20
20
  )
21
21
  from unstructured_ingest.v2.logger import logger
22
- from unstructured_ingest.v2.processes.connector_registry import (
23
- DestinationRegistryEntry,
24
- )
22
+ from unstructured_ingest.v2.processes.connector_registry import DestinationRegistryEntry
25
23
 
26
24
  if TYPE_CHECKING:
27
25
  from pinecone import Index as PineconeIndex
28
26
 
29
27
 
30
28
  CONNECTOR_TYPE = "pinecone"
29
+ MAX_PAYLOAD_SIZE = 2 * 1024 * 1024 # 2MB
31
30
 
32
31
 
33
32
  class PineconeAccessConfig(AccessConfig):
@@ -69,6 +68,23 @@ class PineconeUploaderConfig(UploaderConfig):
69
68
  batch_size: int = Field(default=100, description="Number of records per batch")
70
69
 
71
70
 
71
+ ALLOWED_FIELDS = (
72
+ "element_id",
73
+ "text",
74
+ "parent_id",
75
+ "category_depth",
76
+ "emphasized_text_tags",
77
+ "emphasized_text_contents",
78
+ "coordinates",
79
+ "last_modified",
80
+ "page_number",
81
+ "filename",
82
+ "is_continuation",
83
+ "link_urls",
84
+ "link_texts",
85
+ )
86
+
87
+
72
88
  @dataclass
73
89
  class PineconeUploadStager(UploadStager):
74
90
  upload_stager_config: PineconeUploadStagerConfig = field(
@@ -77,22 +93,24 @@ class PineconeUploadStager(UploadStager):
77
93
 
78
94
  @staticmethod
79
95
  def conform_dict(element_dict: dict) -> dict:
80
- # While flatten_dict enables indexing on various fields,
81
- # element_serialized enables easily reloading the element object to memory.
82
- # element_serialized is formed without text/embeddings to avoid data bloating.
96
+ embeddings = element_dict.pop("embeddings", None)
97
+ metadata: dict[str, Any] = element_dict.pop("metadata", {})
98
+ data_source = metadata.pop("data_source", {})
99
+ coordinates = metadata.pop("coordinates", {})
100
+
101
+ element_dict.update(metadata)
102
+ element_dict.update(data_source)
103
+ element_dict.update(coordinates)
104
+
83
105
  return {
84
106
  "id": str(uuid.uuid4()),
85
- "values": element_dict.pop("embeddings", None),
86
- "metadata": {
87
- "text": element_dict.pop("text", None),
88
- "element_serialized": json.dumps(element_dict),
89
- **flatten_dict(
90
- element_dict,
91
- separator="-",
92
- flatten_lists=True,
93
- remove_none=True,
94
- ),
95
- },
107
+ "values": embeddings,
108
+ "metadata": flatten_dict(
109
+ {k: v for k, v in element_dict.items() if k in ALLOWED_FIELDS},
110
+ separator="-",
111
+ flatten_lists=True,
112
+ remove_none=True,
113
+ ),
96
114
  }
97
115
 
98
116
  def run(
@@ -150,9 +168,10 @@ class PineconeUploader(Uploader):
150
168
  f" with batch size {self.upload_config.batch_size}"
151
169
  )
152
170
 
153
- pinecone_batch_size = self.upload_config.batch_size
154
- for pinecone_batch in batch_generator(elements_dict, pinecone_batch_size):
155
- self.upsert_batch(batch=pinecone_batch)
171
+ for batch in generator_batching_wbytes(
172
+ elements_dict, MAX_PAYLOAD_SIZE - 100, self.upload_config.batch_size
173
+ ):
174
+ self.upsert_batch(batch=batch)
156
175
 
157
176
 
158
177
  pinecone_destination_entry = DestinationRegistryEntry(
@@ -43,11 +43,11 @@ class Uncompressor(BaseProcess, ABC):
43
43
  new_rel_download_path = str(f).replace(str(Path(local_filepath.parent)), "")[1:]
44
44
  new_file_data.source_identifiers = SourceIdentifiers(
45
45
  filename=f.name,
46
- fullpath=file_data.source_identifiers.fullpath.replace(
46
+ fullpath=str(file_data.source_identifiers.fullpath).replace(
47
47
  file_data.source_identifiers.filename, new_rel_download_path
48
48
  ),
49
49
  rel_path=(
50
- file_data.source_identifiers.rel_path.replace(
50
+ str(file_data.source_identifiers.rel_path).replace(
51
51
  file_data.source_identifiers.filename, new_rel_download_path
52
52
  )
53
53
  if file_data.source_identifiers.rel_path
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: unstructured-ingest
3
- Version: 0.0.11
3
+ Version: 0.0.13
4
4
  Summary: A library that prepares raw documents for downstream ML tasks.
5
5
  Home-page: https://github.com/Unstructured-IO/unstructured-ingest
6
6
  Author: Unstructured Technologies
@@ -1 +0,0 @@
1
- __version__ = "0.0.11" # pragma: no cover