unstructured-ingest 1.1.2__tar.gz → 1.2.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (243) hide show
  1. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/PKG-INFO +2 -3
  2. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/pyproject.toml +1 -10
  3. unstructured_ingest-1.2.0/unstructured_ingest/__version__.py +1 -0
  4. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/otel.py +10 -8
  5. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py +6 -19
  6. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/fsspec.py +1 -1
  7. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/filesystem.py +4 -4
  8. unstructured_ingest-1.1.2/unstructured_ingest/__version__.py +0 -1
  9. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/.gitignore +0 -0
  10. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/LICENSE.md +0 -0
  11. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/README.md +0 -0
  12. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/__init__.py +0 -0
  13. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/README.md +0 -0
  14. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/__init__.py +0 -0
  15. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/base/__init__.py +0 -0
  16. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/base/cmd.py +0 -0
  17. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/base/dest.py +0 -0
  18. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/base/importer.py +0 -0
  19. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/base/src.py +0 -0
  20. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/cli.py +0 -0
  21. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/cmds.py +0 -0
  22. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/utils/__init__.py +0 -0
  23. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/utils/click.py +0 -0
  24. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/cli/utils/model_conversion.py +0 -0
  25. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/data_types/__init__.py +0 -0
  26. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/data_types/entities.py +0 -0
  27. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/data_types/file_data.py +0 -0
  28. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/__init__.py +0 -0
  29. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/azure_openai.py +0 -0
  30. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/bedrock.py +0 -0
  31. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/huggingface.py +0 -0
  32. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/interfaces.py +0 -0
  33. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  34. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/octoai.py +0 -0
  35. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/openai.py +0 -0
  36. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/togetherai.py +0 -0
  37. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/vertexai.py +0 -0
  38. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/embed/voyageai.py +0 -0
  39. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/error.py +0 -0
  40. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/errors_v2.py +0 -0
  41. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/__init__.py +0 -0
  42. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/connector.py +0 -0
  43. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/downloader.py +0 -0
  44. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/indexer.py +0 -0
  45. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/process.py +0 -0
  46. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/processor.py +0 -0
  47. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/upload_stager.py +0 -0
  48. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/interfaces/uploader.py +0 -0
  49. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/logger.py +0 -0
  50. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/main.py +0 -0
  51. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/__init__.py +0 -0
  52. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/interfaces.py +0 -0
  53. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/otel.py +0 -0
  54. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/pipeline.py +0 -0
  55. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/__init__.py +0 -0
  56. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/chunk.py +0 -0
  57. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/download.py +0 -0
  58. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/embed.py +0 -0
  59. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/filter.py +0 -0
  60. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/index.py +0 -0
  61. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/partition.py +0 -0
  62. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/stage.py +0 -0
  63. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/uncompress.py +0 -0
  64. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/pipeline/steps/upload.py +0 -0
  65. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/__init__.py +0 -0
  66. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/chunker.py +0 -0
  67. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connector_registry.py +0 -0
  68. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/__init__.py +0 -0
  69. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/airtable.py +0 -0
  70. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/assets/__init__.py +0 -0
  71. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql +0 -0
  72. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json +0 -0
  73. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/astradb.py +0 -0
  74. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/azure_ai_search.py +0 -0
  75. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/chroma.py +0 -0
  76. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/confluence.py +0 -0
  77. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/couchbase.py +0 -0
  78. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/__init__.py +0 -0
  79. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/volumes.py +0 -0
  80. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/volumes_aws.py +0 -0
  81. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/volumes_azure.py +0 -0
  82. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/volumes_gcp.py +0 -0
  83. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/volumes_native.py +0 -0
  84. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/databricks/volumes_table.py +0 -0
  85. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/delta_table.py +0 -0
  86. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/discord.py +0 -0
  87. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/duckdb/__init__.py +0 -0
  88. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/duckdb/base.py +0 -0
  89. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/duckdb/duckdb.py +0 -0
  90. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/duckdb/motherduck.py +0 -0
  91. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/elasticsearch/__init__.py +0 -0
  92. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/elasticsearch/opensearch.py +0 -0
  93. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/__init__.py +0 -0
  94. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/azure.py +0 -0
  95. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/box.py +0 -0
  96. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/dropbox.py +0 -0
  97. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/gcs.py +0 -0
  98. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/s3.py +0 -0
  99. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/sftp.py +0 -0
  100. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/fsspec/utils.py +0 -0
  101. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/github.py +0 -0
  102. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/gitlab.py +0 -0
  103. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/google_drive.py +0 -0
  104. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py +0 -0
  105. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +0 -0
  106. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/jira.py +0 -0
  107. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/kafka/__init__.py +0 -0
  108. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/kafka/cloud.py +0 -0
  109. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/kafka/kafka.py +0 -0
  110. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/kafka/local.py +0 -0
  111. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/kdbai.py +0 -0
  112. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/__init__.py +0 -0
  113. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/aws.py +0 -0
  114. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/azure.py +0 -0
  115. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/cloud.py +0 -0
  116. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/gcp.py +0 -0
  117. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/lancedb.py +0 -0
  118. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/lancedb/local.py +0 -0
  119. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/local.py +0 -0
  120. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/milvus.py +0 -0
  121. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/mongodb.py +0 -0
  122. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/neo4j.py +0 -0
  123. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/__init__.py +0 -0
  124. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/client.py +0 -0
  125. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/connector.py +0 -0
  126. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/helpers.py +0 -0
  127. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/ingest_backoff/__init__.py +0 -0
  128. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_common.py +0 -0
  129. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py +0 -0
  130. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +0 -0
  131. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/interfaces.py +0 -0
  132. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/__init__.py +0 -0
  133. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/block.py +0 -0
  134. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/__init__.py +0 -0
  135. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py +0 -0
  136. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py +0 -0
  137. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -0
  138. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/callout.py +0 -0
  139. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py +0 -0
  140. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py +0 -0
  141. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/code.py +0 -0
  142. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py +0 -0
  143. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/divider.py +0 -0
  144. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/embed.py +0 -0
  145. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/equation.py +0 -0
  146. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/file.py +0 -0
  147. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/heading.py +0 -0
  148. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/image.py +0 -0
  149. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py +0 -0
  150. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py +0 -0
  151. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py +0 -0
  152. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py +0 -0
  153. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py +0 -0
  154. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/quote.py +0 -0
  155. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +0 -0
  156. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/table.py +0 -0
  157. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py +0 -0
  158. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/template.py +0 -0
  159. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/todo.py +0 -0
  160. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py +0 -0
  161. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py +0 -0
  162. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/blocks/video.py +0 -0
  163. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database.py +0 -0
  164. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py +0 -0
  165. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py +0 -0
  166. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py +0 -0
  167. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py +0 -0
  168. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/date.py +0 -0
  169. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/email.py +0 -0
  170. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/files.py +0 -0
  171. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py +0 -0
  172. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -0
  173. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py +0 -0
  174. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py +0 -0
  175. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/number.py +0 -0
  176. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/people.py +0 -0
  177. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py +0 -0
  178. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py +0 -0
  179. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py +0 -0
  180. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py +0 -0
  181. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/select.py +0 -0
  182. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/status.py +0 -0
  183. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/title.py +0 -0
  184. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py +0 -0
  185. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/url.py +0 -0
  186. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py +0 -0
  187. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/date.py +0 -0
  188. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/file.py +0 -0
  189. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/page.py +0 -0
  190. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/parent.py +0 -0
  191. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/rich_text.py +0 -0
  192. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/notion/types/user.py +0 -0
  193. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/onedrive.py +0 -0
  194. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/outlook.py +0 -0
  195. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/pinecone.py +0 -0
  196. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/qdrant/__init__.py +0 -0
  197. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/qdrant/cloud.py +0 -0
  198. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/qdrant/local.py +0 -0
  199. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/qdrant/qdrant.py +0 -0
  200. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/qdrant/server.py +0 -0
  201. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/redisdb.py +0 -0
  202. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/salesforce.py +0 -0
  203. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sharepoint.py +0 -0
  204. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/slack.py +0 -0
  205. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/__init__.py +0 -0
  206. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py +0 -0
  207. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/postgres.py +0 -0
  208. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/singlestore.py +0 -0
  209. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/snowflake.py +0 -0
  210. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/sql.py +0 -0
  211. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/sqlite.py +0 -0
  212. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/sql/vastdb.py +0 -0
  213. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/utils.py +0 -0
  214. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/vectara.py +0 -0
  215. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/weaviate/__init__.py +0 -0
  216. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/weaviate/cloud.py +0 -0
  217. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/weaviate/embedded.py +0 -0
  218. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/weaviate/local.py +0 -0
  219. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/weaviate/weaviate.py +0 -0
  220. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/zendesk/__init__.py +0 -0
  221. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/zendesk/client.py +0 -0
  222. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/connectors/zendesk/zendesk.py +0 -0
  223. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/embedder.py +0 -0
  224. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/filter.py +0 -0
  225. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/partitioner.py +0 -0
  226. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/uncompress.py +0 -0
  227. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/utils/__init__.py +0 -0
  228. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/utils/blob_storage.py +0 -0
  229. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/utils/logging/connector.py +0 -0
  230. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/processes/utils/logging/sanitizer.py +0 -0
  231. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/unstructured_api.py +0 -0
  232. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/__init__.py +0 -0
  233. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/chunking.py +0 -0
  234. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/compression.py +0 -0
  235. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/constants.py +0 -0
  236. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/data_prep.py +0 -0
  237. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/dep_check.py +0 -0
  238. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/html.py +0 -0
  239. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/ndjson.py +0 -0
  240. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/pydantic_models.py +0 -0
  241. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  242. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/table.py +0 -0
  243. {unstructured_ingest-1.1.2 → unstructured_ingest-1.2.0}/unstructured_ingest/utils/tls.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: unstructured_ingest
3
- Version: 1.1.2
3
+ Version: 1.2.0
4
4
  Summary: Local ETL data pipeline to get data RAG ready
5
5
  Author-email: Unstructured Technologies <devops@unstructuredai.io>
6
6
  License-Expression: Apache-2.0
@@ -12,12 +12,11 @@ Classifier: Intended Audience :: Science/Research
12
12
  Classifier: License :: OSI Approved :: Apache Software License
13
13
  Classifier: Operating System :: OS Independent
14
14
  Classifier: Programming Language :: Python :: 3
15
- Classifier: Programming Language :: Python :: 3.9
16
15
  Classifier: Programming Language :: Python :: 3.10
17
16
  Classifier: Programming Language :: Python :: 3.11
18
17
  Classifier: Programming Language :: Python :: 3.12
19
18
  Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
20
- Requires-Python: <3.13,>=3.9
19
+ Requires-Python: <3.13,>=3.10
21
20
  Requires-Dist: certifi>=2025.7.14
22
21
  Requires-Dist: click
23
22
  Requires-Dist: opentelemetry-sdk
@@ -1,7 +1,7 @@
1
1
  [project]
2
2
  name = "unstructured_ingest"
3
3
  description = "Local ETL data pipeline to get data RAG ready"
4
- requires-python = ">=3.9, <3.13"
4
+ requires-python = ">=3.10, <3.13"
5
5
  authors = [{name = "Unstructured Technologies", email = "devops@unstructuredai.io"}]
6
6
  classifiers = [
7
7
  "Development Status :: 4 - Beta",
@@ -11,7 +11,6 @@ classifiers = [
11
11
  "License :: OSI Approved :: Apache Software License",
12
12
  "Operating System :: OS Independent",
13
13
  "Programming Language :: Python :: 3",
14
- "Programming Language :: Python :: 3.9",
15
14
  "Programming Language :: Python :: 3.10",
16
15
  "Programming Language :: Python :: 3.11",
17
16
  "Programming Language :: Python :: 3.12",
@@ -147,21 +146,13 @@ test = [
147
146
  ]
148
147
  # Add constraints needed for CI
149
148
  ci = [
150
- # consistency with local-inference-pin
151
- "protobuf<4.24",
152
149
  "grpcio>=1.65.5",
153
150
  # TODO: Pinned in transformers package, remove when that gets updated
154
151
  "tokenizers>=0.19,<0.20",
155
- # TODO: Constaint due to boto, with python before 3.10 not requiring openssl 1.1.1, remove when that gets
156
- # updated or we drop support for 3.9
157
- "urllib3<1.27",
158
152
  # TODO: Constriant due to aiobotocore, remove when that gets updates:
159
153
  "botocore<1.34.132",
160
154
  # TODO: Constriant due to both 8.5.0 and 8.4.0 being installed during pip-compile
161
155
  "importlib-metadata>=8.5.0",
162
- # TODO: Constraint due to boto, with python before 3.10 not requiring openssl 1.1.1, remove when that gets
163
- # updated or we drop support for 3.9
164
- "urllib3<1.27",
165
156
  "unstructured-client>= 0.25.8",
166
157
  "fsspec==2024.5.0",
167
158
  # python 3.12 support
@@ -0,0 +1 @@
1
+ __version__ = "1.2.0" # pragma: no cover
@@ -32,21 +32,23 @@ class LogSpanExporter(ConsoleSpanExporter):
32
32
  self.log_out(self.formatter(span))
33
33
  return SpanExportResult.SUCCESS
34
34
 
35
+
35
36
  def get_log_out() -> Callable:
36
37
  level_names_mapping = {
37
- 'CRITICAL': logging.CRITICAL,
38
- 'FATAL': logging.FATAL,
39
- 'ERROR': logging.ERROR,
40
- 'WARN': logging.WARNING,
41
- 'WARNING': logging.WARNING,
42
- 'INFO': logging.INFO,
43
- 'DEBUG': logging.DEBUG,
44
- 'NOTSET': logging.NOTSET,
38
+ "CRITICAL": logging.CRITICAL,
39
+ "FATAL": logging.FATAL,
40
+ "ERROR": logging.ERROR,
41
+ "WARN": logging.WARNING,
42
+ "WARNING": logging.WARNING,
43
+ "INFO": logging.INFO,
44
+ "DEBUG": logging.DEBUG,
45
+ "NOTSET": logging.NOTSET,
45
46
  }
46
47
  log_level = os.getenv("OTEL_LOG_LEVEL", "DEBUG").upper()
47
48
  log_level_int = level_names_mapping.get(log_level, logging.DEBUG)
48
49
  return lambda message: logger.log(log_level_int, message)
49
50
 
51
+
50
52
  @dataclass
51
53
  class OtelHandler:
52
54
  otel_endpoint: Optional[str] = None
@@ -19,7 +19,6 @@ from unstructured_ingest.error import (
19
19
  DestinationConnectionError,
20
20
  SourceConnectionError,
21
21
  SourceConnectionNetworkError,
22
- WriteError,
23
22
  )
24
23
  from unstructured_ingest.interfaces import (
25
24
  AccessConfig,
@@ -336,6 +335,8 @@ class ElasticsearchUploadStager(UploadStager):
336
335
 
337
336
  def conform_dict(self, element_dict: dict, file_data: FileData) -> dict:
338
337
  data = element_dict.copy()
338
+ # when _op_type is not specified, it defaults to "index":
339
+ # Overwrites if exists, creates if not.
339
340
  resp = {
340
341
  "_index": self.upload_stager_config.index_name,
341
342
  "_id": get_enhanced_element_id(element_dict=data, file_data=file_data),
@@ -397,23 +398,6 @@ class ElasticsearchUploader(Uploader):
397
398
 
398
399
  return parallel_bulk
399
400
 
400
- def delete_by_record_id(self, client, file_data: FileData) -> None:
401
- logger.debug(
402
- f"deleting any content with metadata {RECORD_ID_LABEL}={file_data.identifier} "
403
- f"from {self.upload_config.index_name} index"
404
- )
405
- delete_resp = client.delete_by_query(
406
- index=self.upload_config.index_name,
407
- body={"query": {"match": {self.upload_config.record_id_key: file_data.identifier}}},
408
- )
409
- logger.info(
410
- "deleted {} records from index {}".format(
411
- delete_resp["deleted"], self.upload_config.index_name
412
- )
413
- )
414
- if failures := delete_resp.get("failures"):
415
- raise WriteError(f"failed to delete records: {failures}")
416
-
417
401
  @requires_dependencies(["elasticsearch"], extras="elasticsearch")
418
402
  def run_data(self, data: list[dict], file_data: FileData, **kwargs: Any) -> None: # noqa: E501
419
403
  from elasticsearch.helpers.errors import BulkIndexError
@@ -429,7 +413,6 @@ class ElasticsearchUploader(Uploader):
429
413
  )
430
414
 
431
415
  with self.connection_config.get_client() as client:
432
- self.delete_by_record_id(client=client, file_data=file_data)
433
416
  if not client.indices.exists(index=self.upload_config.index_name):
434
417
  logger.warning(
435
418
  f"{(self.__class__.__name__).replace('Uploader', '')} index does not exist: "
@@ -446,6 +429,10 @@ class ElasticsearchUploader(Uploader):
446
429
  thread_count=self.upload_config.num_threads,
447
430
  )
448
431
  collections.deque(iterator, maxlen=0)
432
+ logger.info(
433
+ f"uploaded batch of {len(batch)} elements to index "
434
+ f"{self.upload_config.index_name}"
435
+ )
449
436
  except BulkIndexError as e:
450
437
  sanitized_errors = [
451
438
  self._sanitize_bulk_index_error(error) for error in e.errors
@@ -385,7 +385,7 @@ class FsspecUploader(Uploader):
385
385
 
386
386
  def __post_init__(self):
387
387
  super().__post_init__()
388
- # TODO once python3.9 no longer supported and kw_only is allowed in dataclasses, remove:
388
+ # TODO: Consider using `kw_only` instead
389
389
  if not self.upload_config:
390
390
  raise TypeError(
391
391
  f"{self.__class__.__name__}.__init__() "
@@ -11,12 +11,12 @@ from pathlib import Path
11
11
  def mkdir_concurrent_safe(path: Path) -> None:
12
12
  """
13
13
  Create directory safely in concurrent environments, handling race conditions.
14
-
14
+
15
15
  This addresses the issue where Path.mkdir(parents=True, exist_ok=True) can still
16
- raise FileExistsError when multiple processes attempt to create overlapping
16
+ raise FileExistsError when multiple processes attempt to create overlapping
17
17
  directory structures simultaneously. In this codebase, this occurs when multiple
18
18
  files are being downloaded in parallel and archive extraction is happening in parallel.
19
-
19
+
20
20
  Related: https://github.com/python/cpython/pull/112966/files
21
21
  Python core team used the same approach to fix zipfile race conditions.
22
22
  """
@@ -24,4 +24,4 @@ def mkdir_concurrent_safe(path: Path) -> None:
24
24
  path.mkdir(parents=True, exist_ok=True)
25
25
  except FileExistsError:
26
26
  if not (path.exists() and path.is_dir()):
27
- raise
27
+ raise
@@ -1 +0,0 @@
1
- __version__ = "1.1.2" # pragma: no cover