unstructured-ingest 1.0.35__tar.gz → 1.0.37__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (240) hide show
  1. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/PKG-INFO +1 -1
  2. unstructured_ingest-1.0.37/unstructured_ingest/__version__.py +1 -0
  3. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/fsspec.py +3 -4
  4. unstructured_ingest-1.0.37/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +110 -0
  5. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sharepoint.py +32 -4
  6. unstructured_ingest-1.0.35/unstructured_ingest/__version__.py +0 -1
  7. unstructured_ingest-1.0.35/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +0 -57
  8. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/.gitignore +0 -0
  9. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/LICENSE.md +0 -0
  10. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/README.md +0 -0
  11. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/pyproject.toml +0 -0
  12. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/__init__.py +0 -0
  13. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/README.md +0 -0
  14. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/__init__.py +0 -0
  15. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/base/__init__.py +0 -0
  16. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/base/cmd.py +0 -0
  17. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/base/dest.py +0 -0
  18. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/base/importer.py +0 -0
  19. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/base/src.py +0 -0
  20. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/cli.py +0 -0
  21. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/cmds.py +0 -0
  22. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/utils/__init__.py +0 -0
  23. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/utils/click.py +0 -0
  24. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/cli/utils/model_conversion.py +0 -0
  25. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/data_types/__init__.py +0 -0
  26. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/data_types/entities.py +0 -0
  27. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/data_types/file_data.py +0 -0
  28. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/__init__.py +0 -0
  29. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/azure_openai.py +0 -0
  30. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/bedrock.py +0 -0
  31. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/huggingface.py +0 -0
  32. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/interfaces.py +0 -0
  33. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  34. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/octoai.py +0 -0
  35. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/openai.py +0 -0
  36. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/togetherai.py +0 -0
  37. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/vertexai.py +0 -0
  38. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/embed/voyageai.py +0 -0
  39. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/error.py +0 -0
  40. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/errors_v2.py +0 -0
  41. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/__init__.py +0 -0
  42. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/connector.py +0 -0
  43. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/downloader.py +0 -0
  44. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/indexer.py +0 -0
  45. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/process.py +0 -0
  46. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/processor.py +0 -0
  47. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/upload_stager.py +0 -0
  48. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/interfaces/uploader.py +0 -0
  49. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/logger.py +0 -0
  50. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/main.py +0 -0
  51. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/otel.py +0 -0
  52. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/__init__.py +0 -0
  53. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/interfaces.py +0 -0
  54. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/otel.py +0 -0
  55. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/pipeline.py +0 -0
  56. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/__init__.py +0 -0
  57. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/chunk.py +0 -0
  58. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/download.py +0 -0
  59. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/embed.py +0 -0
  60. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/filter.py +0 -0
  61. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/index.py +0 -0
  62. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/partition.py +0 -0
  63. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/stage.py +0 -0
  64. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/uncompress.py +0 -0
  65. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/pipeline/steps/upload.py +0 -0
  66. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/__init__.py +0 -0
  67. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/chunker.py +0 -0
  68. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connector_registry.py +0 -0
  69. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/__init__.py +0 -0
  70. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/airtable.py +0 -0
  71. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/assets/__init__.py +0 -0
  72. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql +0 -0
  73. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json +0 -0
  74. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/astradb.py +0 -0
  75. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/azure_ai_search.py +0 -0
  76. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/chroma.py +0 -0
  77. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/confluence.py +0 -0
  78. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/couchbase.py +0 -0
  79. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/__init__.py +0 -0
  80. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/volumes.py +0 -0
  81. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/volumes_aws.py +0 -0
  82. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/volumes_azure.py +0 -0
  83. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/volumes_gcp.py +0 -0
  84. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/volumes_native.py +0 -0
  85. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/databricks/volumes_table.py +0 -0
  86. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/delta_table.py +0 -0
  87. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/discord.py +0 -0
  88. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/duckdb/__init__.py +0 -0
  89. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/duckdb/base.py +0 -0
  90. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/duckdb/duckdb.py +0 -0
  91. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/duckdb/motherduck.py +0 -0
  92. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/elasticsearch/__init__.py +0 -0
  93. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py +0 -0
  94. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/elasticsearch/opensearch.py +0 -0
  95. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/__init__.py +0 -0
  96. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/azure.py +0 -0
  97. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/box.py +0 -0
  98. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/dropbox.py +0 -0
  99. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/gcs.py +0 -0
  100. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/s3.py +0 -0
  101. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/sftp.py +0 -0
  102. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/fsspec/utils.py +0 -0
  103. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/github.py +0 -0
  104. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/gitlab.py +0 -0
  105. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/google_drive.py +0 -0
  106. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py +0 -0
  107. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +0 -0
  108. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/jira.py +0 -0
  109. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/kafka/__init__.py +0 -0
  110. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/kafka/cloud.py +0 -0
  111. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/kafka/kafka.py +0 -0
  112. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/kafka/local.py +0 -0
  113. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/kdbai.py +0 -0
  114. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/__init__.py +0 -0
  115. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/aws.py +0 -0
  116. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/azure.py +0 -0
  117. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/cloud.py +0 -0
  118. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/gcp.py +0 -0
  119. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/lancedb.py +0 -0
  120. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/lancedb/local.py +0 -0
  121. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/local.py +0 -0
  122. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/milvus.py +0 -0
  123. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/mongodb.py +0 -0
  124. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/neo4j.py +0 -0
  125. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/__init__.py +0 -0
  126. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/client.py +0 -0
  127. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/connector.py +0 -0
  128. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/helpers.py +0 -0
  129. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/ingest_backoff/__init__.py +0 -0
  130. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_common.py +0 -0
  131. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py +0 -0
  132. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +0 -0
  133. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/interfaces.py +0 -0
  134. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/__init__.py +0 -0
  135. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/block.py +0 -0
  136. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/__init__.py +0 -0
  137. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py +0 -0
  138. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py +0 -0
  139. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -0
  140. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/callout.py +0 -0
  141. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py +0 -0
  142. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py +0 -0
  143. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/code.py +0 -0
  144. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py +0 -0
  145. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/divider.py +0 -0
  146. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/embed.py +0 -0
  147. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/equation.py +0 -0
  148. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/file.py +0 -0
  149. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/heading.py +0 -0
  150. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/image.py +0 -0
  151. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py +0 -0
  152. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py +0 -0
  153. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py +0 -0
  154. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py +0 -0
  155. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py +0 -0
  156. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/quote.py +0 -0
  157. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/table.py +0 -0
  158. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py +0 -0
  159. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/template.py +0 -0
  160. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/todo.py +0 -0
  161. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py +0 -0
  162. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py +0 -0
  163. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/blocks/video.py +0 -0
  164. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database.py +0 -0
  165. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py +0 -0
  166. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py +0 -0
  167. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py +0 -0
  168. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py +0 -0
  169. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/date.py +0 -0
  170. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/email.py +0 -0
  171. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/files.py +0 -0
  172. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py +0 -0
  173. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -0
  174. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py +0 -0
  175. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py +0 -0
  176. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/number.py +0 -0
  177. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/people.py +0 -0
  178. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py +0 -0
  179. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py +0 -0
  180. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py +0 -0
  181. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py +0 -0
  182. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/select.py +0 -0
  183. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/status.py +0 -0
  184. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/title.py +0 -0
  185. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py +0 -0
  186. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/url.py +0 -0
  187. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py +0 -0
  188. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/date.py +0 -0
  189. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/file.py +0 -0
  190. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/page.py +0 -0
  191. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/parent.py +0 -0
  192. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/rich_text.py +0 -0
  193. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/notion/types/user.py +0 -0
  194. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/onedrive.py +0 -0
  195. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/outlook.py +0 -0
  196. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/pinecone.py +0 -0
  197. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/qdrant/__init__.py +0 -0
  198. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/qdrant/cloud.py +0 -0
  199. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/qdrant/local.py +0 -0
  200. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/qdrant/qdrant.py +0 -0
  201. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/qdrant/server.py +0 -0
  202. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/redisdb.py +0 -0
  203. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/salesforce.py +0 -0
  204. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/slack.py +0 -0
  205. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/__init__.py +0 -0
  206. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py +0 -0
  207. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/postgres.py +0 -0
  208. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/singlestore.py +0 -0
  209. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/snowflake.py +0 -0
  210. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/sql.py +0 -0
  211. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/sqlite.py +0 -0
  212. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/sql/vastdb.py +0 -0
  213. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/utils.py +0 -0
  214. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/vectara.py +0 -0
  215. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/weaviate/__init__.py +0 -0
  216. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/weaviate/cloud.py +0 -0
  217. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/weaviate/embedded.py +0 -0
  218. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/weaviate/local.py +0 -0
  219. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/weaviate/weaviate.py +0 -0
  220. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/zendesk/__init__.py +0 -0
  221. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/zendesk/client.py +0 -0
  222. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/connectors/zendesk/zendesk.py +0 -0
  223. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/embedder.py +0 -0
  224. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/filter.py +0 -0
  225. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/partitioner.py +0 -0
  226. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/uncompress.py +0 -0
  227. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/utils/__init__.py +0 -0
  228. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/processes/utils/blob_storage.py +0 -0
  229. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/unstructured_api.py +0 -0
  230. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/__init__.py +0 -0
  231. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/chunking.py +0 -0
  232. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/compression.py +0 -0
  233. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/constants.py +0 -0
  234. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/data_prep.py +0 -0
  235. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/dep_check.py +0 -0
  236. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/html.py +0 -0
  237. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/ndjson.py +0 -0
  238. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/pydantic_models.py +0 -0
  239. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  240. {unstructured_ingest-1.0.35 → unstructured_ingest-1.0.37}/unstructured_ingest/utils/table.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: unstructured_ingest
3
- Version: 1.0.35
3
+ Version: 1.0.37
4
4
  Summary: Local ETL data pipeline to get data RAG ready
5
5
  Author-email: Unstructured Technologies <devops@unstructuredai.io>
6
6
  License-Expression: Apache-2.0
@@ -0,0 +1 @@
1
+ __version__ = "1.0.37" # pragma: no cover
@@ -343,10 +343,9 @@ class FsspecUploader(Uploader):
343
343
  raise self.wrap_error(e=e)
344
344
 
345
345
  def get_upload_path(self, file_data: FileData) -> Path:
346
- upload_path = (
347
- Path(self.upload_config.path_without_protocol)
348
- / file_data.source_identifiers.relative_path.lstrip("/")
349
- )
346
+ upload_path = Path(
347
+ self.upload_config.path_without_protocol
348
+ ) / file_data.source_identifiers.relative_path.lstrip("/")
350
349
  updated_upload_path = upload_path.parent / f"{upload_path.name}.json"
351
350
  return updated_upload_path
352
351
 
@@ -0,0 +1,110 @@
1
+ # https://developers.notion.com/reference/block#synced-block
2
+ from dataclasses import dataclass, field
3
+ from typing import List, Optional
4
+
5
+ from htmlBuilder.tags import HtmlTag
6
+
7
+ from unstructured_ingest.processes.connectors.notion.interfaces import BlockBase
8
+
9
+
10
+ @dataclass
11
+ class OriginalSyncedBlock(BlockBase):
12
+ synced_from: Optional[str] = None
13
+ children: List[dict] = field(default_factory=list)
14
+
15
+ @staticmethod
16
+ def can_have_children() -> bool:
17
+ return True
18
+
19
+ @classmethod
20
+ def from_dict(cls, data: dict):
21
+ """Create OriginalSyncedBlock from dictionary data.
22
+
23
+ Original blocks contain children content.
24
+ """
25
+ if "children" not in data:
26
+ raise ValueError(f"OriginalSyncedBlock data missing 'children': {data}")
27
+ return cls(children=data["children"])
28
+
29
+ def get_html(self) -> Optional[HtmlTag]:
30
+ return None
31
+
32
+
33
+ @dataclass
34
+ class DuplicateSyncedBlock(BlockBase):
35
+ type: str
36
+ block_id: str
37
+
38
+ @staticmethod
39
+ def can_have_children() -> bool:
40
+ """Check if duplicate synced blocks can have children.
41
+
42
+ Duplicate blocks themselves don't have children directly fetched here,
43
+ but they represent content that does, so Notion API might report has_children=True
44
+ on the parent block object. The actual children are fetched from the original block.
45
+ """
46
+ return True
47
+
48
+ @classmethod
49
+ def from_dict(cls, data: dict):
50
+ """Create DuplicateSyncedBlock from dictionary data.
51
+
52
+ Duplicate blocks contain a 'synced_from' reference.
53
+ """
54
+ synced_from_data = data.get("synced_from")
55
+ if not synced_from_data or not isinstance(synced_from_data, dict):
56
+ raise ValueError(f"Invalid data structure for DuplicateSyncedBlock: {data}")
57
+ # Ensure required keys are present in the nested dictionary
58
+ if "type" not in synced_from_data or "block_id" not in synced_from_data:
59
+ raise ValueError(
60
+ f"Missing 'type' or 'block_id' in synced_from data: {synced_from_data}"
61
+ )
62
+ return cls(type=synced_from_data["type"], block_id=synced_from_data["block_id"])
63
+
64
+ def get_html(self) -> Optional[HtmlTag]:
65
+ """Get HTML representation of the duplicate synced block.
66
+
67
+ HTML representation might need fetching the original block's content,
68
+ which is outside the scope of this simple data class.
69
+ """
70
+ return None
71
+
72
+
73
+ class SyncBlock(BlockBase):
74
+ @staticmethod
75
+ def can_have_children() -> bool:
76
+ """Check if synced blocks can have children.
77
+
78
+ Synced blocks (both original and duplicate) can conceptually have children.
79
+ """
80
+ return True
81
+
82
+ @classmethod
83
+ def from_dict(cls, data: dict):
84
+ """Create appropriate SyncedBlock subclass from dictionary data.
85
+
86
+ Determine if it's a duplicate (has 'synced_from') or original (has 'children').
87
+ """
88
+ if data.get("synced_from") is not None:
89
+ # It's a duplicate block containing a reference
90
+ return DuplicateSyncedBlock.from_dict(data)
91
+ elif "children" in data:
92
+ # It's an original block containing children
93
+ return OriginalSyncedBlock.from_dict(data)
94
+ else:
95
+ # Handle cases where neither 'synced_from' nor 'children' are present.
96
+ # Notion API might return this for an empty original synced block.
97
+ # Let's treat it as an empty OriginalSyncedBlock.
98
+ # If this assumption is wrong, errors might occur later.
99
+ # Consider logging a warning here if strictness is needed.
100
+ return OriginalSyncedBlock(children=[])
101
+
102
+
103
+ def get_html(self) -> Optional[HtmlTag]:
104
+ """Get HTML representation of the synced block.
105
+
106
+ The specific instance returned by from_dict (Original or Duplicate)
107
+ will handle its own get_html logic.
108
+ This method on the base SyncBlock might not be directly called.
109
+ """
110
+ return None
@@ -29,6 +29,7 @@ from unstructured_ingest.utils.dep_check import requires_dependencies
29
29
 
30
30
  if TYPE_CHECKING:
31
31
  from office365.onedrive.driveitems.driveItem import DriveItem
32
+ from office365.onedrive.sites.site import Site
32
33
 
33
34
  CONNECTOR_TYPE = "sharepoint"
34
35
  LEGACY_DEFAULT_PATH = "Shared Documents"
@@ -51,6 +52,33 @@ class SharepointConnectionConfig(OnedriveConnectionConfig):
51
52
  https://[tenant]-admin.sharepoint.com.\
52
53
  This requires the app to be registered at a tenant level"
53
54
  )
55
+ library: Optional[str] = Field(
56
+ default=None,
57
+ description="Sharepoint library name. If not provided, the default \
58
+ drive will be used.",
59
+ )
60
+
61
+ def _get_drive_item(self, client_site: Site) -> DriveItem:
62
+ """Helper method to get the drive item for the specified library or default drive."""
63
+ site_drive_item = None
64
+ if self.library:
65
+ for drive in client_site.drives.get().execute_query():
66
+ if drive.name == self.library:
67
+ logger.info(f"Found the requested library: {self.library}")
68
+ site_drive_item = drive.get().execute_query().root
69
+ break
70
+
71
+ # If no specific library was found or requested, use the default drive
72
+ if not site_drive_item:
73
+ if self.library:
74
+ logger.warning(
75
+ f"Library '{self.library}' not found in site '{self.site}'. "
76
+ "Using the default drive instead."
77
+ )
78
+
79
+ site_drive_item = client_site.drive.get().execute_query().root
80
+
81
+ return site_drive_item
54
82
 
55
83
 
56
84
  class SharepointIndexerConfig(OnedriveIndexerConfig):
@@ -76,8 +104,8 @@ class SharepointIndexer(OnedriveIndexer):
76
104
 
77
105
  client = await asyncio.to_thread(self.connection_config.get_client)
78
106
  try:
79
- site = client.sites.get_by_url(self.connection_config.site).get().execute_query()
80
- site_drive_item = site.drive.get().execute_query().root
107
+ client_site = client.sites.get_by_url(self.connection_config.site).get().execute_query()
108
+ site_drive_item = self.connection_config._get_drive_item(client_site)
81
109
  except ClientRequestException:
82
110
  logger.info("Site not found")
83
111
 
@@ -118,8 +146,8 @@ class SharepointDownloader(OnedriveDownloader):
118
146
  client = self.connection_config.get_client()
119
147
 
120
148
  try:
121
- site = client.sites.get_by_url(self.connection_config.site).get().execute_query()
122
- site_drive_item = site.drive.get().execute_query().root
149
+ client_site = client.sites.get_by_url(self.connection_config.site).get().execute_query()
150
+ site_drive_item = self.connection_config._get_drive_item(client_site)
123
151
  except ClientRequestException:
124
152
  logger.info("Site not found")
125
153
  file = site_drive_item.get_by_path(server_relative_path).get().execute_query()
@@ -1 +0,0 @@
1
- __version__ = "1.0.35" # pragma: no cover
@@ -1,57 +0,0 @@
1
- # https://developers.notion.com/reference/block#synced-block
2
- from dataclasses import dataclass, field
3
- from typing import List, Optional
4
-
5
- from htmlBuilder.tags import HtmlTag
6
-
7
- from unstructured_ingest.processes.connectors.notion.interfaces import BlockBase
8
-
9
-
10
- @dataclass
11
- class OriginalSyncedBlock(BlockBase):
12
- synced_from: Optional[str] = None
13
- children: List[dict] = field(default_factory=list)
14
-
15
- @staticmethod
16
- def can_have_children() -> bool:
17
- return True
18
-
19
- @classmethod
20
- def from_dict(cls, data: dict):
21
- return cls(children=data["children"])
22
-
23
- def get_html(self) -> Optional[HtmlTag]:
24
- return None
25
-
26
-
27
- @dataclass
28
- class DuplicateSyncedBlock(BlockBase):
29
- type: str
30
- block_id: str
31
-
32
- @staticmethod
33
- def can_have_children() -> bool:
34
- return True
35
-
36
- @classmethod
37
- def from_dict(cls, data: dict):
38
- return cls(**data)
39
-
40
- def get_html(self) -> Optional[HtmlTag]:
41
- return None
42
-
43
-
44
- class SyncBlock(BlockBase):
45
- @staticmethod
46
- def can_have_children() -> bool:
47
- return True
48
-
49
- @classmethod
50
- def from_dict(cls, data: dict):
51
- if "synced_from" in data:
52
- return OriginalSyncedBlock.from_dict(data)
53
- else:
54
- return DuplicateSyncedBlock.from_dict(data)
55
-
56
- def get_html(self) -> Optional[HtmlTag]:
57
- return None