unstructured-ingest 1.0.47__tar.gz → 1.0.48__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of unstructured-ingest might be problematic. Click here for more details.

Files changed (239) hide show
  1. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/PKG-INFO +1 -1
  2. unstructured_ingest-1.0.48/unstructured_ingest/__version__.py +1 -0
  3. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/jira.py +61 -21
  4. unstructured_ingest-1.0.47/unstructured_ingest/__version__.py +0 -1
  5. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/.gitignore +0 -0
  6. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/LICENSE.md +0 -0
  7. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/README.md +0 -0
  8. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/pyproject.toml +0 -0
  9. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/__init__.py +0 -0
  10. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/README.md +0 -0
  11. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/__init__.py +0 -0
  12. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/base/__init__.py +0 -0
  13. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/base/cmd.py +0 -0
  14. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/base/dest.py +0 -0
  15. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/base/importer.py +0 -0
  16. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/base/src.py +0 -0
  17. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/cli.py +0 -0
  18. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/cmds.py +0 -0
  19. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/utils/__init__.py +0 -0
  20. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/utils/click.py +0 -0
  21. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/cli/utils/model_conversion.py +0 -0
  22. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/data_types/__init__.py +0 -0
  23. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/data_types/entities.py +0 -0
  24. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/data_types/file_data.py +0 -0
  25. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/__init__.py +0 -0
  26. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/azure_openai.py +0 -0
  27. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/bedrock.py +0 -0
  28. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/huggingface.py +0 -0
  29. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/interfaces.py +0 -0
  30. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/mixedbreadai.py +0 -0
  31. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/octoai.py +0 -0
  32. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/openai.py +0 -0
  33. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/togetherai.py +0 -0
  34. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/vertexai.py +0 -0
  35. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/embed/voyageai.py +0 -0
  36. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/error.py +0 -0
  37. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/errors_v2.py +0 -0
  38. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/__init__.py +0 -0
  39. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/connector.py +0 -0
  40. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/downloader.py +0 -0
  41. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/indexer.py +0 -0
  42. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/process.py +0 -0
  43. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/processor.py +0 -0
  44. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/upload_stager.py +0 -0
  45. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/interfaces/uploader.py +0 -0
  46. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/logger.py +0 -0
  47. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/main.py +0 -0
  48. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/otel.py +0 -0
  49. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/__init__.py +0 -0
  50. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/interfaces.py +0 -0
  51. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/otel.py +0 -0
  52. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/pipeline.py +0 -0
  53. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/__init__.py +0 -0
  54. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/chunk.py +0 -0
  55. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/download.py +0 -0
  56. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/embed.py +0 -0
  57. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/filter.py +0 -0
  58. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/index.py +0 -0
  59. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/partition.py +0 -0
  60. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/stage.py +0 -0
  61. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/uncompress.py +0 -0
  62. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/pipeline/steps/upload.py +0 -0
  63. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/__init__.py +0 -0
  64. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/chunker.py +0 -0
  65. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connector_registry.py +0 -0
  66. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/__init__.py +0 -0
  67. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/airtable.py +0 -0
  68. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/assets/__init__.py +0 -0
  69. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/assets/databricks_delta_table_schema.sql +0 -0
  70. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/assets/weaviate_collection_config.json +0 -0
  71. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/astradb.py +0 -0
  72. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/azure_ai_search.py +0 -0
  73. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/chroma.py +0 -0
  74. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/confluence.py +0 -0
  75. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/couchbase.py +0 -0
  76. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/__init__.py +0 -0
  77. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/volumes.py +0 -0
  78. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/volumes_aws.py +0 -0
  79. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/volumes_azure.py +0 -0
  80. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/volumes_gcp.py +0 -0
  81. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/volumes_native.py +0 -0
  82. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/databricks/volumes_table.py +0 -0
  83. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/delta_table.py +0 -0
  84. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/discord.py +0 -0
  85. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/duckdb/__init__.py +0 -0
  86. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/duckdb/base.py +0 -0
  87. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/duckdb/duckdb.py +0 -0
  88. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/duckdb/motherduck.py +0 -0
  89. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/elasticsearch/__init__.py +0 -0
  90. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/elasticsearch/elasticsearch.py +0 -0
  91. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/elasticsearch/opensearch.py +0 -0
  92. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/__init__.py +0 -0
  93. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/azure.py +0 -0
  94. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/box.py +0 -0
  95. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/dropbox.py +0 -0
  96. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/fsspec.py +0 -0
  97. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/gcs.py +0 -0
  98. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/s3.py +0 -0
  99. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/sftp.py +0 -0
  100. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/fsspec/utils.py +0 -0
  101. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/github.py +0 -0
  102. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/gitlab.py +0 -0
  103. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/google_drive.py +0 -0
  104. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/ibm_watsonx/__init__.py +0 -0
  105. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/ibm_watsonx/ibm_watsonx_s3.py +0 -0
  106. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/kafka/__init__.py +0 -0
  107. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/kafka/cloud.py +0 -0
  108. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/kafka/kafka.py +0 -0
  109. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/kafka/local.py +0 -0
  110. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/kdbai.py +0 -0
  111. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/__init__.py +0 -0
  112. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/aws.py +0 -0
  113. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/azure.py +0 -0
  114. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/cloud.py +0 -0
  115. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/gcp.py +0 -0
  116. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/lancedb.py +0 -0
  117. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/lancedb/local.py +0 -0
  118. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/local.py +0 -0
  119. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/milvus.py +0 -0
  120. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/mongodb.py +0 -0
  121. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/neo4j.py +0 -0
  122. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/__init__.py +0 -0
  123. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/client.py +0 -0
  124. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/connector.py +0 -0
  125. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/helpers.py +0 -0
  126. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/ingest_backoff/__init__.py +0 -0
  127. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_common.py +0 -0
  128. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/ingest_backoff/_wrapper.py +0 -0
  129. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/ingest_backoff/types.py +0 -0
  130. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/interfaces.py +0 -0
  131. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/__init__.py +0 -0
  132. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/block.py +0 -0
  133. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/__init__.py +0 -0
  134. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/bookmark.py +0 -0
  135. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/breadcrumb.py +0 -0
  136. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/bulleted_list_item.py +0 -0
  137. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/callout.py +0 -0
  138. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/child_database.py +0 -0
  139. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/child_page.py +0 -0
  140. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/code.py +0 -0
  141. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/column_list.py +0 -0
  142. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/divider.py +0 -0
  143. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/embed.py +0 -0
  144. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/equation.py +0 -0
  145. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/file.py +0 -0
  146. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/heading.py +0 -0
  147. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/image.py +0 -0
  148. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/link_preview.py +0 -0
  149. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/link_to_page.py +0 -0
  150. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/numbered_list.py +0 -0
  151. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/paragraph.py +0 -0
  152. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/pdf.py +0 -0
  153. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/quote.py +0 -0
  154. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/synced_block.py +0 -0
  155. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/table.py +0 -0
  156. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/table_of_contents.py +0 -0
  157. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/template.py +0 -0
  158. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/todo.py +0 -0
  159. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/toggle.py +0 -0
  160. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/unsupported.py +0 -0
  161. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/blocks/video.py +0 -0
  162. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database.py +0 -0
  163. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/__init__.py +0 -0
  164. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/checkbox.py +0 -0
  165. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_by.py +0 -0
  166. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/created_time.py +0 -0
  167. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/date.py +0 -0
  168. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/email.py +0 -0
  169. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/files.py +0 -0
  170. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/formula.py +0 -0
  171. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_by.py +0 -0
  172. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/last_edited_time.py +0 -0
  173. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/multiselect.py +0 -0
  174. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/number.py +0 -0
  175. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/people.py +0 -0
  176. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/phone_number.py +0 -0
  177. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/relation.py +0 -0
  178. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/rich_text.py +0 -0
  179. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/rollup.py +0 -0
  180. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/select.py +0 -0
  181. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/status.py +0 -0
  182. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/title.py +0 -0
  183. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/unique_id.py +0 -0
  184. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/url.py +0 -0
  185. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/database_properties/verification.py +0 -0
  186. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/date.py +0 -0
  187. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/file.py +0 -0
  188. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/page.py +0 -0
  189. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/parent.py +0 -0
  190. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/rich_text.py +0 -0
  191. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/notion/types/user.py +0 -0
  192. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/onedrive.py +0 -0
  193. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/outlook.py +0 -0
  194. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/pinecone.py +0 -0
  195. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/qdrant/__init__.py +0 -0
  196. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/qdrant/cloud.py +0 -0
  197. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/qdrant/local.py +0 -0
  198. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/qdrant/qdrant.py +0 -0
  199. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/qdrant/server.py +0 -0
  200. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/redisdb.py +0 -0
  201. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/salesforce.py +0 -0
  202. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sharepoint.py +0 -0
  203. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/slack.py +0 -0
  204. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/__init__.py +0 -0
  205. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/databricks_delta_tables.py +0 -0
  206. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/postgres.py +0 -0
  207. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/singlestore.py +0 -0
  208. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/snowflake.py +0 -0
  209. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/sql.py +0 -0
  210. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/sqlite.py +0 -0
  211. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/sql/vastdb.py +0 -0
  212. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/utils.py +0 -0
  213. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/vectara.py +0 -0
  214. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/weaviate/__init__.py +0 -0
  215. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/weaviate/cloud.py +0 -0
  216. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/weaviate/embedded.py +0 -0
  217. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/weaviate/local.py +0 -0
  218. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/weaviate/weaviate.py +0 -0
  219. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/zendesk/__init__.py +0 -0
  220. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/zendesk/client.py +0 -0
  221. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/connectors/zendesk/zendesk.py +0 -0
  222. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/embedder.py +0 -0
  223. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/filter.py +0 -0
  224. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/partitioner.py +0 -0
  225. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/uncompress.py +0 -0
  226. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/utils/__init__.py +0 -0
  227. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/processes/utils/blob_storage.py +0 -0
  228. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/unstructured_api.py +0 -0
  229. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/__init__.py +0 -0
  230. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/chunking.py +0 -0
  231. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/compression.py +0 -0
  232. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/constants.py +0 -0
  233. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/data_prep.py +0 -0
  234. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/dep_check.py +0 -0
  235. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/html.py +0 -0
  236. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/ndjson.py +0 -0
  237. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/pydantic_models.py +0 -0
  238. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/string_and_date_utils.py +0 -0
  239. {unstructured_ingest-1.0.47 → unstructured_ingest-1.0.48}/unstructured_ingest/utils/table.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: unstructured_ingest
3
- Version: 1.0.47
3
+ Version: 1.0.48
4
4
  Summary: Local ETL data pipeline to get data RAG ready
5
5
  Author-email: Unstructured Technologies <devops@unstructuredai.io>
6
6
  License-Expression: Apache-2.0
@@ -0,0 +1 @@
1
+ __version__ = "1.0.48" # pragma: no cover
@@ -41,10 +41,17 @@ DEFAULT_R_SEP = "\n"
41
41
  class JiraIssueMetadata(BaseModel):
42
42
  id: str
43
43
  key: str
44
+ fields: Optional[dict] = None # Add fields to capture attachment data
44
45
 
45
46
  def get_project_id(self) -> str:
46
47
  return self.key.split("-")[0]
47
48
 
49
+ def get_attachments(self) -> List[dict]:
50
+ """Extract attachment information from fields"""
51
+ if self.fields and "attachment" in self.fields:
52
+ return self.fields["attachment"]
53
+ return []
54
+
48
55
 
49
56
  class FieldGetter(dict):
50
57
  def __getitem__(self, key):
@@ -196,15 +203,17 @@ class JiraIndexer(Indexer):
196
203
  yield JiraIssueMetadata.model_validate(issue)
197
204
 
198
205
  def _get_issues_within_projects(self) -> Generator[JiraIssueMetadata, None, None]:
199
- fields = ["key", "id", "status"]
206
+ fields = ["key", "id", "status", "attachment"] # Add attachment field
200
207
  jql = "project in ({})".format(", ".join(self.index_config.projects))
201
208
  jql = self._update_jql(jql)
202
209
  logger.debug(f"running jql: {jql}")
203
210
  return self.run_jql(jql=jql, fields=fields)
204
211
 
205
- def _get_issues_within_single_board(self, board_id: str) -> List[JiraIssueMetadata]:
212
+ def _get_issues_within_single_board(
213
+ self, board_id: str
214
+ ) -> Generator[JiraIssueMetadata, None, None]:
206
215
  with self.connection_config.get_client() as client:
207
- fields = ["key", "id"]
216
+ fields = ["key", "id", "attachment"] # Add attachment field
208
217
  if self.index_config.status_filters:
209
218
  jql = "status in ({}) ORDER BY id".format(
210
219
  ", ".join([f'"{s}"' for s in self.index_config.status_filters])
@@ -233,23 +242,38 @@ class JiraIndexer(Indexer):
233
242
  return jql
234
243
 
235
244
  def _get_issues_by_keys(self) -> Generator[JiraIssueMetadata, None, None]:
236
- fields = ["key", "id"]
245
+ fields = ["key", "id", "attachment"] # Add attachment field
237
246
  jql = "key in ({})".format(", ".join(self.index_config.issues))
238
247
  jql = self._update_jql(jql)
239
248
  logger.debug(f"running jql: {jql}")
240
249
  return self.run_jql(jql=jql, fields=fields)
241
250
 
242
251
  def _create_file_data_from_issue(self, issue: JiraIssueMetadata) -> FileData:
243
- # Build metadata
252
+ # Construct relative path and filename first
253
+ filename = f"{issue.key}.txt"
254
+ relative_path = str(Path(issue.get_project_id()) / filename)
255
+
256
+ # Build metadata with attachments included in record_locator
257
+ record_locator = {"id": issue.id, "key": issue.key, "full_path": relative_path}
258
+
259
+ # Add attachments to record_locator if they exist
260
+ attachments = issue.get_attachments()
261
+ if attachments:
262
+ record_locator["attachments"] = [
263
+ {
264
+ "id": att["id"],
265
+ "filename": att["filename"],
266
+ "created": att.get("created"),
267
+ "mimeType": att.get("mimeType"),
268
+ }
269
+ for att in attachments
270
+ ]
271
+
244
272
  metadata = FileDataSourceMetadata(
245
273
  date_processed=str(time()),
246
- record_locator=issue.model_dump(),
274
+ record_locator=record_locator,
247
275
  )
248
276
 
249
- # Construct relative path and filename
250
- filename = f"{issue.id}.txt"
251
- relative_path = str(Path(issue.get_project_id()) / filename)
252
-
253
277
  source_identifiers = SourceIdentifiers(
254
278
  filename=filename,
255
279
  fullpath=relative_path,
@@ -400,21 +424,37 @@ class JiraDownloader(Downloader):
400
424
  self, attachment_dict: dict, parent_filedata: FileData
401
425
  ) -> FileData:
402
426
  new_filedata = parent_filedata.model_copy(deep=True)
403
- if new_filedata.metadata.record_locator is None:
404
- new_filedata.metadata.record_locator = {}
405
- new_filedata.metadata.record_locator["parent_issue"] = (
406
- parent_filedata.metadata.record_locator["id"]
407
- )
427
+
428
+ # Create attachment record_locator with parent context
429
+ attachment_record_locator = {
430
+ "id": attachment_dict["id"],
431
+ "filename": attachment_dict["filename"],
432
+ "created": attachment_dict.get("created"),
433
+ "mimeType": attachment_dict.get("mimeType"),
434
+ "parent": {
435
+ "id": parent_filedata.metadata.record_locator["id"],
436
+ "key": parent_filedata.metadata.record_locator["key"],
437
+ "full_path": parent_filedata.source_identifiers.fullpath,
438
+ },
439
+ }
440
+
408
441
  # Append an identifier for attachment to not conflict with issue ids
409
442
  new_filedata.identifier = "{}a".format(attachment_dict["id"])
410
- filename = attachment_dict["filename"]
411
- new_filedata.metadata.filesize_bytes = attachment_dict.pop("size", None)
412
- new_filedata.metadata.date_created = attachment_dict.pop("created", None)
413
- new_filedata.metadata.url = attachment_dict.pop("self", None)
414
- new_filedata.metadata.record_locator = attachment_dict
443
+ filename = f"{attachment_dict['filename']}.{attachment_dict['id']}"
444
+ new_filedata.metadata.filesize_bytes = attachment_dict.get("size")
445
+ new_filedata.metadata.date_created = attachment_dict.get("created")
446
+ new_filedata.metadata.url = attachment_dict.get("self")
447
+ new_filedata.metadata.record_locator = attachment_record_locator
448
+ full_path = (
449
+ Path(parent_filedata.source_identifiers.fullpath).with_suffix("") / Path(filename)
450
+ ).as_posix()
451
+ new_filedata.metadata.record_locator["full_path"] = full_path
415
452
  new_filedata.source_identifiers = SourceIdentifiers(
416
453
  filename=filename,
417
- fullpath=(Path(str(attachment_dict["id"])) / Path(filename)).as_posix(),
454
+ # add issue_parent to the fullpath and rel_path
455
+ # to ensure that the attachment is saved in the same folder as the parent issue
456
+ fullpath=full_path,
457
+ rel_path=full_path,
418
458
  )
419
459
  return new_filedata
420
460
 
@@ -1 +0,0 @@
1
- __version__ = "1.0.47" # pragma: no cover