llama-cloud 0.0.11__py3-none-any.whl → 0.0.12__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of llama-cloud might be problematic. Click here for more details.

Files changed (51) hide show
  1. llama_cloud/__init__.py +72 -10
  2. llama_cloud/client.py +3 -0
  3. llama_cloud/resources/__init__.py +11 -1
  4. llama_cloud/resources/auth/__init__.py +2 -0
  5. llama_cloud/resources/auth/client.py +124 -0
  6. llama_cloud/resources/data_sinks/types/data_sink_update_component_one.py +4 -0
  7. llama_cloud/resources/pipelines/__init__.py +12 -2
  8. llama_cloud/resources/pipelines/client.py +9 -47
  9. llama_cloud/resources/pipelines/types/__init__.py +11 -1
  10. llama_cloud/resources/pipelines/types/pipeline_update_transform_config.py +31 -0
  11. llama_cloud/types/__init__.py +70 -10
  12. llama_cloud/types/advanced_mode_transform_config.py +38 -0
  13. llama_cloud/types/advanced_mode_transform_config_chunking_config.py +67 -0
  14. llama_cloud/types/advanced_mode_transform_config_segmentation_config.py +45 -0
  15. llama_cloud/types/character_chunking_config.py +32 -0
  16. llama_cloud/types/{html_node_parser.py → character_splitter.py} +9 -9
  17. llama_cloud/types/chat_data.py +2 -0
  18. llama_cloud/types/cloud_az_storage_blob_data_source.py +11 -2
  19. llama_cloud/types/{transform_config.py → cloud_milvus_vector_store.py} +11 -7
  20. llama_cloud/types/cloud_mongo_db_atlas_vector_search.py +51 -0
  21. llama_cloud/types/configurable_data_sink_names.py +8 -0
  22. llama_cloud/types/configurable_transformation_names.py +8 -12
  23. llama_cloud/types/configured_transformation_item_component_one.py +4 -6
  24. llama_cloud/types/custom_claims.py +61 -0
  25. llama_cloud/types/data_sink_component_one.py +4 -0
  26. llama_cloud/types/data_sink_create_component_one.py +4 -0
  27. llama_cloud/types/element_segmentation_config.py +29 -0
  28. llama_cloud/types/embedding_config_component.py +2 -14
  29. llama_cloud/types/embedding_config_component_one.py +19 -0
  30. llama_cloud/types/eval_dataset_job_record.py +1 -0
  31. llama_cloud/types/ingestion_error_response.py +34 -0
  32. llama_cloud/types/job_name_mapping.py +45 -0
  33. llama_cloud/types/llama_parse_supported_file_extensions.py +32 -0
  34. llama_cloud/types/{simple_file_node_parser.py → llm_parameters.py} +6 -14
  35. llama_cloud/types/managed_ingestion_status_response.py +6 -0
  36. llama_cloud/types/none_chunking_config.py +29 -0
  37. llama_cloud/types/none_segmentation_config.py +29 -0
  38. llama_cloud/types/page_segmentation_config.py +29 -0
  39. llama_cloud/types/{json_node_parser.py → page_splitter_node_parser.py} +3 -8
  40. llama_cloud/types/parsing_job.py +2 -0
  41. llama_cloud/types/pipeline_create.py +2 -2
  42. llama_cloud/types/pipeline_create_transform_config.py +31 -0
  43. llama_cloud/types/semantic_chunking_config.py +32 -0
  44. llama_cloud/types/sentence_chunking_config.py +34 -0
  45. llama_cloud/types/token_chunking_config.py +33 -0
  46. llama_cloud/types/user.py +35 -0
  47. {llama_cloud-0.0.11.dist-info → llama_cloud-0.0.12.dist-info}/METADATA +1 -1
  48. {llama_cloud-0.0.11.dist-info → llama_cloud-0.0.12.dist-info}/RECORD +50 -30
  49. llama_cloud/types/transform_config_mode.py +0 -21
  50. {llama_cloud-0.0.11.dist-info → llama_cloud-0.0.12.dist-info}/LICENSE +0 -0
  51. {llama_cloud-0.0.11.dist-info → llama_cloud-0.0.12.dist-info}/WHEEL +0 -0
@@ -36,8 +36,8 @@ from ...types.preset_retrieval_params import PresetRetrievalParams
36
36
  from ...types.retrieval_mode import RetrievalMode
37
37
  from ...types.retrieve_results import RetrieveResults
38
38
  from ...types.text_node import TextNode
39
- from ...types.transform_config import TransformConfig
40
39
  from .types.pipeline_file_update_custom_metadata_value import PipelineFileUpdateCustomMetadataValue
40
+ from .types.pipeline_update_transform_config import PipelineUpdateTransformConfig
41
41
 
42
42
  try:
43
43
  import pydantic
@@ -119,7 +119,6 @@ class PipelinesClient:
119
119
  - request: PipelineCreate.
120
120
  ---
121
121
  from llama_cloud import (
122
- AutoTransformConfig,
123
122
  ConfigurableDataSinkNames,
124
123
  DataSinkCreate,
125
124
  EmbeddingConfig,
@@ -133,8 +132,6 @@ class PipelinesClient:
133
132
  PresetRetrievalParams,
134
133
  RetrievalMode,
135
134
  SupportedEvalLlmModelNames,
136
- TransformConfig,
137
- TransformConfigMode,
138
135
  )
139
136
  from llama_cloud.client import LlamaCloud
140
137
 
@@ -146,10 +143,6 @@ class PipelinesClient:
146
143
  embedding_config=EmbeddingConfig(
147
144
  type=EmbeddingConfigType.OPENAI_EMBEDDING,
148
145
  ),
149
- transform_config=TransformConfig(
150
- mode=TransformConfigMode.AUTO,
151
- config=AutoTransformConfig(),
152
- ),
153
146
  data_sink=DataSinkCreate(
154
147
  name="string",
155
148
  sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -199,7 +192,6 @@ class PipelinesClient:
199
192
  - request: PipelineCreate.
200
193
  ---
201
194
  from llama_cloud import (
202
- AutoTransformConfig,
203
195
  ConfigurableDataSinkNames,
204
196
  DataSinkCreate,
205
197
  EmbeddingConfig,
@@ -213,8 +205,6 @@ class PipelinesClient:
213
205
  PresetRetrievalParams,
214
206
  RetrievalMode,
215
207
  SupportedEvalLlmModelNames,
216
- TransformConfig,
217
- TransformConfigMode,
218
208
  )
219
209
  from llama_cloud.client import LlamaCloud
220
210
 
@@ -226,10 +216,6 @@ class PipelinesClient:
226
216
  embedding_config=EmbeddingConfig(
227
217
  type=EmbeddingConfigType.OPENAI_EMBEDDING,
228
218
  ),
229
- transform_config=TransformConfig(
230
- mode=TransformConfigMode.AUTO,
231
- config=AutoTransformConfig(),
232
- ),
233
219
  data_sink=DataSinkCreate(
234
220
  name="string",
235
221
  sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -305,7 +291,7 @@ class PipelinesClient:
305
291
  pipeline_id: str,
306
292
  *,
307
293
  embedding_config: typing.Optional[EmbeddingConfig] = OMIT,
308
- transform_config: typing.Optional[TransformConfig] = OMIT,
294
+ transform_config: typing.Optional[PipelineUpdateTransformConfig] = OMIT,
309
295
  configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]] = OMIT,
310
296
  data_sink_id: typing.Optional[str] = OMIT,
311
297
  data_sink: typing.Optional[DataSinkCreate] = OMIT,
@@ -323,7 +309,7 @@ class PipelinesClient:
323
309
 
324
310
  - embedding_config: typing.Optional[EmbeddingConfig]. Configuration for the embedding model.
325
311
 
326
- - transform_config: typing.Optional[TransformConfig]. Configuration for the transformation.
312
+ - transform_config: typing.Optional[PipelineUpdateTransformConfig]. Configuration for the transformation.
327
313
 
328
314
  - configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]]. List of configured transformations.
329
315
 
@@ -342,7 +328,6 @@ class PipelinesClient:
342
328
  - managed_pipeline_id: typing.Optional[str]. The ID of the ManagedPipeline this playground pipeline is linked to.
343
329
  ---
344
330
  from llama_cloud import (
345
- AutoTransformConfig,
346
331
  ConfigurableDataSinkNames,
347
332
  DataSinkCreate,
348
333
  EmbeddingConfig,
@@ -354,8 +339,6 @@ class PipelinesClient:
354
339
  PresetRetrievalParams,
355
340
  RetrievalMode,
356
341
  SupportedEvalLlmModelNames,
357
- TransformConfig,
358
- TransformConfigMode,
359
342
  )
360
343
  from llama_cloud.client import LlamaCloud
361
344
 
@@ -367,10 +350,6 @@ class PipelinesClient:
367
350
  embedding_config=EmbeddingConfig(
368
351
  type=EmbeddingConfigType.OPENAI_EMBEDDING,
369
352
  ),
370
- transform_config=TransformConfig(
371
- mode=TransformConfigMode.AUTO,
372
- config=AutoTransformConfig(),
373
- ),
374
353
  data_sink=DataSinkCreate(
375
354
  name="string",
376
355
  sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -1329,6 +1308,7 @@ class PipelinesClient:
1329
1308
  from llama_cloud import (
1330
1309
  ChatData,
1331
1310
  FilterCondition,
1311
+ LlmParameters,
1332
1312
  MetadataFilters,
1333
1313
  PresetRetrievalParams,
1334
1314
  RetrievalMode,
@@ -1349,6 +1329,7 @@ class PipelinesClient:
1349
1329
  ),
1350
1330
  retrieval_mode=RetrievalMode.CHUNKS,
1351
1331
  ),
1332
+ llm_parameters=LlmParameters(),
1352
1333
  ),
1353
1334
  )
1354
1335
  """
@@ -1724,7 +1705,6 @@ class AsyncPipelinesClient:
1724
1705
  - request: PipelineCreate.
1725
1706
  ---
1726
1707
  from llama_cloud import (
1727
- AutoTransformConfig,
1728
1708
  ConfigurableDataSinkNames,
1729
1709
  DataSinkCreate,
1730
1710
  EmbeddingConfig,
@@ -1738,8 +1718,6 @@ class AsyncPipelinesClient:
1738
1718
  PresetRetrievalParams,
1739
1719
  RetrievalMode,
1740
1720
  SupportedEvalLlmModelNames,
1741
- TransformConfig,
1742
- TransformConfigMode,
1743
1721
  )
1744
1722
  from llama_cloud.client import AsyncLlamaCloud
1745
1723
 
@@ -1751,10 +1729,6 @@ class AsyncPipelinesClient:
1751
1729
  embedding_config=EmbeddingConfig(
1752
1730
  type=EmbeddingConfigType.OPENAI_EMBEDDING,
1753
1731
  ),
1754
- transform_config=TransformConfig(
1755
- mode=TransformConfigMode.AUTO,
1756
- config=AutoTransformConfig(),
1757
- ),
1758
1732
  data_sink=DataSinkCreate(
1759
1733
  name="string",
1760
1734
  sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -1804,7 +1778,6 @@ class AsyncPipelinesClient:
1804
1778
  - request: PipelineCreate.
1805
1779
  ---
1806
1780
  from llama_cloud import (
1807
- AutoTransformConfig,
1808
1781
  ConfigurableDataSinkNames,
1809
1782
  DataSinkCreate,
1810
1783
  EmbeddingConfig,
@@ -1818,8 +1791,6 @@ class AsyncPipelinesClient:
1818
1791
  PresetRetrievalParams,
1819
1792
  RetrievalMode,
1820
1793
  SupportedEvalLlmModelNames,
1821
- TransformConfig,
1822
- TransformConfigMode,
1823
1794
  )
1824
1795
  from llama_cloud.client import AsyncLlamaCloud
1825
1796
 
@@ -1831,10 +1802,6 @@ class AsyncPipelinesClient:
1831
1802
  embedding_config=EmbeddingConfig(
1832
1803
  type=EmbeddingConfigType.OPENAI_EMBEDDING,
1833
1804
  ),
1834
- transform_config=TransformConfig(
1835
- mode=TransformConfigMode.AUTO,
1836
- config=AutoTransformConfig(),
1837
- ),
1838
1805
  data_sink=DataSinkCreate(
1839
1806
  name="string",
1840
1807
  sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -1910,7 +1877,7 @@ class AsyncPipelinesClient:
1910
1877
  pipeline_id: str,
1911
1878
  *,
1912
1879
  embedding_config: typing.Optional[EmbeddingConfig] = OMIT,
1913
- transform_config: typing.Optional[TransformConfig] = OMIT,
1880
+ transform_config: typing.Optional[PipelineUpdateTransformConfig] = OMIT,
1914
1881
  configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]] = OMIT,
1915
1882
  data_sink_id: typing.Optional[str] = OMIT,
1916
1883
  data_sink: typing.Optional[DataSinkCreate] = OMIT,
@@ -1928,7 +1895,7 @@ class AsyncPipelinesClient:
1928
1895
 
1929
1896
  - embedding_config: typing.Optional[EmbeddingConfig]. Configuration for the embedding model.
1930
1897
 
1931
- - transform_config: typing.Optional[TransformConfig]. Configuration for the transformation.
1898
+ - transform_config: typing.Optional[PipelineUpdateTransformConfig]. Configuration for the transformation.
1932
1899
 
1933
1900
  - configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]]. List of configured transformations.
1934
1901
 
@@ -1947,7 +1914,6 @@ class AsyncPipelinesClient:
1947
1914
  - managed_pipeline_id: typing.Optional[str]. The ID of the ManagedPipeline this playground pipeline is linked to.
1948
1915
  ---
1949
1916
  from llama_cloud import (
1950
- AutoTransformConfig,
1951
1917
  ConfigurableDataSinkNames,
1952
1918
  DataSinkCreate,
1953
1919
  EmbeddingConfig,
@@ -1959,8 +1925,6 @@ class AsyncPipelinesClient:
1959
1925
  PresetRetrievalParams,
1960
1926
  RetrievalMode,
1961
1927
  SupportedEvalLlmModelNames,
1962
- TransformConfig,
1963
- TransformConfigMode,
1964
1928
  )
1965
1929
  from llama_cloud.client import AsyncLlamaCloud
1966
1930
 
@@ -1972,10 +1936,6 @@ class AsyncPipelinesClient:
1972
1936
  embedding_config=EmbeddingConfig(
1973
1937
  type=EmbeddingConfigType.OPENAI_EMBEDDING,
1974
1938
  ),
1975
- transform_config=TransformConfig(
1976
- mode=TransformConfigMode.AUTO,
1977
- config=AutoTransformConfig(),
1978
- ),
1979
1939
  data_sink=DataSinkCreate(
1980
1940
  name="string",
1981
1941
  sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -2936,6 +2896,7 @@ class AsyncPipelinesClient:
2936
2896
  from llama_cloud import (
2937
2897
  ChatData,
2938
2898
  FilterCondition,
2899
+ LlmParameters,
2939
2900
  MetadataFilters,
2940
2901
  PresetRetrievalParams,
2941
2902
  RetrievalMode,
@@ -2956,6 +2917,7 @@ class AsyncPipelinesClient:
2956
2917
  ),
2957
2918
  retrieval_mode=RetrievalMode.CHUNKS,
2958
2919
  ),
2920
+ llm_parameters=LlmParameters(),
2959
2921
  ),
2960
2922
  )
2961
2923
  """
@@ -1,5 +1,15 @@
1
1
  # This file was auto-generated by Fern from our API Definition.
2
2
 
3
3
  from .pipeline_file_update_custom_metadata_value import PipelineFileUpdateCustomMetadataValue
4
+ from .pipeline_update_transform_config import (
5
+ PipelineUpdateTransformConfig,
6
+ PipelineUpdateTransformConfig_Advanced,
7
+ PipelineUpdateTransformConfig_Auto,
8
+ )
4
9
 
5
- __all__ = ["PipelineFileUpdateCustomMetadataValue"]
10
+ __all__ = [
11
+ "PipelineFileUpdateCustomMetadataValue",
12
+ "PipelineUpdateTransformConfig",
13
+ "PipelineUpdateTransformConfig_Advanced",
14
+ "PipelineUpdateTransformConfig_Auto",
15
+ ]
@@ -0,0 +1,31 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ from __future__ import annotations
4
+
5
+ import typing
6
+
7
+ import typing_extensions
8
+
9
+ from ....types.advanced_mode_transform_config import AdvancedModeTransformConfig
10
+ from ....types.auto_transform_config import AutoTransformConfig
11
+
12
+
13
+ class PipelineUpdateTransformConfig_Auto(AutoTransformConfig):
14
+ mode: typing_extensions.Literal["auto"]
15
+
16
+ class Config:
17
+ frozen = True
18
+ smart_union = True
19
+ allow_population_by_field_name = True
20
+
21
+
22
+ class PipelineUpdateTransformConfig_Advanced(AdvancedModeTransformConfig):
23
+ mode: typing_extensions.Literal["advanced"]
24
+
25
+ class Config:
26
+ frozen = True
27
+ smart_union = True
28
+ allow_population_by_field_name = True
29
+
30
+
31
+ PipelineUpdateTransformConfig = typing.Union[PipelineUpdateTransformConfig_Auto, PipelineUpdateTransformConfig_Advanced]
@@ -1,10 +1,27 @@
1
1
  # This file was auto-generated by Fern from our API Definition.
2
2
 
3
+ from .advanced_mode_transform_config import AdvancedModeTransformConfig
4
+ from .advanced_mode_transform_config_chunking_config import (
5
+ AdvancedModeTransformConfigChunkingConfig,
6
+ AdvancedModeTransformConfigChunkingConfig_Character,
7
+ AdvancedModeTransformConfigChunkingConfig_None,
8
+ AdvancedModeTransformConfigChunkingConfig_Semantic,
9
+ AdvancedModeTransformConfigChunkingConfig_Sentence,
10
+ AdvancedModeTransformConfigChunkingConfig_Token,
11
+ )
12
+ from .advanced_mode_transform_config_segmentation_config import (
13
+ AdvancedModeTransformConfigSegmentationConfig,
14
+ AdvancedModeTransformConfigSegmentationConfig_Element,
15
+ AdvancedModeTransformConfigSegmentationConfig_None,
16
+ AdvancedModeTransformConfigSegmentationConfig_Page,
17
+ )
3
18
  from .auto_transform_config import AutoTransformConfig
4
19
  from .azure_open_ai_embedding import AzureOpenAiEmbedding
5
20
  from .base import Base
6
21
  from .base_prompt_template import BasePromptTemplate
7
22
  from .bedrock_embedding import BedrockEmbedding
23
+ from .character_chunking_config import CharacterChunkingConfig
24
+ from .character_splitter import CharacterSplitter
8
25
  from .chat_data import ChatData
9
26
  from .chat_message import ChatMessage
10
27
  from .cloud_az_storage_blob_data_source import CloudAzStorageBlobDataSource
@@ -14,6 +31,8 @@ from .cloud_confluence_data_source import CloudConfluenceDataSource
14
31
  from .cloud_document import CloudDocument
15
32
  from .cloud_document_create import CloudDocumentCreate
16
33
  from .cloud_jira_data_source import CloudJiraDataSource
34
+ from .cloud_milvus_vector_store import CloudMilvusVectorStore
35
+ from .cloud_mongo_db_atlas_vector_search import CloudMongoDbAtlasVectorSearch
17
36
  from .cloud_notion_page_data_source import CloudNotionPageDataSource
18
37
  from .cloud_one_drive_data_source import CloudOneDriveDataSource
19
38
  from .cloud_pinecone_vector_store import CloudPineconeVectorStore
@@ -32,6 +51,7 @@ from .configurable_transformation_names import ConfigurableTransformationNames
32
51
  from .configured_transformation_item import ConfiguredTransformationItem
33
52
  from .configured_transformation_item_component import ConfiguredTransformationItemComponent
34
53
  from .configured_transformation_item_component_one import ConfiguredTransformationItemComponentOne
54
+ from .custom_claims import CustomClaims
35
55
  from .data_sink import DataSink
36
56
  from .data_sink_component import DataSinkComponent
37
57
  from .data_sink_component_one import DataSinkComponentOne
@@ -48,8 +68,10 @@ from .data_source_create_component_one import DataSourceCreateComponentOne
48
68
  from .data_source_create_custom_metadata_value import DataSourceCreateCustomMetadataValue
49
69
  from .data_source_custom_metadata_value import DataSourceCustomMetadataValue
50
70
  from .data_source_definition import DataSourceDefinition
71
+ from .element_segmentation_config import ElementSegmentationConfig
51
72
  from .embedding_config import EmbeddingConfig
52
73
  from .embedding_config_component import EmbeddingConfigComponent
74
+ from .embedding_config_component_one import EmbeddingConfigComponentOne
53
75
  from .embedding_config_type import EmbeddingConfigType
54
76
  from .eval_dataset import EvalDataset
55
77
  from .eval_dataset_job_params import EvalDatasetJobParams
@@ -70,14 +92,15 @@ from .file_resource_info_value import FileResourceInfoValue
70
92
  from .filter_condition import FilterCondition
71
93
  from .filter_operator import FilterOperator
72
94
  from .gemini_embedding import GeminiEmbedding
73
- from .html_node_parser import HtmlNodeParser
74
95
  from .http_validation_error import HttpValidationError
75
96
  from .hugging_face_inference_api_embedding import HuggingFaceInferenceApiEmbedding
76
97
  from .hugging_face_inference_api_embedding_token import HuggingFaceInferenceApiEmbeddingToken
77
- from .json_node_parser import JsonNodeParser
98
+ from .ingestion_error_response import IngestionErrorResponse
99
+ from .job_name_mapping import JobNameMapping
78
100
  from .llama_parse_parameters import LlamaParseParameters
79
101
  from .llama_parse_supported_file_extensions import LlamaParseSupportedFileExtensions
80
102
  from .llm import Llm
103
+ from .llm_parameters import LlmParameters
81
104
  from .local_eval import LocalEval
82
105
  from .local_eval_results import LocalEvalResults
83
106
  from .local_eval_sets import LocalEvalSets
@@ -92,10 +115,14 @@ from .metadata_filters import MetadataFilters
92
115
  from .metadata_filters_filters_item import MetadataFiltersFiltersItem
93
116
  from .metric_result import MetricResult
94
117
  from .node_parser import NodeParser
118
+ from .none_chunking_config import NoneChunkingConfig
119
+ from .none_segmentation_config import NoneSegmentationConfig
95
120
  from .object_type import ObjectType
96
121
  from .open_ai_embedding import OpenAiEmbedding
97
122
  from .organization import Organization
98
123
  from .organization_create import OrganizationCreate
124
+ from .page_segmentation_config import PageSegmentationConfig
125
+ from .page_splitter_node_parser import PageSplitterNodeParser
99
126
  from .parser_languages import ParserLanguages
100
127
  from .parsing_history_item import ParsingHistoryItem
101
128
  from .parsing_job import ParsingJob
@@ -105,6 +132,11 @@ from .parsing_job_text_result import ParsingJobTextResult
105
132
  from .parsing_usage import ParsingUsage
106
133
  from .pipeline import Pipeline
107
134
  from .pipeline_create import PipelineCreate
135
+ from .pipeline_create_transform_config import (
136
+ PipelineCreateTransformConfig,
137
+ PipelineCreateTransformConfig_Advanced,
138
+ PipelineCreateTransformConfig_Auto,
139
+ )
108
140
  from .pipeline_data_source import PipelineDataSource
109
141
  from .pipeline_data_source_component import PipelineDataSourceComponent
110
142
  from .pipeline_data_source_component_one import PipelineDataSourceComponentOne
@@ -128,18 +160,19 @@ from .pydantic_program_mode import PydanticProgramMode
128
160
  from .related_node_info import RelatedNodeInfo
129
161
  from .retrieval_mode import RetrievalMode
130
162
  from .retrieve_results import RetrieveResults
163
+ from .semantic_chunking_config import SemanticChunkingConfig
164
+ from .sentence_chunking_config import SentenceChunkingConfig
131
165
  from .sentence_splitter import SentenceSplitter
132
- from .simple_file_node_parser import SimpleFileNodeParser
133
166
  from .status_enum import StatusEnum
134
167
  from .supported_eval_llm_model import SupportedEvalLlmModel
135
168
  from .supported_eval_llm_model_names import SupportedEvalLlmModelNames
136
169
  from .text_node import TextNode
137
170
  from .text_node_relationships_value import TextNodeRelationshipsValue
138
171
  from .text_node_with_score import TextNodeWithScore
172
+ from .token_chunking_config import TokenChunkingConfig
139
173
  from .token_text_splitter import TokenTextSplitter
140
- from .transform_config import TransformConfig
141
- from .transform_config_mode import TransformConfigMode
142
174
  from .transformation_category_names import TransformationCategoryNames
175
+ from .user import User
143
176
  from .user_organization import UserOrganization
144
177
  from .user_organization_create import UserOrganizationCreate
145
178
  from .user_organization_delete import UserOrganizationDelete
@@ -147,11 +180,24 @@ from .validation_error import ValidationError
147
180
  from .validation_error_loc_item import ValidationErrorLocItem
148
181
 
149
182
  __all__ = [
183
+ "AdvancedModeTransformConfig",
184
+ "AdvancedModeTransformConfigChunkingConfig",
185
+ "AdvancedModeTransformConfigChunkingConfig_Character",
186
+ "AdvancedModeTransformConfigChunkingConfig_None",
187
+ "AdvancedModeTransformConfigChunkingConfig_Semantic",
188
+ "AdvancedModeTransformConfigChunkingConfig_Sentence",
189
+ "AdvancedModeTransformConfigChunkingConfig_Token",
190
+ "AdvancedModeTransformConfigSegmentationConfig",
191
+ "AdvancedModeTransformConfigSegmentationConfig_Element",
192
+ "AdvancedModeTransformConfigSegmentationConfig_None",
193
+ "AdvancedModeTransformConfigSegmentationConfig_Page",
150
194
  "AutoTransformConfig",
151
195
  "AzureOpenAiEmbedding",
152
196
  "Base",
153
197
  "BasePromptTemplate",
154
198
  "BedrockEmbedding",
199
+ "CharacterChunkingConfig",
200
+ "CharacterSplitter",
155
201
  "ChatData",
156
202
  "ChatMessage",
157
203
  "CloudAzStorageBlobDataSource",
@@ -161,6 +207,8 @@ __all__ = [
161
207
  "CloudDocument",
162
208
  "CloudDocumentCreate",
163
209
  "CloudJiraDataSource",
210
+ "CloudMilvusVectorStore",
211
+ "CloudMongoDbAtlasVectorSearch",
164
212
  "CloudNotionPageDataSource",
165
213
  "CloudOneDriveDataSource",
166
214
  "CloudPineconeVectorStore",
@@ -179,6 +227,7 @@ __all__ = [
179
227
  "ConfiguredTransformationItem",
180
228
  "ConfiguredTransformationItemComponent",
181
229
  "ConfiguredTransformationItemComponentOne",
230
+ "CustomClaims",
182
231
  "DataSink",
183
232
  "DataSinkComponent",
184
233
  "DataSinkComponentOne",
@@ -195,8 +244,10 @@ __all__ = [
195
244
  "DataSourceCreateCustomMetadataValue",
196
245
  "DataSourceCustomMetadataValue",
197
246
  "DataSourceDefinition",
247
+ "ElementSegmentationConfig",
198
248
  "EmbeddingConfig",
199
249
  "EmbeddingConfigComponent",
250
+ "EmbeddingConfigComponentOne",
200
251
  "EmbeddingConfigType",
201
252
  "EvalDataset",
202
253
  "EvalDatasetJobParams",
@@ -217,14 +268,15 @@ __all__ = [
217
268
  "FilterCondition",
218
269
  "FilterOperator",
219
270
  "GeminiEmbedding",
220
- "HtmlNodeParser",
221
271
  "HttpValidationError",
222
272
  "HuggingFaceInferenceApiEmbedding",
223
273
  "HuggingFaceInferenceApiEmbeddingToken",
224
- "JsonNodeParser",
274
+ "IngestionErrorResponse",
275
+ "JobNameMapping",
225
276
  "LlamaParseParameters",
226
277
  "LlamaParseSupportedFileExtensions",
227
278
  "Llm",
279
+ "LlmParameters",
228
280
  "LocalEval",
229
281
  "LocalEvalResults",
230
282
  "LocalEvalSets",
@@ -239,10 +291,14 @@ __all__ = [
239
291
  "MetadataFiltersFiltersItem",
240
292
  "MetricResult",
241
293
  "NodeParser",
294
+ "NoneChunkingConfig",
295
+ "NoneSegmentationConfig",
242
296
  "ObjectType",
243
297
  "OpenAiEmbedding",
244
298
  "Organization",
245
299
  "OrganizationCreate",
300
+ "PageSegmentationConfig",
301
+ "PageSplitterNodeParser",
246
302
  "ParserLanguages",
247
303
  "ParsingHistoryItem",
248
304
  "ParsingJob",
@@ -252,6 +308,9 @@ __all__ = [
252
308
  "ParsingUsage",
253
309
  "Pipeline",
254
310
  "PipelineCreate",
311
+ "PipelineCreateTransformConfig",
312
+ "PipelineCreateTransformConfig_Advanced",
313
+ "PipelineCreateTransformConfig_Auto",
255
314
  "PipelineDataSource",
256
315
  "PipelineDataSourceComponent",
257
316
  "PipelineDataSourceComponentOne",
@@ -275,18 +334,19 @@ __all__ = [
275
334
  "RelatedNodeInfo",
276
335
  "RetrievalMode",
277
336
  "RetrieveResults",
337
+ "SemanticChunkingConfig",
338
+ "SentenceChunkingConfig",
278
339
  "SentenceSplitter",
279
- "SimpleFileNodeParser",
280
340
  "StatusEnum",
281
341
  "SupportedEvalLlmModel",
282
342
  "SupportedEvalLlmModelNames",
283
343
  "TextNode",
284
344
  "TextNodeRelationshipsValue",
285
345
  "TextNodeWithScore",
346
+ "TokenChunkingConfig",
286
347
  "TokenTextSplitter",
287
- "TransformConfig",
288
- "TransformConfigMode",
289
348
  "TransformationCategoryNames",
349
+ "User",
290
350
  "UserOrganization",
291
351
  "UserOrganizationCreate",
292
352
  "UserOrganizationDelete",
@@ -0,0 +1,38 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ import datetime as dt
4
+ import typing
5
+
6
+ from ..core.datetime_utils import serialize_datetime
7
+ from .advanced_mode_transform_config_chunking_config import AdvancedModeTransformConfigChunkingConfig
8
+ from .advanced_mode_transform_config_segmentation_config import AdvancedModeTransformConfigSegmentationConfig
9
+
10
+ try:
11
+ import pydantic
12
+ if pydantic.__version__.startswith("1."):
13
+ raise ImportError
14
+ import pydantic.v1 as pydantic # type: ignore
15
+ except ImportError:
16
+ import pydantic # type: ignore
17
+
18
+
19
+ class AdvancedModeTransformConfig(pydantic.BaseModel):
20
+ segmentation_config: typing.Optional[AdvancedModeTransformConfigSegmentationConfig] = pydantic.Field(
21
+ description="Configuration for the segmentation."
22
+ )
23
+ chunking_config: typing.Optional[AdvancedModeTransformConfigChunkingConfig] = pydantic.Field(
24
+ description="Configuration for the chunking."
25
+ )
26
+
27
+ def json(self, **kwargs: typing.Any) -> str:
28
+ kwargs_with_defaults: typing.Any = {"by_alias": True, "exclude_unset": True, **kwargs}
29
+ return super().json(**kwargs_with_defaults)
30
+
31
+ def dict(self, **kwargs: typing.Any) -> typing.Dict[str, typing.Any]:
32
+ kwargs_with_defaults: typing.Any = {"by_alias": True, "exclude_unset": True, **kwargs}
33
+ return super().dict(**kwargs_with_defaults)
34
+
35
+ class Config:
36
+ frozen = True
37
+ smart_union = True
38
+ json_encoders = {dt.datetime: serialize_datetime}
@@ -0,0 +1,67 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ from __future__ import annotations
4
+
5
+ import typing
6
+
7
+ import typing_extensions
8
+
9
+ from .character_chunking_config import CharacterChunkingConfig
10
+ from .none_chunking_config import NoneChunkingConfig
11
+ from .semantic_chunking_config import SemanticChunkingConfig
12
+ from .sentence_chunking_config import SentenceChunkingConfig
13
+ from .token_chunking_config import TokenChunkingConfig
14
+
15
+
16
+ class AdvancedModeTransformConfigChunkingConfig_None(NoneChunkingConfig):
17
+ mode: typing_extensions.Literal["none"]
18
+
19
+ class Config:
20
+ frozen = True
21
+ smart_union = True
22
+ allow_population_by_field_name = True
23
+
24
+
25
+ class AdvancedModeTransformConfigChunkingConfig_Character(CharacterChunkingConfig):
26
+ mode: typing_extensions.Literal["character"]
27
+
28
+ class Config:
29
+ frozen = True
30
+ smart_union = True
31
+ allow_population_by_field_name = True
32
+
33
+
34
+ class AdvancedModeTransformConfigChunkingConfig_Token(TokenChunkingConfig):
35
+ mode: typing_extensions.Literal["token"]
36
+
37
+ class Config:
38
+ frozen = True
39
+ smart_union = True
40
+ allow_population_by_field_name = True
41
+
42
+
43
+ class AdvancedModeTransformConfigChunkingConfig_Sentence(SentenceChunkingConfig):
44
+ mode: typing_extensions.Literal["sentence"]
45
+
46
+ class Config:
47
+ frozen = True
48
+ smart_union = True
49
+ allow_population_by_field_name = True
50
+
51
+
52
+ class AdvancedModeTransformConfigChunkingConfig_Semantic(SemanticChunkingConfig):
53
+ mode: typing_extensions.Literal["semantic"]
54
+
55
+ class Config:
56
+ frozen = True
57
+ smart_union = True
58
+ allow_population_by_field_name = True
59
+
60
+
61
+ AdvancedModeTransformConfigChunkingConfig = typing.Union[
62
+ AdvancedModeTransformConfigChunkingConfig_None,
63
+ AdvancedModeTransformConfigChunkingConfig_Character,
64
+ AdvancedModeTransformConfigChunkingConfig_Token,
65
+ AdvancedModeTransformConfigChunkingConfig_Sentence,
66
+ AdvancedModeTransformConfigChunkingConfig_Semantic,
67
+ ]
@@ -0,0 +1,45 @@
1
+ # This file was auto-generated by Fern from our API Definition.
2
+
3
+ from __future__ import annotations
4
+
5
+ import typing
6
+
7
+ import typing_extensions
8
+
9
+ from .element_segmentation_config import ElementSegmentationConfig
10
+ from .none_segmentation_config import NoneSegmentationConfig
11
+ from .page_segmentation_config import PageSegmentationConfig
12
+
13
+
14
+ class AdvancedModeTransformConfigSegmentationConfig_None(NoneSegmentationConfig):
15
+ mode: typing_extensions.Literal["none"]
16
+
17
+ class Config:
18
+ frozen = True
19
+ smart_union = True
20
+ allow_population_by_field_name = True
21
+
22
+
23
+ class AdvancedModeTransformConfigSegmentationConfig_Page(PageSegmentationConfig):
24
+ mode: typing_extensions.Literal["page"]
25
+
26
+ class Config:
27
+ frozen = True
28
+ smart_union = True
29
+ allow_population_by_field_name = True
30
+
31
+
32
+ class AdvancedModeTransformConfigSegmentationConfig_Element(ElementSegmentationConfig):
33
+ mode: typing_extensions.Literal["element"]
34
+
35
+ class Config:
36
+ frozen = True
37
+ smart_union = True
38
+ allow_population_by_field_name = True
39
+
40
+
41
+ AdvancedModeTransformConfigSegmentationConfig = typing.Union[
42
+ AdvancedModeTransformConfigSegmentationConfig_None,
43
+ AdvancedModeTransformConfigSegmentationConfig_Page,
44
+ AdvancedModeTransformConfigSegmentationConfig_Element,
45
+ ]