PyPI - llama-cloud - Versions diffs - 0.0.10__py3-none-any.whl → 0.0.12__py3-none-any.whl - Mend

llama-cloud 0.0.10py3-none-any.whl → 0.0.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of llama-cloud might be problematic. Click here for more details.

Files changed (57) hide show

llama_cloud/__init__.py +82 -6
llama_cloud/client.py +3 -0
llama_cloud/resources/__init__.py +13 -2
llama_cloud/resources/auth/__init__.py +2 -0
llama_cloud/resources/auth/client.py +124 -0
llama_cloud/resources/data_sinks/types/data_sink_update_component_one.py +4 -0
llama_cloud/resources/extraction/__init__.py +2 -2
llama_cloud/resources/extraction/client.py +139 -48
llama_cloud/resources/extraction/types/__init__.py +2 -1
llama_cloud/resources/extraction/types/extraction_schema_create_data_schema_value.py +7 -0
llama_cloud/resources/pipelines/__init__.py +12 -2
llama_cloud/resources/pipelines/client.py +58 -2
llama_cloud/resources/pipelines/types/__init__.py +11 -1
llama_cloud/resources/pipelines/types/pipeline_update_transform_config.py +31 -0
llama_cloud/types/__init__.py +78 -6
llama_cloud/types/advanced_mode_transform_config.py +38 -0
llama_cloud/types/advanced_mode_transform_config_chunking_config.py +67 -0
llama_cloud/types/advanced_mode_transform_config_segmentation_config.py +45 -0
llama_cloud/types/auto_transform_config.py +32 -0
llama_cloud/types/character_chunking_config.py +32 -0
llama_cloud/types/{html_node_parser.py → character_splitter.py} +9 -9
llama_cloud/types/chat_data.py +2 -0
llama_cloud/types/cloud_az_storage_blob_data_source.py +11 -2
llama_cloud/types/{simple_file_node_parser.py → cloud_milvus_vector_store.py} +7 -14
llama_cloud/types/cloud_mongo_db_atlas_vector_search.py +51 -0
llama_cloud/types/configurable_data_sink_names.py +8 -0
llama_cloud/types/configurable_transformation_names.py +8 -12
llama_cloud/types/configured_transformation_item_component_one.py +4 -6
llama_cloud/types/custom_claims.py +61 -0
llama_cloud/types/data_sink_component_one.py +4 -0
llama_cloud/types/data_sink_create_component_one.py +4 -0
llama_cloud/types/element_segmentation_config.py +29 -0
llama_cloud/types/embedding_config.py +36 -0
llama_cloud/types/embedding_config_component.py +7 -0
llama_cloud/types/embedding_config_component_one.py +19 -0
llama_cloud/types/embedding_config_type.py +41 -0
llama_cloud/types/eval_dataset_job_record.py +1 -0
llama_cloud/types/ingestion_error_response.py +34 -0
llama_cloud/types/job_name_mapping.py +45 -0
llama_cloud/types/llama_parse_supported_file_extensions.py +32 -0
llama_cloud/types/llm_parameters.py +39 -0
llama_cloud/types/managed_ingestion_status_response.py +6 -0
llama_cloud/types/none_chunking_config.py +29 -0
llama_cloud/types/none_segmentation_config.py +29 -0
llama_cloud/types/page_segmentation_config.py +29 -0
llama_cloud/types/{json_node_parser.py → page_splitter_node_parser.py} +3 -8
llama_cloud/types/parsing_job.py +2 -0
llama_cloud/types/pipeline_create.py +8 -0
llama_cloud/types/pipeline_create_transform_config.py +31 -0
llama_cloud/types/semantic_chunking_config.py +32 -0
llama_cloud/types/sentence_chunking_config.py +34 -0
llama_cloud/types/token_chunking_config.py +33 -0
llama_cloud/types/user.py +35 -0
{llama_cloud-0.0.10.dist-info → llama_cloud-0.0.12.dist-info}/METADATA +1 -1
{llama_cloud-0.0.10.dist-info → llama_cloud-0.0.12.dist-info}/RECORD +57 -30
{llama_cloud-0.0.10.dist-info → llama_cloud-0.0.12.dist-info}/LICENSE +0 -0
{llama_cloud-0.0.10.dist-info → llama_cloud-0.0.12.dist-info}/WHEEL +0 -0

llama_cloud/resources/extraction/client.py CHANGED Viewed

@@ -13,6 +13,7 @@ from ...types.extraction_job import ExtractionJob
 from ...types.extraction_result import ExtractionResult
 from ...types.extraction_schema import ExtractionSchema
 from ...types.http_validation_error import HttpValidationError
+from .types.extraction_schema_create_data_schema_value import ExtractionSchemaCreateDataSchemaValue
 from .types.extraction_schema_update_data_schema_value import ExtractionSchemaUpdateDataSchemaValue
 try:
@@ -31,47 +32,66 @@ class ExtractionClient:
     def __init__(self, *, client_wrapper: SyncClientWrapper):
         self._client_wrapper = client_wrapper
-    def infer_schema(
+    def list_schemas(self, *, project_id: typing.Optional[str] = None) -> typing.List[ExtractionSchema]:
+        """
+        Parameters:
+            - project_id: typing.Optional[str].
+        ---
+        from llama_cloud.client import LlamaCloud
+        client = LlamaCloud(
+            token="YOUR_TOKEN",
+        )
+        client.extraction.list_schemas()
+        """
+        _response = self._client_wrapper.httpx_client.request(
+            "GET",
+            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas"),
+            params=remove_none_from_dict({"project_id": project_id}),
+            headers=self._client_wrapper.get_headers(),
+            timeout=60,
+        )
+        if 200 <= _response.status_code < 300:
+            return pydantic.parse_obj_as(typing.List[ExtractionSchema], _response.json())  # type: ignore
+        if _response.status_code == 422:
+            raise UnprocessableEntityError(pydantic.parse_obj_as(HttpValidationError, _response.json()))  # type: ignore
+        try:
+            _response_json = _response.json()
+        except JSONDecodeError:
+            raise ApiError(status_code=_response.status_code, body=_response.text)
+        raise ApiError(status_code=_response.status_code, body=_response_json)
+    def create_schema(
         self,
         *,
-        schema_id: typing.Optional[str] = OMIT,
         name: str,
         project_id: typing.Optional[str] = OMIT,
-        file_ids: typing.List[str],
-        stream: typing.Optional[bool] = OMIT,
+        data_schema: typing.Dict[str, ExtractionSchemaCreateDataSchemaValue],
     ) -> ExtractionSchema:
         """
         Parameters:
-            - schema_id: typing.Optional[str]. The ID of a schema to update with the new schema
             - name: str. The name of the extraction schema
             - project_id: typing.Optional[str]. The ID of the project that the extraction schema belongs to
-            - file_ids: typing.List[str]. The IDs of the files that the extraction schema contains
-            - stream: typing.Optional[bool]. Whether to stream the results of the extraction schema
+            - data_schema: typing.Dict[str, ExtractionSchemaCreateDataSchemaValue]. The schema of the data
         ---
         from llama_cloud.client import LlamaCloud
         client = LlamaCloud(
             token="YOUR_TOKEN",
         )
-        client.extraction.infer_schema(
+        client.extraction.create_schema(
             name="string",
-            file_ids=[],
+            data_schema={},
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"name": name, "file_ids": file_ids}
-        if schema_id is not OMIT:
-            _request["schema_id"] = schema_id
+        _request: typing.Dict[str, typing.Any] = {"name": name, "data_schema": data_schema}
         if project_id is not OMIT:
             _request["project_id"] = project_id
-        if stream is not OMIT:
-            _request["stream"] = stream
         _response = self._client_wrapper.httpx_client.request(
             "POST",
-            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas/infer"),
+            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas"),
             json=jsonable_encoder(_request),
             headers=self._client_wrapper.get_headers(),
             timeout=60,
@@ -86,27 +106,53 @@ class ExtractionClient:
             raise ApiError(status_code=_response.status_code, body=_response.text)
         raise ApiError(status_code=_response.status_code, body=_response_json)
-    def list_schemas(self, *, project_id: typing.Optional[str] = None) -> typing.List[ExtractionSchema]:
+    def infer_schema(
+        self,
+        *,
+        schema_id: typing.Optional[str] = OMIT,
+        name: str,
+        project_id: typing.Optional[str] = OMIT,
+        file_ids: typing.List[str],
+        stream: typing.Optional[bool] = OMIT,
+    ) -> ExtractionSchema:
         """
         Parameters:
-            - project_id: typing.Optional[str].
+            - schema_id: typing.Optional[str]. The ID of a schema to update with the new schema
+            - name: str. The name of the extraction schema
+            - project_id: typing.Optional[str]. The ID of the project that the extraction schema belongs to
+            - file_ids: typing.List[str]. The IDs of the files that the extraction schema contains
+            - stream: typing.Optional[bool]. Whether to stream the results of the extraction schema
         ---
         from llama_cloud.client import LlamaCloud
         client = LlamaCloud(
             token="YOUR_TOKEN",
         )
-        client.extraction.list_schemas()
+        client.extraction.infer_schema(
+            name="string",
+            file_ids=[],
+        )
         """
+        _request: typing.Dict[str, typing.Any] = {"name": name, "file_ids": file_ids}
+        if schema_id is not OMIT:
+            _request["schema_id"] = schema_id
+        if project_id is not OMIT:
+            _request["project_id"] = project_id
+        if stream is not OMIT:
+            _request["stream"] = stream
         _response = self._client_wrapper.httpx_client.request(
-            "GET",
-            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas"),
-            params=remove_none_from_dict({"project_id": project_id}),
+            "POST",
+            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas/infer"),
+            json=jsonable_encoder(_request),
             headers=self._client_wrapper.get_headers(),
             timeout=60,
         )
         if 200 <= _response.status_code < 300:
-            return pydantic.parse_obj_as(typing.List[ExtractionSchema], _response.json())  # type: ignore
+            return pydantic.parse_obj_as(ExtractionSchema, _response.json())  # type: ignore
         if _response.status_code == 422:
             raise UnprocessableEntityError(pydantic.parse_obj_as(HttpValidationError, _response.json()))  # type: ignore
         try:
@@ -350,47 +396,66 @@ class AsyncExtractionClient:
     def __init__(self, *, client_wrapper: AsyncClientWrapper):
         self._client_wrapper = client_wrapper
-    async def infer_schema(
+    async def list_schemas(self, *, project_id: typing.Optional[str] = None) -> typing.List[ExtractionSchema]:
+        """
+        Parameters:
+            - project_id: typing.Optional[str].
+        ---
+        from llama_cloud.client import AsyncLlamaCloud
+        client = AsyncLlamaCloud(
+            token="YOUR_TOKEN",
+        )
+        await client.extraction.list_schemas()
+        """
+        _response = await self._client_wrapper.httpx_client.request(
+            "GET",
+            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas"),
+            params=remove_none_from_dict({"project_id": project_id}),
+            headers=self._client_wrapper.get_headers(),
+            timeout=60,
+        )
+        if 200 <= _response.status_code < 300:
+            return pydantic.parse_obj_as(typing.List[ExtractionSchema], _response.json())  # type: ignore
+        if _response.status_code == 422:
+            raise UnprocessableEntityError(pydantic.parse_obj_as(HttpValidationError, _response.json()))  # type: ignore
+        try:
+            _response_json = _response.json()
+        except JSONDecodeError:
+            raise ApiError(status_code=_response.status_code, body=_response.text)
+        raise ApiError(status_code=_response.status_code, body=_response_json)
+    async def create_schema(
         self,
         *,
-        schema_id: typing.Optional[str] = OMIT,
         name: str,
         project_id: typing.Optional[str] = OMIT,
-        file_ids: typing.List[str],
-        stream: typing.Optional[bool] = OMIT,
+        data_schema: typing.Dict[str, ExtractionSchemaCreateDataSchemaValue],
     ) -> ExtractionSchema:
         """
         Parameters:
-            - schema_id: typing.Optional[str]. The ID of a schema to update with the new schema
             - name: str. The name of the extraction schema
             - project_id: typing.Optional[str]. The ID of the project that the extraction schema belongs to
-            - file_ids: typing.List[str]. The IDs of the files that the extraction schema contains
-            - stream: typing.Optional[bool]. Whether to stream the results of the extraction schema
+            - data_schema: typing.Dict[str, ExtractionSchemaCreateDataSchemaValue]. The schema of the data
         ---
         from llama_cloud.client import AsyncLlamaCloud
         client = AsyncLlamaCloud(
             token="YOUR_TOKEN",
         )
-        await client.extraction.infer_schema(
+        await client.extraction.create_schema(
             name="string",
-            file_ids=[],
+            data_schema={},
         )
         """
-        _request: typing.Dict[str, typing.Any] = {"name": name, "file_ids": file_ids}
-        if schema_id is not OMIT:
-            _request["schema_id"] = schema_id
+        _request: typing.Dict[str, typing.Any] = {"name": name, "data_schema": data_schema}
         if project_id is not OMIT:
             _request["project_id"] = project_id
-        if stream is not OMIT:
-            _request["stream"] = stream
         _response = await self._client_wrapper.httpx_client.request(
             "POST",
-            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas/infer"),
+            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas"),
             json=jsonable_encoder(_request),
             headers=self._client_wrapper.get_headers(),
             timeout=60,
@@ -405,27 +470,53 @@ class AsyncExtractionClient:
             raise ApiError(status_code=_response.status_code, body=_response.text)
         raise ApiError(status_code=_response.status_code, body=_response_json)
-    async def list_schemas(self, *, project_id: typing.Optional[str] = None) -> typing.List[ExtractionSchema]:
+    async def infer_schema(
+        self,
+        *,
+        schema_id: typing.Optional[str] = OMIT,
+        name: str,
+        project_id: typing.Optional[str] = OMIT,
+        file_ids: typing.List[str],
+        stream: typing.Optional[bool] = OMIT,
+    ) -> ExtractionSchema:
         """
         Parameters:
-            - project_id: typing.Optional[str].
+            - schema_id: typing.Optional[str]. The ID of a schema to update with the new schema
+            - name: str. The name of the extraction schema
+            - project_id: typing.Optional[str]. The ID of the project that the extraction schema belongs to
+            - file_ids: typing.List[str]. The IDs of the files that the extraction schema contains
+            - stream: typing.Optional[bool]. Whether to stream the results of the extraction schema
         ---
         from llama_cloud.client import AsyncLlamaCloud
         client = AsyncLlamaCloud(
             token="YOUR_TOKEN",
         )
-        await client.extraction.list_schemas()
+        await client.extraction.infer_schema(
+            name="string",
+            file_ids=[],
+        )
         """
+        _request: typing.Dict[str, typing.Any] = {"name": name, "file_ids": file_ids}
+        if schema_id is not OMIT:
+            _request["schema_id"] = schema_id
+        if project_id is not OMIT:
+            _request["project_id"] = project_id
+        if stream is not OMIT:
+            _request["stream"] = stream
         _response = await self._client_wrapper.httpx_client.request(
-            "GET",
-            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas"),
-            params=remove_none_from_dict({"project_id": project_id}),
+            "POST",
+            urllib.parse.urljoin(f"{self._client_wrapper.get_base_url()}/", "api/v1/extraction/schemas/infer"),
+            json=jsonable_encoder(_request),
             headers=self._client_wrapper.get_headers(),
             timeout=60,
         )
         if 200 <= _response.status_code < 300:
-            return pydantic.parse_obj_as(typing.List[ExtractionSchema], _response.json())  # type: ignore
+            return pydantic.parse_obj_as(ExtractionSchema, _response.json())  # type: ignore
         if _response.status_code == 422:
             raise UnprocessableEntityError(pydantic.parse_obj_as(HttpValidationError, _response.json()))  # type: ignore
         try:

llama_cloud/resources/extraction/types/__init__.py CHANGED Viewed

@@ -1,5 +1,6 @@
 # This file was auto-generated by Fern from our API Definition.
+from .extraction_schema_create_data_schema_value import ExtractionSchemaCreateDataSchemaValue
 from .extraction_schema_update_data_schema_value import ExtractionSchemaUpdateDataSchemaValue
-__all__ = ["ExtractionSchemaUpdateDataSchemaValue"]
+__all__ = ["ExtractionSchemaCreateDataSchemaValue", "ExtractionSchemaUpdateDataSchemaValue"]

llama_cloud/resources/extraction/types/extraction_schema_create_data_schema_value.py ADDED Viewed

@@ -0,0 +1,7 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+ExtractionSchemaCreateDataSchemaValue = typing.Union[
+    typing.Dict[str, typing.Any], typing.List[typing.Any], str, int, float, bool
+]

llama_cloud/resources/pipelines/__init__.py CHANGED Viewed

@@ -1,5 +1,15 @@
 # This file was auto-generated by Fern from our API Definition.
-from .types import PipelineFileUpdateCustomMetadataValue
+from .types import (
+    PipelineFileUpdateCustomMetadataValue,
+    PipelineUpdateTransformConfig,
+    PipelineUpdateTransformConfig_Advanced,
+    PipelineUpdateTransformConfig_Auto,
+)
-__all__ = ["PipelineFileUpdateCustomMetadataValue"]
+__all__ = [
+    "PipelineFileUpdateCustomMetadataValue",
+    "PipelineUpdateTransformConfig",
+    "PipelineUpdateTransformConfig_Advanced",
+    "PipelineUpdateTransformConfig_Auto",
+]

llama_cloud/resources/pipelines/client.py CHANGED Viewed

@@ -15,6 +15,7 @@ from ...types.cloud_document import CloudDocument
 from ...types.cloud_document_create import CloudDocumentCreate
 from ...types.configured_transformation_item import ConfiguredTransformationItem
 from ...types.data_sink_create import DataSinkCreate
+from ...types.embedding_config import EmbeddingConfig
 from ...types.eval_dataset_job_record import EvalDatasetJobRecord
 from ...types.eval_execution_params import EvalExecutionParams
 from ...types.eval_execution_params_override import EvalExecutionParamsOverride
@@ -36,6 +37,7 @@ from ...types.retrieval_mode import RetrievalMode
 from ...types.retrieve_results import RetrieveResults
 from ...types.text_node import TextNode
 from .types.pipeline_file_update_custom_metadata_value import PipelineFileUpdateCustomMetadataValue
+from .types.pipeline_update_transform_config import PipelineUpdateTransformConfig
 try:
     import pydantic
@@ -119,6 +121,8 @@ class PipelinesClient:
         from llama_cloud import (
             ConfigurableDataSinkNames,
             DataSinkCreate,
+            EmbeddingConfig,
+            EmbeddingConfigType,
             EvalExecutionParams,
             FilterCondition,
             LlamaParseParameters,
@@ -136,6 +140,9 @@ class PipelinesClient:
         )
         client.pipelines.create_pipeline(
             request=PipelineCreate(
+                embedding_config=EmbeddingConfig(
+                    type=EmbeddingConfigType.OPENAI_EMBEDDING,
+                ),
                 data_sink=DataSinkCreate(
                     name="string",
                     sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -187,6 +194,8 @@ class PipelinesClient:
         from llama_cloud import (
             ConfigurableDataSinkNames,
             DataSinkCreate,
+            EmbeddingConfig,
+            EmbeddingConfigType,
             EvalExecutionParams,
             FilterCondition,
             LlamaParseParameters,
@@ -204,6 +213,9 @@ class PipelinesClient:
         )
         client.pipelines.upsert_pipeline(
             request=PipelineCreate(
+                embedding_config=EmbeddingConfig(
+                    type=EmbeddingConfigType.OPENAI_EMBEDDING,
+                ),
                 data_sink=DataSinkCreate(
                     name="string",
                     sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -278,6 +290,8 @@ class PipelinesClient:
         self,
         pipeline_id: str,
         *,
+        embedding_config: typing.Optional[EmbeddingConfig] = OMIT,
+        transform_config: typing.Optional[PipelineUpdateTransformConfig] = OMIT,
         configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]] = OMIT,
         data_sink_id: typing.Optional[str] = OMIT,
         data_sink: typing.Optional[DataSinkCreate] = OMIT,
@@ -293,7 +307,11 @@ class PipelinesClient:
         Parameters:
             - pipeline_id: str.
-            - configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]].
+            - embedding_config: typing.Optional[EmbeddingConfig]. Configuration for the embedding model.
+            - transform_config: typing.Optional[PipelineUpdateTransformConfig]. Configuration for the transformation.
+            - configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]]. List of configured transformations.
             - data_sink_id: typing.Optional[str]. Data sink ID. When provided instead of data_sink, the data sink will be looked up by ID.
@@ -312,6 +330,8 @@ class PipelinesClient:
         from llama_cloud import (
             ConfigurableDataSinkNames,
             DataSinkCreate,
+            EmbeddingConfig,
+            EmbeddingConfigType,
             EvalExecutionParams,
             FilterCondition,
             LlamaParseParameters,
@@ -327,6 +347,9 @@ class PipelinesClient:
         )
         client.pipelines.update_existing_pipeline(
             pipeline_id="string",
+            embedding_config=EmbeddingConfig(
+                type=EmbeddingConfigType.OPENAI_EMBEDDING,
+            ),
             data_sink=DataSinkCreate(
                 name="string",
                 sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -345,6 +368,10 @@ class PipelinesClient:
         )
         """
         _request: typing.Dict[str, typing.Any] = {}
+        if embedding_config is not OMIT:
+            _request["embedding_config"] = embedding_config
+        if transform_config is not OMIT:
+            _request["transform_config"] = transform_config
         if configured_transformations is not OMIT:
             _request["configured_transformations"] = configured_transformations
         if data_sink_id is not OMIT:
@@ -1281,6 +1308,7 @@ class PipelinesClient:
         from llama_cloud import (
             ChatData,
             FilterCondition,
+            LlmParameters,
             MetadataFilters,
             PresetRetrievalParams,
             RetrievalMode,
@@ -1301,6 +1329,7 @@ class PipelinesClient:
                     ),
                     retrieval_mode=RetrievalMode.CHUNKS,
                 ),
+                llm_parameters=LlmParameters(),
             ),
         )
         """
@@ -1678,6 +1707,8 @@ class AsyncPipelinesClient:
         from llama_cloud import (
             ConfigurableDataSinkNames,
             DataSinkCreate,
+            EmbeddingConfig,
+            EmbeddingConfigType,
             EvalExecutionParams,
             FilterCondition,
             LlamaParseParameters,
@@ -1695,6 +1726,9 @@ class AsyncPipelinesClient:
         )
         await client.pipelines.create_pipeline(
             request=PipelineCreate(
+                embedding_config=EmbeddingConfig(
+                    type=EmbeddingConfigType.OPENAI_EMBEDDING,
+                ),
                 data_sink=DataSinkCreate(
                     name="string",
                     sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -1746,6 +1780,8 @@ class AsyncPipelinesClient:
         from llama_cloud import (
             ConfigurableDataSinkNames,
             DataSinkCreate,
+            EmbeddingConfig,
+            EmbeddingConfigType,
             EvalExecutionParams,
             FilterCondition,
             LlamaParseParameters,
@@ -1763,6 +1799,9 @@ class AsyncPipelinesClient:
         )
         await client.pipelines.upsert_pipeline(
             request=PipelineCreate(
+                embedding_config=EmbeddingConfig(
+                    type=EmbeddingConfigType.OPENAI_EMBEDDING,
+                ),
                 data_sink=DataSinkCreate(
                     name="string",
                     sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -1837,6 +1876,8 @@ class AsyncPipelinesClient:
         self,
         pipeline_id: str,
         *,
+        embedding_config: typing.Optional[EmbeddingConfig] = OMIT,
+        transform_config: typing.Optional[PipelineUpdateTransformConfig] = OMIT,
         configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]] = OMIT,
         data_sink_id: typing.Optional[str] = OMIT,
         data_sink: typing.Optional[DataSinkCreate] = OMIT,
@@ -1852,7 +1893,11 @@ class AsyncPipelinesClient:
         Parameters:
             - pipeline_id: str.
-            - configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]].
+            - embedding_config: typing.Optional[EmbeddingConfig]. Configuration for the embedding model.
+            - transform_config: typing.Optional[PipelineUpdateTransformConfig]. Configuration for the transformation.
+            - configured_transformations: typing.Optional[typing.List[ConfiguredTransformationItem]]. List of configured transformations.
             - data_sink_id: typing.Optional[str]. Data sink ID. When provided instead of data_sink, the data sink will be looked up by ID.
@@ -1871,6 +1916,8 @@ class AsyncPipelinesClient:
         from llama_cloud import (
             ConfigurableDataSinkNames,
             DataSinkCreate,
+            EmbeddingConfig,
+            EmbeddingConfigType,
             EvalExecutionParams,
             FilterCondition,
             LlamaParseParameters,
@@ -1886,6 +1933,9 @@ class AsyncPipelinesClient:
         )
         await client.pipelines.update_existing_pipeline(
             pipeline_id="string",
+            embedding_config=EmbeddingConfig(
+                type=EmbeddingConfigType.OPENAI_EMBEDDING,
+            ),
             data_sink=DataSinkCreate(
                 name="string",
                 sink_type=ConfigurableDataSinkNames.CHROMA,
@@ -1904,6 +1954,10 @@ class AsyncPipelinesClient:
         )
         """
         _request: typing.Dict[str, typing.Any] = {}
+        if embedding_config is not OMIT:
+            _request["embedding_config"] = embedding_config
+        if transform_config is not OMIT:
+            _request["transform_config"] = transform_config
         if configured_transformations is not OMIT:
             _request["configured_transformations"] = configured_transformations
         if data_sink_id is not OMIT:
@@ -2842,6 +2896,7 @@ class AsyncPipelinesClient:
         from llama_cloud import (
             ChatData,
             FilterCondition,
+            LlmParameters,
             MetadataFilters,
             PresetRetrievalParams,
             RetrievalMode,
@@ -2862,6 +2917,7 @@ class AsyncPipelinesClient:
                     ),
                     retrieval_mode=RetrievalMode.CHUNKS,
                 ),
+                llm_parameters=LlmParameters(),
             ),
         )
         """

llama_cloud/resources/pipelines/types/__init__.py CHANGED Viewed

@@ -1,5 +1,15 @@
 # This file was auto-generated by Fern from our API Definition.
 from .pipeline_file_update_custom_metadata_value import PipelineFileUpdateCustomMetadataValue
+from .pipeline_update_transform_config import (
+    PipelineUpdateTransformConfig,
+    PipelineUpdateTransformConfig_Advanced,
+    PipelineUpdateTransformConfig_Auto,
+)
-__all__ = ["PipelineFileUpdateCustomMetadataValue"]
+__all__ = [
+    "PipelineFileUpdateCustomMetadataValue",
+    "PipelineUpdateTransformConfig",
+    "PipelineUpdateTransformConfig_Advanced",
+    "PipelineUpdateTransformConfig_Auto",
+]

llama_cloud/resources/pipelines/types/pipeline_update_transform_config.py ADDED Viewed

@@ -0,0 +1,31 @@
+# This file was auto-generated by Fern from our API Definition.
+from __future__ import annotations
+import typing
+import typing_extensions
+from ....types.advanced_mode_transform_config import AdvancedModeTransformConfig
+from ....types.auto_transform_config import AutoTransformConfig
+class PipelineUpdateTransformConfig_Auto(AutoTransformConfig):
+    mode: typing_extensions.Literal["auto"]
+    class Config:
+        frozen = True
+        smart_union = True
+        allow_population_by_field_name = True
+class PipelineUpdateTransformConfig_Advanced(AdvancedModeTransformConfig):
+    mode: typing_extensions.Literal["advanced"]
+    class Config:
+        frozen = True
+        smart_union = True
+        allow_population_by_field_name = True
+PipelineUpdateTransformConfig = typing.Union[PipelineUpdateTransformConfig_Auto, PipelineUpdateTransformConfig_Advanced]

llama-cloud 0.0.10__py3-none-any.whl → 0.0.12__py3-none-any.whl

Potentially problematic release.

llama-cloud 0.0.10py3-none-any.whl → 0.0.12py3-none-any.whl