PyPI - llama-stack - Versions diffs - 0.4.3__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

llama-stack 0.4.3py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (311) hide show

llama_stack/cli/stack/_list_deps.py +11 -7
llama_stack/cli/stack/run.py +3 -25
llama_stack/core/access_control/datatypes.py +78 -0
llama_stack/core/configure.py +2 -2
{llama_stack_api/internal → llama_stack/core/connectors}/__init__.py +2 -2
llama_stack/core/connectors/connectors.py +162 -0
llama_stack/core/conversations/conversations.py +61 -58
llama_stack/core/datatypes.py +54 -8
llama_stack/core/library_client.py +60 -13
llama_stack/core/prompts/prompts.py +43 -42
llama_stack/core/routers/datasets.py +20 -17
llama_stack/core/routers/eval_scoring.py +143 -53
llama_stack/core/routers/inference.py +20 -9
llama_stack/core/routers/safety.py +30 -42
llama_stack/core/routers/vector_io.py +15 -7
llama_stack/core/routing_tables/models.py +42 -3
llama_stack/core/routing_tables/scoring_functions.py +19 -19
llama_stack/core/routing_tables/shields.py +20 -17
llama_stack/core/routing_tables/vector_stores.py +8 -5
llama_stack/core/server/auth.py +192 -17
llama_stack/core/server/fastapi_router_registry.py +40 -5
llama_stack/core/server/server.py +24 -5
llama_stack/core/stack.py +54 -10
llama_stack/core/storage/datatypes.py +9 -0
llama_stack/core/store/registry.py +1 -1
llama_stack/core/utils/exec.py +2 -2
llama_stack/core/utils/type_inspection.py +16 -2
llama_stack/distributions/dell/config.yaml +4 -1
llama_stack/distributions/dell/doc_template.md +209 -0
llama_stack/distributions/dell/run-with-safety.yaml +4 -1
llama_stack/distributions/nvidia/config.yaml +4 -1
llama_stack/distributions/nvidia/doc_template.md +170 -0
llama_stack/distributions/nvidia/run-with-safety.yaml +4 -1
llama_stack/distributions/oci/config.yaml +4 -1
llama_stack/distributions/oci/doc_template.md +140 -0
llama_stack/distributions/open-benchmark/config.yaml +9 -1
llama_stack/distributions/postgres-demo/config.yaml +1 -1
llama_stack/distributions/starter/build.yaml +62 -0
llama_stack/distributions/starter/config.yaml +22 -3
llama_stack/distributions/starter/run-with-postgres-store.yaml +22 -3
llama_stack/distributions/starter/starter.py +13 -1
llama_stack/distributions/starter-gpu/build.yaml +62 -0
llama_stack/distributions/starter-gpu/config.yaml +22 -3
llama_stack/distributions/starter-gpu/run-with-postgres-store.yaml +22 -3
llama_stack/distributions/template.py +10 -2
llama_stack/distributions/watsonx/config.yaml +4 -1
llama_stack/log.py +1 -0
llama_stack/models/llama/resources/dog.jpg +0 -0
llama_stack/models/llama/resources/pasta.jpeg +0 -0
llama_stack/models/llama/resources/small_dog.jpg +0 -0
llama_stack/providers/inline/agents/meta_reference/__init__.py +1 -0
llama_stack/providers/inline/agents/meta_reference/agents.py +58 -61
llama_stack/providers/inline/agents/meta_reference/responses/openai_responses.py +187 -60
llama_stack/providers/inline/agents/meta_reference/responses/streaming.py +99 -22
llama_stack/providers/inline/agents/meta_reference/responses/types.py +2 -1
llama_stack/providers/inline/agents/meta_reference/responses/utils.py +4 -1
llama_stack/providers/inline/agents/meta_reference/safety.py +2 -2
llama_stack/providers/inline/batches/reference/batches.py +2 -1
llama_stack/providers/inline/eval/meta_reference/eval.py +40 -32
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.h +9 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.swift +189 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/Parsing.swift +238 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/PromptTemplate.swift +12 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/SystemPrompts.swift +89 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.pbxproj +550 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +8 -0
llama_stack/providers/inline/post_training/huggingface/post_training.py +33 -38
llama_stack/providers/inline/post_training/huggingface/utils.py +2 -5
llama_stack/providers/inline/post_training/torchtune/common/utils.py +5 -9
llama_stack/providers/inline/post_training/torchtune/post_training.py +28 -33
llama_stack/providers/inline/post_training/torchtune/recipes/lora_finetuning_single_device.py +2 -4
llama_stack/providers/inline/safety/code_scanner/code_scanner.py +12 -15
llama_stack/providers/inline/safety/llama_guard/llama_guard.py +20 -24
llama_stack/providers/inline/safety/prompt_guard/prompt_guard.py +11 -17
llama_stack/providers/inline/scoring/basic/scoring.py +13 -17
llama_stack/providers/inline/scoring/braintrust/braintrust.py +15 -15
llama_stack/providers/inline/scoring/llm_as_judge/scoring.py +13 -17
llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py +1 -1
llama_stack/providers/registry/agents.py +1 -0
llama_stack/providers/registry/inference.py +1 -9
llama_stack/providers/registry/vector_io.py +136 -16
llama_stack/providers/remote/datasetio/nvidia/README.md +74 -0
llama_stack/providers/remote/eval/nvidia/README.md +134 -0
llama_stack/providers/remote/eval/nvidia/eval.py +22 -21
llama_stack/providers/remote/files/s3/README.md +266 -0
llama_stack/providers/remote/files/s3/config.py +5 -3
llama_stack/providers/remote/files/s3/files.py +2 -2
llama_stack/providers/remote/inference/gemini/gemini.py +4 -0
llama_stack/providers/remote/inference/nvidia/NVIDIA.md +203 -0
llama_stack/providers/remote/inference/openai/openai.py +2 -0
llama_stack/providers/remote/inference/together/together.py +4 -0
llama_stack/providers/remote/inference/vertexai/config.py +3 -3
llama_stack/providers/remote/inference/vertexai/vertexai.py +5 -2
llama_stack/providers/remote/inference/vllm/config.py +37 -18
llama_stack/providers/remote/inference/vllm/vllm.py +0 -3
llama_stack/providers/remote/inference/watsonx/watsonx.py +4 -0
llama_stack/providers/remote/post_training/nvidia/README.md +151 -0
llama_stack/providers/remote/post_training/nvidia/models.py +3 -11
llama_stack/providers/remote/post_training/nvidia/post_training.py +31 -33
llama_stack/providers/remote/safety/bedrock/bedrock.py +10 -27
llama_stack/providers/remote/safety/nvidia/README.md +78 -0
llama_stack/providers/remote/safety/nvidia/nvidia.py +9 -25
llama_stack/providers/remote/safety/sambanova/sambanova.py +13 -11
llama_stack/providers/remote/vector_io/elasticsearch/__init__.py +17 -0
llama_stack/providers/remote/vector_io/elasticsearch/config.py +32 -0
llama_stack/providers/remote/vector_io/elasticsearch/elasticsearch.py +463 -0
llama_stack/providers/remote/vector_io/oci/__init__.py +22 -0
llama_stack/providers/remote/vector_io/oci/config.py +41 -0
llama_stack/providers/remote/vector_io/oci/oci26ai.py +595 -0
llama_stack/providers/remote/vector_io/pgvector/config.py +69 -2
llama_stack/providers/remote/vector_io/pgvector/pgvector.py +255 -6
llama_stack/providers/remote/vector_io/qdrant/qdrant.py +62 -38
llama_stack/providers/utils/bedrock/client.py +3 -3
llama_stack/providers/utils/bedrock/config.py +7 -7
llama_stack/providers/utils/inference/__init__.py +0 -25
llama_stack/providers/utils/inference/embedding_mixin.py +4 -0
llama_stack/providers/utils/inference/http_client.py +239 -0
llama_stack/providers/utils/inference/litellm_openai_mixin.py +6 -0
llama_stack/providers/utils/inference/model_registry.py +148 -2
llama_stack/providers/utils/inference/openai_compat.py +1 -158
llama_stack/providers/utils/inference/openai_mixin.py +42 -2
llama_stack/providers/utils/inference/prompt_adapter.py +0 -209
llama_stack/providers/utils/memory/openai_vector_store_mixin.py +92 -5
llama_stack/providers/utils/memory/vector_store.py +46 -19
llama_stack/providers/utils/responses/responses_store.py +40 -6
llama_stack/providers/utils/safety.py +114 -0
llama_stack/providers/utils/tools/mcp.py +44 -3
llama_stack/testing/api_recorder.py +9 -3
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0.dist-info}/METADATA +14 -2
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0.dist-info}/RECORD +135 -279
llama_stack-0.5.0.dist-info/top_level.txt +1 -0
llama_stack/distributions/meta-reference-gpu/__init__.py +0 -7
llama_stack/distributions/meta-reference-gpu/config.yaml +0 -140
llama_stack/distributions/meta-reference-gpu/meta_reference.py +0 -163
llama_stack/distributions/meta-reference-gpu/run-with-safety.yaml +0 -155
llama_stack/models/llama/hadamard_utils.py +0 -88
llama_stack/models/llama/llama3/args.py +0 -74
llama_stack/models/llama/llama3/generation.py +0 -378
llama_stack/models/llama/llama3/model.py +0 -304
llama_stack/models/llama/llama3/multimodal/__init__.py +0 -12
llama_stack/models/llama/llama3/multimodal/encoder_utils.py +0 -180
llama_stack/models/llama/llama3/multimodal/image_transform.py +0 -409
llama_stack/models/llama/llama3/multimodal/model.py +0 -1430
llama_stack/models/llama/llama3/multimodal/utils.py +0 -26
llama_stack/models/llama/llama3/quantization/__init__.py +0 -5
llama_stack/models/llama/llama3/quantization/loader.py +0 -316
llama_stack/models/llama/llama3_1/__init__.py +0 -12
llama_stack/models/llama/llama3_1/prompt_format.md +0 -358
llama_stack/models/llama/llama3_1/prompts.py +0 -258
llama_stack/models/llama/llama3_2/__init__.py +0 -5
llama_stack/models/llama/llama3_2/prompts_text.py +0 -229
llama_stack/models/llama/llama3_2/prompts_vision.py +0 -126
llama_stack/models/llama/llama3_2/text_prompt_format.md +0 -286
llama_stack/models/llama/llama3_2/vision_prompt_format.md +0 -141
llama_stack/models/llama/llama3_3/__init__.py +0 -5
llama_stack/models/llama/llama3_3/prompts.py +0 -259
llama_stack/models/llama/llama4/args.py +0 -107
llama_stack/models/llama/llama4/ffn.py +0 -58
llama_stack/models/llama/llama4/moe.py +0 -214
llama_stack/models/llama/llama4/preprocess.py +0 -435
llama_stack/models/llama/llama4/quantization/__init__.py +0 -5
llama_stack/models/llama/llama4/quantization/loader.py +0 -226
llama_stack/models/llama/llama4/vision/__init__.py +0 -5
llama_stack/models/llama/llama4/vision/embedding.py +0 -210
llama_stack/models/llama/llama4/vision/encoder.py +0 -412
llama_stack/models/llama/quantize_impls.py +0 -316
llama_stack/providers/inline/inference/meta_reference/__init__.py +0 -20
llama_stack/providers/inline/inference/meta_reference/common.py +0 -24
llama_stack/providers/inline/inference/meta_reference/config.py +0 -68
llama_stack/providers/inline/inference/meta_reference/generators.py +0 -201
llama_stack/providers/inline/inference/meta_reference/inference.py +0 -542
llama_stack/providers/inline/inference/meta_reference/model_parallel.py +0 -77
llama_stack/providers/inline/inference/meta_reference/parallel_utils.py +0 -353
llama_stack-0.4.3.dist-info/top_level.txt +0 -2
llama_stack_api/__init__.py +0 -945
llama_stack_api/admin/__init__.py +0 -45
llama_stack_api/admin/api.py +0 -72
llama_stack_api/admin/fastapi_routes.py +0 -117
llama_stack_api/admin/models.py +0 -113
llama_stack_api/agents.py +0 -173
llama_stack_api/batches/__init__.py +0 -40
llama_stack_api/batches/api.py +0 -53
llama_stack_api/batches/fastapi_routes.py +0 -113
llama_stack_api/batches/models.py +0 -78
llama_stack_api/benchmarks/__init__.py +0 -43
llama_stack_api/benchmarks/api.py +0 -39
llama_stack_api/benchmarks/fastapi_routes.py +0 -109
llama_stack_api/benchmarks/models.py +0 -109
llama_stack_api/common/__init__.py +0 -5
llama_stack_api/common/content_types.py +0 -101
llama_stack_api/common/errors.py +0 -95
llama_stack_api/common/job_types.py +0 -38
llama_stack_api/common/responses.py +0 -77
llama_stack_api/common/training_types.py +0 -47
llama_stack_api/common/type_system.py +0 -146
llama_stack_api/connectors.py +0 -146
llama_stack_api/conversations.py +0 -270
llama_stack_api/datasetio.py +0 -55
llama_stack_api/datasets/__init__.py +0 -61
llama_stack_api/datasets/api.py +0 -35
llama_stack_api/datasets/fastapi_routes.py +0 -104
llama_stack_api/datasets/models.py +0 -152
llama_stack_api/datatypes.py +0 -373
llama_stack_api/eval.py +0 -137
llama_stack_api/file_processors/__init__.py +0 -27
llama_stack_api/file_processors/api.py +0 -64
llama_stack_api/file_processors/fastapi_routes.py +0 -78
llama_stack_api/file_processors/models.py +0 -42
llama_stack_api/files/__init__.py +0 -35
llama_stack_api/files/api.py +0 -51
llama_stack_api/files/fastapi_routes.py +0 -124
llama_stack_api/files/models.py +0 -107
llama_stack_api/inference.py +0 -1169
llama_stack_api/inspect_api/__init__.py +0 -37
llama_stack_api/inspect_api/api.py +0 -25
llama_stack_api/inspect_api/fastapi_routes.py +0 -76
llama_stack_api/inspect_api/models.py +0 -28
llama_stack_api/internal/kvstore.py +0 -28
llama_stack_api/internal/sqlstore.py +0 -81
llama_stack_api/llama_stack_api/__init__.py +0 -945
llama_stack_api/llama_stack_api/admin/__init__.py +0 -45
llama_stack_api/llama_stack_api/admin/api.py +0 -72
llama_stack_api/llama_stack_api/admin/fastapi_routes.py +0 -117
llama_stack_api/llama_stack_api/admin/models.py +0 -113
llama_stack_api/llama_stack_api/agents.py +0 -173
llama_stack_api/llama_stack_api/batches/__init__.py +0 -40
llama_stack_api/llama_stack_api/batches/api.py +0 -53
llama_stack_api/llama_stack_api/batches/fastapi_routes.py +0 -113
llama_stack_api/llama_stack_api/batches/models.py +0 -78
llama_stack_api/llama_stack_api/benchmarks/__init__.py +0 -43
llama_stack_api/llama_stack_api/benchmarks/api.py +0 -39
llama_stack_api/llama_stack_api/benchmarks/fastapi_routes.py +0 -109
llama_stack_api/llama_stack_api/benchmarks/models.py +0 -109
llama_stack_api/llama_stack_api/common/__init__.py +0 -5
llama_stack_api/llama_stack_api/common/content_types.py +0 -101
llama_stack_api/llama_stack_api/common/errors.py +0 -95
llama_stack_api/llama_stack_api/common/job_types.py +0 -38
llama_stack_api/llama_stack_api/common/responses.py +0 -77
llama_stack_api/llama_stack_api/common/training_types.py +0 -47
llama_stack_api/llama_stack_api/common/type_system.py +0 -146
llama_stack_api/llama_stack_api/connectors.py +0 -146
llama_stack_api/llama_stack_api/conversations.py +0 -270
llama_stack_api/llama_stack_api/datasetio.py +0 -55
llama_stack_api/llama_stack_api/datasets/__init__.py +0 -61
llama_stack_api/llama_stack_api/datasets/api.py +0 -35
llama_stack_api/llama_stack_api/datasets/fastapi_routes.py +0 -104
llama_stack_api/llama_stack_api/datasets/models.py +0 -152
llama_stack_api/llama_stack_api/datatypes.py +0 -373
llama_stack_api/llama_stack_api/eval.py +0 -137
llama_stack_api/llama_stack_api/file_processors/__init__.py +0 -27
llama_stack_api/llama_stack_api/file_processors/api.py +0 -64
llama_stack_api/llama_stack_api/file_processors/fastapi_routes.py +0 -78
llama_stack_api/llama_stack_api/file_processors/models.py +0 -42
llama_stack_api/llama_stack_api/files/__init__.py +0 -35
llama_stack_api/llama_stack_api/files/api.py +0 -51
llama_stack_api/llama_stack_api/files/fastapi_routes.py +0 -124
llama_stack_api/llama_stack_api/files/models.py +0 -107
llama_stack_api/llama_stack_api/inference.py +0 -1169
llama_stack_api/llama_stack_api/inspect_api/__init__.py +0 -37
llama_stack_api/llama_stack_api/inspect_api/api.py +0 -25
llama_stack_api/llama_stack_api/inspect_api/fastapi_routes.py +0 -76
llama_stack_api/llama_stack_api/inspect_api/models.py +0 -28
llama_stack_api/llama_stack_api/internal/__init__.py +0 -9
llama_stack_api/llama_stack_api/internal/kvstore.py +0 -28
llama_stack_api/llama_stack_api/internal/sqlstore.py +0 -81
llama_stack_api/llama_stack_api/models.py +0 -171
llama_stack_api/llama_stack_api/openai_responses.py +0 -1468
llama_stack_api/llama_stack_api/post_training.py +0 -370
llama_stack_api/llama_stack_api/prompts.py +0 -203
llama_stack_api/llama_stack_api/providers/__init__.py +0 -33
llama_stack_api/llama_stack_api/providers/api.py +0 -16
llama_stack_api/llama_stack_api/providers/fastapi_routes.py +0 -57
llama_stack_api/llama_stack_api/providers/models.py +0 -24
llama_stack_api/llama_stack_api/py.typed +0 -0
llama_stack_api/llama_stack_api/rag_tool.py +0 -168
llama_stack_api/llama_stack_api/resource.py +0 -37
llama_stack_api/llama_stack_api/router_utils.py +0 -160
llama_stack_api/llama_stack_api/safety.py +0 -132
llama_stack_api/llama_stack_api/schema_utils.py +0 -208
llama_stack_api/llama_stack_api/scoring.py +0 -93
llama_stack_api/llama_stack_api/scoring_functions.py +0 -211
llama_stack_api/llama_stack_api/shields.py +0 -93
llama_stack_api/llama_stack_api/tools.py +0 -226
llama_stack_api/llama_stack_api/vector_io.py +0 -941
llama_stack_api/llama_stack_api/vector_stores.py +0 -53
llama_stack_api/llama_stack_api/version.py +0 -9
llama_stack_api/models.py +0 -171
llama_stack_api/openai_responses.py +0 -1468
llama_stack_api/post_training.py +0 -370
llama_stack_api/prompts.py +0 -203
llama_stack_api/providers/__init__.py +0 -33
llama_stack_api/providers/api.py +0 -16
llama_stack_api/providers/fastapi_routes.py +0 -57
llama_stack_api/providers/models.py +0 -24
llama_stack_api/py.typed +0 -0
llama_stack_api/rag_tool.py +0 -168
llama_stack_api/resource.py +0 -37
llama_stack_api/router_utils.py +0 -160
llama_stack_api/safety.py +0 -132
llama_stack_api/schema_utils.py +0 -208
llama_stack_api/scoring.py +0 -93
llama_stack_api/scoring_functions.py +0 -211
llama_stack_api/shields.py +0 -93
llama_stack_api/tools.py +0 -226
llama_stack_api/vector_io.py +0 -941
llama_stack_api/vector_stores.py +0 -53
llama_stack_api/version.py +0 -9
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0.dist-info}/WHEEL +0 -0
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0.dist-info}/entry_points.txt +0 -0
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0.dist-info}/licenses/LICENSE +0 -0

llama_stack_api/llama_stack_api/vector_io.py DELETED Viewed

@@ -1,941 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from typing import Annotated, Any, Literal, Protocol, runtime_checkable
-from fastapi import Body, Query
-from pydantic import BaseModel, Field, field_validator
-from llama_stack_api.inference import InterleavedContent
-from llama_stack_api.schema_utils import json_schema_type, register_schema, webmethod
-from llama_stack_api.vector_stores import VectorStore
-from llama_stack_api.version import LLAMA_STACK_API_V1
-@json_schema_type
-class ChunkMetadata(BaseModel):
-    """
-    `ChunkMetadata` is backend metadata for a `Chunk` that is used to store additional information about the chunk that
-        will not be used in the context during inference, but is required for backend functionality. The `ChunkMetadata`
-        is set during chunk creation in `MemoryToolRuntimeImpl().insert()`and is not expected to change after.
-        Use `Chunk.metadata` for metadata that will be used in the context during inference.
-    :param chunk_id: The ID of the chunk. If not set, it will be generated based on the document ID and content.
-    :param document_id: The ID of the document this chunk belongs to.
-    :param source: The source of the content, such as a URL, file path, or other identifier.
-    :param created_timestamp: An optional timestamp indicating when the chunk was created.
-    :param updated_timestamp: An optional timestamp indicating when the chunk was last updated.
-    :param chunk_window: The window of the chunk, which can be used to group related chunks together.
-    :param chunk_tokenizer: The tokenizer used to create the chunk. Default is Tiktoken.
-    :param content_token_count: The number of tokens in the content of the chunk.
-    :param metadata_token_count: The number of tokens in the metadata of the chunk.
-    """
-    chunk_id: str | None = None
-    document_id: str | None = None
-    source: str | None = None
-    created_timestamp: int | None = None
-    updated_timestamp: int | None = None
-    chunk_window: str | None = None
-    chunk_tokenizer: str | None = None
-    content_token_count: int | None = None
-    metadata_token_count: int | None = None
-@json_schema_type
-class Chunk(BaseModel):
-    """
-    A chunk of content from file processing.
-    :param content: The content of the chunk, which can be interleaved text, images, or other types.
-    :param chunk_id: Unique identifier for the chunk. Must be provided explicitly.
-    :param metadata: Metadata associated with the chunk that will be used in the model context during inference.
-    :param chunk_metadata: Metadata for the chunk that will NOT be used in the context during inference.
-        The `chunk_metadata` is required backend functionality.
-    """
-    content: InterleavedContent
-    chunk_id: str
-    metadata: dict[str, Any] = Field(default_factory=dict)
-    chunk_metadata: ChunkMetadata
-    @property
-    def document_id(self) -> str | None:
-        """Returns the document_id from either metadata or chunk_metadata, with metadata taking precedence."""
-        # Check metadata first (takes precedence)
-        doc_id = self.metadata.get("document_id")
-        if doc_id is not None:
-            if not isinstance(doc_id, str):
-                raise TypeError(f"metadata['document_id'] must be a string, got {type(doc_id).__name__}: {doc_id!r}")
-            return doc_id
-        # Fall back to chunk_metadata if available (Pydantic ensures type safety)
-        if self.chunk_metadata is not None:
-            return self.chunk_metadata.document_id
-        return None
-@json_schema_type
-class EmbeddedChunk(Chunk):
-    """
-    A chunk of content with its embedding vector for vector database operations.
-    Inherits all fields from Chunk and adds embedding-related fields.
-    :param embedding: The embedding vector for the chunk content.
-    :param embedding_model: The model used to generate the embedding (e.g., 'openai/text-embedding-3-small').
-    :param embedding_dimension: The dimension of the embedding vector.
-    """
-    embedding: list[float]
-    embedding_model: str
-    embedding_dimension: int
-@json_schema_type
-class QueryChunksResponse(BaseModel):
-    """Response from querying chunks in a vector database.
-    :param chunks: List of embedded chunks returned from the query
-    :param scores: Relevance scores corresponding to each returned chunk
-    """
-    chunks: list[EmbeddedChunk]
-    scores: list[float]
-@json_schema_type
-class VectorStoreFileCounts(BaseModel):
-    """File processing status counts for a vector store.
-    :param completed: Number of files that have been successfully processed
-    :param cancelled: Number of files that had their processing cancelled
-    :param failed: Number of files that failed to process
-    :param in_progress: Number of files currently being processed
-    :param total: Total number of files in the vector store
-    """
-    completed: int
-    cancelled: int
-    failed: int
-    in_progress: int
-    total: int
-# TODO: rename this as OpenAIVectorStore
-@json_schema_type
-class VectorStoreObject(BaseModel):
-    """OpenAI Vector Store object.
-    :param id: Unique identifier for the vector store
-    :param object: Object type identifier, always "vector_store"
-    :param created_at: Timestamp when the vector store was created
-    :param name: (Optional) Name of the vector store
-    :param usage_bytes: Storage space used by the vector store in bytes
-    :param file_counts: File processing status counts for the vector store
-    :param status: Current status of the vector store
-    :param expires_after: (Optional) Expiration policy for the vector store
-    :param expires_at: (Optional) Timestamp when the vector store will expire
-    :param last_active_at: (Optional) Timestamp of last activity on the vector store
-    :param metadata: Set of key-value pairs that can be attached to the vector store
-    """
-    id: str
-    object: str = "vector_store"
-    created_at: int
-    name: str | None = None
-    usage_bytes: int = 0
-    file_counts: VectorStoreFileCounts
-    status: str = "completed"
-    expires_after: dict[str, Any] | None = None
-    expires_at: int | None = None
-    last_active_at: int | None = None
-    metadata: dict[str, Any] = Field(default_factory=dict)
-@json_schema_type
-class VectorStoreCreateRequest(BaseModel):
-    """Request to create a vector store.
-    :param name: (Optional) Name for the vector store
-    :param file_ids: List of file IDs to include in the vector store
-    :param expires_after: (Optional) Expiration policy for the vector store
-    :param chunking_strategy: (Optional) Strategy for splitting files into chunks
-    :param metadata: Set of key-value pairs that can be attached to the vector store
-    """
-    name: str | None = None
-    file_ids: list[str] = Field(default_factory=list)
-    expires_after: dict[str, Any] | None = None
-    chunking_strategy: dict[str, Any] | None = None
-    metadata: dict[str, Any] = Field(default_factory=dict)
-@json_schema_type
-class VectorStoreModifyRequest(BaseModel):
-    """Request to modify a vector store.
-    :param name: (Optional) Updated name for the vector store
-    :param expires_after: (Optional) Updated expiration policy for the vector store
-    :param metadata: (Optional) Updated set of key-value pairs for the vector store
-    """
-    name: str | None = None
-    expires_after: dict[str, Any] | None = None
-    metadata: dict[str, Any] | None = None
-@json_schema_type
-class VectorStoreListResponse(BaseModel):
-    """Response from listing vector stores.
-    :param object: Object type identifier, always "list"
-    :param data: List of vector store objects
-    :param first_id: (Optional) ID of the first vector store in the list for pagination
-    :param last_id: (Optional) ID of the last vector store in the list for pagination
-    :param has_more: Whether there are more vector stores available beyond this page
-    """
-    object: str = "list"
-    data: list[VectorStoreObject]
-    first_id: str | None = None
-    last_id: str | None = None
-    has_more: bool = False
-@json_schema_type
-class VectorStoreSearchRequest(BaseModel):
-    """Request to search a vector store.
-    :param query: Search query as a string or list of strings
-    :param filters: (Optional) Filters based on file attributes to narrow search results
-    :param max_num_results: Maximum number of results to return, defaults to 10
-    :param ranking_options: (Optional) Options for ranking and filtering search results
-    :param rewrite_query: Whether to rewrite the query for better vector search performance
-    """
-    query: str | list[str]
-    filters: dict[str, Any] | None = None
-    max_num_results: int = 10
-    ranking_options: dict[str, Any] | None = None
-    rewrite_query: bool = False
-@json_schema_type
-class VectorStoreContent(BaseModel):
-    """Content item from a vector store file or search result.
-    :param type: Content type, currently only "text" is supported
-    :param text: The actual text content
-    :param embedding: Optional embedding vector for this content chunk
-    :param chunk_metadata: Optional chunk metadata
-    :param metadata: Optional user-defined metadata
-    """
-    type: Literal["text"]
-    text: str
-    embedding: list[float] | None = None
-    chunk_metadata: ChunkMetadata | None = None
-    metadata: dict[str, Any] | None = None
-@json_schema_type
-class VectorStoreSearchResponse(BaseModel):
-    """Response from searching a vector store.
-    :param file_id: Unique identifier of the file containing the result
-    :param filename: Name of the file containing the result
-    :param score: Relevance score for this search result
-    :param attributes: (Optional) Key-value attributes associated with the file
-    :param content: List of content items matching the search query
-    """
-    file_id: str
-    filename: str
-    score: float
-    attributes: dict[str, str | float | bool] | None = None
-    content: list[VectorStoreContent]
-@json_schema_type
-class VectorStoreSearchResponsePage(BaseModel):
-    """Paginated response from searching a vector store.
-    :param object: Object type identifier for the search results page
-    :param search_query: The original search query that was executed
-    :param data: List of search result objects
-    :param has_more: Whether there are more results available beyond this page
-    :param next_page: (Optional) Token for retrieving the next page of results
-    """
-    object: str = "vector_store.search_results.page"
-    search_query: list[str]
-    data: list[VectorStoreSearchResponse]
-    has_more: bool = False
-    next_page: str | None = None
-@json_schema_type
-class VectorStoreDeleteResponse(BaseModel):
-    """Response from deleting a vector store.
-    :param id: Unique identifier of the deleted vector store
-    :param object: Object type identifier for the deletion response
-    :param deleted: Whether the deletion operation was successful
-    """
-    id: str
-    object: str = "vector_store.deleted"
-    deleted: bool = True
-@json_schema_type
-class VectorStoreFileContentResponse(BaseModel):
-    """Represents the parsed content of a vector store file.
-    :param object: The object type, which is always `vector_store.file_content.page`
-    :param data: Parsed content of the file
-    :param has_more: Indicates if there are more content pages to fetch
-    :param next_page: The token for the next page, if any
-    """
-    object: Literal["vector_store.file_content.page"] = "vector_store.file_content.page"
-    data: list[VectorStoreContent]
-    has_more: bool = False
-    next_page: str | None = None
-@json_schema_type
-class VectorStoreChunkingStrategyAuto(BaseModel):
-    """Automatic chunking strategy for vector store files.
-    :param type: Strategy type, always "auto" for automatic chunking
-    """
-    type: Literal["auto"] = "auto"
-@json_schema_type
-class VectorStoreChunkingStrategyStaticConfig(BaseModel):
-    """Configuration for static chunking strategy.
-    :param chunk_overlap_tokens: Number of tokens to overlap between adjacent chunks
-    :param max_chunk_size_tokens: Maximum number of tokens per chunk, must be between 100 and 4096
-    """
-    chunk_overlap_tokens: int = 400
-    max_chunk_size_tokens: int = Field(800, ge=100, le=4096)
-@json_schema_type
-class VectorStoreChunkingStrategyStatic(BaseModel):
-    """Static chunking strategy with configurable parameters.
-    :param type: Strategy type, always "static" for static chunking
-    :param static: Configuration parameters for the static chunking strategy
-    """
-    type: Literal["static"] = "static"
-    static: VectorStoreChunkingStrategyStaticConfig
-VectorStoreChunkingStrategy = Annotated[
-    VectorStoreChunkingStrategyAuto | VectorStoreChunkingStrategyStatic,
-    Field(discriminator="type"),
-]
-register_schema(VectorStoreChunkingStrategy, name="VectorStoreChunkingStrategy")
-class SearchRankingOptions(BaseModel):
-    """Options for ranking and filtering search results.
-    :param ranker: (Optional) Name of the ranking algorithm to use
-    :param score_threshold: (Optional) Minimum relevance score threshold for results
-    """
-    ranker: str | None = None
-    # NOTE: OpenAI File Search Tool requires threshold to be between 0 and 1, however
-    # we don't guarantee that the score is between 0 and 1, so will leave this unconstrained
-    # and let the provider handle it
-    score_threshold: float | None = Field(default=0.0)
-@json_schema_type
-class VectorStoreFileLastError(BaseModel):
-    """Error information for failed vector store file processing.
-    :param code: Error code indicating the type of failure
-    :param message: Human-readable error message describing the failure
-    """
-    code: Literal["server_error"] | Literal["rate_limit_exceeded"]
-    message: str
-VectorStoreFileStatus = Literal["completed"] | Literal["in_progress"] | Literal["cancelled"] | Literal["failed"]
-register_schema(VectorStoreFileStatus, name="VectorStoreFileStatus")
-# VectorStoreFileAttributes type with OpenAPI constraints
-VectorStoreFileAttributes = Annotated[
-    dict[str, Annotated[str, Field(max_length=512)] | float | bool],
-    Field(
-        max_length=16,
-        json_schema_extra={
-            "propertyNames": {"type": "string", "maxLength": 64},
-            "x-oaiTypeLabel": "map",
-        },
-        description=(
-            "Set of 16 key-value pairs that can be attached to an object. This can be "
-            "useful for storing additional information about the object in a structured "
-            "format, and querying for objects via API or the dashboard. Keys are strings "
-            "with a maximum length of 64 characters. Values are strings with a maximum "
-            "length of 512 characters, booleans, or numbers."
-        ),
-    ),
-]
-def _sanitize_vector_store_attributes(metadata: dict[str, Any] | None) -> dict[str, str | float | bool]:
-    """
-    Sanitize metadata to VectorStoreFileAttributes spec (max 16 properties, primitives only).
-    Converts dict[str, Any] to dict[str, str | float | bool]:
-    - Preserves: str (truncated to 512 chars), bool, int/float (as float)
-    - Converts: list -> comma-separated string
-    - Filters: dict, None, other types
-    - Enforces: max 16 properties, max 64 char keys, max 512 char string values
-    """
-    if not metadata:
-        return {}
-    sanitized: dict[str, str | float | bool] = {}
-    for key, value in metadata.items():
-        # Enforce max 16 properties
-        if len(sanitized) >= 16:
-            break
-        # Enforce max 64 char keys
-        if len(key) > 64:
-            continue
-        # Convert to supported primitive types
-        if isinstance(value, bool):
-            sanitized[key] = value
-        elif isinstance(value, int | float):
-            sanitized[key] = float(value)
-        elif isinstance(value, str):
-            # Enforce max 512 char string values
-            sanitized[key] = value[:512] if len(value) > 512 else value
-        elif isinstance(value, list):
-            # Convert lists to comma-separated strings (max 512 chars)
-            list_str = ", ".join(str(item) for item in value)
-            sanitized[key] = list_str[:512] if len(list_str) > 512 else list_str
-    return sanitized
-@json_schema_type
-class VectorStoreFileObject(BaseModel):
-    """OpenAI Vector Store File object.
-    :param id: Unique identifier for the file
-    :param object: Object type identifier, always "vector_store.file"
-    :param attributes: Key-value attributes associated with the file
-    :param chunking_strategy: Strategy used for splitting the file into chunks
-    :param created_at: Timestamp when the file was added to the vector store
-    :param last_error: (Optional) Error information if file processing failed
-    :param status: Current processing status of the file
-    :param usage_bytes: Storage space used by this file in bytes
-    :param vector_store_id: ID of the vector store containing this file
-    """
-    id: str
-    object: str = "vector_store.file"
-    attributes: VectorStoreFileAttributes = Field(default_factory=dict)
-    chunking_strategy: VectorStoreChunkingStrategy
-    created_at: int
-    last_error: VectorStoreFileLastError | None = None
-    status: VectorStoreFileStatus
-    usage_bytes: int = 0
-    vector_store_id: str
-    @field_validator("attributes", mode="before")
-    @classmethod
-    def _validate_attributes(cls, v: dict[str, Any] | None) -> dict[str, str | float | bool]:
-        """Sanitize attributes to match VectorStoreFileAttributes OpenAPI spec."""
-        return _sanitize_vector_store_attributes(v)
-@json_schema_type
-class VectorStoreListFilesResponse(BaseModel):
-    """Response from listing files in a vector store.
-    :param object: Object type identifier, always "list"
-    :param data: List of vector store file objects
-    :param first_id: (Optional) ID of the first file in the list for pagination
-    :param last_id: (Optional) ID of the last file in the list for pagination
-    :param has_more: Whether there are more files available beyond this page
-    """
-    object: str = "list"
-    data: list[VectorStoreFileObject]
-    first_id: str | None = None
-    last_id: str | None = None
-    has_more: bool = False
-@json_schema_type
-class VectorStoreFileDeleteResponse(BaseModel):
-    """Response from deleting a vector store file.
-    :param id: Unique identifier of the deleted file
-    :param object: Object type identifier for the deletion response
-    :param deleted: Whether the deletion operation was successful
-    """
-    id: str
-    object: str = "vector_store.file.deleted"
-    deleted: bool = True
-@json_schema_type
-class VectorStoreFileBatchObject(BaseModel):
-    """OpenAI Vector Store File Batch object.
-    :param id: Unique identifier for the file batch
-    :param object: Object type identifier, always "vector_store.file_batch"
-    :param created_at: Timestamp when the file batch was created
-    :param vector_store_id: ID of the vector store containing the file batch
-    :param status: Current processing status of the file batch
-    :param file_counts: File processing status counts for the batch
-    """
-    id: str
-    object: str = "vector_store.file_batch"
-    created_at: int
-    vector_store_id: str
-    status: VectorStoreFileStatus
-    file_counts: VectorStoreFileCounts
-@json_schema_type
-class VectorStoreFilesListInBatchResponse(BaseModel):
-    """Response from listing files in a vector store file batch.
-    :param object: Object type identifier, always "list"
-    :param data: List of vector store file objects in the batch
-    :param first_id: (Optional) ID of the first file in the list for pagination
-    :param last_id: (Optional) ID of the last file in the list for pagination
-    :param has_more: Whether there are more files available beyond this page
-    """
-    object: str = "list"
-    data: list[VectorStoreFileObject]
-    first_id: str | None = None
-    last_id: str | None = None
-    has_more: bool = False
-# extra_body can be accessed via .model_extra
-@json_schema_type
-class OpenAICreateVectorStoreRequestWithExtraBody(BaseModel, extra="allow"):
-    """Request to create a vector store with extra_body support.
-    :param name: (Optional) A name for the vector store
-    :param file_ids: List of file IDs to include in the vector store
-    :param expires_after: (Optional) Expiration policy for the vector store
-    :param chunking_strategy: (Optional) Strategy for splitting files into chunks
-    :param metadata: Set of key-value pairs that can be attached to the vector store
-    """
-    name: str | None = None
-    file_ids: list[str] | None = None
-    expires_after: dict[str, Any] | None = None
-    chunking_strategy: VectorStoreChunkingStrategy | None = None
-    metadata: dict[str, Any] | None = None
-# extra_body can be accessed via .model_extra
-@json_schema_type
-class OpenAICreateVectorStoreFileBatchRequestWithExtraBody(BaseModel, extra="allow"):
-    """Request to create a vector store file batch with extra_body support.
-    :param file_ids: A list of File IDs that the vector store should use
-    :param attributes: (Optional) Key-value attributes to store with the files
-    :param chunking_strategy: (Optional) The chunking strategy used to chunk the file(s). Defaults to auto
-    """
-    file_ids: list[str]
-    attributes: dict[str, Any] | None = None
-    chunking_strategy: VectorStoreChunkingStrategy | None = None
-class VectorStoreTable(Protocol):
-    def get_vector_store(self, vector_store_id: str) -> VectorStore | None: ...
-@runtime_checkable
-class VectorIO(Protocol):
-    vector_store_table: VectorStoreTable | None = None
-    # this will just block now until chunks are inserted, but it should
-    # probably return a Job instance which can be polled for completion
-    # TODO: rename vector_store_id to vector_store_id once Stainless is working
-    @webmethod(route="/vector-io/insert", method="POST", level=LLAMA_STACK_API_V1)
-    async def insert_chunks(
-        self,
-        vector_store_id: str,
-        chunks: list[EmbeddedChunk],
-        ttl_seconds: int | None = None,
-    ) -> None:
-        """Insert embedded chunks into a vector database.
-        :param vector_store_id: The identifier of the vector database to insert the chunks into.
-        :param chunks: The embedded chunks to insert. Each `EmbeddedChunk` contains the content, metadata,
-            and embedding vector ready for storage.
-        :param ttl_seconds: The time to live of the chunks.
-        """
-        ...
-    # TODO: rename vector_store_id to vector_store_id once Stainless is working
-    @webmethod(route="/vector-io/query", method="POST", level=LLAMA_STACK_API_V1)
-    async def query_chunks(
-        self,
-        vector_store_id: str,
-        query: InterleavedContent,
-        params: dict[str, Any] | None = None,
-    ) -> QueryChunksResponse:
-        """Query chunks from a vector database.
-        :param vector_store_id: The identifier of the vector database to query.
-        :param query: The query to search for.
-        :param params: The parameters of the query.
-        :returns: A QueryChunksResponse.
-        """
-        ...
-    # OpenAI Vector Stores API endpoints
-    @webmethod(route="/vector_stores", method="POST", level=LLAMA_STACK_API_V1)
-    async def openai_create_vector_store(
-        self,
-        params: Annotated[OpenAICreateVectorStoreRequestWithExtraBody, Body(...)],
-    ) -> VectorStoreObject:
-        """Creates a vector store.
-        Generate an OpenAI-compatible vector store with the given parameters.
-        :returns: A VectorStoreObject representing the created vector store.
-        """
-        ...
-    @webmethod(route="/vector_stores", method="GET", level=LLAMA_STACK_API_V1)
-    async def openai_list_vector_stores(
-        self,
-        limit: int | None = 20,
-        order: str | None = "desc",
-        after: str | None = None,
-        before: str | None = None,
-    ) -> VectorStoreListResponse:
-        """Returns a list of vector stores.
-        :param limit: A limit on the number of objects to be returned. Limit can range between 1 and 100, and the default is 20.
-        :param order: Sort order by the `created_at` timestamp of the objects. `asc` for ascending order and `desc` for descending order.
-        :param after: A cursor for use in pagination. `after` is an object ID that defines your place in the list.
-        :param before: A cursor for use in pagination. `before` is an object ID that defines your place in the list.
-        :returns: A VectorStoreListResponse containing the list of vector stores.
-        """
-        ...
-    @webmethod(route="/vector_stores/{vector_store_id}", method="GET", level=LLAMA_STACK_API_V1)
-    async def openai_retrieve_vector_store(
-        self,
-        vector_store_id: str,
-    ) -> VectorStoreObject:
-        """Retrieves a vector store.
-        :param vector_store_id: The ID of the vector store to retrieve.
-        :returns: A VectorStoreObject representing the vector store.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}",
-        method="POST",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_update_vector_store(
-        self,
-        vector_store_id: str,
-        name: str | None = None,
-        expires_after: dict[str, Any] | None = None,
-        metadata: dict[str, Any] | None = None,
-    ) -> VectorStoreObject:
-        """Updates a vector store.
-        :param vector_store_id: The ID of the vector store to update.
-        :param name: The name of the vector store.
-        :param expires_after: The expiration policy for a vector store.
-        :param metadata: Set of 16 key-value pairs that can be attached to an object.
-        :returns: A VectorStoreObject representing the updated vector store.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}",
-        method="DELETE",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_delete_vector_store(
-        self,
-        vector_store_id: str,
-    ) -> VectorStoreDeleteResponse:
-        """Delete a vector store.
-        :param vector_store_id: The ID of the vector store to delete.
-        :returns: A VectorStoreDeleteResponse indicating the deletion status.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/search",
-        method="POST",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_search_vector_store(
-        self,
-        vector_store_id: str,
-        query: str | list[str],
-        filters: dict[str, Any] | None = None,
-        max_num_results: int | None = 10,
-        ranking_options: SearchRankingOptions | None = None,
-        rewrite_query: bool | None = False,
-        search_mode: (
-            str | None
-        ) = "vector",  # Using str instead of Literal due to OpenAPI schema generator limitations
-    ) -> VectorStoreSearchResponsePage:
-        """Search for chunks in a vector store.
-        Searches a vector store for relevant chunks based on a query and optional file attribute filters.
-        :param vector_store_id: The ID of the vector store to search.
-        :param query: The query string or array for performing the search.
-        :param filters: Filters based on file attributes to narrow the search results.
-        :param max_num_results: Maximum number of results to return (1 to 50 inclusive, default 10).
-        :param ranking_options: Ranking options for fine-tuning the search results.
-        :param rewrite_query: Whether to rewrite the natural language query for vector search (default false)
-        :param search_mode: The search mode to use - "keyword", "vector", or "hybrid" (default "vector")
-        :returns: A VectorStoreSearchResponse containing the search results.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/files",
-        method="POST",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_attach_file_to_vector_store(
-        self,
-        vector_store_id: str,
-        file_id: str,
-        attributes: dict[str, Any] | None = None,
-        chunking_strategy: VectorStoreChunkingStrategy | None = None,
-    ) -> VectorStoreFileObject:
-        """Attach a file to a vector store.
-        :param vector_store_id: The ID of the vector store to attach the file to.
-        :param file_id: The ID of the file to attach to the vector store.
-        :param attributes: The key-value attributes stored with the file, which can be used for filtering.
-        :param chunking_strategy: The chunking strategy to use for the file.
-        :returns: A VectorStoreFileObject representing the attached file.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/files",
-        method="GET",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_list_files_in_vector_store(
-        self,
-        vector_store_id: str,
-        limit: int | None = 20,
-        order: str | None = "desc",
-        after: str | None = None,
-        before: str | None = None,
-        filter: VectorStoreFileStatus | None = None,
-    ) -> VectorStoreListFilesResponse:
-        """List files in a vector store.
-        :param vector_store_id: The ID of the vector store to list files from.
-        :param limit: (Optional) A limit on the number of objects to be returned. Limit can range between 1 and 100, and the default is 20.
-        :param order: (Optional) Sort order by the `created_at` timestamp of the objects. `asc` for ascending order and `desc` for descending order.
-        :param after: (Optional) A cursor for use in pagination. `after` is an object ID that defines your place in the list.
-        :param before: (Optional) A cursor for use in pagination. `before` is an object ID that defines your place in the list.
-        :param filter: (Optional) Filter by file status to only return files with the specified status.
-        :returns: A VectorStoreListFilesResponse containing the list of files.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/files/{file_id}",
-        method="GET",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_retrieve_vector_store_file(
-        self,
-        vector_store_id: str,
-        file_id: str,
-    ) -> VectorStoreFileObject:
-        """Retrieves a vector store file.
-        :param vector_store_id: The ID of the vector store containing the file to retrieve.
-        :param file_id: The ID of the file to retrieve.
-        :returns: A VectorStoreFileObject representing the file.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/files/{file_id}/content",
-        method="GET",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_retrieve_vector_store_file_contents(
-        self,
-        vector_store_id: str,
-        file_id: str,
-        include_embeddings: Annotated[bool | None, Query()] = False,
-        include_metadata: Annotated[bool | None, Query()] = False,
-    ) -> VectorStoreFileContentResponse:
-        """Retrieves the contents of a vector store file.
-        :param vector_store_id: The ID of the vector store containing the file to retrieve.
-        :param file_id: The ID of the file to retrieve.
-        :param include_embeddings: Whether to include embedding vectors in the response.
-        :param include_metadata: Whether to include chunk metadata in the response.
-        :returns: File contents, optionally with embeddings and metadata based on query parameters.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/files/{file_id}",
-        method="POST",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_update_vector_store_file(
-        self,
-        vector_store_id: str,
-        file_id: str,
-        attributes: dict[str, Any],
-    ) -> VectorStoreFileObject:
-        """Updates a vector store file.
-        :param vector_store_id: The ID of the vector store containing the file to update.
-        :param file_id: The ID of the file to update.
-        :param attributes: The updated key-value attributes to store with the file.
-        :returns: A VectorStoreFileObject representing the updated file.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/files/{file_id}",
-        method="DELETE",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_delete_vector_store_file(
-        self,
-        vector_store_id: str,
-        file_id: str,
-    ) -> VectorStoreFileDeleteResponse:
-        """Delete a vector store file.
-        :param vector_store_id: The ID of the vector store containing the file to delete.
-        :param file_id: The ID of the file to delete.
-        :returns: A VectorStoreFileDeleteResponse indicating the deletion status.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/file_batches",
-        method="POST",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_create_vector_store_file_batch(
-        self,
-        vector_store_id: str,
-        params: Annotated[OpenAICreateVectorStoreFileBatchRequestWithExtraBody, Body(...)],
-    ) -> VectorStoreFileBatchObject:
-        """Create a vector store file batch.
-        Generate an OpenAI-compatible vector store file batch for the given vector store.
-        :param vector_store_id: The ID of the vector store to create the file batch for.
-        :returns: A VectorStoreFileBatchObject representing the created file batch.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/file_batches/{batch_id}",
-        method="GET",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_retrieve_vector_store_file_batch(
-        self,
-        batch_id: str,
-        vector_store_id: str,
-    ) -> VectorStoreFileBatchObject:
-        """Retrieve a vector store file batch.
-        :param batch_id: The ID of the file batch to retrieve.
-        :param vector_store_id: The ID of the vector store containing the file batch.
-        :returns: A VectorStoreFileBatchObject representing the file batch.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/file_batches/{batch_id}/files",
-        method="GET",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_list_files_in_vector_store_file_batch(
-        self,
-        batch_id: str,
-        vector_store_id: str,
-        after: str | None = None,
-        before: str | None = None,
-        filter: str | None = None,
-        limit: int | None = 20,
-        order: str | None = "desc",
-    ) -> VectorStoreFilesListInBatchResponse:
-        """Returns a list of vector store files in a batch.
-        :param batch_id: The ID of the file batch to list files from.
-        :param vector_store_id: The ID of the vector store containing the file batch.
-        :param after: A cursor for use in pagination. `after` is an object ID that defines your place in the list.
-        :param before: A cursor for use in pagination. `before` is an object ID that defines your place in the list.
-        :param filter: Filter by file status. One of in_progress, completed, failed, cancelled.
-        :param limit: A limit on the number of objects to be returned. Limit can range between 1 and 100, and the default is 20.
-        :param order: Sort order by the `created_at` timestamp of the objects. `asc` for ascending order and `desc` for descending order.
-        :returns: A VectorStoreFilesListInBatchResponse containing the list of files in the batch.
-        """
-        ...
-    @webmethod(
-        route="/vector_stores/{vector_store_id}/file_batches/{batch_id}/cancel",
-        method="POST",
-        level=LLAMA_STACK_API_V1,
-    )
-    async def openai_cancel_vector_store_file_batch(
-        self,
-        batch_id: str,
-        vector_store_id: str,
-    ) -> VectorStoreFileBatchObject:
-        """Cancels a vector store file batch.
-        :param batch_id: The ID of the file batch to cancel.
-        :param vector_store_id: The ID of the vector store containing the file batch.
-        :returns: A VectorStoreFileBatchObject representing the cancelled file batch.
-        """
-        ...

llama-stack 0.4.3__py3-none-any.whl → 0.5.0__py3-none-any.whl

llama-stack 0.4.3py3-none-any.whl → 0.5.0py3-none-any.whl