PyPI - llama-stack - Versions diffs - 0.4.3__py3-none-any.whl → 0.5.0rc1__py3-none-any.whl - Mend

llama-stack 0.4.3py3-none-any.whl → 0.5.0rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (307) hide show

llama_stack/cli/stack/_list_deps.py +11 -7
llama_stack/cli/stack/run.py +3 -25
llama_stack/core/access_control/datatypes.py +78 -0
llama_stack/core/configure.py +2 -2
{llama_stack_api/internal → llama_stack/core/connectors}/__init__.py +2 -2
llama_stack/core/connectors/connectors.py +162 -0
llama_stack/core/conversations/conversations.py +61 -58
llama_stack/core/datatypes.py +54 -8
llama_stack/core/library_client.py +60 -13
llama_stack/core/prompts/prompts.py +43 -42
llama_stack/core/routers/datasets.py +20 -17
llama_stack/core/routers/eval_scoring.py +143 -53
llama_stack/core/routers/inference.py +20 -9
llama_stack/core/routers/safety.py +30 -42
llama_stack/core/routers/vector_io.py +15 -7
llama_stack/core/routing_tables/models.py +42 -3
llama_stack/core/routing_tables/scoring_functions.py +19 -19
llama_stack/core/routing_tables/shields.py +20 -17
llama_stack/core/routing_tables/vector_stores.py +8 -5
llama_stack/core/server/auth.py +192 -17
llama_stack/core/server/fastapi_router_registry.py +40 -5
llama_stack/core/server/server.py +24 -5
llama_stack/core/stack.py +54 -10
llama_stack/core/storage/datatypes.py +9 -0
llama_stack/core/store/registry.py +1 -1
llama_stack/core/utils/exec.py +2 -2
llama_stack/core/utils/type_inspection.py +16 -2
llama_stack/distributions/dell/config.yaml +4 -1
llama_stack/distributions/dell/doc_template.md +209 -0
llama_stack/distributions/dell/run-with-safety.yaml +4 -1
llama_stack/distributions/nvidia/config.yaml +4 -1
llama_stack/distributions/nvidia/doc_template.md +170 -0
llama_stack/distributions/nvidia/run-with-safety.yaml +4 -1
llama_stack/distributions/oci/config.yaml +4 -1
llama_stack/distributions/oci/doc_template.md +140 -0
llama_stack/distributions/open-benchmark/config.yaml +9 -1
llama_stack/distributions/postgres-demo/config.yaml +1 -1
llama_stack/distributions/starter/build.yaml +62 -0
llama_stack/distributions/starter/config.yaml +22 -3
llama_stack/distributions/starter/run-with-postgres-store.yaml +22 -3
llama_stack/distributions/starter/starter.py +13 -1
llama_stack/distributions/starter-gpu/build.yaml +62 -0
llama_stack/distributions/starter-gpu/config.yaml +22 -3
llama_stack/distributions/starter-gpu/run-with-postgres-store.yaml +22 -3
llama_stack/distributions/template.py +10 -2
llama_stack/distributions/watsonx/config.yaml +4 -1
llama_stack/log.py +1 -0
llama_stack/models/llama/resources/dog.jpg +0 -0
llama_stack/models/llama/resources/pasta.jpeg +0 -0
llama_stack/models/llama/resources/small_dog.jpg +0 -0
llama_stack/providers/inline/agents/meta_reference/__init__.py +1 -0
llama_stack/providers/inline/agents/meta_reference/agents.py +57 -61
llama_stack/providers/inline/agents/meta_reference/responses/openai_responses.py +183 -60
llama_stack/providers/inline/agents/meta_reference/responses/streaming.py +94 -22
llama_stack/providers/inline/agents/meta_reference/responses/types.py +2 -1
llama_stack/providers/inline/agents/meta_reference/responses/utils.py +4 -1
llama_stack/providers/inline/agents/meta_reference/safety.py +2 -2
llama_stack/providers/inline/batches/reference/batches.py +2 -1
llama_stack/providers/inline/eval/meta_reference/eval.py +40 -32
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.h +9 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.swift +189 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/Parsing.swift +238 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/PromptTemplate.swift +12 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/SystemPrompts.swift +89 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.pbxproj +550 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +8 -0
llama_stack/providers/inline/post_training/huggingface/post_training.py +33 -38
llama_stack/providers/inline/post_training/huggingface/utils.py +2 -5
llama_stack/providers/inline/post_training/torchtune/post_training.py +28 -33
llama_stack/providers/inline/post_training/torchtune/recipes/lora_finetuning_single_device.py +2 -4
llama_stack/providers/inline/safety/code_scanner/code_scanner.py +12 -15
llama_stack/providers/inline/safety/llama_guard/llama_guard.py +15 -18
llama_stack/providers/inline/safety/prompt_guard/prompt_guard.py +11 -17
llama_stack/providers/inline/scoring/basic/scoring.py +13 -17
llama_stack/providers/inline/scoring/braintrust/braintrust.py +15 -15
llama_stack/providers/inline/scoring/llm_as_judge/scoring.py +13 -17
llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py +1 -1
llama_stack/providers/registry/agents.py +1 -0
llama_stack/providers/registry/inference.py +1 -9
llama_stack/providers/registry/vector_io.py +136 -16
llama_stack/providers/remote/datasetio/nvidia/README.md +74 -0
llama_stack/providers/remote/eval/nvidia/README.md +134 -0
llama_stack/providers/remote/eval/nvidia/eval.py +22 -21
llama_stack/providers/remote/files/s3/README.md +266 -0
llama_stack/providers/remote/files/s3/config.py +5 -3
llama_stack/providers/remote/files/s3/files.py +2 -2
llama_stack/providers/remote/inference/gemini/gemini.py +4 -0
llama_stack/providers/remote/inference/nvidia/NVIDIA.md +203 -0
llama_stack/providers/remote/inference/openai/openai.py +2 -0
llama_stack/providers/remote/inference/together/together.py +4 -0
llama_stack/providers/remote/inference/vertexai/config.py +3 -3
llama_stack/providers/remote/inference/vertexai/vertexai.py +5 -2
llama_stack/providers/remote/inference/vllm/config.py +37 -18
llama_stack/providers/remote/inference/vllm/vllm.py +0 -3
llama_stack/providers/remote/inference/watsonx/watsonx.py +4 -0
llama_stack/providers/remote/post_training/nvidia/README.md +151 -0
llama_stack/providers/remote/post_training/nvidia/post_training.py +31 -33
llama_stack/providers/remote/safety/bedrock/bedrock.py +10 -27
llama_stack/providers/remote/safety/nvidia/README.md +78 -0
llama_stack/providers/remote/safety/nvidia/nvidia.py +9 -25
llama_stack/providers/remote/safety/sambanova/sambanova.py +13 -11
llama_stack/providers/remote/vector_io/elasticsearch/__init__.py +17 -0
llama_stack/providers/remote/vector_io/elasticsearch/config.py +32 -0
llama_stack/providers/remote/vector_io/elasticsearch/elasticsearch.py +463 -0
llama_stack/providers/remote/vector_io/oci/__init__.py +22 -0
llama_stack/providers/remote/vector_io/oci/config.py +41 -0
llama_stack/providers/remote/vector_io/oci/oci26ai.py +595 -0
llama_stack/providers/remote/vector_io/pgvector/config.py +69 -2
llama_stack/providers/remote/vector_io/pgvector/pgvector.py +255 -6
llama_stack/providers/remote/vector_io/qdrant/qdrant.py +62 -38
llama_stack/providers/utils/bedrock/client.py +3 -3
llama_stack/providers/utils/bedrock/config.py +7 -7
llama_stack/providers/utils/inference/embedding_mixin.py +4 -0
llama_stack/providers/utils/inference/http_client.py +239 -0
llama_stack/providers/utils/inference/litellm_openai_mixin.py +5 -0
llama_stack/providers/utils/inference/model_registry.py +148 -2
llama_stack/providers/utils/inference/openai_compat.py +2 -1
llama_stack/providers/utils/inference/openai_mixin.py +41 -2
llama_stack/providers/utils/memory/openai_vector_store_mixin.py +92 -5
llama_stack/providers/utils/memory/vector_store.py +46 -19
llama_stack/providers/utils/responses/responses_store.py +40 -6
llama_stack/providers/utils/safety.py +114 -0
llama_stack/providers/utils/tools/mcp.py +44 -3
llama_stack/testing/api_recorder.py +9 -3
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0rc1.dist-info}/METADATA +14 -2
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0rc1.dist-info}/RECORD +131 -275
llama_stack-0.5.0rc1.dist-info/top_level.txt +1 -0
llama_stack/distributions/meta-reference-gpu/__init__.py +0 -7
llama_stack/distributions/meta-reference-gpu/config.yaml +0 -140
llama_stack/distributions/meta-reference-gpu/meta_reference.py +0 -163
llama_stack/distributions/meta-reference-gpu/run-with-safety.yaml +0 -155
llama_stack/models/llama/hadamard_utils.py +0 -88
llama_stack/models/llama/llama3/args.py +0 -74
llama_stack/models/llama/llama3/generation.py +0 -378
llama_stack/models/llama/llama3/model.py +0 -304
llama_stack/models/llama/llama3/multimodal/__init__.py +0 -12
llama_stack/models/llama/llama3/multimodal/encoder_utils.py +0 -180
llama_stack/models/llama/llama3/multimodal/image_transform.py +0 -409
llama_stack/models/llama/llama3/multimodal/model.py +0 -1430
llama_stack/models/llama/llama3/multimodal/utils.py +0 -26
llama_stack/models/llama/llama3/quantization/__init__.py +0 -5
llama_stack/models/llama/llama3/quantization/loader.py +0 -316
llama_stack/models/llama/llama3_1/__init__.py +0 -12
llama_stack/models/llama/llama3_1/prompt_format.md +0 -358
llama_stack/models/llama/llama3_1/prompts.py +0 -258
llama_stack/models/llama/llama3_2/__init__.py +0 -5
llama_stack/models/llama/llama3_2/prompts_text.py +0 -229
llama_stack/models/llama/llama3_2/prompts_vision.py +0 -126
llama_stack/models/llama/llama3_2/text_prompt_format.md +0 -286
llama_stack/models/llama/llama3_2/vision_prompt_format.md +0 -141
llama_stack/models/llama/llama3_3/__init__.py +0 -5
llama_stack/models/llama/llama3_3/prompts.py +0 -259
llama_stack/models/llama/llama4/args.py +0 -107
llama_stack/models/llama/llama4/ffn.py +0 -58
llama_stack/models/llama/llama4/moe.py +0 -214
llama_stack/models/llama/llama4/preprocess.py +0 -435
llama_stack/models/llama/llama4/quantization/__init__.py +0 -5
llama_stack/models/llama/llama4/quantization/loader.py +0 -226
llama_stack/models/llama/llama4/vision/__init__.py +0 -5
llama_stack/models/llama/llama4/vision/embedding.py +0 -210
llama_stack/models/llama/llama4/vision/encoder.py +0 -412
llama_stack/models/llama/quantize_impls.py +0 -316
llama_stack/providers/inline/inference/meta_reference/__init__.py +0 -20
llama_stack/providers/inline/inference/meta_reference/common.py +0 -24
llama_stack/providers/inline/inference/meta_reference/config.py +0 -68
llama_stack/providers/inline/inference/meta_reference/generators.py +0 -201
llama_stack/providers/inline/inference/meta_reference/inference.py +0 -542
llama_stack/providers/inline/inference/meta_reference/model_parallel.py +0 -77
llama_stack/providers/inline/inference/meta_reference/parallel_utils.py +0 -353
llama_stack-0.4.3.dist-info/top_level.txt +0 -2
llama_stack_api/__init__.py +0 -945
llama_stack_api/admin/__init__.py +0 -45
llama_stack_api/admin/api.py +0 -72
llama_stack_api/admin/fastapi_routes.py +0 -117
llama_stack_api/admin/models.py +0 -113
llama_stack_api/agents.py +0 -173
llama_stack_api/batches/__init__.py +0 -40
llama_stack_api/batches/api.py +0 -53
llama_stack_api/batches/fastapi_routes.py +0 -113
llama_stack_api/batches/models.py +0 -78
llama_stack_api/benchmarks/__init__.py +0 -43
llama_stack_api/benchmarks/api.py +0 -39
llama_stack_api/benchmarks/fastapi_routes.py +0 -109
llama_stack_api/benchmarks/models.py +0 -109
llama_stack_api/common/__init__.py +0 -5
llama_stack_api/common/content_types.py +0 -101
llama_stack_api/common/errors.py +0 -95
llama_stack_api/common/job_types.py +0 -38
llama_stack_api/common/responses.py +0 -77
llama_stack_api/common/training_types.py +0 -47
llama_stack_api/common/type_system.py +0 -146
llama_stack_api/connectors.py +0 -146
llama_stack_api/conversations.py +0 -270
llama_stack_api/datasetio.py +0 -55
llama_stack_api/datasets/__init__.py +0 -61
llama_stack_api/datasets/api.py +0 -35
llama_stack_api/datasets/fastapi_routes.py +0 -104
llama_stack_api/datasets/models.py +0 -152
llama_stack_api/datatypes.py +0 -373
llama_stack_api/eval.py +0 -137
llama_stack_api/file_processors/__init__.py +0 -27
llama_stack_api/file_processors/api.py +0 -64
llama_stack_api/file_processors/fastapi_routes.py +0 -78
llama_stack_api/file_processors/models.py +0 -42
llama_stack_api/files/__init__.py +0 -35
llama_stack_api/files/api.py +0 -51
llama_stack_api/files/fastapi_routes.py +0 -124
llama_stack_api/files/models.py +0 -107
llama_stack_api/inference.py +0 -1169
llama_stack_api/inspect_api/__init__.py +0 -37
llama_stack_api/inspect_api/api.py +0 -25
llama_stack_api/inspect_api/fastapi_routes.py +0 -76
llama_stack_api/inspect_api/models.py +0 -28
llama_stack_api/internal/kvstore.py +0 -28
llama_stack_api/internal/sqlstore.py +0 -81
llama_stack_api/llama_stack_api/__init__.py +0 -945
llama_stack_api/llama_stack_api/admin/__init__.py +0 -45
llama_stack_api/llama_stack_api/admin/api.py +0 -72
llama_stack_api/llama_stack_api/admin/fastapi_routes.py +0 -117
llama_stack_api/llama_stack_api/admin/models.py +0 -113
llama_stack_api/llama_stack_api/agents.py +0 -173
llama_stack_api/llama_stack_api/batches/__init__.py +0 -40
llama_stack_api/llama_stack_api/batches/api.py +0 -53
llama_stack_api/llama_stack_api/batches/fastapi_routes.py +0 -113
llama_stack_api/llama_stack_api/batches/models.py +0 -78
llama_stack_api/llama_stack_api/benchmarks/__init__.py +0 -43
llama_stack_api/llama_stack_api/benchmarks/api.py +0 -39
llama_stack_api/llama_stack_api/benchmarks/fastapi_routes.py +0 -109
llama_stack_api/llama_stack_api/benchmarks/models.py +0 -109
llama_stack_api/llama_stack_api/common/__init__.py +0 -5
llama_stack_api/llama_stack_api/common/content_types.py +0 -101
llama_stack_api/llama_stack_api/common/errors.py +0 -95
llama_stack_api/llama_stack_api/common/job_types.py +0 -38
llama_stack_api/llama_stack_api/common/responses.py +0 -77
llama_stack_api/llama_stack_api/common/training_types.py +0 -47
llama_stack_api/llama_stack_api/common/type_system.py +0 -146
llama_stack_api/llama_stack_api/connectors.py +0 -146
llama_stack_api/llama_stack_api/conversations.py +0 -270
llama_stack_api/llama_stack_api/datasetio.py +0 -55
llama_stack_api/llama_stack_api/datasets/__init__.py +0 -61
llama_stack_api/llama_stack_api/datasets/api.py +0 -35
llama_stack_api/llama_stack_api/datasets/fastapi_routes.py +0 -104
llama_stack_api/llama_stack_api/datasets/models.py +0 -152
llama_stack_api/llama_stack_api/datatypes.py +0 -373
llama_stack_api/llama_stack_api/eval.py +0 -137
llama_stack_api/llama_stack_api/file_processors/__init__.py +0 -27
llama_stack_api/llama_stack_api/file_processors/api.py +0 -64
llama_stack_api/llama_stack_api/file_processors/fastapi_routes.py +0 -78
llama_stack_api/llama_stack_api/file_processors/models.py +0 -42
llama_stack_api/llama_stack_api/files/__init__.py +0 -35
llama_stack_api/llama_stack_api/files/api.py +0 -51
llama_stack_api/llama_stack_api/files/fastapi_routes.py +0 -124
llama_stack_api/llama_stack_api/files/models.py +0 -107
llama_stack_api/llama_stack_api/inference.py +0 -1169
llama_stack_api/llama_stack_api/inspect_api/__init__.py +0 -37
llama_stack_api/llama_stack_api/inspect_api/api.py +0 -25
llama_stack_api/llama_stack_api/inspect_api/fastapi_routes.py +0 -76
llama_stack_api/llama_stack_api/inspect_api/models.py +0 -28
llama_stack_api/llama_stack_api/internal/__init__.py +0 -9
llama_stack_api/llama_stack_api/internal/kvstore.py +0 -28
llama_stack_api/llama_stack_api/internal/sqlstore.py +0 -81
llama_stack_api/llama_stack_api/models.py +0 -171
llama_stack_api/llama_stack_api/openai_responses.py +0 -1468
llama_stack_api/llama_stack_api/post_training.py +0 -370
llama_stack_api/llama_stack_api/prompts.py +0 -203
llama_stack_api/llama_stack_api/providers/__init__.py +0 -33
llama_stack_api/llama_stack_api/providers/api.py +0 -16
llama_stack_api/llama_stack_api/providers/fastapi_routes.py +0 -57
llama_stack_api/llama_stack_api/providers/models.py +0 -24
llama_stack_api/llama_stack_api/py.typed +0 -0
llama_stack_api/llama_stack_api/rag_tool.py +0 -168
llama_stack_api/llama_stack_api/resource.py +0 -37
llama_stack_api/llama_stack_api/router_utils.py +0 -160
llama_stack_api/llama_stack_api/safety.py +0 -132
llama_stack_api/llama_stack_api/schema_utils.py +0 -208
llama_stack_api/llama_stack_api/scoring.py +0 -93
llama_stack_api/llama_stack_api/scoring_functions.py +0 -211
llama_stack_api/llama_stack_api/shields.py +0 -93
llama_stack_api/llama_stack_api/tools.py +0 -226
llama_stack_api/llama_stack_api/vector_io.py +0 -941
llama_stack_api/llama_stack_api/vector_stores.py +0 -53
llama_stack_api/llama_stack_api/version.py +0 -9
llama_stack_api/models.py +0 -171
llama_stack_api/openai_responses.py +0 -1468
llama_stack_api/post_training.py +0 -370
llama_stack_api/prompts.py +0 -203
llama_stack_api/providers/__init__.py +0 -33
llama_stack_api/providers/api.py +0 -16
llama_stack_api/providers/fastapi_routes.py +0 -57
llama_stack_api/providers/models.py +0 -24
llama_stack_api/py.typed +0 -0
llama_stack_api/rag_tool.py +0 -168
llama_stack_api/resource.py +0 -37
llama_stack_api/router_utils.py +0 -160
llama_stack_api/safety.py +0 -132
llama_stack_api/schema_utils.py +0 -208
llama_stack_api/scoring.py +0 -93
llama_stack_api/scoring_functions.py +0 -211
llama_stack_api/shields.py +0 -93
llama_stack_api/tools.py +0 -226
llama_stack_api/vector_io.py +0 -941
llama_stack_api/vector_stores.py +0 -53
llama_stack_api/version.py +0 -9
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0rc1.dist-info}/WHEEL +0 -0
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0rc1.dist-info}/entry_points.txt +0 -0
{llama_stack-0.4.3.dist-info → llama_stack-0.5.0rc1.dist-info}/licenses/LICENSE +0 -0

llama_stack_api/file_processors/models.py DELETED Viewed

@@ -1,42 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-"""Pydantic models for File Processors API responses.
-This module defines the response models for the File Processors API
-using Pydantic with Field descriptions for OpenAPI schema generation.
-Request models are not needed for this API since it uses multipart form data
-with individual parameters rather than a JSON request body.
-"""
-from typing import Any
-from pydantic import BaseModel, Field
-from llama_stack_api.schema_utils import json_schema_type
-from llama_stack_api.vector_io import Chunk
-@json_schema_type
-class ProcessFileResponse(BaseModel):
-    """Response model for file processing operation.
-    Returns a list of chunks ready for storage in vector databases.
-    Each chunk contains the content and metadata.
-    """
-    chunks: list[Chunk] = Field(..., description="Processed chunks from the file. Always returns at least one chunk.")
-    metadata: dict[str, Any] = Field(
-        ...,
-        description="Processing-run metadata such as processor name/version, processing_time_ms, page_count, extraction_method (e.g. docling/pypdf/ocr), confidence scores, plus provider-specific fields.",
-    )
-__all__ = [
-    "ProcessFileResponse",
-]

llama_stack_api/files/__init__.py DELETED Viewed

@@ -1,35 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from . import fastapi_routes
-from .api import Files
-from .models import (
-    DeleteFileRequest,
-    ExpiresAfter,
-    ListFilesRequest,
-    ListOpenAIFileResponse,
-    OpenAIFileDeleteResponse,
-    OpenAIFileObject,
-    OpenAIFilePurpose,
-    RetrieveFileContentRequest,
-    RetrieveFileRequest,
-    UploadFileRequest,
-)
-__all__ = [
-    "DeleteFileRequest",
-    "ExpiresAfter",
-    "fastapi_routes",
-    "Files",
-    "ListFilesRequest",
-    "ListOpenAIFileResponse",
-    "OpenAIFileDeleteResponse",
-    "OpenAIFileObject",
-    "OpenAIFilePurpose",
-    "RetrieveFileContentRequest",
-    "RetrieveFileRequest",
-    "UploadFileRequest",
-]

llama_stack_api/files/api.py DELETED Viewed

@@ -1,51 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from typing import Protocol, runtime_checkable
-from fastapi import Response, UploadFile
-from .models import (
-    DeleteFileRequest,
-    ListFilesRequest,
-    ListOpenAIFileResponse,
-    OpenAIFileDeleteResponse,
-    OpenAIFileObject,
-    RetrieveFileContentRequest,
-    RetrieveFileRequest,
-    UploadFileRequest,
-)
-@runtime_checkable
-class Files(Protocol):
-    """Files API for managing file uploads and retrieval."""
-    async def openai_upload_file(
-        self,
-        request: UploadFileRequest,
-        file: UploadFile,
-    ) -> OpenAIFileObject: ...
-    async def openai_list_files(
-        self,
-        request: ListFilesRequest,
-    ) -> ListOpenAIFileResponse: ...
-    async def openai_retrieve_file(
-        self,
-        request: RetrieveFileRequest,
-    ) -> OpenAIFileObject: ...
-    async def openai_delete_file(
-        self,
-        request: DeleteFileRequest,
-    ) -> OpenAIFileDeleteResponse: ...
-    async def openai_retrieve_file_content(
-        self,
-        request: RetrieveFileContentRequest,
-    ) -> Response: ...

llama_stack_api/files/fastapi_routes.py DELETED Viewed

@@ -1,124 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from typing import Annotated
-from fastapi import APIRouter, Depends, UploadFile
-from fastapi.param_functions import File, Form
-from fastapi.responses import Response
-from llama_stack_api.router_utils import create_path_dependency, create_query_dependency, standard_responses
-from llama_stack_api.version import LLAMA_STACK_API_V1
-from .api import Files
-from .models import (
-    DeleteFileRequest,
-    ExpiresAfter,
-    ListFilesRequest,
-    ListOpenAIFileResponse,
-    OpenAIFileDeleteResponse,
-    OpenAIFileObject,
-    OpenAIFilePurpose,
-    RetrieveFileContentRequest,
-    RetrieveFileRequest,
-    UploadFileRequest,
-)
-# Automatically generate dependency functions from Pydantic models
-# This ensures the models are the single source of truth for descriptions
-get_list_files_request = create_query_dependency(ListFilesRequest)
-get_get_files_request = create_path_dependency(RetrieveFileRequest)
-get_delete_files_request = create_path_dependency(DeleteFileRequest)
-get_retrieve_file_content_request = create_path_dependency(RetrieveFileContentRequest)
-def create_router(impl: Files) -> APIRouter:
-    router = APIRouter(
-        prefix=f"/{LLAMA_STACK_API_V1}",
-        tags=["Files"],
-        responses=standard_responses,
-    )
-    @router.get(
-        "/files",
-        response_model=ListOpenAIFileResponse,
-        summary="List files",
-        description="List files",
-        responses={
-            200: {"description": "The list of files."},
-        },
-    )
-    async def list_files(
-        request: Annotated[ListFilesRequest, Depends(get_list_files_request)],
-    ) -> ListOpenAIFileResponse:
-        return await impl.openai_list_files(request)
-    @router.get(
-        "/files/{file_id}",
-        response_model=OpenAIFileObject,
-        summary="Get file",
-        description="Get file",
-        responses={
-            200: {"description": "The file."},
-        },
-    )
-    async def get_file(
-        request: Annotated[RetrieveFileRequest, Depends(get_get_files_request)],
-    ) -> OpenAIFileObject:
-        return await impl.openai_retrieve_file(request)
-    @router.delete(
-        "/files/{file_id}",
-        response_model=OpenAIFileDeleteResponse,
-        summary="Delete file",
-        description="Delete file",
-        responses={
-            200: {"description": "The file was deleted."},
-        },
-    )
-    async def delete_file(
-        request: Annotated[DeleteFileRequest, Depends(get_delete_files_request)],
-    ) -> OpenAIFileDeleteResponse:
-        return await impl.openai_delete_file(request)
-    @router.get(
-        "/files/{file_id}/content",
-        status_code=200,
-        summary="Retrieve file content",
-        description="Retrieve file content",
-        responses={
-            200: {
-                "description": "The raw file content as a binary response.",
-                "content": {"application/json": {"schema": {"$ref": "#/components/schemas/Response"}}},
-            },
-        },
-    )
-    async def retrieve_file_content(
-        request: Annotated[RetrieveFileContentRequest, Depends(get_retrieve_file_content_request)],
-    ) -> Response:
-        return await impl.openai_retrieve_file_content(request)
-    @router.post(
-        "/files",
-        response_model=OpenAIFileObject,
-        summary="Upload file",
-        description="Upload a file.",
-        responses={
-            200: {"description": "The uploaded file."},
-        },
-    )
-    async def upload_file(
-        file: Annotated[UploadFile, File(description="The file to upload.")],
-        purpose: Annotated[OpenAIFilePurpose, Form(description="The intended purpose of the uploaded file.")],
-        expires_after: Annotated[ExpiresAfter | None, Form(description="Optional expiration settings.")] = None,
-    ) -> OpenAIFileObject:
-        request = UploadFileRequest(
-            purpose=purpose,
-            expires_after=expires_after,
-        )
-        return await impl.openai_upload_file(request, file)
-    return router

llama_stack_api/files/models.py DELETED Viewed

@@ -1,107 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from enum import StrEnum
-from typing import ClassVar, Literal
-from pydantic import BaseModel, Field
-from llama_stack_api.common.responses import Order
-from llama_stack_api.schema_utils import json_schema_type
-class OpenAIFilePurpose(StrEnum):
-    """
-    Valid purpose values for OpenAI Files API.
-    """
-    ASSISTANTS = "assistants"
-    BATCH = "batch"
-@json_schema_type
-class OpenAIFileObject(BaseModel):
-    """OpenAI File object as defined in the OpenAI Files API."""
-    object: Literal["file"] = Field(default="file", description="The object type, which is always 'file'.")
-    id: str = Field(..., description="The file identifier, which can be referenced in the API endpoints.")
-    bytes: int = Field(..., description="The size of the file, in bytes.")
-    created_at: int = Field(..., description="The Unix timestamp (in seconds) for when the file was created.")
-    expires_at: int = Field(..., description="The Unix timestamp (in seconds) for when the file expires.")
-    filename: str = Field(..., description="The name of the file.")
-    purpose: OpenAIFilePurpose = Field(..., description="The intended purpose of the file.")
-@json_schema_type
-class ExpiresAfter(BaseModel):
-    """Control expiration of uploaded files."""
-    MIN: ClassVar[int] = 3600  # 1 hour
-    MAX: ClassVar[int] = 2592000  # 30 days
-    anchor: Literal["created_at"] = Field(..., description="The anchor point for expiration, must be 'created_at'.")
-    seconds: int = Field(
-        ..., ge=MIN, le=MAX, description="Seconds until expiration, between 3600 (1 hour) and 2592000 (30 days)."
-    )
-@json_schema_type
-class ListOpenAIFileResponse(BaseModel):
-    """Response for listing files in OpenAI Files API."""
-    data: list[OpenAIFileObject] = Field(..., description="The list of files.")
-    has_more: bool = Field(..., description="Whether there are more files available beyond this page.")
-    first_id: str = Field(..., description="The ID of the first file in the list for pagination.")
-    last_id: str = Field(..., description="The ID of the last file in the list for pagination.")
-    object: Literal["list"] = Field(default="list", description="The object type, which is always 'list'.")
-@json_schema_type
-class OpenAIFileDeleteResponse(BaseModel):
-    """Response for deleting a file in OpenAI Files API."""
-    id: str = Field(..., description="The file identifier that was deleted.")
-    object: Literal["file"] = Field(default="file", description="The object type, which is always 'file'.")
-    deleted: bool = Field(..., description="Whether the file was successfully deleted.")
-@json_schema_type
-class ListFilesRequest(BaseModel):
-    """Request model for listing files."""
-    after: str | None = Field(default=None, description="A cursor for pagination. Returns files after this ID.")
-    limit: int | None = Field(default=10000, description="Maximum number of files to return (1-10,000).")
-    order: Order | None = Field(default=Order.desc, description="Sort order by created_at timestamp ('asc' or 'desc').")
-    purpose: OpenAIFilePurpose | None = Field(default=None, description="Filter files by purpose.")
-@json_schema_type
-class RetrieveFileRequest(BaseModel):
-    """Request model for retrieving a file."""
-    file_id: str = Field(..., description="The ID of the file to retrieve.")
-@json_schema_type
-class DeleteFileRequest(BaseModel):
-    """Request model for deleting a file."""
-    file_id: str = Field(..., description="The ID of the file to delete.")
-@json_schema_type
-class RetrieveFileContentRequest(BaseModel):
-    """Request model for retrieving file content."""
-    file_id: str = Field(..., description="The ID of the file to retrieve content from.")
-@json_schema_type
-class UploadFileRequest(BaseModel):
-    """Request model for uploading a file."""
-    purpose: OpenAIFilePurpose = Field(..., description="The intended purpose of the uploaded file.")
-    expires_after: ExpiresAfter | None = Field(default=None, description="Optional expiration settings for the file.")

llama-stack 0.4.3__py3-none-any.whl → 0.5.0rc1__py3-none-any.whl

llama-stack 0.4.3py3-none-any.whl → 0.5.0rc1py3-none-any.whl