PyPI - llama-stack - Versions diffs - 0.4.2__py3-none-any.whl → 0.4.4__py3-none-any.whl - Mend

llama-stack 0.4.2py3-none-any.whl → 0.4.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (182) hide show

llama_stack/core/library_client.py +80 -3
llama_stack/core/routing_tables/common.py +11 -0
llama_stack/core/routing_tables/vector_stores.py +4 -0
llama_stack/core/stack.py +16 -1
llama_stack/core/storage/kvstore/kvstore.py +11 -0
llama_stack/core/storage/kvstore/mongodb/mongodb.py +5 -0
llama_stack/core/storage/kvstore/postgres/postgres.py +8 -0
llama_stack/core/storage/kvstore/redis/redis.py +5 -0
llama_stack/core/storage/sqlstore/sqlalchemy_sqlstore.py +8 -0
llama_stack/core/storage/sqlstore/sqlstore.py +8 -0
llama_stack/distributions/dell/doc_template.md +209 -0
llama_stack/distributions/meta-reference-gpu/doc_template.md +119 -0
llama_stack/distributions/nvidia/doc_template.md +170 -0
llama_stack/distributions/oci/doc_template.md +140 -0
llama_stack/models/llama/llama3/dog.jpg +0 -0
llama_stack/models/llama/llama3/pasta.jpeg +0 -0
llama_stack/models/llama/resources/dog.jpg +0 -0
llama_stack/models/llama/resources/pasta.jpeg +0 -0
llama_stack/models/llama/resources/small_dog.jpg +0 -0
llama_stack/providers/inline/agents/meta_reference/responses/openai_responses.py +184 -33
llama_stack/providers/inline/agents/meta_reference/responses/streaming.py +4 -0
llama_stack/providers/inline/agents/meta_reference/responses/tool_executor.py +9 -1
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.h +9 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/LocalInference.swift +189 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/Parsing.swift +238 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/PromptTemplate.swift +12 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl/SystemPrompts.swift +89 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.pbxproj +550 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -0
llama_stack/providers/inline/ios/inference/LocalInferenceImpl.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +8 -0
llama_stack/providers/remote/datasetio/nvidia/README.md +74 -0
llama_stack/providers/remote/eval/nvidia/README.md +134 -0
llama_stack/providers/remote/files/s3/README.md +266 -0
llama_stack/providers/remote/inference/nvidia/NVIDIA.md +203 -0
llama_stack/providers/remote/post_training/nvidia/README.md +151 -0
llama_stack/providers/remote/safety/nvidia/README.md +78 -0
llama_stack/providers/remote/vector_io/pgvector/pgvector.py +13 -1
llama_stack/providers/utils/inference/embedding_mixin.py +20 -16
llama_stack/providers/utils/memory/openai_vector_store_mixin.py +33 -0
llama_stack/providers/utils/responses/responses_store.py +34 -0
llama_stack/providers/utils/tools/mcp.py +258 -16
{llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/METADATA +2 -2
{llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/RECORD +47 -158
{llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/WHEEL +1 -1
llama_stack-0.4.4.dist-info/top_level.txt +1 -0
llama_stack-0.4.2.dist-info/top_level.txt +0 -2
llama_stack_api/__init__.py +0 -945
llama_stack_api/admin/__init__.py +0 -45
llama_stack_api/admin/api.py +0 -72
llama_stack_api/admin/fastapi_routes.py +0 -117
llama_stack_api/admin/models.py +0 -113
llama_stack_api/agents.py +0 -173
llama_stack_api/batches/__init__.py +0 -40
llama_stack_api/batches/api.py +0 -53
llama_stack_api/batches/fastapi_routes.py +0 -113
llama_stack_api/batches/models.py +0 -78
llama_stack_api/benchmarks/__init__.py +0 -43
llama_stack_api/benchmarks/api.py +0 -39
llama_stack_api/benchmarks/fastapi_routes.py +0 -109
llama_stack_api/benchmarks/models.py +0 -109
llama_stack_api/common/__init__.py +0 -5
llama_stack_api/common/content_types.py +0 -101
llama_stack_api/common/errors.py +0 -95
llama_stack_api/common/job_types.py +0 -38
llama_stack_api/common/responses.py +0 -77
llama_stack_api/common/training_types.py +0 -47
llama_stack_api/common/type_system.py +0 -146
llama_stack_api/connectors.py +0 -146
llama_stack_api/conversations.py +0 -270
llama_stack_api/datasetio.py +0 -55
llama_stack_api/datasets/__init__.py +0 -61
llama_stack_api/datasets/api.py +0 -35
llama_stack_api/datasets/fastapi_routes.py +0 -104
llama_stack_api/datasets/models.py +0 -152
llama_stack_api/datatypes.py +0 -373
llama_stack_api/eval.py +0 -137
llama_stack_api/file_processors/__init__.py +0 -27
llama_stack_api/file_processors/api.py +0 -64
llama_stack_api/file_processors/fastapi_routes.py +0 -78
llama_stack_api/file_processors/models.py +0 -42
llama_stack_api/files/__init__.py +0 -35
llama_stack_api/files/api.py +0 -51
llama_stack_api/files/fastapi_routes.py +0 -124
llama_stack_api/files/models.py +0 -107
llama_stack_api/inference.py +0 -1169
llama_stack_api/inspect_api/__init__.py +0 -37
llama_stack_api/inspect_api/api.py +0 -25
llama_stack_api/inspect_api/fastapi_routes.py +0 -76
llama_stack_api/inspect_api/models.py +0 -28
llama_stack_api/internal/__init__.py +0 -9
llama_stack_api/internal/kvstore.py +0 -26
llama_stack_api/internal/sqlstore.py +0 -79
llama_stack_api/llama_stack_api/__init__.py +0 -945
llama_stack_api/llama_stack_api/admin/__init__.py +0 -45
llama_stack_api/llama_stack_api/admin/api.py +0 -72
llama_stack_api/llama_stack_api/admin/fastapi_routes.py +0 -117
llama_stack_api/llama_stack_api/admin/models.py +0 -113
llama_stack_api/llama_stack_api/agents.py +0 -173
llama_stack_api/llama_stack_api/batches/__init__.py +0 -40
llama_stack_api/llama_stack_api/batches/api.py +0 -53
llama_stack_api/llama_stack_api/batches/fastapi_routes.py +0 -113
llama_stack_api/llama_stack_api/batches/models.py +0 -78
llama_stack_api/llama_stack_api/benchmarks/__init__.py +0 -43
llama_stack_api/llama_stack_api/benchmarks/api.py +0 -39
llama_stack_api/llama_stack_api/benchmarks/fastapi_routes.py +0 -109
llama_stack_api/llama_stack_api/benchmarks/models.py +0 -109
llama_stack_api/llama_stack_api/common/__init__.py +0 -5
llama_stack_api/llama_stack_api/common/content_types.py +0 -101
llama_stack_api/llama_stack_api/common/errors.py +0 -95
llama_stack_api/llama_stack_api/common/job_types.py +0 -38
llama_stack_api/llama_stack_api/common/responses.py +0 -77
llama_stack_api/llama_stack_api/common/training_types.py +0 -47
llama_stack_api/llama_stack_api/common/type_system.py +0 -146
llama_stack_api/llama_stack_api/connectors.py +0 -146
llama_stack_api/llama_stack_api/conversations.py +0 -270
llama_stack_api/llama_stack_api/datasetio.py +0 -55
llama_stack_api/llama_stack_api/datasets/__init__.py +0 -61
llama_stack_api/llama_stack_api/datasets/api.py +0 -35
llama_stack_api/llama_stack_api/datasets/fastapi_routes.py +0 -104
llama_stack_api/llama_stack_api/datasets/models.py +0 -152
llama_stack_api/llama_stack_api/datatypes.py +0 -373
llama_stack_api/llama_stack_api/eval.py +0 -137
llama_stack_api/llama_stack_api/file_processors/__init__.py +0 -27
llama_stack_api/llama_stack_api/file_processors/api.py +0 -64
llama_stack_api/llama_stack_api/file_processors/fastapi_routes.py +0 -78
llama_stack_api/llama_stack_api/file_processors/models.py +0 -42
llama_stack_api/llama_stack_api/files/__init__.py +0 -35
llama_stack_api/llama_stack_api/files/api.py +0 -51
llama_stack_api/llama_stack_api/files/fastapi_routes.py +0 -124
llama_stack_api/llama_stack_api/files/models.py +0 -107
llama_stack_api/llama_stack_api/inference.py +0 -1169
llama_stack_api/llama_stack_api/inspect_api/__init__.py +0 -37
llama_stack_api/llama_stack_api/inspect_api/api.py +0 -25
llama_stack_api/llama_stack_api/inspect_api/fastapi_routes.py +0 -76
llama_stack_api/llama_stack_api/inspect_api/models.py +0 -28
llama_stack_api/llama_stack_api/internal/__init__.py +0 -9
llama_stack_api/llama_stack_api/internal/kvstore.py +0 -26
llama_stack_api/llama_stack_api/internal/sqlstore.py +0 -79
llama_stack_api/llama_stack_api/models.py +0 -171
llama_stack_api/llama_stack_api/openai_responses.py +0 -1468
llama_stack_api/llama_stack_api/post_training.py +0 -370
llama_stack_api/llama_stack_api/prompts.py +0 -203
llama_stack_api/llama_stack_api/providers/__init__.py +0 -33
llama_stack_api/llama_stack_api/providers/api.py +0 -16
llama_stack_api/llama_stack_api/providers/fastapi_routes.py +0 -57
llama_stack_api/llama_stack_api/providers/models.py +0 -24
llama_stack_api/llama_stack_api/py.typed +0 -0
llama_stack_api/llama_stack_api/rag_tool.py +0 -168
llama_stack_api/llama_stack_api/resource.py +0 -37
llama_stack_api/llama_stack_api/router_utils.py +0 -160
llama_stack_api/llama_stack_api/safety.py +0 -132
llama_stack_api/llama_stack_api/schema_utils.py +0 -208
llama_stack_api/llama_stack_api/scoring.py +0 -93
llama_stack_api/llama_stack_api/scoring_functions.py +0 -211
llama_stack_api/llama_stack_api/shields.py +0 -93
llama_stack_api/llama_stack_api/tools.py +0 -226
llama_stack_api/llama_stack_api/vector_io.py +0 -941
llama_stack_api/llama_stack_api/vector_stores.py +0 -51
llama_stack_api/llama_stack_api/version.py +0 -9
llama_stack_api/models.py +0 -171
llama_stack_api/openai_responses.py +0 -1468
llama_stack_api/post_training.py +0 -370
llama_stack_api/prompts.py +0 -203
llama_stack_api/providers/__init__.py +0 -33
llama_stack_api/providers/api.py +0 -16
llama_stack_api/providers/fastapi_routes.py +0 -57
llama_stack_api/providers/models.py +0 -24
llama_stack_api/py.typed +0 -0
llama_stack_api/rag_tool.py +0 -168
llama_stack_api/resource.py +0 -37
llama_stack_api/router_utils.py +0 -160
llama_stack_api/safety.py +0 -132
llama_stack_api/schema_utils.py +0 -208
llama_stack_api/scoring.py +0 -93
llama_stack_api/scoring_functions.py +0 -211
llama_stack_api/shields.py +0 -93
llama_stack_api/tools.py +0 -226
llama_stack_api/vector_io.py +0 -941
llama_stack_api/vector_stores.py +0 -51
llama_stack_api/version.py +0 -9
{llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/entry_points.txt +0 -0
{llama_stack-0.4.2.dist-info → llama_stack-0.4.4.dist-info}/licenses/LICENSE +0 -0

llama_stack_api/inspect_api/__init__.py DELETED Viewed

@@ -1,37 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-"""Inspect API protocol and models.
-This module contains the Inspect protocol definition.
-Pydantic models are defined in llama_stack_api.inspect.models.
-The FastAPI router is defined in llama_stack_api.inspect.fastapi_routes.
-"""
-# Import fastapi_routes for router factory access
-from . import fastapi_routes
-# Import protocol for re-export
-from .api import Inspect
-# Import models for re-export
-from .models import (
-    ApiFilter,
-    HealthInfo,
-    ListRoutesResponse,
-    RouteInfo,
-    VersionInfo,
-)
-__all__ = [
-    "Inspect",
-    "ApiFilter",
-    "HealthInfo",
-    "ListRoutesResponse",
-    "RouteInfo",
-    "VersionInfo",
-    "fastapi_routes",
-]

llama_stack_api/inspect_api/api.py DELETED Viewed

@@ -1,25 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from typing import Protocol, runtime_checkable
-from .models import (
-    ApiFilter,
-    HealthInfo,
-    ListRoutesResponse,
-    VersionInfo,
-)
-@runtime_checkable
-class Inspect(Protocol):
-    """APIs for inspecting the Llama Stack service, including health status, available API routes with methods and implementing providers."""
-    async def list_routes(self, api_filter: ApiFilter | None = None) -> ListRoutesResponse: ...
-    async def health(self) -> HealthInfo: ...
-    async def version(self) -> VersionInfo: ...

llama_stack_api/inspect_api/fastapi_routes.py DELETED Viewed

@@ -1,76 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-"""FastAPI router for the Inspect API.
-This module defines the FastAPI router for the Inspect API using standard
-FastAPI route decorators.
-"""
-from typing import Annotated
-from fastapi import APIRouter, Query
-from llama_stack_api.router_utils import PUBLIC_ROUTE_KEY, standard_responses
-from llama_stack_api.version import LLAMA_STACK_API_V1
-from .api import Inspect
-from .models import (
-    ApiFilter,
-    HealthInfo,
-    ListRoutesResponse,
-    VersionInfo,
-)
-def create_router(impl: Inspect) -> APIRouter:
-    """Create a FastAPI router for the Inspect API."""
-    router = APIRouter(
-        prefix=f"/{LLAMA_STACK_API_V1}",
-        tags=["Inspect"],
-        responses=standard_responses,
-    )
-    @router.get(
-        "/inspect/routes",
-        response_model=ListRoutesResponse,
-        summary="List routes.",
-        description="List all available API routes with their methods and implementing providers.",
-        responses={200: {"description": "Response containing information about all available routes."}},
-    )
-    async def list_routes(
-        api_filter: Annotated[
-            ApiFilter | None,
-            Query(
-                description="Optional filter to control which routes are returned. Can be an API level ('v1', 'v1alpha', 'v1beta') to show non-deprecated routes at that level, or 'deprecated' to show deprecated routes across all levels. If not specified, returns all non-deprecated routes."
-            ),
-        ] = None,
-    ) -> ListRoutesResponse:
-        return await impl.list_routes(api_filter)
-    @router.get(
-        "/health",
-        response_model=HealthInfo,
-        summary="Get health status.",
-        description="Get the current health status of the service.",
-        responses={200: {"description": "Health information indicating if the service is operational."}},
-        openapi_extra={PUBLIC_ROUTE_KEY: True},
-    )
-    async def health() -> HealthInfo:
-        return await impl.health()
-    @router.get(
-        "/version",
-        response_model=VersionInfo,
-        summary="Get version.",
-        description="Get the version of the service.",
-        responses={200: {"description": "Version information containing the service version number."}},
-        openapi_extra={PUBLIC_ROUTE_KEY: True},
-    )
-    async def version() -> VersionInfo:
-        return await impl.version()
-    return router

llama_stack_api/inspect_api/models.py DELETED Viewed

@@ -1,28 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-"""Pydantic models for Inspect API requests and responses.
-This module re-exports models from llama_stack_api.admin.models to ensure
-a single source of truth and avoid type conflicts.
-"""
-# Import and re-export shared models from admin
-from llama_stack_api.admin.models import (
-    ApiFilter,
-    HealthInfo,
-    ListRoutesResponse,
-    RouteInfo,
-    VersionInfo,
-)
-__all__ = [
-    "ApiFilter",
-    "RouteInfo",
-    "HealthInfo",
-    "VersionInfo",
-    "ListRoutesResponse",
-]

llama_stack_api/internal/__init__.py DELETED Viewed

@@ -1,9 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-# Internal subpackage for shared interfaces that are not part of the public API.
-__all__: list[str] = []

llama_stack_api/internal/kvstore.py DELETED Viewed

@@ -1,26 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from datetime import datetime
-from typing import Protocol
-class KVStore(Protocol):
-    """Protocol for simple key/value storage backends."""
-    # TODO: make the value type bytes instead of str
-    async def set(self, key: str, value: str, expiration: datetime | None = None) -> None: ...
-    async def get(self, key: str) -> str | None: ...
-    async def delete(self, key: str) -> None: ...
-    async def values_in_range(self, start_key: str, end_key: str) -> list[str]: ...
-    async def keys_in_range(self, start_key: str, end_key: str) -> list[str]: ...
-__all__ = ["KVStore"]

llama_stack_api/internal/sqlstore.py DELETED Viewed

@@ -1,79 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-from collections.abc import Mapping, Sequence
-from enum import Enum
-from typing import Any, Literal, Protocol
-from pydantic import BaseModel
-from llama_stack_api import PaginatedResponse
-class ColumnType(Enum):
-    INTEGER = "INTEGER"
-    STRING = "STRING"
-    TEXT = "TEXT"
-    FLOAT = "FLOAT"
-    BOOLEAN = "BOOLEAN"
-    JSON = "JSON"
-    DATETIME = "DATETIME"
-class ColumnDefinition(BaseModel):
-    type: ColumnType
-    primary_key: bool = False
-    nullable: bool = True
-    default: Any = None
-class SqlStore(Protocol):
-    """Protocol for common SQL-store functionality."""
-    async def create_table(self, table: str, schema: Mapping[str, ColumnType | ColumnDefinition]) -> None: ...
-    async def insert(self, table: str, data: Mapping[str, Any] | Sequence[Mapping[str, Any]]) -> None: ...
-    async def upsert(
-        self,
-        table: str,
-        data: Mapping[str, Any],
-        conflict_columns: list[str],
-        update_columns: list[str] | None = None,
-    ) -> None: ...
-    async def fetch_all(
-        self,
-        table: str,
-        where: Mapping[str, Any] | None = None,
-        where_sql: str | None = None,
-        limit: int | None = None,
-        order_by: list[tuple[str, Literal["asc", "desc"]]] | None = None,
-        cursor: tuple[str, str] | None = None,
-    ) -> PaginatedResponse: ...
-    async def fetch_one(
-        self,
-        table: str,
-        where: Mapping[str, Any] | None = None,
-        where_sql: str | None = None,
-        order_by: list[tuple[str, Literal["asc", "desc"]]] | None = None,
-    ) -> dict[str, Any] | None: ...
-    async def update(self, table: str, data: Mapping[str, Any], where: Mapping[str, Any]) -> None: ...
-    async def delete(self, table: str, where: Mapping[str, Any]) -> None: ...
-    async def add_column_if_not_exists(
-        self,
-        table: str,
-        column_name: str,
-        column_type: ColumnType,
-        nullable: bool = True,
-    ) -> None: ...
-__all__ = ["ColumnDefinition", "ColumnType", "SqlStore"]

llama-stack 0.4.2__py3-none-any.whl → 0.4.4__py3-none-any.whl

llama-stack 0.4.2py3-none-any.whl → 0.4.4py3-none-any.whl