PyPI - agenta - Versions diffs - 0.12.7__py3-none-any.whl → 0.13.0__py3-none-any.whl - Mend

agenta 0.12.7py3-none-any.whl → 0.13.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of agenta might be problematic. Click here for more details.

Files changed (88) hide show

agenta/__init__.py +3 -1
agenta/cli/helper.py +1 -1
agenta/cli/main.py +1 -1
agenta/cli/variant_commands.py +7 -5
agenta/client/api.py +1 -1
agenta/client/backend/__init__.py +78 -18
agenta/client/backend/client.py +1031 -5526
agenta/client/backend/resources/__init__.py +31 -0
agenta/client/backend/resources/apps/__init__.py +1 -0
agenta/client/backend/resources/apps/client.py +977 -0
agenta/client/backend/resources/bases/__init__.py +1 -0
agenta/client/backend/resources/bases/client.py +127 -0
agenta/client/backend/resources/configs/__init__.py +1 -0
agenta/client/backend/resources/configs/client.py +377 -0
agenta/client/backend/resources/containers/__init__.py +5 -0
agenta/client/backend/resources/containers/client.py +383 -0
agenta/client/backend/resources/containers/types/__init__.py +5 -0
agenta/client/backend/{types → resources/containers/types}/container_templates_response.py +1 -1
agenta/client/backend/resources/environments/__init__.py +1 -0
agenta/client/backend/resources/environments/client.py +131 -0
agenta/client/backend/resources/evaluations/__init__.py +1 -0
agenta/client/backend/resources/evaluations/client.py +1008 -0
agenta/client/backend/resources/evaluators/__init__.py +1 -0
agenta/client/backend/resources/evaluators/client.py +594 -0
agenta/client/backend/resources/observability/__init__.py +1 -0
agenta/client/backend/resources/observability/client.py +1184 -0
agenta/client/backend/resources/testsets/__init__.py +1 -0
agenta/client/backend/resources/testsets/client.py +689 -0
agenta/client/backend/resources/variants/__init__.py +5 -0
agenta/client/backend/resources/variants/client.py +796 -0
agenta/client/backend/resources/variants/types/__init__.py +7 -0
agenta/client/backend/resources/variants/types/add_variant_from_base_and_config_response.py +7 -0
agenta/client/backend/types/__init__.py +54 -22
agenta/client/backend/types/aggregated_result.py +2 -2
agenta/client/backend/types/aggregated_result_evaluator_config.py +9 -0
agenta/client/backend/types/{app_variant_output.py → app_variant_response.py} +4 -2
agenta/client/backend/types/{trace.py → create_span.py} +20 -10
agenta/client/backend/types/create_trace_response.py +37 -0
agenta/client/backend/types/environment_output.py +3 -1
agenta/client/backend/types/environment_output_extended.py +45 -0
agenta/client/backend/types/environment_revision.py +41 -0
agenta/client/backend/types/error.py +37 -0
agenta/client/backend/types/evaluation.py +6 -3
agenta/client/backend/types/evaluation_scenario_output.py +4 -2
agenta/client/backend/types/{delete_evaluation.py → evaluation_scenario_score_update.py} +2 -2
agenta/client/backend/types/evaluation_status_enum.py +4 -0
agenta/client/backend/types/evaluator.py +1 -0
agenta/client/backend/types/{get_config_reponse.py → get_config_response.py} +1 -2
agenta/client/backend/types/human_evaluation_scenario.py +2 -2
agenta/client/backend/types/{app_variant_output_extended.py → human_evaluation_scenario_update.py} +11 -16
agenta/client/backend/types/human_evaluation_update.py +37 -0
agenta/client/backend/types/image.py +1 -0
agenta/client/backend/types/invite_request.py +1 -0
agenta/client/backend/types/{list_api_keys_output.py → list_api_keys_response.py} +1 -1
agenta/client/backend/types/llm_tokens.py +38 -0
agenta/client/backend/types/new_human_evaluation.py +42 -0
agenta/client/backend/types/organization.py +1 -0
agenta/client/backend/types/permission.py +141 -0
agenta/client/backend/types/result.py +2 -0
agenta/client/backend/types/{human_evaluation_scenario_score.py → score.py} +1 -1
agenta/client/backend/types/span.py +18 -16
agenta/client/backend/types/span_detail.py +52 -0
agenta/client/backend/types/span_kind.py +49 -0
agenta/client/backend/types/span_status_code.py +29 -0
agenta/client/backend/types/span_variant.py +38 -0
agenta/client/backend/types/trace_detail.py +52 -0
agenta/client/backend/types/with_pagination.py +40 -0
agenta/client/backend/types/workspace_member_response.py +38 -0
agenta/client/backend/types/workspace_permission.py +40 -0
agenta/client/backend/types/workspace_response.py +44 -0
agenta/client/backend/types/workspace_role.py +41 -0
agenta/client/backend/types/workspace_role_response.py +38 -0
agenta/docker/docker_utils.py +1 -5
agenta/sdk/__init__.py +3 -1
agenta/sdk/agenta_decorator.py +68 -18
agenta/sdk/agenta_init.py +53 -21
agenta/sdk/tracing/context_manager.py +13 -0
agenta/sdk/tracing/decorators.py +41 -0
agenta/sdk/tracing/llm_tracing.py +220 -0
agenta/sdk/tracing/logger.py +19 -0
agenta/sdk/tracing/tasks_manager.py +130 -0
{agenta-0.12.7.dist-info → agenta-0.13.0.dist-info}/METADATA +47 -96
agenta-0.13.0.dist-info/RECORD +161 -0
agenta/client/backend/types/add_variant_from_base_and_config_response.py +0 -7
agenta/client/backend/types/human_evaluation_scenario_update_score.py +0 -5
agenta-0.12.7.dist-info/RECORD +0 -114
{agenta-0.12.7.dist-info → agenta-0.13.0.dist-info}/WHEEL +0 -0
{agenta-0.12.7.dist-info → agenta-0.13.0.dist-info}/entry_points.txt +0 -0

agenta/client/backend/resources/variants/types/__init__.py ADDED Viewed

@@ -0,0 +1,7 @@
+# This file was auto-generated by Fern from our API Definition.
+from .add_variant_from_base_and_config_response import (
+    AddVariantFromBaseAndConfigResponse,
+)
+__all__ = ["AddVariantFromBaseAndConfigResponse"]

agenta/client/backend/resources/variants/types/add_variant_from_base_and_config_response.py ADDED Viewed

@@ -0,0 +1,7 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+from ....types.app_variant_response import AppVariantResponse
+AddVariantFromBaseAndConfigResponse = typing.Union[AppVariantResponse, typing.Any]

agenta/client/backend/types/__init__.py CHANGED Viewed

@@ -1,113 +1,145 @@
 # This file was auto-generated by Fern from our API Definition.
-from .add_variant_from_base_and_config_response import (
-    AddVariantFromBaseAndConfigResponse,
-)
 from .aggregated_result import AggregatedResult
+from .aggregated_result_evaluator_config import AggregatedResultEvaluatorConfig
 from .app import App
-from .app_variant_output import AppVariantOutput
-from .app_variant_output_extended import AppVariantOutputExtended
+from .app_variant_response import AppVariantResponse
 from .app_variant_revision import AppVariantRevision
 from .base_output import BaseOutput
 from .body_import_testset import BodyImportTestset
 from .config_db import ConfigDb
-from .container_templates_response import ContainerTemplatesResponse
 from .create_app_output import CreateAppOutput
-from .delete_evaluation import DeleteEvaluation
+from .create_span import CreateSpan
+from .create_trace_response import CreateTraceResponse
 from .docker_env_vars import DockerEnvVars
 from .environment_output import EnvironmentOutput
+from .environment_output_extended import EnvironmentOutputExtended
+from .environment_revision import EnvironmentRevision
+from .error import Error
 from .evaluation import Evaluation
 from .evaluation_scenario import EvaluationScenario
 from .evaluation_scenario_input import EvaluationScenarioInput
 from .evaluation_scenario_output import EvaluationScenarioOutput
 from .evaluation_scenario_result import EvaluationScenarioResult
+from .evaluation_scenario_score_update import EvaluationScenarioScoreUpdate
 from .evaluation_status_enum import EvaluationStatusEnum
 from .evaluation_type import EvaluationType
 from .evaluation_webhook import EvaluationWebhook
 from .evaluator import Evaluator
 from .evaluator_config import EvaluatorConfig
 from .feedback import Feedback
-from .get_config_reponse import GetConfigReponse
+from .get_config_response import GetConfigResponse
 from .http_validation_error import HttpValidationError
 from .human_evaluation import HumanEvaluation
 from .human_evaluation_scenario import HumanEvaluationScenario
 from .human_evaluation_scenario_input import HumanEvaluationScenarioInput
 from .human_evaluation_scenario_output import HumanEvaluationScenarioOutput
-from .human_evaluation_scenario_score import HumanEvaluationScenarioScore
-from .human_evaluation_scenario_update_score import HumanEvaluationScenarioUpdateScore
+from .human_evaluation_scenario_update import HumanEvaluationScenarioUpdate
+from .human_evaluation_update import HumanEvaluationUpdate
 from .image import Image
 from .invite_request import InviteRequest
-from .list_api_keys_output import ListApiKeysOutput
+from .list_api_keys_response import ListApiKeysResponse
 from .llm_run_rate_limit import LlmRunRateLimit
+from .llm_tokens import LlmTokens
+from .new_human_evaluation import NewHumanEvaluation
 from .new_testset import NewTestset
 from .organization import Organization
 from .organization_output import OrganizationOutput
+from .permission import Permission
 from .result import Result
+from .score import Score
 from .simple_evaluation_output import SimpleEvaluationOutput
 from .span import Span
+from .span_detail import SpanDetail
+from .span_kind import SpanKind
+from .span_status_code import SpanStatusCode
+from .span_variant import SpanVariant
 from .template import Template
 from .template_image_info import TemplateImageInfo
 from .test_set_output_response import TestSetOutputResponse
 from .test_set_simple_response import TestSetSimpleResponse
-from .trace import Trace
+from .trace_detail import TraceDetail
 from .uri import Uri
 from .validation_error import ValidationError
 from .validation_error_loc_item import ValidationErrorLocItem
 from .variant_action import VariantAction
 from .variant_action_enum import VariantActionEnum
+from .with_pagination import WithPagination
+from .workspace_member_response import WorkspaceMemberResponse
+from .workspace_permission import WorkspacePermission
+from .workspace_response import WorkspaceResponse
+from .workspace_role import WorkspaceRole
+from .workspace_role_response import WorkspaceRoleResponse
 __all__ = [
-    "AddVariantFromBaseAndConfigResponse",
     "AggregatedResult",
+    "AggregatedResultEvaluatorConfig",
     "App",
-    "AppVariantOutput",
-    "AppVariantOutputExtended",
+    "AppVariantResponse",
     "AppVariantRevision",
     "BaseOutput",
     "BodyImportTestset",
     "ConfigDb",
-    "ContainerTemplatesResponse",
     "CreateAppOutput",
-    "DeleteEvaluation",
+    "CreateSpan",
+    "CreateTraceResponse",
     "DockerEnvVars",
     "EnvironmentOutput",
+    "EnvironmentOutputExtended",
+    "EnvironmentRevision",
+    "Error",
     "Evaluation",
     "EvaluationScenario",
     "EvaluationScenarioInput",
     "EvaluationScenarioOutput",
     "EvaluationScenarioResult",
+    "EvaluationScenarioScoreUpdate",
     "EvaluationStatusEnum",
     "EvaluationType",
     "EvaluationWebhook",
     "Evaluator",
     "EvaluatorConfig",
     "Feedback",
-    "GetConfigReponse",
+    "GetConfigResponse",
     "HttpValidationError",
     "HumanEvaluation",
     "HumanEvaluationScenario",
     "HumanEvaluationScenarioInput",
     "HumanEvaluationScenarioOutput",
-    "HumanEvaluationScenarioScore",
-    "HumanEvaluationScenarioUpdateScore",
+    "HumanEvaluationScenarioUpdate",
+    "HumanEvaluationUpdate",
     "Image",
     "InviteRequest",
-    "ListApiKeysOutput",
+    "ListApiKeysResponse",
     "LlmRunRateLimit",
+    "LlmTokens",
+    "NewHumanEvaluation",
     "NewTestset",
     "Organization",
     "OrganizationOutput",
+    "Permission",
     "Result",
+    "Score",
     "SimpleEvaluationOutput",
     "Span",
+    "SpanDetail",
+    "SpanKind",
+    "SpanStatusCode",
+    "SpanVariant",
     "Template",
     "TemplateImageInfo",
     "TestSetOutputResponse",
     "TestSetSimpleResponse",
-    "Trace",
+    "TraceDetail",
     "Uri",
     "ValidationError",
     "ValidationErrorLocItem",
     "VariantAction",
     "VariantActionEnum",
+    "WithPagination",
+    "WorkspaceMemberResponse",
+    "WorkspacePermission",
+    "WorkspaceResponse",
+    "WorkspaceRole",
+    "WorkspaceRoleResponse",
 ]

agenta/client/backend/types/aggregated_result.py CHANGED Viewed

@@ -4,7 +4,7 @@ import datetime as dt
 import typing
 from ..core.datetime_utils import serialize_datetime
-from .evaluator_config import EvaluatorConfig
+from .aggregated_result_evaluator_config import AggregatedResultEvaluatorConfig
 from .result import Result
 try:
@@ -14,7 +14,7 @@ except ImportError:
 class AggregatedResult(pydantic.BaseModel):
-    evaluator_config: EvaluatorConfig
+    evaluator_config: AggregatedResultEvaluatorConfig
     result: Result
     def json(self, **kwargs: typing.Any) -> str:

agenta/client/backend/types/aggregated_result_evaluator_config.py ADDED Viewed

@@ -0,0 +1,9 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+from .evaluator_config import EvaluatorConfig
+AggregatedResultEvaluatorConfig = typing.Union[
+    EvaluatorConfig, typing.Dict[str, typing.Any]
+]

agenta/client/backend/types/{app_variant_output.py → app_variant_response.py} RENAMED Viewed

@@ -11,19 +11,21 @@ except ImportError:
     import pydantic  # type: ignore
-class AppVariantOutput(pydantic.BaseModel):
+class AppVariantResponse(pydantic.BaseModel):
     app_id: str
     app_name: str
     variant_id: str
     variant_name: str
     parameters: typing.Optional[typing.Dict[str, typing.Any]]
     previous_variant_name: typing.Optional[str]
-    organization_id: typing.Optional[str]
     user_id: str
     base_name: str
     base_id: str
     config_name: str
     uri: typing.Optional[str]
+    revision: int
+    organization_id: typing.Optional[str]
+    workspace_id: typing.Optional[str]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/{trace.py → create_span.py} RENAMED Viewed

@@ -4,7 +4,9 @@ import datetime as dt
 import typing
 from ..core.datetime_utils import serialize_datetime
-from .feedback import Feedback
+from .llm_tokens import LlmTokens
+from .span_kind import SpanKind
+from .span_status_code import SpanStatusCode
 try:
     import pydantic.v1 as pydantic  # type: ignore
@@ -12,19 +14,27 @@ except ImportError:
     import pydantic  # type: ignore
-class Trace(pydantic.BaseModel):
+class CreateSpan(pydantic.BaseModel):
+    id: str
     app_id: typing.Optional[str]
     variant_id: typing.Optional[str]
-    cost: typing.Optional[float]
-    latency: float
-    status: str
-    token_consumption: typing.Optional[int]
+    variant_name: typing.Optional[str]
+    inputs: typing.Optional[typing.Dict[str, typing.Any]]
+    outputs: typing.Optional[typing.List[str]]
+    config: typing.Optional[typing.Dict[str, typing.Any]]
+    environment: typing.Optional[str]
     tags: typing.Optional[typing.List[str]]
+    token_consumption: typing.Optional[int]
+    name: str
+    parent_span_id: typing.Optional[str]
+    attributes: typing.Optional[typing.Dict[str, typing.Any]]
+    spankind: str
+    status: str
+    user: typing.Optional[str]
     start_time: dt.datetime
-    end_time: dt.datetime
-    trace_id: str
-    spans: typing.List[str]
-    feedbacks: typing.Optional[typing.List[Feedback]]
+    end_time: typing.Optional[dt.datetime]
+    tokens: typing.Optional[LlmTokens]
+    cost: typing.Optional[float]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/create_trace_response.py ADDED Viewed

@@ -0,0 +1,37 @@
+# This file was auto-generated by Fern from our API Definition.
+import datetime as dt
+import typing
+from ..core.datetime_utils import serialize_datetime
+try:
+    import pydantic.v1 as pydantic  # type: ignore
+except ImportError:
+    import pydantic  # type: ignore
+class CreateTraceResponse(pydantic.BaseModel):
+    message: str
+    data: typing.Dict[str, typing.Any]
+    def json(self, **kwargs: typing.Any) -> str:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().json(**kwargs_with_defaults)
+    def dict(self, **kwargs: typing.Any) -> typing.Dict[str, typing.Any]:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().dict(**kwargs_with_defaults)
+    class Config:
+        frozen = True
+        smart_union = True
+        json_encoders = {dt.datetime: serialize_datetime}

agenta/client/backend/types/environment_output.py CHANGED Viewed

@@ -17,7 +17,9 @@ class EnvironmentOutput(pydantic.BaseModel):
     deployed_app_variant_id: typing.Optional[str]
     deployed_variant_name: typing.Optional[str]
     deployed_app_variant_revision_id: typing.Optional[str]
-    revision: typing.Optional[str]
+    revision: typing.Optional[int]
+    organization_id: typing.Optional[str]
+    workspace_id: typing.Optional[str]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/environment_output_extended.py ADDED Viewed

@@ -0,0 +1,45 @@
+# This file was auto-generated by Fern from our API Definition.
+import datetime as dt
+import typing
+from ..core.datetime_utils import serialize_datetime
+from .environment_revision import EnvironmentRevision
+try:
+    import pydantic.v1 as pydantic  # type: ignore
+except ImportError:
+    import pydantic  # type: ignore
+class EnvironmentOutputExtended(pydantic.BaseModel):
+    name: str
+    app_id: str
+    deployed_app_variant_id: typing.Optional[str]
+    deployed_variant_name: typing.Optional[str]
+    deployed_app_variant_revision_id: typing.Optional[str]
+    revision: typing.Optional[int]
+    revisions: typing.List[EnvironmentRevision]
+    organization_id: typing.Optional[str]
+    workspace_id: typing.Optional[str]
+    def json(self, **kwargs: typing.Any) -> str:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().json(**kwargs_with_defaults)
+    def dict(self, **kwargs: typing.Any) -> typing.Dict[str, typing.Any]:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().dict(**kwargs_with_defaults)
+    class Config:
+        frozen = True
+        smart_union = True
+        json_encoders = {dt.datetime: serialize_datetime}

agenta/client/backend/types/environment_revision.py ADDED Viewed

@@ -0,0 +1,41 @@
+# This file was auto-generated by Fern from our API Definition.
+import datetime as dt
+import typing
+from ..core.datetime_utils import serialize_datetime
+try:
+    import pydantic.v1 as pydantic  # type: ignore
+except ImportError:
+    import pydantic  # type: ignore
+class EnvironmentRevision(pydantic.BaseModel):
+    id: str
+    revision: int
+    modified_by: str
+    deployed_app_variant_revision: typing.Optional[str]
+    deployment: typing.Optional[str]
+    created_at: dt.datetime
+    def json(self, **kwargs: typing.Any) -> str:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().json(**kwargs_with_defaults)
+    def dict(self, **kwargs: typing.Any) -> typing.Dict[str, typing.Any]:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().dict(**kwargs_with_defaults)
+    class Config:
+        frozen = True
+        smart_union = True
+        json_encoders = {dt.datetime: serialize_datetime}

agenta/client/backend/types/error.py ADDED Viewed

@@ -0,0 +1,37 @@
+# This file was auto-generated by Fern from our API Definition.
+import datetime as dt
+import typing
+from ..core.datetime_utils import serialize_datetime
+try:
+    import pydantic.v1 as pydantic  # type: ignore
+except ImportError:
+    import pydantic  # type: ignore
+class Error(pydantic.BaseModel):
+    message: str
+    stacktrace: typing.Optional[str]
+    def json(self, **kwargs: typing.Any) -> str:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().json(**kwargs_with_defaults)
+    def dict(self, **kwargs: typing.Any) -> typing.Dict[str, typing.Any]:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().dict(**kwargs_with_defaults)
+    class Config:
+        frozen = True
+        smart_union = True
+        json_encoders = {dt.datetime: serialize_datetime}

agenta/client/backend/types/evaluation.py CHANGED Viewed

@@ -5,6 +5,7 @@ import typing
 from ..core.datetime_utils import serialize_datetime
 from .aggregated_result import AggregatedResult
+from .result import Result
 try:
     import pydantic.v1 as pydantic  # type: ignore
@@ -21,10 +22,12 @@ class Evaluation(pydantic.BaseModel):
     variant_names: typing.List[str]
     variant_revision_ids: typing.List[str]
     revisions: typing.List[str]
-    testset_id: str
-    testset_name: str
-    status: str
+    testset_id: typing.Optional[str]
+    testset_name: typing.Optional[str]
+    status: Result
     aggregated_results: typing.List[AggregatedResult]
+    average_cost: typing.Optional[Result]
+    average_latency: typing.Optional[Result]
     created_at: dt.datetime
     updated_at: dt.datetime

agenta/client/backend/types/evaluation_scenario_output.py CHANGED Viewed

@@ -4,6 +4,7 @@ import datetime as dt
 import typing
 from ..core.datetime_utils import serialize_datetime
+from .result import Result
 try:
     import pydantic.v1 as pydantic  # type: ignore
@@ -12,8 +13,9 @@ except ImportError:
 class EvaluationScenarioOutput(pydantic.BaseModel):
-    type: str
-    value: typing.Optional[typing.Any]
+    result: Result
+    cost: typing.Optional[float]
+    latency: typing.Optional[float]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/{delete_evaluation.py → evaluation_scenario_score_update.py} RENAMED Viewed

@@ -11,8 +11,8 @@ except ImportError:
     import pydantic  # type: ignore
-class DeleteEvaluation(pydantic.BaseModel):
-    evaluations_ids: typing.List[str]
+class EvaluationScenarioScoreUpdate(pydantic.BaseModel):
+    score: float
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/evaluation_status_enum.py CHANGED Viewed

@@ -14,6 +14,7 @@ class EvaluationStatusEnum(str, enum.Enum):
     EVALUATION_INITIALIZED = "EVALUATION_INITIALIZED"
     EVALUATION_STARTED = "EVALUATION_STARTED"
     EVALUATION_FINISHED = "EVALUATION_FINISHED"
+    EVALUATION_FINISHED_WITH_ERRORS = "EVALUATION_FINISHED_WITH_ERRORS"
     EVALUATION_FAILED = "EVALUATION_FAILED"
     def visit(
@@ -21,6 +22,7 @@ class EvaluationStatusEnum(str, enum.Enum):
         evaluation_initialized: typing.Callable[[], T_Result],
         evaluation_started: typing.Callable[[], T_Result],
         evaluation_finished: typing.Callable[[], T_Result],
+        evaluation_finished_with_errors: typing.Callable[[], T_Result],
         evaluation_failed: typing.Callable[[], T_Result],
     ) -> T_Result:
         if self is EvaluationStatusEnum.EVALUATION_INITIALIZED:
@@ -29,5 +31,7 @@ class EvaluationStatusEnum(str, enum.Enum):
             return evaluation_started()
         if self is EvaluationStatusEnum.EVALUATION_FINISHED:
             return evaluation_finished()
+        if self is EvaluationStatusEnum.EVALUATION_FINISHED_WITH_ERRORS:
+            return evaluation_finished_with_errors()
         if self is EvaluationStatusEnum.EVALUATION_FAILED:
             return evaluation_failed()

agenta/client/backend/types/evaluator.py CHANGED Viewed

@@ -16,6 +16,7 @@ class Evaluator(pydantic.BaseModel):
     key: str
     direct_use: bool
     settings_template: typing.Dict[str, typing.Any]
+    description: typing.Optional[str]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/{get_config_reponse.py → get_config_response.py} RENAMED Viewed

@@ -11,8 +11,7 @@ except ImportError:
     import pydantic  # type: ignore
-class GetConfigReponse(pydantic.BaseModel):
-    config_id: str
+class GetConfigResponse(pydantic.BaseModel):
     config_name: str
     current_version: int
     parameters: typing.Dict[str, typing.Any]

agenta/client/backend/types/human_evaluation_scenario.py CHANGED Viewed

@@ -6,7 +6,7 @@ import typing
 from ..core.datetime_utils import serialize_datetime
 from .human_evaluation_scenario_input import HumanEvaluationScenarioInput
 from .human_evaluation_scenario_output import HumanEvaluationScenarioOutput
-from .human_evaluation_scenario_score import HumanEvaluationScenarioScore
+from .score import Score
 try:
     import pydantic.v1 as pydantic  # type: ignore
@@ -20,7 +20,7 @@ class HumanEvaluationScenario(pydantic.BaseModel):
     inputs: typing.List[HumanEvaluationScenarioInput]
     outputs: typing.List[HumanEvaluationScenarioOutput]
     vote: typing.Optional[str]
-    score: typing.Optional[HumanEvaluationScenarioScore]
+    score: typing.Optional[Score]
     evaluation: typing.Optional[str]
     correct_answer: typing.Optional[str]
     is_pinned: typing.Optional[bool]

agenta/client/backend/types/{app_variant_output_extended.py → human_evaluation_scenario_update.py} RENAMED Viewed

@@ -4,7 +4,9 @@ import datetime as dt
 import typing
 from ..core.datetime_utils import serialize_datetime
-from .app_variant_revision import AppVariantRevision
+from .human_evaluation_scenario_input import HumanEvaluationScenarioInput
+from .human_evaluation_scenario_output import HumanEvaluationScenarioOutput
+from .score import Score
 try:
     import pydantic.v1 as pydantic  # type: ignore
@@ -12,21 +14,14 @@ except ImportError:
     import pydantic  # type: ignore
-class AppVariantOutputExtended(pydantic.BaseModel):
-    app_id: str
-    app_name: str
-    variant_id: str
-    variant_name: str
-    parameters: typing.Optional[typing.Dict[str, typing.Any]]
-    previous_variant_name: typing.Optional[str]
-    organization_id: str
-    user_id: str
-    base_name: str
-    base_id: str
-    config_name: str
-    uri: typing.Optional[str]
-    revision: int
-    revisions: typing.List[AppVariantRevision]
+class HumanEvaluationScenarioUpdate(pydantic.BaseModel):
+    vote: typing.Optional[str]
+    score: typing.Optional[Score]
+    correct_answer: typing.Optional[str]
+    outputs: typing.Optional[typing.List[HumanEvaluationScenarioOutput]]
+    inputs: typing.Optional[typing.List[HumanEvaluationScenarioInput]]
+    is_pinned: typing.Optional[bool]
+    note: typing.Optional[str]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta/client/backend/types/human_evaluation_update.py ADDED Viewed

@@ -0,0 +1,37 @@
+# This file was auto-generated by Fern from our API Definition.
+import datetime as dt
+import typing
+from ..core.datetime_utils import serialize_datetime
+from .evaluation_status_enum import EvaluationStatusEnum
+try:
+    import pydantic.v1 as pydantic  # type: ignore
+except ImportError:
+    import pydantic  # type: ignore
+class HumanEvaluationUpdate(pydantic.BaseModel):
+    status: typing.Optional[EvaluationStatusEnum]
+    def json(self, **kwargs: typing.Any) -> str:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().json(**kwargs_with_defaults)
+    def dict(self, **kwargs: typing.Any) -> typing.Dict[str, typing.Any]:
+        kwargs_with_defaults: typing.Any = {
+            "by_alias": True,
+            "exclude_unset": True,
+            **kwargs,
+        }
+        return super().dict(**kwargs_with_defaults)
+    class Config:
+        frozen = True
+        smart_union = True
+        json_encoders = {dt.datetime: serialize_datetime}

agenta/client/backend/types/image.py CHANGED Viewed

@@ -16,6 +16,7 @@ class Image(pydantic.BaseModel):
     docker_id: str
     tags: str
     organization_id: typing.Optional[str]
+    workspace_id: typing.Optional[str]
     def json(self, **kwargs: typing.Any) -> str:
         kwargs_with_defaults: typing.Any = {

agenta 0.12.7__py3-none-any.whl → 0.13.0__py3-none-any.whl

Potentially problematic release.

agenta 0.12.7py3-none-any.whl → 0.13.0py3-none-any.whl