PyPI - arize-phoenix - Versions diffs - 5.5.2__py3-none-any.whl → 5.7.0__py3-none-any.whl - Mend

arize-phoenix 5.5.2py3-none-any.whl → 5.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (186) hide show

{arize_phoenix-5.5.2.dist-info → arize_phoenix-5.7.0.dist-info}/METADATA +4 -7
arize_phoenix-5.7.0.dist-info/RECORD +330 -0
phoenix/config.py +50 -8
phoenix/core/model.py +3 -3
phoenix/core/model_schema.py +41 -50
phoenix/core/model_schema_adapter.py +17 -16
phoenix/datetime_utils.py +2 -2
phoenix/db/bulk_inserter.py +10 -20
phoenix/db/engines.py +2 -1
phoenix/db/enums.py +2 -2
phoenix/db/helpers.py +8 -7
phoenix/db/insertion/dataset.py +9 -19
phoenix/db/insertion/document_annotation.py +14 -13
phoenix/db/insertion/helpers.py +6 -16
phoenix/db/insertion/span_annotation.py +14 -13
phoenix/db/insertion/trace_annotation.py +14 -13
phoenix/db/insertion/types.py +19 -30
phoenix/db/migrations/versions/3be8647b87d8_add_token_columns_to_spans_table.py +8 -8
phoenix/db/models.py +28 -28
phoenix/experiments/evaluators/base.py +2 -1
phoenix/experiments/evaluators/code_evaluators.py +4 -5
phoenix/experiments/evaluators/llm_evaluators.py +157 -4
phoenix/experiments/evaluators/utils.py +3 -2
phoenix/experiments/functions.py +10 -21
phoenix/experiments/tracing.py +2 -1
phoenix/experiments/types.py +20 -29
phoenix/experiments/utils.py +2 -1
phoenix/inferences/errors.py +6 -5
phoenix/inferences/fixtures.py +6 -5
phoenix/inferences/inferences.py +37 -37
phoenix/inferences/schema.py +11 -10
phoenix/inferences/validation.py +13 -14
phoenix/logging/_formatter.py +3 -3
phoenix/metrics/__init__.py +5 -4
phoenix/metrics/binning.py +2 -1
phoenix/metrics/metrics.py +2 -1
phoenix/metrics/mixins.py +7 -6
phoenix/metrics/retrieval_metrics.py +2 -1
phoenix/metrics/timeseries.py +5 -4
phoenix/metrics/wrappers.py +2 -2
phoenix/pointcloud/clustering.py +3 -4
phoenix/pointcloud/pointcloud.py +7 -5
phoenix/pointcloud/umap_parameters.py +2 -1
phoenix/server/api/dataloaders/annotation_summaries.py +12 -19
phoenix/server/api/dataloaders/average_experiment_run_latency.py +2 -2
phoenix/server/api/dataloaders/cache/two_tier_cache.py +3 -2
phoenix/server/api/dataloaders/dataset_example_revisions.py +3 -8
phoenix/server/api/dataloaders/dataset_example_spans.py +2 -5
phoenix/server/api/dataloaders/document_evaluation_summaries.py +12 -18
phoenix/server/api/dataloaders/document_evaluations.py +3 -7
phoenix/server/api/dataloaders/document_retrieval_metrics.py +6 -13
phoenix/server/api/dataloaders/experiment_annotation_summaries.py +4 -8
phoenix/server/api/dataloaders/experiment_error_rates.py +2 -5
phoenix/server/api/dataloaders/experiment_run_annotations.py +3 -7
phoenix/server/api/dataloaders/experiment_run_counts.py +1 -5
phoenix/server/api/dataloaders/experiment_sequence_number.py +2 -5
phoenix/server/api/dataloaders/latency_ms_quantile.py +21 -30
phoenix/server/api/dataloaders/min_start_or_max_end_times.py +7 -13
phoenix/server/api/dataloaders/project_by_name.py +3 -3
phoenix/server/api/dataloaders/record_counts.py +11 -18
phoenix/server/api/dataloaders/span_annotations.py +3 -7
phoenix/server/api/dataloaders/span_dataset_examples.py +3 -8
phoenix/server/api/dataloaders/span_descendants.py +3 -7
phoenix/server/api/dataloaders/span_projects.py +2 -2
phoenix/server/api/dataloaders/token_counts.py +12 -19
phoenix/server/api/dataloaders/trace_row_ids.py +3 -7
phoenix/server/api/dataloaders/user_roles.py +3 -3
phoenix/server/api/dataloaders/users.py +3 -3
phoenix/server/api/helpers/__init__.py +4 -3
phoenix/server/api/helpers/dataset_helpers.py +10 -9
phoenix/server/api/helpers/playground_clients.py +671 -0
phoenix/server/api/helpers/playground_registry.py +70 -0
phoenix/server/api/helpers/playground_spans.py +325 -0
phoenix/server/api/input_types/AddExamplesToDatasetInput.py +2 -2
phoenix/server/api/input_types/AddSpansToDatasetInput.py +2 -2
phoenix/server/api/input_types/ChatCompletionInput.py +38 -0
phoenix/server/api/input_types/ChatCompletionMessageInput.py +13 -1
phoenix/server/api/input_types/ClusterInput.py +2 -2
phoenix/server/api/input_types/DeleteAnnotationsInput.py +1 -3
phoenix/server/api/input_types/DeleteDatasetExamplesInput.py +2 -2
phoenix/server/api/input_types/DeleteExperimentsInput.py +1 -3
phoenix/server/api/input_types/DimensionFilter.py +4 -4
phoenix/server/api/input_types/GenerativeModelInput.py +17 -0
phoenix/server/api/input_types/Granularity.py +1 -1
phoenix/server/api/input_types/InvocationParameters.py +156 -13
phoenix/server/api/input_types/PatchDatasetExamplesInput.py +2 -2
phoenix/server/api/input_types/TemplateOptions.py +10 -0
phoenix/server/api/mutations/__init__.py +4 -0
phoenix/server/api/mutations/chat_mutations.py +374 -0
phoenix/server/api/mutations/dataset_mutations.py +4 -4
phoenix/server/api/mutations/experiment_mutations.py +1 -2
phoenix/server/api/mutations/export_events_mutations.py +7 -7
phoenix/server/api/mutations/span_annotations_mutations.py +4 -4
phoenix/server/api/mutations/trace_annotations_mutations.py +4 -4
phoenix/server/api/mutations/user_mutations.py +4 -4
phoenix/server/api/openapi/schema.py +2 -2
phoenix/server/api/queries.py +61 -72
phoenix/server/api/routers/oauth2.py +4 -4
phoenix/server/api/routers/v1/datasets.py +22 -36
phoenix/server/api/routers/v1/evaluations.py +6 -5
phoenix/server/api/routers/v1/experiment_evaluations.py +2 -2
phoenix/server/api/routers/v1/experiment_runs.py +2 -2
phoenix/server/api/routers/v1/experiments.py +4 -4
phoenix/server/api/routers/v1/spans.py +13 -12
phoenix/server/api/routers/v1/traces.py +5 -5
phoenix/server/api/routers/v1/utils.py +5 -5
phoenix/server/api/schema.py +42 -10
phoenix/server/api/subscriptions.py +347 -494
phoenix/server/api/types/AnnotationSummary.py +3 -3
phoenix/server/api/types/ChatCompletionSubscriptionPayload.py +44 -0
phoenix/server/api/types/Cluster.py +8 -7
phoenix/server/api/types/Dataset.py +5 -4
phoenix/server/api/types/Dimension.py +3 -3
phoenix/server/api/types/DocumentEvaluationSummary.py +8 -7
phoenix/server/api/types/EmbeddingDimension.py +6 -5
phoenix/server/api/types/EvaluationSummary.py +3 -3
phoenix/server/api/types/Event.py +7 -7
phoenix/server/api/types/Experiment.py +3 -3
phoenix/server/api/types/ExperimentComparison.py +2 -4
phoenix/server/api/types/GenerativeProvider.py +27 -3
phoenix/server/api/types/Inferences.py +9 -8
phoenix/server/api/types/InferencesRole.py +2 -2
phoenix/server/api/types/Model.py +2 -2
phoenix/server/api/types/Project.py +11 -18
phoenix/server/api/types/Segments.py +3 -3
phoenix/server/api/types/Span.py +45 -7
phoenix/server/api/types/TemplateLanguage.py +9 -0
phoenix/server/api/types/TimeSeries.py +8 -7
phoenix/server/api/types/Trace.py +2 -2
phoenix/server/api/types/UMAPPoints.py +6 -6
phoenix/server/api/types/User.py +3 -3
phoenix/server/api/types/node.py +1 -3
phoenix/server/api/types/pagination.py +4 -4
phoenix/server/api/utils.py +2 -4
phoenix/server/app.py +76 -37
phoenix/server/bearer_auth.py +4 -10
phoenix/server/dml_event.py +3 -3
phoenix/server/dml_event_handler.py +10 -24
phoenix/server/grpc_server.py +3 -2
phoenix/server/jwt_store.py +22 -21
phoenix/server/main.py +17 -4
phoenix/server/oauth2.py +3 -2
phoenix/server/rate_limiters.py +5 -8
phoenix/server/static/.vite/manifest.json +31 -31
phoenix/server/static/assets/components-Csu8UKOs.js +1612 -0
phoenix/server/static/assets/{index-DCzakdJq.js → index-Bk5C9EA7.js} +2 -2
phoenix/server/static/assets/{pages-CAL1FDMt.js → pages-UeWaKXNs.js} +337 -442
phoenix/server/static/assets/{vendor-6IcPAw_j.js → vendor-CtqfhlbC.js} +6 -6
phoenix/server/static/assets/{vendor-arizeai-DRZuoyuF.js → vendor-arizeai-C_3SBz56.js} +2 -2
phoenix/server/static/assets/{vendor-codemirror-DVE2_WBr.js → vendor-codemirror-wfdk9cjp.js} +1 -1
phoenix/server/static/assets/{vendor-recharts-DwrexFA4.js → vendor-recharts-BiVnSv90.js} +1 -1
phoenix/server/templates/index.html +1 -0
phoenix/server/thread_server.py +1 -1
phoenix/server/types.py +17 -29
phoenix/services.py +8 -3
phoenix/session/client.py +12 -24
phoenix/session/data_extractor.py +3 -3
phoenix/session/evaluation.py +1 -2
phoenix/session/session.py +26 -21
phoenix/trace/attributes.py +16 -28
phoenix/trace/dsl/filter.py +17 -21
phoenix/trace/dsl/helpers.py +3 -3
phoenix/trace/dsl/query.py +13 -22
phoenix/trace/fixtures.py +11 -17
phoenix/trace/otel.py +5 -15
phoenix/trace/projects.py +3 -2
phoenix/trace/schemas.py +2 -2
phoenix/trace/span_evaluations.py +9 -8
phoenix/trace/span_json_decoder.py +3 -3
phoenix/trace/span_json_encoder.py +2 -2
phoenix/trace/trace_dataset.py +6 -5
phoenix/trace/utils.py +6 -6
phoenix/utilities/deprecation.py +3 -2
phoenix/utilities/error_handling.py +3 -2
phoenix/utilities/json.py +2 -1
phoenix/utilities/logging.py +2 -2
phoenix/utilities/project.py +1 -1
phoenix/utilities/re.py +3 -4
phoenix/utilities/template_formatters.py +16 -5
phoenix/version.py +1 -1
arize_phoenix-5.5.2.dist-info/RECORD +0 -321
phoenix/server/static/assets/components-hX0LgYz3.js +0 -1428
{arize_phoenix-5.5.2.dist-info → arize_phoenix-5.7.0.dist-info}/WHEEL +0 -0
{arize_phoenix-5.5.2.dist-info → arize_phoenix-5.7.0.dist-info}/entry_points.txt +0 -0
{arize_phoenix-5.5.2.dist-info → arize_phoenix-5.7.0.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-5.5.2.dist-info → arize_phoenix-5.7.0.dist-info}/licenses/LICENSE +0 -0

phoenix/server/api/input_types/InvocationParameters.py CHANGED Viewed

@@ -1,20 +1,163 @@
-from typing import List, Optional
+from enum import Enum
+from typing import Annotated, Any, Mapping, Optional, Union
 import strawberry
 from strawberry import UNSET
 from strawberry.scalars import JSON
+@strawberry.enum
+class CanonicalParameterName(str, Enum):
+    TEMPERATURE = "temperature"
+    MAX_COMPLETION_TOKENS = "max_completion_tokens"
+    STOP_SEQUENCES = "stop_sequences"
+    TOP_P = "top_p"
+    RANDOM_SEED = "random_seed"
+    TOOL_CHOICE = "tool_choice"
+    RESPONSE_FORMAT = "response_format"
+@strawberry.enum
+class InvocationInputField(str, Enum):
+    value_int = "value_int"
+    value_float = "value_float"
+    value_bool = "value_bool"
+    value_string = "value_string"
+    value_json = "value_json"
+    value_string_list = "value_string_list"
+    value_boolean = "value_boolean"
 @strawberry.input
-class InvocationParameters:
-    """
-    Invocation parameters interface shared between different providers.
-    """
-    temperature: Optional[float] = UNSET
-    max_completion_tokens: Optional[int] = UNSET
-    max_tokens: Optional[int] = UNSET
-    top_p: Optional[float] = UNSET
-    stop: Optional[List[str]] = UNSET
-    seed: Optional[int] = UNSET
-    tool_choice: Optional[JSON] = UNSET
+class InvocationParameterInput:
+    invocation_name: str
+    canonical_name: Optional[CanonicalParameterName] = None
+    value_int: Optional[int] = UNSET
+    value_float: Optional[float] = UNSET
+    value_bool: Optional[bool] = UNSET
+    value_string: Optional[str] = UNSET
+    value_json: Optional[JSON] = UNSET
+    value_string_list: Optional[list[str]] = UNSET
+    value_boolean: Optional[bool] = UNSET
+@strawberry.interface
+class InvocationParameterBase:
+    invocation_name: str
+    canonical_name: Optional[CanonicalParameterName] = None
+    label: str
+    required: bool = False
+    hidden: bool = False
+@strawberry.type
+class IntInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_int
+    default_value: Optional[int] = UNSET
+@strawberry.type
+class FloatInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_float
+    default_value: Optional[float] = UNSET
+@strawberry.type
+class BoundedFloatInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_float
+    default_value: Optional[float] = UNSET
+    min_value: float
+    max_value: float
+@strawberry.type
+class StringInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_string
+    default_value: Optional[str] = UNSET
+@strawberry.type
+class JSONInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_json
+    default_value: Optional[JSON] = UNSET
+@strawberry.type
+class StringListInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_string_list
+    default_value: Optional[list[str]] = UNSET
+@strawberry.type
+class BooleanInvocationParameter(InvocationParameterBase):
+    invocation_input_field: InvocationInputField = InvocationInputField.value_bool
+    default_value: Optional[bool] = UNSET
+def extract_parameter(
+    param_def: InvocationParameterBase, param_input: InvocationParameterInput
+) -> Any:
+    if isinstance(param_def, IntInvocationParameter):
+        return (
+            param_input.value_int if param_input.value_int is not UNSET else param_def.default_value
+        )
+    elif isinstance(param_def, FloatInvocationParameter):
+        return (
+            param_input.value_float
+            if param_input.value_float is not UNSET
+            else param_def.default_value
+        )
+    elif isinstance(param_def, BoundedFloatInvocationParameter):
+        return (
+            param_input.value_float
+            if param_input.value_float is not UNSET
+            else param_def.default_value
+        )
+    elif isinstance(param_def, StringInvocationParameter):
+        return (
+            param_input.value_string
+            if param_input.value_string is not UNSET
+            else param_def.default_value
+        )
+    elif isinstance(param_def, JSONInvocationParameter):
+        return (
+            param_input.value_json
+            if param_input.value_json is not UNSET
+            else param_def.default_value
+        )
+    elif isinstance(param_def, StringListInvocationParameter):
+        return (
+            param_input.value_string_list
+            if param_input.value_string_list is not UNSET
+            else param_def.default_value
+        )
+    elif isinstance(param_def, BooleanInvocationParameter):
+        return (
+            param_input.value_bool
+            if param_input.value_bool is not UNSET
+            else param_def.default_value
+        )
+def validate_invocation_parameters(
+    parameters: list["InvocationParameter"],
+    input: Mapping[str, Any],
+) -> None:
+    for param_def in parameters:
+        if param_def.required and param_def.invocation_name not in input:
+            raise ValueError(f"Required parameter {param_def.invocation_name} not provided")
+# Create the union for output types
+InvocationParameter = Annotated[
+    Union[
+        IntInvocationParameter,
+        FloatInvocationParameter,
+        BoundedFloatInvocationParameter,
+        StringInvocationParameter,
+        JSONInvocationParameter,
+        StringListInvocationParameter,
+        BooleanInvocationParameter,
+    ],
+    strawberry.union("InvocationParameter"),
+]

phoenix/server/api/input_types/PatchDatasetExamplesInput.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from typing import List, Optional
+from typing import Optional
 import strawberry
 from strawberry import UNSET
@@ -30,6 +30,6 @@ class PatchDatasetExamplesInput:
     Input type to the patchDatasetExamples mutation.
     """
-    patches: List[DatasetExamplePatch]
+    patches: list[DatasetExamplePatch]
     version_description: Optional[str] = UNSET
     version_metadata: Optional[JSON] = UNSET

phoenix/server/api/input_types/TemplateOptions.py ADDED Viewed

@@ -0,0 +1,10 @@
+import strawberry
+from strawberry.scalars import JSON
+from phoenix.server.api.types.TemplateLanguage import TemplateLanguage
+@strawberry.input
+class TemplateOptions:
+    variables: JSON
+    language: TemplateLanguage

phoenix/server/api/mutations/__init__.py CHANGED Viewed

@@ -1,6 +1,9 @@
 import strawberry
 from phoenix.server.api.mutations.api_key_mutations import ApiKeyMutationMixin
+from phoenix.server.api.mutations.chat_mutations import (
+    ChatCompletionMutationMixin,
+)
 from phoenix.server.api.mutations.dataset_mutations import DatasetMutationMixin
 from phoenix.server.api.mutations.experiment_mutations import ExperimentMutationMixin
 from phoenix.server.api.mutations.export_events_mutations import ExportEventsMutationMixin
@@ -20,5 +23,6 @@ class Mutation(
     SpanAnnotationMutationMixin,
     TraceAnnotationMutationMixin,
     UserMutationMixin,
+    ChatCompletionMutationMixin,
 ):
     pass

phoenix/server/api/mutations/chat_mutations.py ADDED Viewed

@@ -0,0 +1,374 @@
+import json
+from dataclasses import asdict
+from datetime import datetime, timezone
+from itertools import chain
+from traceback import format_exc
+from typing import Any, Iterable, Iterator, List, Optional
+import strawberry
+from openinference.semconv.trace import (
+    MessageAttributes,
+    OpenInferenceMimeTypeValues,
+    OpenInferenceSpanKindValues,
+    SpanAttributes,
+    ToolAttributes,
+    ToolCallAttributes,
+)
+from opentelemetry.sdk.trace.id_generator import RandomIdGenerator as DefaultOTelIDGenerator
+from opentelemetry.trace import StatusCode
+from sqlalchemy import insert, select
+from strawberry.types import Info
+from typing_extensions import assert_never
+from phoenix.datetime_utils import local_now, normalize_datetime
+from phoenix.db import models
+from phoenix.server.api.context import Context
+from phoenix.server.api.exceptions import BadRequest
+from phoenix.server.api.helpers.playground_clients import initialize_playground_clients
+from phoenix.server.api.helpers.playground_registry import PLAYGROUND_CLIENT_REGISTRY
+from phoenix.server.api.input_types.ChatCompletionInput import ChatCompletionInput
+from phoenix.server.api.input_types.TemplateOptions import TemplateOptions
+from phoenix.server.api.types.ChatCompletionMessageRole import ChatCompletionMessageRole
+from phoenix.server.api.types.ChatCompletionSubscriptionPayload import (
+    TextChunk,
+    ToolCallChunk,
+)
+from phoenix.server.api.types.Span import Span, to_gql_span
+from phoenix.server.api.types.TemplateLanguage import TemplateLanguage
+from phoenix.server.dml_event import SpanInsertEvent
+from phoenix.trace.attributes import unflatten
+from phoenix.trace.schemas import SpanException
+from phoenix.utilities.template_formatters import (
+    FStringTemplateFormatter,
+    MustacheTemplateFormatter,
+    TemplateFormatter,
+)
+initialize_playground_clients()
+ChatCompletionMessage = tuple[ChatCompletionMessageRole, str, Optional[str], Optional[List[Any]]]
+@strawberry.type
+class ChatCompletionFunctionCall:
+    name: str
+    arguments: str
+@strawberry.type
+class ChatCompletionToolCall:
+    id: str
+    function: ChatCompletionFunctionCall
+@strawberry.type
+class ChatCompletionMutationPayload:
+    content: Optional[str]
+    tool_calls: List[ChatCompletionToolCall]
+    span: Span
+    error_message: Optional[str]
+@strawberry.type
+class ChatCompletionMutationMixin:
+    @strawberry.mutation
+    async def chat_completion(
+        self, info: Info[Context, None], input: ChatCompletionInput
+    ) -> ChatCompletionMutationPayload:
+        provider_key = input.model.provider_key
+        llm_client_class = PLAYGROUND_CLIENT_REGISTRY.get_client(provider_key, input.model.name)
+        if llm_client_class is None:
+            raise BadRequest(f"No LLM client registered for provider '{provider_key}'")
+        attributes: dict[str, Any] = {}
+        llm_client = llm_client_class(
+            model=input.model,
+            api_key=input.api_key,
+        )
+        messages = [
+            (
+                message.role,
+                message.content,
+                message.tool_call_id if isinstance(message.tool_call_id, str) else None,
+                message.tool_calls if isinstance(message.tool_calls, list) else None,
+            )
+            for message in input.messages
+        ]
+        if template_options := input.template:
+            messages = list(_formatted_messages(messages, template_options))
+        invocation_parameters = llm_client.construct_invocation_parameters(
+            input.invocation_parameters
+        )
+        text_content = ""
+        tool_calls = []
+        events = []
+        attributes.update(
+            chain(
+                _llm_span_kind(),
+                _llm_model_name(input.model.name),
+                _llm_tools(input.tools or []),
+                _llm_input_messages(messages),
+                _llm_invocation_parameters(invocation_parameters),
+                _input_value_and_mime_type(input),
+                **llm_client.attributes,
+            )
+        )
+        start_time = normalize_datetime(dt=local_now(), tz=timezone.utc)
+        status_code = StatusCode.OK
+        status_message = ""
+        try:
+            async for chunk in llm_client.chat_completion_create(
+                messages=messages, tools=input.tools or [], **invocation_parameters
+            ):
+                # Process the chunk
+                if isinstance(chunk, TextChunk):
+                    text_content += chunk.content
+                elif isinstance(chunk, ToolCallChunk):
+                    tool_call = ChatCompletionToolCall(
+                        id=chunk.id,
+                        function=ChatCompletionFunctionCall(
+                            name=chunk.function.name,
+                            arguments=chunk.function.arguments,
+                        ),
+                    )
+                    tool_calls.append(tool_call)
+                else:
+                    assert_never(chunk)
+        except Exception as e:
+            # Handle exceptions and record exception event
+            status_code = StatusCode.ERROR
+            status_message = str(e)
+            end_time = normalize_datetime(dt=local_now(), tz=timezone.utc)
+            assert end_time is not None
+            events.append(
+                SpanException(
+                    timestamp=end_time,
+                    message=status_message,
+                    exception_type=type(e).__name__,
+                    exception_escaped=False,
+                    exception_stacktrace=format_exc(),
+                )
+            )
+        else:
+            end_time = normalize_datetime(dt=local_now(), tz=timezone.utc)
+        if text_content or tool_calls:
+            attributes.update(
+                chain(
+                    _output_value_and_mime_type({"text": text_content, "tool_calls": tool_calls}),
+                    _llm_output_messages(text_content, tool_calls),
+                )
+            )
+        # Now write the span to the database
+        trace_id = _generate_trace_id()
+        span_id = _generate_span_id()
+        async with info.context.db() as session:
+            # Get or create the project ID
+            if (
+                project_id := await session.scalar(
+                    select(models.Project.id).where(models.Project.name == PLAYGROUND_PROJECT_NAME)
+                )
+            ) is None:
+                project_id = await session.scalar(
+                    insert(models.Project)
+                    .returning(models.Project.id)
+                    .values(
+                        name=PLAYGROUND_PROJECT_NAME,
+                        description="Traces from prompt playground",
+                    )
+                )
+            trace = models.Trace(
+                project_rowid=project_id,
+                trace_id=trace_id,
+                start_time=start_time,
+                end_time=end_time,
+            )
+            span = models.Span(
+                trace_rowid=trace.id,
+                span_id=span_id,
+                parent_id=None,
+                name="ChatCompletion",
+                span_kind=LLM,
+                start_time=start_time,
+                end_time=end_time,
+                attributes=unflatten(attributes.items()),
+                events=[_serialize_event(event) for event in events],
+                status_code=status_code.name,
+                status_message=status_message,
+                cumulative_error_count=int(status_code is StatusCode.ERROR),
+                cumulative_llm_token_count_prompt=attributes.get(LLM_TOKEN_COUNT_PROMPT, 0),
+                cumulative_llm_token_count_completion=attributes.get(LLM_TOKEN_COUNT_COMPLETION, 0),
+                llm_token_count_prompt=attributes.get(LLM_TOKEN_COUNT_PROMPT, 0),
+                llm_token_count_completion=attributes.get(LLM_TOKEN_COUNT_COMPLETION, 0),
+                trace=trace,
+            )
+            session.add(trace)
+            session.add(span)
+            await session.flush()
+        gql_span = to_gql_span(span)
+        info.context.event_queue.put(SpanInsertEvent(ids=(project_id,)))
+        if status_code is StatusCode.ERROR:
+            return ChatCompletionMutationPayload(
+                content=None,
+                tool_calls=[],
+                span=gql_span,
+                error_message=status_message,
+            )
+        else:
+            return ChatCompletionMutationPayload(
+                content=text_content if text_content else None,
+                tool_calls=tool_calls,
+                span=gql_span,
+                error_message=None,
+            )
+def _formatted_messages(
+    messages: Iterable[ChatCompletionMessage],
+    template_options: TemplateOptions,
+) -> Iterator[ChatCompletionMessage]:
+    """
+    Formats the messages using the given template options.
+    """
+    template_formatter = _template_formatter(template_language=template_options.language)
+    (
+        roles,
+        templates,
+        tool_call_id,
+        tool_calls,
+    ) = zip(*messages)
+    formatted_templates = map(
+        lambda template: template_formatter.format(template, **template_options.variables),
+        templates,
+    )
+    formatted_messages = zip(roles, formatted_templates, tool_call_id, tool_calls)
+    return formatted_messages
+def _template_formatter(template_language: TemplateLanguage) -> TemplateFormatter:
+    """
+    Instantiates the appropriate template formatter for the template language.
+    """
+    if template_language is TemplateLanguage.MUSTACHE:
+        return MustacheTemplateFormatter()
+    if template_language is TemplateLanguage.F_STRING:
+        return FStringTemplateFormatter()
+    assert_never(template_language)
+def _llm_span_kind() -> Iterator[tuple[str, Any]]:
+    yield OPENINFERENCE_SPAN_KIND, LLM
+def _llm_model_name(model_name: str) -> Iterator[tuple[str, Any]]:
+    yield LLM_MODEL_NAME, model_name
+def _llm_invocation_parameters(invocation_parameters: dict[str, Any]) -> Iterator[tuple[str, Any]]:
+    yield LLM_INVOCATION_PARAMETERS, json.dumps(invocation_parameters)
+def _llm_tools(tools: List[Any]) -> Iterator[tuple[str, Any]]:
+    for tool_index, tool in enumerate(tools):
+        yield f"{LLM_TOOLS}.{tool_index}.{TOOL_JSON_SCHEMA}", json.dumps(tool)
+def _input_value_and_mime_type(input: ChatCompletionInput) -> Iterator[tuple[str, Any]]:
+    input_data = input.__dict__.copy()
+    input_data.pop("api_key", None)
+    yield INPUT_MIME_TYPE, JSON
+    yield INPUT_VALUE, json.dumps(input_data)
+def _output_value_and_mime_type(output: Any) -> Iterator[tuple[str, Any]]:
+    yield OUTPUT_MIME_TYPE, JSON
+    yield OUTPUT_VALUE, json.dumps(output)
+def _llm_input_messages(
+    messages: Iterable[ChatCompletionMessage],
+) -> Iterator[tuple[str, Any]]:
+    for i, (role, content, _tool_call_id, tool_calls) in enumerate(messages):
+        yield f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_ROLE}", role.value.lower()
+        yield f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_CONTENT}", content
+        if tool_calls:
+            for tool_call_index, tool_call in enumerate(tool_calls):
+                yield (
+                    f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_NAME}",
+                    tool_call["function"]["name"],
+                )
+                if arguments := tool_call["function"]["arguments"]:
+                    yield (
+                        f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_ARGUMENTS_JSON}",
+                        json.dumps(arguments),
+                    )
+def _llm_output_messages(
+    text_content: str, tool_calls: List[ChatCompletionToolCall]
+) -> Iterator[tuple[str, Any]]:
+    yield f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_ROLE}", "assistant"
+    if text_content:
+        yield f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_CONTENT}", text_content
+    for tool_call_index, tool_call in enumerate(tool_calls):
+        yield (
+            f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_NAME}",
+            tool_call.function.name,
+        )
+        if arguments := tool_call.function.arguments:
+            yield (
+                f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_ARGUMENTS_JSON}",
+                json.dumps(arguments),
+            )
+def _generate_trace_id() -> str:
+    return _hex(DefaultOTelIDGenerator().generate_trace_id())
+def _generate_span_id() -> str:
+    return _hex(DefaultOTelIDGenerator().generate_span_id())
+def _hex(number: int) -> str:
+    return hex(number)[2:]
+def _serialize_event(event: SpanException) -> dict[str, Any]:
+    return {k: (v.isoformat() if isinstance(v, datetime) else v) for k, v in asdict(event).items()}
+JSON = OpenInferenceMimeTypeValues.JSON.value
+LLM = OpenInferenceSpanKindValues.LLM.value
+OPENINFERENCE_SPAN_KIND = SpanAttributes.OPENINFERENCE_SPAN_KIND
+INPUT_MIME_TYPE = SpanAttributes.INPUT_MIME_TYPE
+INPUT_VALUE = SpanAttributes.INPUT_VALUE
+OUTPUT_MIME_TYPE = SpanAttributes.OUTPUT_MIME_TYPE
+OUTPUT_VALUE = SpanAttributes.OUTPUT_VALUE
+LLM_INPUT_MESSAGES = SpanAttributes.LLM_INPUT_MESSAGES
+LLM_OUTPUT_MESSAGES = SpanAttributes.LLM_OUTPUT_MESSAGES
+LLM_MODEL_NAME = SpanAttributes.LLM_MODEL_NAME
+LLM_INVOCATION_PARAMETERS = SpanAttributes.LLM_INVOCATION_PARAMETERS
+LLM_TOOLS = SpanAttributes.LLM_TOOLS
+LLM_TOKEN_COUNT_PROMPT = SpanAttributes.LLM_TOKEN_COUNT_PROMPT
+LLM_TOKEN_COUNT_COMPLETION = SpanAttributes.LLM_TOKEN_COUNT_COMPLETION
+MESSAGE_CONTENT = MessageAttributes.MESSAGE_CONTENT
+MESSAGE_ROLE = MessageAttributes.MESSAGE_ROLE
+MESSAGE_TOOL_CALLS = MessageAttributes.MESSAGE_TOOL_CALLS
+TOOL_CALL_FUNCTION_NAME = ToolCallAttributes.TOOL_CALL_FUNCTION_NAME
+TOOL_CALL_FUNCTION_ARGUMENTS_JSON = ToolCallAttributes.TOOL_CALL_FUNCTION_ARGUMENTS_JSON
+TOOL_JSON_SCHEMA = ToolAttributes.TOOL_JSON_SCHEMA
+PLAYGROUND_PROJECT_NAME = "playground"

phoenix/server/api/mutations/dataset_mutations.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import asyncio
 from datetime import datetime
-from typing import Any, Dict
+from typing import Any
 import strawberry
 from openinference.semconv.trace import (
@@ -175,7 +175,7 @@ class DatasetMutationMixin:
                 )
             ).all()
-            span_annotations_by_span: Dict[int, Dict[Any, Any]] = {span.id: {} for span in spans}
+            span_annotations_by_span: dict[int, dict[Any, Any]] = {span.id: {} for span in spans}
             for annotation in span_annotations:
                 span_id = annotation.span_rowid
                 if span_id not in span_annotations_by_span:
@@ -287,7 +287,7 @@ class DatasetMutationMixin:
                 )
             ).all()
-            span_annotations_by_span: Dict[int, Dict[Any, Any]] = {span.id: {} for span in spans}
+            span_annotations_by_span: dict[int, dict[Any, Any]] = {span.id: {} for span in spans}
             for annotation in span_annotations:
                 span_id = annotation.span_rowid
                 if span_id not in span_annotations_by_span:
@@ -577,7 +577,7 @@ def _to_orm_revision(
     patch: DatasetExamplePatch,
     example_id: int,
     version_id: int,
-) -> Dict[str, Any]:
+) -> dict[str, Any]:
     """
     Creates a new revision from an existing revision and a patch. The output is a
     dictionary suitable for insertion into the database using the sqlalchemy

phoenix/server/api/mutations/experiment_mutations.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import asyncio
-from typing import List
 import strawberry
 from sqlalchemy import delete
@@ -20,7 +19,7 @@ from phoenix.server.dml_event import ExperimentDeleteEvent
 @strawberry.type
 class ExperimentMutationPayload:
-    experiments: List[Experiment]
+    experiments: list[Experiment]
 @strawberry.type

phoenix/server/api/mutations/export_events_mutations.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import asyncio
 from collections import defaultdict
 from datetime import datetime
-from typing import Dict, List, Optional, Tuple
+from typing import Optional
 import strawberry
 from strawberry import ID, UNSET
@@ -29,7 +29,7 @@ class ExportEventsMutationMixin:
     async def export_events(
         self,
         info: Info[Context, None],
-        event_ids: List[ID],
+        event_ids: list[ID],
         file_name: Optional[str] = UNSET,
     ) -> ExportedFile:
         if not isinstance(file_name, str):
@@ -61,7 +61,7 @@ class ExportEventsMutationMixin:
     async def export_clusters(
         self,
         info: Info[Context, None],
-        clusters: List[ClusterInput],
+        clusters: list[ClusterInput],
         file_name: Optional[str] = UNSET,
     ) -> ExportedFile:
         if not isinstance(file_name, str):
@@ -81,10 +81,10 @@ class ExportEventsMutationMixin:
 def _unpack_clusters(
-    clusters: List[ClusterInput],
-) -> Tuple[Dict[ms.InferencesRole, List[int]], Dict[ms.InferencesRole, Dict[int, str]]]:
-    row_numbers: Dict[ms.InferencesRole, List[int]] = defaultdict(list)
-    cluster_ids: Dict[ms.InferencesRole, Dict[int, str]] = defaultdict(dict)
+    clusters: list[ClusterInput],
+) -> tuple[dict[ms.InferencesRole, list[int]], dict[ms.InferencesRole, dict[int, str]]]:
+    row_numbers: dict[ms.InferencesRole, list[int]] = defaultdict(list)
+    cluster_ids: dict[ms.InferencesRole, dict[int, str]] = defaultdict(dict)
     for i, cluster in enumerate(clusters):
         for row_number, inferences_role in map(unpack_event_id, cluster.event_ids):
             if isinstance(inferences_role, AncillaryInferencesRole):

arize-phoenix 5.5.2__py3-none-any.whl → 5.7.0__py3-none-any.whl

Potentially problematic release.

arize-phoenix 5.5.2py3-none-any.whl → 5.7.0py3-none-any.whl