PyPI - arize-phoenix - Versions diffs - 3.16.1__py3-none-any.whl → 7.7.0__py3-none-any.whl - Mend

arize-phoenix 3.16.1py3-none-any.whl → 7.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (338) hide show

arize_phoenix-7.7.0.dist-info/METADATA +261 -0
arize_phoenix-7.7.0.dist-info/RECORD +345 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/WHEEL +1 -1
arize_phoenix-7.7.0.dist-info/entry_points.txt +3 -0
phoenix/__init__.py +86 -14
phoenix/auth.py +309 -0
phoenix/config.py +675 -45
phoenix/core/model.py +32 -30
phoenix/core/model_schema.py +102 -109
phoenix/core/model_schema_adapter.py +48 -45
phoenix/datetime_utils.py +24 -3
phoenix/db/README.md +54 -0
phoenix/db/__init__.py +4 -0
phoenix/db/alembic.ini +85 -0
phoenix/db/bulk_inserter.py +294 -0
phoenix/db/engines.py +208 -0
phoenix/db/enums.py +20 -0
phoenix/db/facilitator.py +113 -0
phoenix/db/helpers.py +159 -0
phoenix/db/insertion/constants.py +2 -0
phoenix/db/insertion/dataset.py +227 -0
phoenix/db/insertion/document_annotation.py +171 -0
phoenix/db/insertion/evaluation.py +191 -0
phoenix/db/insertion/helpers.py +98 -0
phoenix/db/insertion/span.py +193 -0
phoenix/db/insertion/span_annotation.py +158 -0
phoenix/db/insertion/trace_annotation.py +158 -0
phoenix/db/insertion/types.py +256 -0
phoenix/db/migrate.py +86 -0
phoenix/db/migrations/data_migration_scripts/populate_project_sessions.py +199 -0
phoenix/db/migrations/env.py +114 -0
phoenix/db/migrations/script.py.mako +26 -0
phoenix/db/migrations/versions/10460e46d750_datasets.py +317 -0
phoenix/db/migrations/versions/3be8647b87d8_add_token_columns_to_spans_table.py +126 -0
phoenix/db/migrations/versions/4ded9e43755f_create_project_sessions_table.py +66 -0
phoenix/db/migrations/versions/cd164e83824f_users_and_tokens.py +157 -0
phoenix/db/migrations/versions/cf03bd6bae1d_init.py +280 -0
phoenix/db/models.py +807 -0
phoenix/exceptions.py +5 -1
phoenix/experiments/__init__.py +6 -0
phoenix/experiments/evaluators/__init__.py +29 -0
phoenix/experiments/evaluators/base.py +158 -0
phoenix/experiments/evaluators/code_evaluators.py +184 -0
phoenix/experiments/evaluators/llm_evaluators.py +473 -0
phoenix/experiments/evaluators/utils.py +236 -0
phoenix/experiments/functions.py +772 -0
phoenix/experiments/tracing.py +86 -0
phoenix/experiments/types.py +726 -0
phoenix/experiments/utils.py +25 -0
phoenix/inferences/__init__.py +0 -0
phoenix/{datasets → inferences}/errors.py +6 -5
phoenix/{datasets → inferences}/fixtures.py +49 -42
phoenix/{datasets/dataset.py → inferences/inferences.py} +121 -105
phoenix/{datasets → inferences}/schema.py +11 -11
phoenix/{datasets → inferences}/validation.py +13 -14
phoenix/logging/__init__.py +3 -0
phoenix/logging/_config.py +90 -0
phoenix/logging/_filter.py +6 -0
phoenix/logging/_formatter.py +69 -0
phoenix/metrics/__init__.py +5 -4
phoenix/metrics/binning.py +4 -3
phoenix/metrics/metrics.py +2 -1
phoenix/metrics/mixins.py +7 -6
phoenix/metrics/retrieval_metrics.py +2 -1
phoenix/metrics/timeseries.py +5 -4
phoenix/metrics/wrappers.py +9 -3
phoenix/pointcloud/clustering.py +5 -5
phoenix/pointcloud/pointcloud.py +7 -5
phoenix/pointcloud/projectors.py +5 -6
phoenix/pointcloud/umap_parameters.py +53 -52
phoenix/server/api/README.md +28 -0
phoenix/server/api/auth.py +44 -0
phoenix/server/api/context.py +152 -9
phoenix/server/api/dataloaders/__init__.py +91 -0
phoenix/server/api/dataloaders/annotation_summaries.py +139 -0
phoenix/server/api/dataloaders/average_experiment_run_latency.py +54 -0
phoenix/server/api/dataloaders/cache/__init__.py +3 -0
phoenix/server/api/dataloaders/cache/two_tier_cache.py +68 -0
phoenix/server/api/dataloaders/dataset_example_revisions.py +131 -0
phoenix/server/api/dataloaders/dataset_example_spans.py +38 -0
phoenix/server/api/dataloaders/document_evaluation_summaries.py +144 -0
phoenix/server/api/dataloaders/document_evaluations.py +31 -0
phoenix/server/api/dataloaders/document_retrieval_metrics.py +89 -0
phoenix/server/api/dataloaders/experiment_annotation_summaries.py +79 -0
phoenix/server/api/dataloaders/experiment_error_rates.py +58 -0
phoenix/server/api/dataloaders/experiment_run_annotations.py +36 -0
phoenix/server/api/dataloaders/experiment_run_counts.py +49 -0
phoenix/server/api/dataloaders/experiment_sequence_number.py +44 -0
phoenix/server/api/dataloaders/latency_ms_quantile.py +188 -0
phoenix/server/api/dataloaders/min_start_or_max_end_times.py +85 -0
phoenix/server/api/dataloaders/project_by_name.py +31 -0
phoenix/server/api/dataloaders/record_counts.py +116 -0
phoenix/server/api/dataloaders/session_io.py +79 -0
phoenix/server/api/dataloaders/session_num_traces.py +30 -0
phoenix/server/api/dataloaders/session_num_traces_with_error.py +32 -0
phoenix/server/api/dataloaders/session_token_usages.py +41 -0
phoenix/server/api/dataloaders/session_trace_latency_ms_quantile.py +55 -0
phoenix/server/api/dataloaders/span_annotations.py +26 -0
phoenix/server/api/dataloaders/span_dataset_examples.py +31 -0
phoenix/server/api/dataloaders/span_descendants.py +57 -0
phoenix/server/api/dataloaders/span_projects.py +33 -0
phoenix/server/api/dataloaders/token_counts.py +124 -0
phoenix/server/api/dataloaders/trace_by_trace_ids.py +25 -0
phoenix/server/api/dataloaders/trace_root_spans.py +32 -0
phoenix/server/api/dataloaders/user_roles.py +30 -0
phoenix/server/api/dataloaders/users.py +33 -0
phoenix/server/api/exceptions.py +48 -0
phoenix/server/api/helpers/__init__.py +12 -0
phoenix/server/api/helpers/dataset_helpers.py +217 -0
phoenix/server/api/helpers/experiment_run_filters.py +763 -0
phoenix/server/api/helpers/playground_clients.py +948 -0
phoenix/server/api/helpers/playground_registry.py +70 -0
phoenix/server/api/helpers/playground_spans.py +455 -0
phoenix/server/api/input_types/AddExamplesToDatasetInput.py +16 -0
phoenix/server/api/input_types/AddSpansToDatasetInput.py +14 -0
phoenix/server/api/input_types/ChatCompletionInput.py +38 -0
phoenix/server/api/input_types/ChatCompletionMessageInput.py +24 -0
phoenix/server/api/input_types/ClearProjectInput.py +15 -0
phoenix/server/api/input_types/ClusterInput.py +2 -2
phoenix/server/api/input_types/CreateDatasetInput.py +12 -0
phoenix/server/api/input_types/CreateSpanAnnotationInput.py +18 -0
phoenix/server/api/input_types/CreateTraceAnnotationInput.py +18 -0
phoenix/server/api/input_types/DataQualityMetricInput.py +5 -2
phoenix/server/api/input_types/DatasetExampleInput.py +14 -0
phoenix/server/api/input_types/DatasetSort.py +17 -0
phoenix/server/api/input_types/DatasetVersionSort.py +16 -0
phoenix/server/api/input_types/DeleteAnnotationsInput.py +7 -0
phoenix/server/api/input_types/DeleteDatasetExamplesInput.py +13 -0
phoenix/server/api/input_types/DeleteDatasetInput.py +7 -0
phoenix/server/api/input_types/DeleteExperimentsInput.py +7 -0
phoenix/server/api/input_types/DimensionFilter.py +4 -4
phoenix/server/api/input_types/GenerativeModelInput.py +17 -0
phoenix/server/api/input_types/Granularity.py +1 -1
phoenix/server/api/input_types/InvocationParameters.py +162 -0
phoenix/server/api/input_types/PatchAnnotationInput.py +19 -0
phoenix/server/api/input_types/PatchDatasetExamplesInput.py +35 -0
phoenix/server/api/input_types/PatchDatasetInput.py +14 -0
phoenix/server/api/input_types/PerformanceMetricInput.py +5 -2
phoenix/server/api/input_types/ProjectSessionSort.py +29 -0
phoenix/server/api/input_types/SpanAnnotationSort.py +17 -0
phoenix/server/api/input_types/SpanSort.py +134 -69
phoenix/server/api/input_types/TemplateOptions.py +10 -0
phoenix/server/api/input_types/TraceAnnotationSort.py +17 -0
phoenix/server/api/input_types/UserRoleInput.py +9 -0
phoenix/server/api/mutations/__init__.py +28 -0
phoenix/server/api/mutations/api_key_mutations.py +167 -0
phoenix/server/api/mutations/chat_mutations.py +593 -0
phoenix/server/api/mutations/dataset_mutations.py +591 -0
phoenix/server/api/mutations/experiment_mutations.py +75 -0
phoenix/server/api/{types/ExportEventsMutation.py → mutations/export_events_mutations.py} +21 -18
phoenix/server/api/mutations/project_mutations.py +57 -0
phoenix/server/api/mutations/span_annotations_mutations.py +128 -0
phoenix/server/api/mutations/trace_annotations_mutations.py +127 -0
phoenix/server/api/mutations/user_mutations.py +329 -0
phoenix/server/api/openapi/__init__.py +0 -0
phoenix/server/api/openapi/main.py +17 -0
phoenix/server/api/openapi/schema.py +16 -0
phoenix/server/api/queries.py +738 -0
phoenix/server/api/routers/__init__.py +11 -0
phoenix/server/api/routers/auth.py +284 -0
phoenix/server/api/routers/embeddings.py +26 -0
phoenix/server/api/routers/oauth2.py +488 -0
phoenix/server/api/routers/v1/__init__.py +64 -0
phoenix/server/api/routers/v1/datasets.py +1017 -0
phoenix/server/api/routers/v1/evaluations.py +362 -0
phoenix/server/api/routers/v1/experiment_evaluations.py +115 -0
phoenix/server/api/routers/v1/experiment_runs.py +167 -0
phoenix/server/api/routers/v1/experiments.py +308 -0
phoenix/server/api/routers/v1/pydantic_compat.py +78 -0
phoenix/server/api/routers/v1/spans.py +267 -0
phoenix/server/api/routers/v1/traces.py +208 -0
phoenix/server/api/routers/v1/utils.py +95 -0
phoenix/server/api/schema.py +44 -241
phoenix/server/api/subscriptions.py +597 -0
phoenix/server/api/types/Annotation.py +21 -0
phoenix/server/api/types/AnnotationSummary.py +55 -0
phoenix/server/api/types/AnnotatorKind.py +16 -0
phoenix/server/api/types/ApiKey.py +27 -0
phoenix/server/api/types/AuthMethod.py +9 -0
phoenix/server/api/types/ChatCompletionMessageRole.py +11 -0
phoenix/server/api/types/ChatCompletionSubscriptionPayload.py +46 -0
phoenix/server/api/types/Cluster.py +25 -24
phoenix/server/api/types/CreateDatasetPayload.py +8 -0
phoenix/server/api/types/DataQualityMetric.py +31 -13
phoenix/server/api/types/Dataset.py +288 -63
phoenix/server/api/types/DatasetExample.py +85 -0
phoenix/server/api/types/DatasetExampleRevision.py +34 -0
phoenix/server/api/types/DatasetVersion.py +14 -0
phoenix/server/api/types/Dimension.py +32 -31
phoenix/server/api/types/DocumentEvaluationSummary.py +9 -8
phoenix/server/api/types/EmbeddingDimension.py +56 -49
phoenix/server/api/types/Evaluation.py +25 -31
phoenix/server/api/types/EvaluationSummary.py +30 -50
phoenix/server/api/types/Event.py +20 -20
phoenix/server/api/types/ExampleRevisionInterface.py +14 -0
phoenix/server/api/types/Experiment.py +152 -0
phoenix/server/api/types/ExperimentAnnotationSummary.py +13 -0
phoenix/server/api/types/ExperimentComparison.py +17 -0
phoenix/server/api/types/ExperimentRun.py +119 -0
phoenix/server/api/types/ExperimentRunAnnotation.py +56 -0
phoenix/server/api/types/GenerativeModel.py +9 -0
phoenix/server/api/types/GenerativeProvider.py +85 -0
phoenix/server/api/types/Inferences.py +80 -0
phoenix/server/api/types/InferencesRole.py +23 -0
phoenix/server/api/types/LabelFraction.py +7 -0
phoenix/server/api/types/MimeType.py +2 -2
phoenix/server/api/types/Model.py +54 -54
phoenix/server/api/types/PerformanceMetric.py +8 -5
phoenix/server/api/types/Project.py +407 -142
phoenix/server/api/types/ProjectSession.py +139 -0
phoenix/server/api/types/Segments.py +4 -4
phoenix/server/api/types/Span.py +221 -176
phoenix/server/api/types/SpanAnnotation.py +43 -0
phoenix/server/api/types/SpanIOValue.py +15 -0
phoenix/server/api/types/SystemApiKey.py +9 -0
phoenix/server/api/types/TemplateLanguage.py +10 -0
phoenix/server/api/types/TimeSeries.py +19 -15
phoenix/server/api/types/TokenUsage.py +11 -0
phoenix/server/api/types/Trace.py +154 -0
phoenix/server/api/types/TraceAnnotation.py +45 -0
phoenix/server/api/types/UMAPPoints.py +7 -7
phoenix/server/api/types/User.py +60 -0
phoenix/server/api/types/UserApiKey.py +45 -0
phoenix/server/api/types/UserRole.py +15 -0
phoenix/server/api/types/node.py +4 -112
phoenix/server/api/types/pagination.py +156 -57
phoenix/server/api/utils.py +34 -0
phoenix/server/app.py +864 -115
phoenix/server/bearer_auth.py +163 -0
phoenix/server/dml_event.py +136 -0
phoenix/server/dml_event_handler.py +256 -0
phoenix/server/email/__init__.py +0 -0
phoenix/server/email/sender.py +97 -0
phoenix/server/email/templates/__init__.py +0 -0
phoenix/server/email/templates/password_reset.html +19 -0
phoenix/server/email/types.py +11 -0
phoenix/server/grpc_server.py +102 -0
phoenix/server/jwt_store.py +505 -0
phoenix/server/main.py +305 -116
phoenix/server/oauth2.py +52 -0
phoenix/server/openapi/__init__.py +0 -0
phoenix/server/prometheus.py +111 -0
phoenix/server/rate_limiters.py +188 -0
phoenix/server/static/.vite/manifest.json +87 -0
phoenix/server/static/assets/components-Cy9nwIvF.js +2125 -0
phoenix/server/static/assets/index-BKvHIxkk.js +113 -0
phoenix/server/static/assets/pages-CUi2xCVQ.js +4449 -0
phoenix/server/static/assets/vendor-DvC8cT4X.js +894 -0
phoenix/server/static/assets/vendor-DxkFTwjz.css +1 -0
phoenix/server/static/assets/vendor-arizeai-Do1793cv.js +662 -0
phoenix/server/static/assets/vendor-codemirror-BzwZPyJM.js +24 -0
phoenix/server/static/assets/vendor-recharts-_Jb7JjhG.js +59 -0
phoenix/server/static/assets/vendor-shiki-Cl9QBraO.js +5 -0
phoenix/server/static/assets/vendor-three-DwGkEfCM.js +2998 -0
phoenix/server/telemetry.py +68 -0
phoenix/server/templates/index.html +82 -23
phoenix/server/thread_server.py +3 -3
phoenix/server/types.py +275 -0
phoenix/services.py +27 -18
phoenix/session/client.py +743 -68
phoenix/session/data_extractor.py +31 -7
phoenix/session/evaluation.py +3 -9
phoenix/session/session.py +263 -219
phoenix/settings.py +22 -0
phoenix/trace/__init__.py +2 -22
phoenix/trace/attributes.py +338 -0
phoenix/trace/dsl/README.md +116 -0
phoenix/trace/dsl/filter.py +663 -213
phoenix/trace/dsl/helpers.py +73 -21
phoenix/trace/dsl/query.py +574 -201
phoenix/trace/exporter.py +24 -19
phoenix/trace/fixtures.py +368 -32
phoenix/trace/otel.py +71 -219
phoenix/trace/projects.py +3 -2
phoenix/trace/schemas.py +33 -11
phoenix/trace/span_evaluations.py +21 -16
phoenix/trace/span_json_decoder.py +6 -4
phoenix/trace/span_json_encoder.py +2 -2
phoenix/trace/trace_dataset.py +47 -32
phoenix/trace/utils.py +21 -4
phoenix/utilities/__init__.py +0 -26
phoenix/utilities/client.py +132 -0
phoenix/utilities/deprecation.py +31 -0
phoenix/utilities/error_handling.py +3 -2
phoenix/utilities/json.py +109 -0
phoenix/utilities/logging.py +8 -0
phoenix/utilities/project.py +2 -2
phoenix/utilities/re.py +49 -0
phoenix/utilities/span_store.py +0 -23
phoenix/utilities/template_formatters.py +99 -0
phoenix/version.py +1 -1
arize_phoenix-3.16.1.dist-info/METADATA +0 -495
arize_phoenix-3.16.1.dist-info/RECORD +0 -178
phoenix/core/project.py +0 -619
phoenix/core/traces.py +0 -96
phoenix/experimental/evals/__init__.py +0 -73
phoenix/experimental/evals/evaluators.py +0 -413
phoenix/experimental/evals/functions/__init__.py +0 -4
phoenix/experimental/evals/functions/classify.py +0 -453
phoenix/experimental/evals/functions/executor.py +0 -353
phoenix/experimental/evals/functions/generate.py +0 -138
phoenix/experimental/evals/functions/processing.py +0 -76
phoenix/experimental/evals/models/__init__.py +0 -14
phoenix/experimental/evals/models/anthropic.py +0 -175
phoenix/experimental/evals/models/base.py +0 -170
phoenix/experimental/evals/models/bedrock.py +0 -221
phoenix/experimental/evals/models/litellm.py +0 -134
phoenix/experimental/evals/models/openai.py +0 -448
phoenix/experimental/evals/models/rate_limiters.py +0 -246
phoenix/experimental/evals/models/vertex.py +0 -173
phoenix/experimental/evals/models/vertexai.py +0 -186
phoenix/experimental/evals/retrievals.py +0 -96
phoenix/experimental/evals/templates/__init__.py +0 -50
phoenix/experimental/evals/templates/default_templates.py +0 -472
phoenix/experimental/evals/templates/template.py +0 -195
phoenix/experimental/evals/utils/__init__.py +0 -172
phoenix/experimental/evals/utils/threads.py +0 -27
phoenix/server/api/helpers.py +0 -11
phoenix/server/api/routers/evaluation_handler.py +0 -109
phoenix/server/api/routers/span_handler.py +0 -70
phoenix/server/api/routers/trace_handler.py +0 -60
phoenix/server/api/types/DatasetRole.py +0 -23
phoenix/server/static/index.css +0 -6
phoenix/server/static/index.js +0 -7447
phoenix/storage/span_store/__init__.py +0 -23
phoenix/storage/span_store/text_file.py +0 -85
phoenix/trace/dsl/missing.py +0 -60
phoenix/trace/langchain/__init__.py +0 -3
phoenix/trace/langchain/instrumentor.py +0 -35
phoenix/trace/llama_index/__init__.py +0 -3
phoenix/trace/llama_index/callback.py +0 -102
phoenix/trace/openai/__init__.py +0 -3
phoenix/trace/openai/instrumentor.py +0 -30
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/licenses/LICENSE +0 -0
/phoenix/{datasets → db/insertion}/__init__.py +0 -0
/phoenix/{experimental → db/migrations}/__init__.py +0 -0
/phoenix/{storage → db/migrations/data_migration_scripts}/__init__.py +0 -0

phoenix/server/api/helpers/playground_registry.py ADDED Viewed

@@ -0,0 +1,70 @@
+from typing import TYPE_CHECKING, Any, Callable, Optional, Union
+from phoenix.server.api.types.GenerativeProvider import GenerativeProviderKey
+if TYPE_CHECKING:
+    from phoenix.server.api.helpers.playground_clients import PlaygroundStreamingClient
+ModelName = Union[str, None]
+ModelKey = tuple[GenerativeProviderKey, ModelName]
+PROVIDER_DEFAULT = None
+class SingletonMeta(type):
+    _instances: dict[Any, Any] = dict()
+    def __call__(cls, *args: Any, **kwargs: Any) -> Any:
+        if cls not in cls._instances:
+            cls._instances[cls] = super(SingletonMeta, cls).__call__(*args, **kwargs)
+        return cls._instances[cls]
+class PlaygroundClientRegistry(metaclass=SingletonMeta):
+    def __init__(self) -> None:
+        self._registry: dict[
+            GenerativeProviderKey, dict[ModelName, Optional[type["PlaygroundStreamingClient"]]]
+        ] = {}
+    def get_client(
+        self,
+        provider_key: GenerativeProviderKey,
+        model_name: ModelName,
+    ) -> Optional[type["PlaygroundStreamingClient"]]:
+        provider_registry = self._registry.get(provider_key, {})
+        client_class = provider_registry.get(model_name)
+        if client_class is None and None in provider_registry:
+            client_class = provider_registry[PROVIDER_DEFAULT]  # Fallback to provider default
+        return client_class
+    def list_all_providers(
+        self,
+    ) -> list[GenerativeProviderKey]:
+        return [provider_key for provider_key in self._registry]
+    def list_models(self, provider_key: GenerativeProviderKey) -> list[str]:
+        provider_registry = self._registry.get(provider_key, {})
+        return [model_name for model_name in provider_registry.keys() if model_name is not None]
+    def list_all_models(self) -> list[ModelKey]:
+        return [
+            (provider_key, model_name)
+            for provider_key, provider_registry in self._registry.items()
+            for model_name in provider_registry.keys()
+        ]
+PLAYGROUND_CLIENT_REGISTRY: PlaygroundClientRegistry = PlaygroundClientRegistry()
+def register_llm_client(
+    provider_key: GenerativeProviderKey,
+    model_names: list[ModelName],
+) -> Callable[[type["PlaygroundStreamingClient"]], type["PlaygroundStreamingClient"]]:
+    def decorator(cls: type["PlaygroundStreamingClient"]) -> type["PlaygroundStreamingClient"]:
+        provider_registry = PLAYGROUND_CLIENT_REGISTRY._registry.setdefault(provider_key, {})
+        for model_name in model_names:
+            provider_registry[model_name] = cls
+        return cls
+    return decorator

phoenix/server/api/helpers/playground_spans.py ADDED Viewed

@@ -0,0 +1,455 @@
+import json
+from collections import defaultdict
+from collections.abc import Mapping
+from dataclasses import asdict
+from datetime import datetime, timezone
+from itertools import chain
+from traceback import format_exc
+from types import TracebackType
+from typing import (
+    Any,
+    Iterable,
+    Iterator,
+    Optional,
+    Union,
+    cast,
+)
+from openinference.instrumentation import safe_json_dumps
+from openinference.semconv.trace import (
+    MessageAttributes,
+    OpenInferenceMimeTypeValues,
+    OpenInferenceSpanKindValues,
+    SpanAttributes,
+    ToolAttributes,
+    ToolCallAttributes,
+)
+from opentelemetry.sdk.trace.id_generator import RandomIdGenerator as DefaultOTelIDGenerator
+from opentelemetry.trace import StatusCode
+from strawberry.scalars import JSON as JSONScalarType
+from typing_extensions import Self, TypeAlias, assert_never
+from phoenix.datetime_utils import local_now, normalize_datetime
+from phoenix.db import models
+from phoenix.server.api.helpers.dataset_helpers import get_dataset_example_output
+from phoenix.server.api.input_types.ChatCompletionInput import (
+    ChatCompletionInput,
+    ChatCompletionOverDatasetInput,
+)
+from phoenix.server.api.types.ChatCompletionMessageRole import ChatCompletionMessageRole
+from phoenix.server.api.types.ChatCompletionSubscriptionPayload import (
+    TextChunk,
+    ToolCallChunk,
+)
+from phoenix.trace.attributes import get_attribute_value, unflatten
+from phoenix.trace.schemas import (
+    SpanEvent,
+    SpanException,
+)
+from phoenix.utilities.json import jsonify
+ChatCompletionMessage: TypeAlias = tuple[
+    ChatCompletionMessageRole, str, Optional[str], Optional[list[str]]
+]
+ToolCallID: TypeAlias = str
+class streaming_llm_span:
+    """
+    A context manager that records OpenInference attributes for streaming chat
+    completion LLM spans.
+    """
+    def __init__(
+        self,
+        *,
+        input: Union[ChatCompletionInput, ChatCompletionOverDatasetInput],
+        messages: list[ChatCompletionMessage],
+        invocation_parameters: Mapping[str, Any],
+        attributes: Optional[dict[str, Any]] = None,
+    ) -> None:
+        self._input = input
+        self._attributes: dict[str, Any] = attributes if attributes is not None else {}
+        self._attributes.update(
+            chain(
+                llm_span_kind(),
+                llm_model_name(input.model.name),
+                llm_tools(input.tools or []),
+                llm_input_messages(messages),
+                llm_invocation_parameters(invocation_parameters),
+                input_value_and_mime_type(input),
+            )
+        )
+        self._events: list[SpanEvent] = []
+        self._start_time: Optional[datetime] = None
+        self._end_time: Optional[datetime] = None
+        self._text_chunks: list[TextChunk] = []
+        self._tool_call_chunks: defaultdict[ToolCallID, list[ToolCallChunk]] = defaultdict(list)
+        self._status_code: StatusCode = StatusCode.UNSET
+        self._status_message: Optional[str] = None
+        self._trace_id = _generate_trace_id()
+        self._span_id = _generate_span_id()
+    async def __aenter__(self) -> Self:
+        self._start_time = cast(datetime, normalize_datetime(dt=local_now(), tz=timezone.utc))
+        return self
+    async def __aexit__(
+        self,
+        exc_type: Optional[type[BaseException]],
+        exc_value: Optional[BaseException],
+        traceback: Optional[TracebackType],
+    ) -> bool:
+        self._end_time = cast(datetime, normalize_datetime(dt=local_now(), tz=timezone.utc))
+        self._status_code = StatusCode.OK
+        if exc_type is not None:
+            self._status_code = StatusCode.ERROR
+            self._status_message = str(exc_value)
+            self._events.append(
+                SpanException(
+                    timestamp=self._end_time,
+                    message=self._status_message,
+                    exception_type=type(exc_value).__name__,
+                    exception_escaped=False,
+                    exception_stacktrace=format_exc(),
+                )
+            )
+        if self._text_chunks or self._tool_call_chunks:
+            self._attributes.update(
+                chain(
+                    _output_value_and_mime_type(self._text_chunks, self._tool_call_chunks),
+                    _llm_output_messages(self._text_chunks, self._tool_call_chunks),
+                )
+            )
+        return True
+    def set_attributes(self, attributes: Mapping[str, Any]) -> None:
+        self._attributes.update(attributes)
+    def add_response_chunk(self, chunk: Union[TextChunk, ToolCallChunk]) -> None:
+        if isinstance(chunk, TextChunk):
+            self._text_chunks.append(chunk)
+        elif isinstance(chunk, ToolCallChunk):
+            self._tool_call_chunks[chunk.id].append(chunk)
+        else:
+            assert_never(chunk)
+    @property
+    def span_id(self) -> str:
+        return self._span_id
+    @property
+    def trace_id(self) -> str:
+        return self._trace_id
+    @property
+    def start_time(self) -> datetime:
+        if self._start_time is None:
+            raise ValueError("Cannot access start time before the context manager is entered")
+        return self._start_time
+    @property
+    def end_time(self) -> datetime:
+        if self._end_time is None:
+            raise ValueError("Cannot access end time before the context manager is exited")
+        return self._end_time
+    @property
+    def status_code(self) -> StatusCode:
+        return self._status_code
+    @property
+    def status_message(self) -> Optional[str]:
+        if self._status_code is StatusCode.UNSET:
+            raise ValueError("Cannot access status message before the context manager is exited")
+        return self._status_message
+    @property
+    def events(self) -> list[SpanEvent]:
+        return self._events
+    @property
+    def attributes(self) -> dict[str, Any]:
+        return unflatten(self._attributes.items())
+def get_db_trace(span: streaming_llm_span, project_id: int) -> models.Trace:
+    return models.Trace(
+        project_rowid=project_id,
+        trace_id=span.trace_id,
+        start_time=span.start_time,
+        end_time=span.end_time,
+    )
+def get_db_span(
+    span: streaming_llm_span,
+    db_trace: models.Trace,
+) -> models.Span:
+    prompt_tokens = get_attribute_value(span.attributes, LLM_TOKEN_COUNT_PROMPT) or 0
+    completion_tokens = get_attribute_value(span.attributes, LLM_TOKEN_COUNT_COMPLETION) or 0
+    return models.Span(
+        trace_rowid=db_trace.id,
+        span_id=span.span_id,
+        parent_id=None,
+        name="ChatCompletion",
+        span_kind=LLM,
+        start_time=span.start_time,
+        end_time=span.end_time,
+        attributes=span.attributes,
+        events=[_serialize_event(event) for event in span.events],
+        status_code=span.status_code.name,
+        status_message=span.status_message or "",
+        cumulative_error_count=int(span.status_code is StatusCode.ERROR),
+        cumulative_llm_token_count_prompt=prompt_tokens,
+        cumulative_llm_token_count_completion=completion_tokens,
+        llm_token_count_prompt=prompt_tokens,
+        llm_token_count_completion=completion_tokens,
+        trace=db_trace,
+    )
+def get_db_experiment_run(
+    db_span: models.Span,
+    db_trace: models.Trace,
+    *,
+    experiment_id: int,
+    example_id: int,
+) -> models.ExperimentRun:
+    return models.ExperimentRun(
+        experiment_id=experiment_id,
+        dataset_example_id=example_id,
+        trace_id=db_trace.trace_id,
+        output=models.ExperimentRunOutput(
+            task_output=get_dataset_example_output(db_span),
+        ),
+        repetition_number=1,
+        start_time=db_span.start_time,
+        end_time=db_span.end_time,
+        error=db_span.status_message or None,
+        prompt_token_count=get_attribute_value(db_span.attributes, LLM_TOKEN_COUNT_PROMPT),
+        completion_token_count=get_attribute_value(db_span.attributes, LLM_TOKEN_COUNT_COMPLETION),
+        trace=db_trace,
+    )
+def llm_span_kind() -> Iterator[tuple[str, Any]]:
+    yield OPENINFERENCE_SPAN_KIND, LLM
+def llm_model_name(model_name: str) -> Iterator[tuple[str, Any]]:
+    yield LLM_MODEL_NAME, model_name
+def llm_invocation_parameters(
+    invocation_parameters: Mapping[str, Any],
+) -> Iterator[tuple[str, Any]]:
+    if invocation_parameters:
+        yield LLM_INVOCATION_PARAMETERS, safe_json_dumps(invocation_parameters)
+def llm_tools(tools: list[JSONScalarType]) -> Iterator[tuple[str, Any]]:
+    for tool_index, tool in enumerate(tools):
+        yield f"{LLM_TOOLS}.{tool_index}.{TOOL_JSON_SCHEMA}", json.dumps(tool)
+def input_value_and_mime_type(
+    input: Union[ChatCompletionInput, ChatCompletionOverDatasetInput],
+) -> Iterator[tuple[str, Any]]:
+    assert (api_key := "api_key") in (input_data := jsonify(input))
+    disallowed_keys = {"api_key", "invocation_parameters"}
+    input_data = {k: v for k, v in input_data.items() if k not in disallowed_keys}
+    assert api_key not in input_data
+    yield INPUT_MIME_TYPE, JSON
+    yield INPUT_VALUE, safe_json_dumps(input_data)
+def _merge_tool_call_chunks(
+    chunks_by_id: defaultdict[str, list[ToolCallChunk]],
+) -> list[dict[str, Any]]:
+    merged_tool_calls = []
+    for tool_id, chunks in chunks_by_id.items():
+        if not chunks:
+            continue
+        first_chunk = chunks[0]
+        if not first_chunk:
+            continue
+        if not hasattr(first_chunk, "function") or not hasattr(first_chunk.function, "name"):
+            continue
+        # Combine all argument chunks
+        merged_arguments = "".join(
+            chunk.function.arguments
+            for chunk in chunks
+            if chunk and hasattr(chunk, "function") and hasattr(chunk.function, "arguments")
+        )
+        merged_tool_calls.append(
+            {
+                "id": tool_id,
+                # Only the first chunk has the tool name
+                "function": {
+                    "name": first_chunk.function.name,
+                    "arguments": merged_arguments or "{}",
+                },
+            }
+        )
+    return merged_tool_calls
+def _output_value_and_mime_type(
+    text_chunks: list[TextChunk],
+    tool_call_chunks: defaultdict[ToolCallID, list[ToolCallChunk]],
+) -> Iterator[tuple[str, Any]]:
+    content = "".join(chunk.content for chunk in text_chunks)
+    merged_tool_calls = _merge_tool_call_chunks(tool_call_chunks)
+    if content and merged_tool_calls:
+        yield OUTPUT_MIME_TYPE, JSON
+        yield (
+            OUTPUT_VALUE,
+            safe_json_dumps(
+                {
+                    "content": content,
+                    "tool_calls": jsonify(
+                        merged_tool_calls,
+                    ),
+                }
+            ),
+        )
+    elif merged_tool_calls:
+        yield OUTPUT_MIME_TYPE, JSON
+        yield OUTPUT_VALUE, safe_json_dumps(jsonify(merged_tool_calls))
+    elif content:
+        yield OUTPUT_MIME_TYPE, TEXT
+        yield OUTPUT_VALUE, content
+def llm_input_messages(
+    messages: Iterable[
+        tuple[ChatCompletionMessageRole, str, Optional[str], Optional[list[JSONScalarType]]]
+    ],
+) -> Iterator[tuple[str, Any]]:
+    for i, (role, content, tool_call_id, tool_calls) in enumerate(messages):
+        yield f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_ROLE}", role.value.lower()
+        yield f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_CONTENT}", content
+        if role == ChatCompletionMessageRole.TOOL and tool_call_id:
+            # Anthropic tool result spans
+            yield f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALL_ID}", tool_call_id
+        if tool_calls is not None:
+            for tool_call_index, tool_call in enumerate(tool_calls):
+                if tool_call.get("type") == "tool_use":
+                    # Anthropic tool call spans
+                    yield (
+                        f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_NAME}",
+                        tool_call["name"],
+                    )
+                    yield (
+                        f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_ARGUMENTS_JSON}",
+                        safe_json_dumps(jsonify(tool_call["input"])),
+                    )
+                    yield (
+                        f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_ID}",
+                        tool_call["id"],
+                    )
+                elif tool_call_function := tool_call.get("function"):
+                    # OpenAI tool call spans
+                    yield (
+                        f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_NAME}",
+                        tool_call_function["name"],
+                    )
+                    if arguments := tool_call_function["arguments"]:
+                        yield (
+                            f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_ARGUMENTS_JSON}",
+                            safe_json_dumps(jsonify(arguments)),
+                        )
+                    if tool_call_id := tool_call.get("id"):
+                        yield (
+                            f"{LLM_INPUT_MESSAGES}.{i}.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_ID}",
+                            tool_call_id,
+                        )
+def _llm_output_messages(
+    text_chunks: list[TextChunk],
+    tool_call_chunks: defaultdict[ToolCallID, list[ToolCallChunk]],
+) -> Iterator[tuple[str, Any]]:
+    yield f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_ROLE}", "assistant"
+    if content := "".join(chunk.content for chunk in text_chunks):
+        yield f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_CONTENT}", content
+    for tool_call_index, (_tool_call_id, tool_call_chunks_) in enumerate(tool_call_chunks.items()):
+        if _tool_call_id:
+            yield (
+                f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_ID}",
+                _tool_call_id,
+            )
+        if tool_call_chunks_ and (name := tool_call_chunks_[0].function.name):
+            yield (
+                f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_NAME}",
+                name,
+            )
+        if arguments := "".join(chunk.function.arguments for chunk in tool_call_chunks_):
+            yield (
+                f"{LLM_OUTPUT_MESSAGES}.0.{MESSAGE_TOOL_CALLS}.{tool_call_index}.{TOOL_CALL_FUNCTION_ARGUMENTS_JSON}",
+                arguments,
+            )
+def _generate_trace_id() -> str:
+    """
+    Generates a random trace ID in hexadecimal format.
+    """
+    return _hex(DefaultOTelIDGenerator().generate_trace_id())
+def _generate_span_id() -> str:
+    """
+    Generates a random span ID in hexadecimal format.
+    """
+    return _hex(DefaultOTelIDGenerator().generate_span_id())
+def _hex(number: int) -> str:
+    """
+    Converts an integer to a hexadecimal string.
+    """
+    return hex(number)[2:]
+def _serialize_event(event: SpanEvent) -> dict[str, Any]:
+    """
+    Serializes a SpanEvent to a dictionary.
+    """
+    return {k: (v.isoformat() if isinstance(v, datetime) else v) for k, v in asdict(event).items()}
+JSON = OpenInferenceMimeTypeValues.JSON.value
+TEXT = OpenInferenceMimeTypeValues.TEXT.value
+LLM = OpenInferenceSpanKindValues.LLM.value
+OPENINFERENCE_SPAN_KIND = SpanAttributes.OPENINFERENCE_SPAN_KIND
+INPUT_MIME_TYPE = SpanAttributes.INPUT_MIME_TYPE
+INPUT_VALUE = SpanAttributes.INPUT_VALUE
+OUTPUT_MIME_TYPE = SpanAttributes.OUTPUT_MIME_TYPE
+OUTPUT_VALUE = SpanAttributes.OUTPUT_VALUE
+LLM_INPUT_MESSAGES = SpanAttributes.LLM_INPUT_MESSAGES
+LLM_OUTPUT_MESSAGES = SpanAttributes.LLM_OUTPUT_MESSAGES
+LLM_MODEL_NAME = SpanAttributes.LLM_MODEL_NAME
+LLM_INVOCATION_PARAMETERS = SpanAttributes.LLM_INVOCATION_PARAMETERS
+LLM_TOOLS = SpanAttributes.LLM_TOOLS
+LLM_TOKEN_COUNT_PROMPT = SpanAttributes.LLM_TOKEN_COUNT_PROMPT
+LLM_TOKEN_COUNT_COMPLETION = SpanAttributes.LLM_TOKEN_COUNT_COMPLETION
+MESSAGE_CONTENT = MessageAttributes.MESSAGE_CONTENT
+MESSAGE_ROLE = MessageAttributes.MESSAGE_ROLE
+MESSAGE_TOOL_CALLS = MessageAttributes.MESSAGE_TOOL_CALLS
+TOOL_CALL_ID = ToolCallAttributes.TOOL_CALL_ID
+TOOL_CALL_FUNCTION_NAME = ToolCallAttributes.TOOL_CALL_FUNCTION_NAME
+TOOL_CALL_FUNCTION_ARGUMENTS_JSON = ToolCallAttributes.TOOL_CALL_FUNCTION_ARGUMENTS_JSON
+TOOL_CALL_ID = ToolCallAttributes.TOOL_CALL_ID
+MESSAGE_TOOL_CALL_ID = MessageAttributes.MESSAGE_TOOL_CALL_ID
+TOOL_JSON_SCHEMA = ToolAttributes.TOOL_JSON_SCHEMA

phoenix/server/api/input_types/AddExamplesToDatasetInput.py ADDED Viewed

@@ -0,0 +1,16 @@
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.relay import GlobalID
+from strawberry.scalars import JSON
+from .DatasetExampleInput import DatasetExampleInput
+@strawberry.input
+class AddExamplesToDatasetInput:
+    dataset_id: GlobalID
+    examples: list[DatasetExampleInput]
+    dataset_version_description: Optional[str] = UNSET
+    dataset_version_metadata: Optional[JSON] = UNSET

phoenix/server/api/input_types/AddSpansToDatasetInput.py ADDED Viewed

@@ -0,0 +1,14 @@
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.relay import GlobalID
+from strawberry.scalars import JSON
+@strawberry.input
+class AddSpansToDatasetInput:
+    dataset_id: GlobalID
+    span_ids: list[GlobalID]
+    dataset_version_description: Optional[str] = UNSET
+    dataset_version_metadata: Optional[JSON] = UNSET

phoenix/server/api/input_types/ChatCompletionInput.py ADDED Viewed

@@ -0,0 +1,38 @@
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.relay.types import GlobalID
+from strawberry.scalars import JSON
+from phoenix.server.api.types.TemplateLanguage import TemplateLanguage
+from .ChatCompletionMessageInput import ChatCompletionMessageInput
+from .GenerativeModelInput import GenerativeModelInput
+from .InvocationParameters import InvocationParameterInput
+from .TemplateOptions import TemplateOptions
+@strawberry.input
+class ChatCompletionInput:
+    messages: list[ChatCompletionMessageInput]
+    model: GenerativeModelInput
+    invocation_parameters: list[InvocationParameterInput] = strawberry.field(default_factory=list)
+    tools: Optional[list[JSON]] = UNSET
+    api_key: Optional[str] = strawberry.field(default=None)
+    template: Optional[TemplateOptions] = UNSET
+@strawberry.input
+class ChatCompletionOverDatasetInput:
+    messages: list[ChatCompletionMessageInput]
+    model: GenerativeModelInput
+    invocation_parameters: list[InvocationParameterInput] = strawberry.field(default_factory=list)
+    tools: Optional[list[JSON]] = UNSET
+    api_key: Optional[str] = strawberry.field(default=None)
+    template_language: TemplateLanguage
+    dataset_id: GlobalID
+    dataset_version_id: Optional[GlobalID] = None
+    experiment_name: Optional[str] = None
+    experiment_description: Optional[str] = None
+    experiment_metadata: Optional[JSON] = strawberry.field(default_factory=dict)

phoenix/server/api/input_types/ChatCompletionMessageInput.py ADDED Viewed

@@ -0,0 +1,24 @@
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.scalars import JSON
+from phoenix.server.api.types.ChatCompletionMessageRole import ChatCompletionMessageRole
+@strawberry.input
+class ChatCompletionMessageInput:
+    role: ChatCompletionMessageRole
+    content: JSON = strawberry.field(
+        default="",
+        description="The content of the message as JSON to support various kinds of text",
+    )
+    tool_calls: Optional[list[JSON]] = strawberry.field(
+        description="The tool calls that were made in the message",
+        default=UNSET,
+    )
+    tool_call_id: Optional[str] = strawberry.field(
+        description="The ID that corresponds to a prior tool call. Used to link a tool message to a pre-existing tool call.",  # noqa: E501
+        default=UNSET,
+    )

phoenix/server/api/input_types/ClearProjectInput.py ADDED Viewed

@@ -0,0 +1,15 @@
+from datetime import datetime
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.relay import GlobalID
+@strawberry.input
+class ClearProjectInput:
+    id: GlobalID
+    end_time: Optional[datetime] = strawberry.field(
+        default=UNSET,
+        description="The time up to which to purge data. Time is right-open /non-inclusive.",
+    )

phoenix/server/api/input_types/ClusterInput.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from typing import List, Optional
+from typing import Optional
 import strawberry
 from strawberry import ID, UNSET
@@ -6,5 +6,5 @@ from strawberry import ID, UNSET
 @strawberry.input
 class ClusterInput:
-    event_ids: List[ID]
+    event_ids: list[ID]
     id: Optional[ID] = UNSET

phoenix/server/api/input_types/CreateDatasetInput.py ADDED Viewed

@@ -0,0 +1,12 @@
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.scalars import JSON
+@strawberry.input
+class CreateDatasetInput:
+    name: str
+    description: Optional[str] = UNSET
+    metadata: Optional[JSON] = UNSET

phoenix/server/api/input_types/CreateSpanAnnotationInput.py ADDED Viewed

@@ -0,0 +1,18 @@
+from typing import Optional
+import strawberry
+from strawberry.relay import GlobalID
+from strawberry.scalars import JSON
+from phoenix.server.api.types.AnnotatorKind import AnnotatorKind
+@strawberry.input
+class CreateSpanAnnotationInput:
+    span_id: GlobalID
+    name: str
+    annotator_kind: AnnotatorKind
+    label: Optional[str] = None
+    score: Optional[float] = None
+    explanation: Optional[str] = None
+    metadata: JSON = strawberry.field(default_factory=dict)

arize-phoenix 3.16.1__py3-none-any.whl → 7.7.0__py3-none-any.whl

Potentially problematic release.

arize-phoenix 3.16.1py3-none-any.whl → 7.7.0py3-none-any.whl