PyPI - arize-phoenix - Versions diffs - 3.16.1__py3-none-any.whl → 7.7.0__py3-none-any.whl - Mend

arize-phoenix 3.16.1py3-none-any.whl → 7.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (338) hide show

arize_phoenix-7.7.0.dist-info/METADATA +261 -0
arize_phoenix-7.7.0.dist-info/RECORD +345 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/WHEEL +1 -1
arize_phoenix-7.7.0.dist-info/entry_points.txt +3 -0
phoenix/__init__.py +86 -14
phoenix/auth.py +309 -0
phoenix/config.py +675 -45
phoenix/core/model.py +32 -30
phoenix/core/model_schema.py +102 -109
phoenix/core/model_schema_adapter.py +48 -45
phoenix/datetime_utils.py +24 -3
phoenix/db/README.md +54 -0
phoenix/db/__init__.py +4 -0
phoenix/db/alembic.ini +85 -0
phoenix/db/bulk_inserter.py +294 -0
phoenix/db/engines.py +208 -0
phoenix/db/enums.py +20 -0
phoenix/db/facilitator.py +113 -0
phoenix/db/helpers.py +159 -0
phoenix/db/insertion/constants.py +2 -0
phoenix/db/insertion/dataset.py +227 -0
phoenix/db/insertion/document_annotation.py +171 -0
phoenix/db/insertion/evaluation.py +191 -0
phoenix/db/insertion/helpers.py +98 -0
phoenix/db/insertion/span.py +193 -0
phoenix/db/insertion/span_annotation.py +158 -0
phoenix/db/insertion/trace_annotation.py +158 -0
phoenix/db/insertion/types.py +256 -0
phoenix/db/migrate.py +86 -0
phoenix/db/migrations/data_migration_scripts/populate_project_sessions.py +199 -0
phoenix/db/migrations/env.py +114 -0
phoenix/db/migrations/script.py.mako +26 -0
phoenix/db/migrations/versions/10460e46d750_datasets.py +317 -0
phoenix/db/migrations/versions/3be8647b87d8_add_token_columns_to_spans_table.py +126 -0
phoenix/db/migrations/versions/4ded9e43755f_create_project_sessions_table.py +66 -0
phoenix/db/migrations/versions/cd164e83824f_users_and_tokens.py +157 -0
phoenix/db/migrations/versions/cf03bd6bae1d_init.py +280 -0
phoenix/db/models.py +807 -0
phoenix/exceptions.py +5 -1
phoenix/experiments/__init__.py +6 -0
phoenix/experiments/evaluators/__init__.py +29 -0
phoenix/experiments/evaluators/base.py +158 -0
phoenix/experiments/evaluators/code_evaluators.py +184 -0
phoenix/experiments/evaluators/llm_evaluators.py +473 -0
phoenix/experiments/evaluators/utils.py +236 -0
phoenix/experiments/functions.py +772 -0
phoenix/experiments/tracing.py +86 -0
phoenix/experiments/types.py +726 -0
phoenix/experiments/utils.py +25 -0
phoenix/inferences/__init__.py +0 -0
phoenix/{datasets → inferences}/errors.py +6 -5
phoenix/{datasets → inferences}/fixtures.py +49 -42
phoenix/{datasets/dataset.py → inferences/inferences.py} +121 -105
phoenix/{datasets → inferences}/schema.py +11 -11
phoenix/{datasets → inferences}/validation.py +13 -14
phoenix/logging/__init__.py +3 -0
phoenix/logging/_config.py +90 -0
phoenix/logging/_filter.py +6 -0
phoenix/logging/_formatter.py +69 -0
phoenix/metrics/__init__.py +5 -4
phoenix/metrics/binning.py +4 -3
phoenix/metrics/metrics.py +2 -1
phoenix/metrics/mixins.py +7 -6
phoenix/metrics/retrieval_metrics.py +2 -1
phoenix/metrics/timeseries.py +5 -4
phoenix/metrics/wrappers.py +9 -3
phoenix/pointcloud/clustering.py +5 -5
phoenix/pointcloud/pointcloud.py +7 -5
phoenix/pointcloud/projectors.py +5 -6
phoenix/pointcloud/umap_parameters.py +53 -52
phoenix/server/api/README.md +28 -0
phoenix/server/api/auth.py +44 -0
phoenix/server/api/context.py +152 -9
phoenix/server/api/dataloaders/__init__.py +91 -0
phoenix/server/api/dataloaders/annotation_summaries.py +139 -0
phoenix/server/api/dataloaders/average_experiment_run_latency.py +54 -0
phoenix/server/api/dataloaders/cache/__init__.py +3 -0
phoenix/server/api/dataloaders/cache/two_tier_cache.py +68 -0
phoenix/server/api/dataloaders/dataset_example_revisions.py +131 -0
phoenix/server/api/dataloaders/dataset_example_spans.py +38 -0
phoenix/server/api/dataloaders/document_evaluation_summaries.py +144 -0
phoenix/server/api/dataloaders/document_evaluations.py +31 -0
phoenix/server/api/dataloaders/document_retrieval_metrics.py +89 -0
phoenix/server/api/dataloaders/experiment_annotation_summaries.py +79 -0
phoenix/server/api/dataloaders/experiment_error_rates.py +58 -0
phoenix/server/api/dataloaders/experiment_run_annotations.py +36 -0
phoenix/server/api/dataloaders/experiment_run_counts.py +49 -0
phoenix/server/api/dataloaders/experiment_sequence_number.py +44 -0
phoenix/server/api/dataloaders/latency_ms_quantile.py +188 -0
phoenix/server/api/dataloaders/min_start_or_max_end_times.py +85 -0
phoenix/server/api/dataloaders/project_by_name.py +31 -0
phoenix/server/api/dataloaders/record_counts.py +116 -0
phoenix/server/api/dataloaders/session_io.py +79 -0
phoenix/server/api/dataloaders/session_num_traces.py +30 -0
phoenix/server/api/dataloaders/session_num_traces_with_error.py +32 -0
phoenix/server/api/dataloaders/session_token_usages.py +41 -0
phoenix/server/api/dataloaders/session_trace_latency_ms_quantile.py +55 -0
phoenix/server/api/dataloaders/span_annotations.py +26 -0
phoenix/server/api/dataloaders/span_dataset_examples.py +31 -0
phoenix/server/api/dataloaders/span_descendants.py +57 -0
phoenix/server/api/dataloaders/span_projects.py +33 -0
phoenix/server/api/dataloaders/token_counts.py +124 -0
phoenix/server/api/dataloaders/trace_by_trace_ids.py +25 -0
phoenix/server/api/dataloaders/trace_root_spans.py +32 -0
phoenix/server/api/dataloaders/user_roles.py +30 -0
phoenix/server/api/dataloaders/users.py +33 -0
phoenix/server/api/exceptions.py +48 -0
phoenix/server/api/helpers/__init__.py +12 -0
phoenix/server/api/helpers/dataset_helpers.py +217 -0
phoenix/server/api/helpers/experiment_run_filters.py +763 -0
phoenix/server/api/helpers/playground_clients.py +948 -0
phoenix/server/api/helpers/playground_registry.py +70 -0
phoenix/server/api/helpers/playground_spans.py +455 -0
phoenix/server/api/input_types/AddExamplesToDatasetInput.py +16 -0
phoenix/server/api/input_types/AddSpansToDatasetInput.py +14 -0
phoenix/server/api/input_types/ChatCompletionInput.py +38 -0
phoenix/server/api/input_types/ChatCompletionMessageInput.py +24 -0
phoenix/server/api/input_types/ClearProjectInput.py +15 -0
phoenix/server/api/input_types/ClusterInput.py +2 -2
phoenix/server/api/input_types/CreateDatasetInput.py +12 -0
phoenix/server/api/input_types/CreateSpanAnnotationInput.py +18 -0
phoenix/server/api/input_types/CreateTraceAnnotationInput.py +18 -0
phoenix/server/api/input_types/DataQualityMetricInput.py +5 -2
phoenix/server/api/input_types/DatasetExampleInput.py +14 -0
phoenix/server/api/input_types/DatasetSort.py +17 -0
phoenix/server/api/input_types/DatasetVersionSort.py +16 -0
phoenix/server/api/input_types/DeleteAnnotationsInput.py +7 -0
phoenix/server/api/input_types/DeleteDatasetExamplesInput.py +13 -0
phoenix/server/api/input_types/DeleteDatasetInput.py +7 -0
phoenix/server/api/input_types/DeleteExperimentsInput.py +7 -0
phoenix/server/api/input_types/DimensionFilter.py +4 -4
phoenix/server/api/input_types/GenerativeModelInput.py +17 -0
phoenix/server/api/input_types/Granularity.py +1 -1
phoenix/server/api/input_types/InvocationParameters.py +162 -0
phoenix/server/api/input_types/PatchAnnotationInput.py +19 -0
phoenix/server/api/input_types/PatchDatasetExamplesInput.py +35 -0
phoenix/server/api/input_types/PatchDatasetInput.py +14 -0
phoenix/server/api/input_types/PerformanceMetricInput.py +5 -2
phoenix/server/api/input_types/ProjectSessionSort.py +29 -0
phoenix/server/api/input_types/SpanAnnotationSort.py +17 -0
phoenix/server/api/input_types/SpanSort.py +134 -69
phoenix/server/api/input_types/TemplateOptions.py +10 -0
phoenix/server/api/input_types/TraceAnnotationSort.py +17 -0
phoenix/server/api/input_types/UserRoleInput.py +9 -0
phoenix/server/api/mutations/__init__.py +28 -0
phoenix/server/api/mutations/api_key_mutations.py +167 -0
phoenix/server/api/mutations/chat_mutations.py +593 -0
phoenix/server/api/mutations/dataset_mutations.py +591 -0
phoenix/server/api/mutations/experiment_mutations.py +75 -0
phoenix/server/api/{types/ExportEventsMutation.py → mutations/export_events_mutations.py} +21 -18
phoenix/server/api/mutations/project_mutations.py +57 -0
phoenix/server/api/mutations/span_annotations_mutations.py +128 -0
phoenix/server/api/mutations/trace_annotations_mutations.py +127 -0
phoenix/server/api/mutations/user_mutations.py +329 -0
phoenix/server/api/openapi/__init__.py +0 -0
phoenix/server/api/openapi/main.py +17 -0
phoenix/server/api/openapi/schema.py +16 -0
phoenix/server/api/queries.py +738 -0
phoenix/server/api/routers/__init__.py +11 -0
phoenix/server/api/routers/auth.py +284 -0
phoenix/server/api/routers/embeddings.py +26 -0
phoenix/server/api/routers/oauth2.py +488 -0
phoenix/server/api/routers/v1/__init__.py +64 -0
phoenix/server/api/routers/v1/datasets.py +1017 -0
phoenix/server/api/routers/v1/evaluations.py +362 -0
phoenix/server/api/routers/v1/experiment_evaluations.py +115 -0
phoenix/server/api/routers/v1/experiment_runs.py +167 -0
phoenix/server/api/routers/v1/experiments.py +308 -0
phoenix/server/api/routers/v1/pydantic_compat.py +78 -0
phoenix/server/api/routers/v1/spans.py +267 -0
phoenix/server/api/routers/v1/traces.py +208 -0
phoenix/server/api/routers/v1/utils.py +95 -0
phoenix/server/api/schema.py +44 -241
phoenix/server/api/subscriptions.py +597 -0
phoenix/server/api/types/Annotation.py +21 -0
phoenix/server/api/types/AnnotationSummary.py +55 -0
phoenix/server/api/types/AnnotatorKind.py +16 -0
phoenix/server/api/types/ApiKey.py +27 -0
phoenix/server/api/types/AuthMethod.py +9 -0
phoenix/server/api/types/ChatCompletionMessageRole.py +11 -0
phoenix/server/api/types/ChatCompletionSubscriptionPayload.py +46 -0
phoenix/server/api/types/Cluster.py +25 -24
phoenix/server/api/types/CreateDatasetPayload.py +8 -0
phoenix/server/api/types/DataQualityMetric.py +31 -13
phoenix/server/api/types/Dataset.py +288 -63
phoenix/server/api/types/DatasetExample.py +85 -0
phoenix/server/api/types/DatasetExampleRevision.py +34 -0
phoenix/server/api/types/DatasetVersion.py +14 -0
phoenix/server/api/types/Dimension.py +32 -31
phoenix/server/api/types/DocumentEvaluationSummary.py +9 -8
phoenix/server/api/types/EmbeddingDimension.py +56 -49
phoenix/server/api/types/Evaluation.py +25 -31
phoenix/server/api/types/EvaluationSummary.py +30 -50
phoenix/server/api/types/Event.py +20 -20
phoenix/server/api/types/ExampleRevisionInterface.py +14 -0
phoenix/server/api/types/Experiment.py +152 -0
phoenix/server/api/types/ExperimentAnnotationSummary.py +13 -0
phoenix/server/api/types/ExperimentComparison.py +17 -0
phoenix/server/api/types/ExperimentRun.py +119 -0
phoenix/server/api/types/ExperimentRunAnnotation.py +56 -0
phoenix/server/api/types/GenerativeModel.py +9 -0
phoenix/server/api/types/GenerativeProvider.py +85 -0
phoenix/server/api/types/Inferences.py +80 -0
phoenix/server/api/types/InferencesRole.py +23 -0
phoenix/server/api/types/LabelFraction.py +7 -0
phoenix/server/api/types/MimeType.py +2 -2
phoenix/server/api/types/Model.py +54 -54
phoenix/server/api/types/PerformanceMetric.py +8 -5
phoenix/server/api/types/Project.py +407 -142
phoenix/server/api/types/ProjectSession.py +139 -0
phoenix/server/api/types/Segments.py +4 -4
phoenix/server/api/types/Span.py +221 -176
phoenix/server/api/types/SpanAnnotation.py +43 -0
phoenix/server/api/types/SpanIOValue.py +15 -0
phoenix/server/api/types/SystemApiKey.py +9 -0
phoenix/server/api/types/TemplateLanguage.py +10 -0
phoenix/server/api/types/TimeSeries.py +19 -15
phoenix/server/api/types/TokenUsage.py +11 -0
phoenix/server/api/types/Trace.py +154 -0
phoenix/server/api/types/TraceAnnotation.py +45 -0
phoenix/server/api/types/UMAPPoints.py +7 -7
phoenix/server/api/types/User.py +60 -0
phoenix/server/api/types/UserApiKey.py +45 -0
phoenix/server/api/types/UserRole.py +15 -0
phoenix/server/api/types/node.py +4 -112
phoenix/server/api/types/pagination.py +156 -57
phoenix/server/api/utils.py +34 -0
phoenix/server/app.py +864 -115
phoenix/server/bearer_auth.py +163 -0
phoenix/server/dml_event.py +136 -0
phoenix/server/dml_event_handler.py +256 -0
phoenix/server/email/__init__.py +0 -0
phoenix/server/email/sender.py +97 -0
phoenix/server/email/templates/__init__.py +0 -0
phoenix/server/email/templates/password_reset.html +19 -0
phoenix/server/email/types.py +11 -0
phoenix/server/grpc_server.py +102 -0
phoenix/server/jwt_store.py +505 -0
phoenix/server/main.py +305 -116
phoenix/server/oauth2.py +52 -0
phoenix/server/openapi/__init__.py +0 -0
phoenix/server/prometheus.py +111 -0
phoenix/server/rate_limiters.py +188 -0
phoenix/server/static/.vite/manifest.json +87 -0
phoenix/server/static/assets/components-Cy9nwIvF.js +2125 -0
phoenix/server/static/assets/index-BKvHIxkk.js +113 -0
phoenix/server/static/assets/pages-CUi2xCVQ.js +4449 -0
phoenix/server/static/assets/vendor-DvC8cT4X.js +894 -0
phoenix/server/static/assets/vendor-DxkFTwjz.css +1 -0
phoenix/server/static/assets/vendor-arizeai-Do1793cv.js +662 -0
phoenix/server/static/assets/vendor-codemirror-BzwZPyJM.js +24 -0
phoenix/server/static/assets/vendor-recharts-_Jb7JjhG.js +59 -0
phoenix/server/static/assets/vendor-shiki-Cl9QBraO.js +5 -0
phoenix/server/static/assets/vendor-three-DwGkEfCM.js +2998 -0
phoenix/server/telemetry.py +68 -0
phoenix/server/templates/index.html +82 -23
phoenix/server/thread_server.py +3 -3
phoenix/server/types.py +275 -0
phoenix/services.py +27 -18
phoenix/session/client.py +743 -68
phoenix/session/data_extractor.py +31 -7
phoenix/session/evaluation.py +3 -9
phoenix/session/session.py +263 -219
phoenix/settings.py +22 -0
phoenix/trace/__init__.py +2 -22
phoenix/trace/attributes.py +338 -0
phoenix/trace/dsl/README.md +116 -0
phoenix/trace/dsl/filter.py +663 -213
phoenix/trace/dsl/helpers.py +73 -21
phoenix/trace/dsl/query.py +574 -201
phoenix/trace/exporter.py +24 -19
phoenix/trace/fixtures.py +368 -32
phoenix/trace/otel.py +71 -219
phoenix/trace/projects.py +3 -2
phoenix/trace/schemas.py +33 -11
phoenix/trace/span_evaluations.py +21 -16
phoenix/trace/span_json_decoder.py +6 -4
phoenix/trace/span_json_encoder.py +2 -2
phoenix/trace/trace_dataset.py +47 -32
phoenix/trace/utils.py +21 -4
phoenix/utilities/__init__.py +0 -26
phoenix/utilities/client.py +132 -0
phoenix/utilities/deprecation.py +31 -0
phoenix/utilities/error_handling.py +3 -2
phoenix/utilities/json.py +109 -0
phoenix/utilities/logging.py +8 -0
phoenix/utilities/project.py +2 -2
phoenix/utilities/re.py +49 -0
phoenix/utilities/span_store.py +0 -23
phoenix/utilities/template_formatters.py +99 -0
phoenix/version.py +1 -1
arize_phoenix-3.16.1.dist-info/METADATA +0 -495
arize_phoenix-3.16.1.dist-info/RECORD +0 -178
phoenix/core/project.py +0 -619
phoenix/core/traces.py +0 -96
phoenix/experimental/evals/__init__.py +0 -73
phoenix/experimental/evals/evaluators.py +0 -413
phoenix/experimental/evals/functions/__init__.py +0 -4
phoenix/experimental/evals/functions/classify.py +0 -453
phoenix/experimental/evals/functions/executor.py +0 -353
phoenix/experimental/evals/functions/generate.py +0 -138
phoenix/experimental/evals/functions/processing.py +0 -76
phoenix/experimental/evals/models/__init__.py +0 -14
phoenix/experimental/evals/models/anthropic.py +0 -175
phoenix/experimental/evals/models/base.py +0 -170
phoenix/experimental/evals/models/bedrock.py +0 -221
phoenix/experimental/evals/models/litellm.py +0 -134
phoenix/experimental/evals/models/openai.py +0 -448
phoenix/experimental/evals/models/rate_limiters.py +0 -246
phoenix/experimental/evals/models/vertex.py +0 -173
phoenix/experimental/evals/models/vertexai.py +0 -186
phoenix/experimental/evals/retrievals.py +0 -96
phoenix/experimental/evals/templates/__init__.py +0 -50
phoenix/experimental/evals/templates/default_templates.py +0 -472
phoenix/experimental/evals/templates/template.py +0 -195
phoenix/experimental/evals/utils/__init__.py +0 -172
phoenix/experimental/evals/utils/threads.py +0 -27
phoenix/server/api/helpers.py +0 -11
phoenix/server/api/routers/evaluation_handler.py +0 -109
phoenix/server/api/routers/span_handler.py +0 -70
phoenix/server/api/routers/trace_handler.py +0 -60
phoenix/server/api/types/DatasetRole.py +0 -23
phoenix/server/static/index.css +0 -6
phoenix/server/static/index.js +0 -7447
phoenix/storage/span_store/__init__.py +0 -23
phoenix/storage/span_store/text_file.py +0 -85
phoenix/trace/dsl/missing.py +0 -60
phoenix/trace/langchain/__init__.py +0 -3
phoenix/trace/langchain/instrumentor.py +0 -35
phoenix/trace/llama_index/__init__.py +0 -3
phoenix/trace/llama_index/callback.py +0 -102
phoenix/trace/openai/__init__.py +0 -3
phoenix/trace/openai/instrumentor.py +0 -30
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/licenses/LICENSE +0 -0
/phoenix/{datasets → db/insertion}/__init__.py +0 -0
/phoenix/{experimental → db/migrations}/__init__.py +0 -0
/phoenix/{storage → db/migrations/data_migration_scripts}/__init__.py +0 -0

phoenix/trace/otel.py CHANGED Viewed

@@ -1,39 +1,34 @@
-import inspect
 import json
 from binascii import hexlify, unhexlify
+from collections.abc import Iterable, Iterator, Mapping, Sequence
 from datetime import datetime, timezone
 from types import MappingProxyType
-from typing import (
-    Any,
-    DefaultDict,
-    Dict,
-    Iterable,
-    Iterator,
-    List,
-    Mapping,
-    Optional,
-    Sequence,
-    Set,
-    SupportsFloat,
-    Tuple,
-    Union,
-    cast,
-)
+from typing import Any, Optional, SupportsFloat, cast
 import numpy as np
 import opentelemetry.proto.trace.v1.trace_pb2 as otlp
-from openinference.semconv import trace
-from openinference.semconv.trace import DocumentAttributes, SpanAttributes
+from openinference.semconv.trace import (
+    DocumentAttributes,
+    OpenInferenceMimeTypeValues,
+    SpanAttributes,
+)
 from opentelemetry.proto.common.v1.common_pb2 import AnyValue, ArrayValue, KeyValue
 from opentelemetry.util.types import Attributes, AttributeValue
 from typing_extensions import TypeAlias, assert_never
+from phoenix.trace.attributes import (
+    JSON_STRING_ATTRIBUTES,
+    flatten,
+    get_attribute_value,
+    has_mapping,
+    load_json_strings,
+    unflatten,
+)
 from phoenix.trace.schemas import (
     EXCEPTION_ESCAPED,
     EXCEPTION_MESSAGE,
     EXCEPTION_STACKTRACE,
     EXCEPTION_TYPE,
-    MimeType,
     Span,
     SpanContext,
     SpanEvent,
@@ -43,6 +38,7 @@ from phoenix.trace.schemas import (
     SpanStatusCode,
     TraceID,
 )
+from phoenix.utilities.json import jsonify
 DOCUMENT_METADATA = DocumentAttributes.DOCUMENT_METADATA
 INPUT_MIME_TYPE = SpanAttributes.INPUT_MIME_TYPE
@@ -53,28 +49,45 @@ OUTPUT_MIME_TYPE = SpanAttributes.OUTPUT_MIME_TYPE
 OUTPUT_VALUE = SpanAttributes.OUTPUT_VALUE
 TOOL_PARAMETERS = SpanAttributes.TOOL_PARAMETERS
 LLM_PROMPT_TEMPLATE_VARIABLES = SpanAttributes.LLM_PROMPT_TEMPLATE_VARIABLES
+LLM_TOKEN_COUNT_PROMPT = SpanAttributes.LLM_TOKEN_COUNT_PROMPT
+LLM_TOKEN_COUNT_COMPLETION = SpanAttributes.LLM_TOKEN_COUNT_COMPLETION
+LLM_TOKEN_COUNT_TOTAL = SpanAttributes.LLM_TOKEN_COUNT_TOTAL
-def decode(otlp_span: otlp.Span) -> Span:
+def coerce_otlp_span_attributes(
+    decoded_attributes: Iterable[tuple[str, Any]],
+) -> Iterator[tuple[str, Any]]:
+    for key, value in decoded_attributes:
+        if key in (LLM_TOKEN_COUNT_PROMPT, LLM_TOKEN_COUNT_COMPLETION, LLM_TOKEN_COUNT_TOTAL):
+            try:
+                value = int(value)
+            except BaseException:
+                pass
+        yield key, value
+def decode_otlp_span(otlp_span: otlp.Span) -> Span:
     trace_id = cast(TraceID, _decode_identifier(otlp_span.trace_id))
     span_id = cast(SpanID, _decode_identifier(otlp_span.span_id))
     parent_id = _decode_identifier(otlp_span.parent_span_id)
     start_time = _decode_unix_nano(otlp_span.start_time_unix_nano)
-    end_time = (
-        _decode_unix_nano(otlp_span.end_time_unix_nano) if otlp_span.end_time_unix_nano else None
-    )
+    end_time = _decode_unix_nano(otlp_span.end_time_unix_nano)
-    attributes = dict(_unflatten(_load_json_strings(_decode_key_values(otlp_span.attributes))))
-    span_kind = SpanKind(attributes.pop(OPENINFERENCE_SPAN_KIND, None))
-    for mime_type in (INPUT_MIME_TYPE, OUTPUT_MIME_TYPE):
-        if mime_type in attributes:
-            attributes[mime_type] = MimeType(attributes[mime_type])
+    attributes = unflatten(
+        load_json_strings(coerce_otlp_span_attributes(_decode_key_values(otlp_span.attributes)))
+    )
+    span_kind = SpanKind(get_attribute_value(attributes, OPENINFERENCE_SPAN_KIND))
     status_code, status_message = _decode_status(otlp_span.status)
     events = [_decode_event(event) for event in otlp_span.events]
+    if (input_value := get_attribute_value(attributes, INPUT_VALUE)) and not isinstance(
+        input_value, str
+    ):
+        attributes["input"]["value"] = json.dumps(input_value)
+        attributes["input"]["mime_type"] = OpenInferenceMimeTypeValues.JSON.value
     return Span(
         name=otlp_span.name,
         context=SpanContext(
@@ -127,7 +140,7 @@ def _decode_unix_nano(time_unix_nano: int) -> datetime:
 def _decode_key_values(
     key_values: Iterable[KeyValue],
-) -> Iterator[Tuple[str, Any]]:
+) -> Iterator[tuple[str, Any]]:
     return ((kv.key, _decode_value(kv.value)) for kv in key_values)
@@ -152,28 +165,6 @@ def _decode_value(any_value: AnyValue) -> Any:
     assert_never(which)
-_JSON_STRING_ATTRIBUTES = (
-    DOCUMENT_METADATA,
-    LLM_PROMPT_TEMPLATE_VARIABLES,
-    METADATA,
-    TOOL_PARAMETERS,
-)
-def _load_json_strings(key_values: Iterable[Tuple[str, Any]]) -> Iterator[Tuple[str, Any]]:
-    for key, value in key_values:
-        if key.endswith(_JSON_STRING_ATTRIBUTES):
-            try:
-                dict_value = json.loads(value)
-            except Exception:
-                yield key, value
-            else:
-                if dict_value:
-                    yield key, dict_value
-        else:
-            yield key, value
 StatusMessage: TypeAlias = str
 _STATUS_DECODING = MappingProxyType(
@@ -185,129 +176,15 @@ _STATUS_DECODING = MappingProxyType(
 )
-def _decode_status(otlp_status: otlp.Status) -> Tuple[SpanStatusCode, StatusMessage]:
+def _decode_status(otlp_status: otlp.Status) -> tuple[SpanStatusCode, StatusMessage]:
     status_code = _STATUS_DECODING.get(otlp_status.code, SpanStatusCode.UNSET)
     return status_code, otlp_status.message
-_SEMANTIC_CONVENTIONS: List[str] = sorted(
-    (
-        getattr(klass, attr)
-        for name in dir(trace)
-        if name.endswith("Attributes") and inspect.isclass(klass := getattr(trace, name))
-        for attr in dir(klass)
-        if attr.isupper()
-    ),
-    reverse=True,
-)  # sorted so the longer strings go first
-def _semantic_convention_prefix_partition(key: str, separator: str = ".") -> Tuple[str, str, str]:
-    """Return the longest prefix of `key` that is a semantic convention, and the remaining suffix
-    separated by `.`. For example, if `key` is "retrieval.documents.2.document.score", return
-    ("retrieval.documents", ".", "2.document.score"). The return signature is based on Python's
-    `.partition` method for strings.
-    """
-    for prefix in _SEMANTIC_CONVENTIONS:
-        if key == prefix:
-            return key, "", ""
-        if key.startswith(prefix) and key[len(prefix) :].startswith(separator):
-            return prefix, separator, key[len(prefix) + len(separator) :]
-    return "", "", ""
-class _Trie(DefaultDict[Union[str, int], "_Trie"]):
-    """Prefix Tree with special handling for indices (i.e. all-digit keys)."""
-    def __init__(self) -> None:
-        super().__init__(_Trie)
-        self.value: Any = None
-        self.indices: Set[int] = set()
-        self.branches: Set[Union[str, int]] = set()
-    def set_value(self, value: Any) -> None:
-        self.value = value
-        # value and indices must not coexist
-        self.branches.update(self.indices)
-        self.indices.clear()
-    def add_index(self, index: int) -> "_Trie":
-        if self.value is not None:
-            self.branches.add(index)
-        elif index not in self.branches:
-            self.indices.add(index)
-        return self[index]
-    def add_branch(self, branch: Union[str, int]) -> "_Trie":
-        if branch in self.indices:
-            self.indices.discard(cast(int, branch))
-        self.branches.add(branch)
-        return self[branch]
-# FIXME: Ideally we should not need something so complicated as a Trie, but it's useful here
-# for backward compatibility reasons regarding some deeply nested objects such as TOOL_PARAMETERS.
-# In the future, we should `json_dumps` them and not let things get too deeply nested.
-def _build_trie(
-    key_value_pairs: Iterable[Tuple[str, Any]],
-    separator: str = ".",
-) -> _Trie:
-    """Build a Trie (a.k.a. prefix tree) from `key_value_pairs`, by partitioning the keys by
-    separator. Each partition is a branch in the Trie. Special handling is done for partitions
-    that are all digits, e.g. "0", "12", etc., which are converted to integers and collected
-    as indices.
-    """
-    trie = _Trie()
-    for key, value in key_value_pairs:
-        if value is None:
-            continue
-        t = trie
-        while True:
-            prefix, _, suffix = _semantic_convention_prefix_partition(key, separator)
-            if prefix:
-                t = t.add_branch(prefix)
-            else:
-                prefix, _, suffix = key.partition(separator)
-                if prefix.isdigit():
-                    index = int(prefix)
-                    t = t.add_index(index) if suffix else t.add_branch(index)
-                else:
-                    t = t.add_branch(prefix)
-            if not suffix:
-                break
-            key = suffix
-        t.set_value(value)
-    return trie
-def _walk(trie: _Trie, prefix: str = "") -> Iterator[Tuple[str, Any]]:
-    if trie.value is not None:
-        yield prefix, trie.value
-    elif prefix and trie.indices:
-        yield prefix, [dict(_walk(trie[index])) for index in sorted(trie.indices)]
-    elif trie.indices:
-        for index in trie.indices:
-            yield from _walk(trie[index], prefix=f"{index}")
-    elif prefix:
-        yield prefix, dict(_walk(trie))
-        return
-    for branch in trie.branches:
-        new_prefix = f"{prefix}.{branch}" if prefix else f"{branch}"
-        yield from _walk(trie[branch], new_prefix)
-def _unflatten(
-    key_value_pairs: Iterable[Tuple[str, Any]],
-    separator: str = ".",
-) -> Iterator[Tuple[str, Any]]:
-    trie = _build_trie(key_value_pairs, separator)
-    yield from _walk(trie)
 _BILLION = 1_000_000_000  # for converting seconds to nanoseconds
-def encode(span: Span) -> otlp.Span:
+def encode_span_to_otlp(span: Span) -> otlp.Span:
     trace_id: bytes = _encode_identifier(span.context.trace_id)
     span_id: bytes = _encode_identifier(span.context.span_id)
     parent_span_id: bytes = _encode_identifier(span.parent_id)
@@ -316,11 +193,7 @@ def encode(span: Span) -> otlp.Span:
     start_time_unix_nano: int = int(span.start_time.timestamp() * _BILLION)
     end_time_unix_nano: int = int(span.end_time.timestamp() * _BILLION) if span.end_time else 0
-    attributes: Dict[str, Any] = span.attributes.copy()
-    for mime_type in (INPUT_MIME_TYPE, OUTPUT_MIME_TYPE):
-        if mime_type in attributes:
-            attributes[mime_type] = attributes[mime_type].value
+    attributes: dict[str, Any] = dict(span.attributes)
     for key, value in span.attributes.items():
         if value is None:
@@ -328,19 +201,34 @@ def encode(span: Span) -> otlp.Span:
             attributes.pop(key, None)
         elif isinstance(value, Mapping):
             attributes.pop(key, None)
-            if key.endswith(_JSON_STRING_ATTRIBUTES):
-                attributes[key] = json.dumps(value)
+            if key.endswith(JSON_STRING_ATTRIBUTES):
+                attributes[key] = json.dumps(jsonify(value))
             else:
-                attributes.update(_flatten_mapping(value, key))
+                attributes.update(
+                    flatten(
+                        value,
+                        prefix=key,
+                        recurse_on_sequence=True,
+                        json_string_attributes=JSON_STRING_ATTRIBUTES,
+                    )
+                )
         elif (
             not isinstance(value, str)
             and (isinstance(value, Sequence) or isinstance(value, np.ndarray))
-            and _has_mapping(value)
+            and has_mapping(value)
         ):
             attributes.pop(key, None)
-            attributes.update(_flatten_sequence(value, key))
-    attributes[OPENINFERENCE_SPAN_KIND] = span.span_kind.value
+            attributes.update(
+                flatten(
+                    value,
+                    prefix=key,
+                    recurse_on_sequence=True,
+                    json_string_attributes=JSON_STRING_ATTRIBUTES,
+                )
+            )
+    if OPENINFERENCE_SPAN_KIND not in attributes:
+        attributes[OPENINFERENCE_SPAN_KIND] = span.span_kind.value
     status = _encode_status(span.status_code, span.status_message)
     events = map(_encode_event, span.events)
@@ -381,42 +269,6 @@ def _encode_identifier(identifier: Optional[str]) -> bytes:
     return unhexlify(identifier)
-def _has_mapping(sequence: Sequence[Any]) -> bool:
-    for item in sequence:
-        if isinstance(item, Mapping):
-            return True
-    return False
-def _flatten_mapping(
-    mapping: Mapping[str, Any],
-    prefix: str,
-) -> Iterator[Tuple[str, Any]]:
-    for key, value in mapping.items():
-        prefixed_key = f"{prefix}.{key}"
-        if isinstance(value, Mapping):
-            if key.endswith(_JSON_STRING_ATTRIBUTES):
-                yield prefixed_key, json.dumps(value)
-            else:
-                yield from _flatten_mapping(value, prefixed_key)
-        elif isinstance(value, Sequence):
-            yield from _flatten_sequence(value, prefixed_key)
-        elif value is not None:
-            yield prefixed_key, value
-def _flatten_sequence(
-    sequence: Sequence[Any],
-    prefix: str,
-) -> Iterator[Tuple[str, Any]]:
-    if isinstance(sequence, str) or not _has_mapping(sequence):
-        yield prefix, sequence
-    for idx, obj in enumerate(sequence):
-        if not isinstance(obj, Mapping):
-            continue
-        yield from _flatten_mapping(obj, f"{prefix}.{idx}")
 def _encode_event(event: SpanEvent) -> otlp.Span.Event:
     return otlp.Span.Event(
         name=event.name,
@@ -451,6 +303,6 @@ def _encode_value(value: AttributeValue) -> AnyValue:
 __all__ = [
-    "encode",
-    "decode",
+    "encode_span_to_otlp",
+    "decode_otlp_span",
 ]

phoenix/trace/projects.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import types
-from typing import Any, Callable, Optional, Type
+from collections.abc import Callable
+from typing import Any, Optional
 from openinference.semconv.resource import ResourceAttributes
 from opentelemetry.sdk import trace
@@ -58,7 +59,7 @@ class using_project:
     def __exit__(
         self,
-        exc_type: Optional[Type[BaseException]],
+        exc_type: Optional[type[BaseException]],
         exc_value: Optional[BaseException],
         traceback: Optional[types.TracebackType],
     ) -> None:

phoenix/trace/schemas.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from dataclasses import dataclass
 from datetime import datetime
 from enum import Enum
-from typing import Any, Dict, List, Optional, Union
+from typing import Any, Mapping, NamedTuple, Optional
 from uuid import UUID
 EXCEPTION_TYPE = "exception.type"
@@ -29,8 +29,6 @@ class SpanKind(Enum):
     """
     SpanKind is loosely inspired by OpenTelemetry's SpanKind
     It captures the type of work that a Span encapsulates.
-    NB: this is actively under construction
     """
     TOOL = "TOOL"
@@ -40,6 +38,8 @@ class SpanKind(Enum):
     EMBEDDING = "EMBEDDING"
     AGENT = "AGENT"
     RERANKER = "RERANKER"
+    EVALUATOR = "EVALUATOR"
+    GUARDRAIL = "GUARDRAIL"
     UNKNOWN = "UNKNOWN"
     def __str__(self) -> str:
@@ -47,16 +47,14 @@ class SpanKind(Enum):
     @classmethod
     def _missing_(cls, v: Any) -> Optional["SpanKind"]:
-        if v and isinstance(v, str) and not v.isupper():
+        if v and isinstance(v, str) and v.isascii() and not v.isupper():
             return cls(v.upper())
-        return None if v else cls.UNKNOWN
+        return cls.UNKNOWN
 TraceID = str
 SpanID = str
-AttributePrimitiveValue = Union[str, bool, float, int]
-AttributeValue = Union[AttributePrimitiveValue, List[AttributePrimitiveValue]]
-SpanAttributes = Dict[str, AttributeValue]
+SpanAttributes = Mapping[str, Any]
 @dataclass(frozen=True)
@@ -73,7 +71,7 @@ class SpanConversationAttributes:
 @dataclass(frozen=True)
-class SpanEvent(Dict[str, Any]):
+class SpanEvent:
     """
     A Span Event can be thought of as a structured log message (or annotation)
     on a Span, typically used to denote a meaningful, singular point in time
@@ -142,7 +140,7 @@ class Span:
     "If the parent_id is None, this is the root span"
     parent_id: Optional[SpanID]
     start_time: datetime
-    end_time: Optional[datetime]
+    end_time: datetime
     status_code: SpanStatusCode
     status_message: str
     """
@@ -171,7 +169,7 @@ class Span:
     OpenTelemetry Inspiration:
     https://opentelemetry.io/docs/concepts/signals/traces/#span-events
     """
-    events: List[SpanEvent]
+    events: list[SpanEvent]
     """
     An extension of the OpenTelemetry Span interface to include the
@@ -189,6 +187,22 @@ class MimeType(Enum):
         return None if v else cls.TEXT
+@dataclass(frozen=True)
+class SpanIOValue:
+    value: str
+    mime_type: MimeType = MimeType.TEXT
+@dataclass(frozen=True)
+class TokenUsage:
+    prompt: int = 0
+    completion: int = 0
+    def __post_init__(self) -> None:
+        assert self.prompt >= 0, "prompt must be non-negative"
+        assert self.completion >= 0, "completion must be non-negative"
 ATTRIBUTE_PREFIX = "attributes."
 CONTEXT_PREFIX = "context."
 COMPUTED_PREFIX = "__computed__."
@@ -202,3 +216,11 @@ class ComputedAttributes(Enum):
     CUMULATIVE_LLM_TOKEN_COUNT_COMPLETION = "cumulative_token_count.completion"
     ERROR_COUNT = "error_count"
     CUMULATIVE_ERROR_COUNT = "cumulative_error_count"
+class ComputedValues(NamedTuple):
+    latency_ms: float
+    cumulative_error_count: int
+    cumulative_llm_token_count_prompt: int
+    cumulative_llm_token_count_completion: int
+    cumulative_llm_token_count_total: int

phoenix/trace/span_evaluations.py CHANGED Viewed

@@ -1,17 +1,19 @@
 import json
 from abc import ABC
+from collections.abc import Callable, Mapping, Sequence
 from dataclasses import dataclass, field
 from itertools import product
 from pathlib import Path
 from types import MappingProxyType
-from typing import Any, Callable, List, Mapping, Optional, Sequence, Set, Tuple, Type, Union
+from typing import Any, Optional, Union
 from uuid import UUID, uuid4
 import pandas as pd
 from pandas.api.types import is_integer_dtype, is_numeric_dtype, is_string_dtype
 from pyarrow import RecordBatchStreamReader, Schema, Table, parquet
-from phoenix.config import TRACE_DATASET_DIR
+from phoenix.config import TRACE_DATASETS_DIR
+from phoenix.exceptions import PhoenixEvaluationNameIsMissing
 from phoenix.trace.errors import InvalidParquetMetadataError
 EVAL_NAME_COLUMN_PREFIX = "eval."
@@ -19,11 +21,11 @@ EVAL_PARQUET_FILE_NAME = "evaluations-{id}.parquet"
 class NeedsNamedIndex(ABC):
-    index_names: Mapping[Tuple[str, ...], Callable[[Any], bool]]
-    all_valid_index_name_sorted_combos: Set[Tuple[str, ...]]
+    index_names: Mapping[tuple[str, ...], Callable[[Any], bool]]
+    all_valid_index_name_sorted_combos: set[tuple[str, ...]]
     @classmethod
-    def preferred_names(cls) -> List[str]:
+    def preferred_names(cls) -> list[str]:
         return [choices[0] for choices in cls.index_names.keys()]
     @classmethod
@@ -42,7 +44,7 @@ class NeedsNamedIndex(ABC):
         )
     @classmethod
-    def find_valid_index_names(cls, dtypes: "pd.Series[Any]") -> Optional[List[str]]:
+    def find_valid_index_names(cls, dtypes: "pd.Series[Any]") -> Optional[list[str]]:
         valid_names = []
         for names, check_type in cls.index_names.items():
             for name in names:
@@ -64,14 +66,15 @@ class NeedsResultColumns(ABC):
     )
     @classmethod
-    def is_valid_result_columns(cls, dtypes: "pd.Series[Any]") -> bool:
+    def is_valid_result_columns(cls, df: pd.DataFrame) -> bool:
+        dtypes = df.dtypes
         names = cls.result_column_names.keys()
         intersection = dtypes.index.intersection(names)  # type: ignore
         if not len(intersection):
             return False
         for name in intersection:
             check_type = cls.result_column_names[name]
-            if not check_type(dtypes[name]):
+            if not check_type(dtypes[name]) and not df.loc[:, name].isna().all():
                 return False
         return True
@@ -91,7 +94,7 @@ class Evaluations(NeedsNamedIndex, NeedsResultColumns, ABC):
             f"dataframe=<rows: {len(self.dataframe)!r}>)"
         )
-    def __dir__(self) -> List[str]:
+    def __dir__(self) -> list[str]:
         return ["get_dataframe"]
     def get_dataframe(self, prefix_columns_with_name: bool = True) -> pd.DataFrame:
@@ -136,7 +139,7 @@ class Evaluations(NeedsNamedIndex, NeedsResultColumns, ABC):
             )
         # Validate that the dataframe contains result columns of appropriate types.
-        if not self.is_valid_result_columns(dataframe.dtypes):
+        if not self.is_valid_result_columns(dataframe):
             raise ValueError(
                 f"The dataframe must contain one of these columns with appropriate "
                 f"value types: {self.result_column_names.keys()} "
@@ -152,7 +155,7 @@ class Evaluations(NeedsNamedIndex, NeedsResultColumns, ABC):
     def __init_subclass__(
         cls,
-        index_names: Mapping[Tuple[str, ...], Callable[[Any], bool]],
+        index_names: Mapping[tuple[str, ...], Callable[[Any], bool]],
         **kwargs: Any,
     ) -> None:
         super().__init_subclass__(**kwargs)
@@ -200,7 +203,7 @@ class Evaluations(NeedsNamedIndex, NeedsResultColumns, ABC):
             UUID: The ID of the evaluations, which can be used as a key to load
             the evaluations from disk using `load`.
         """
-        directory = Path(directory) if directory else TRACE_DATASET_DIR
+        directory = Path(directory) if directory else TRACE_DATASETS_DIR
         path = directory / EVAL_PARQUET_FILE_NAME.format(id=self.id)
         table = self.to_pyarrow_table()
         parquet.write_table(table, path)
@@ -228,7 +231,7 @@ class Evaluations(NeedsNamedIndex, NeedsResultColumns, ABC):
         """
         if not isinstance(id, UUID):
             id = UUID(id)
-        path = Path(directory or TRACE_DATASET_DIR) / EVAL_PARQUET_FILE_NAME.format(id=id)
+        path = Path(directory or TRACE_DATASETS_DIR) / EVAL_PARQUET_FILE_NAME.format(id=id)
         schema = parquet.read_schema(path)
         eval_id, eval_name, evaluations_cls = _parse_schema_metadata(schema)
         if id != eval_id:
@@ -326,7 +329,7 @@ class TraceEvaluations(
 ): ...
-def _parse_schema_metadata(schema: Schema) -> Tuple[UUID, str, Type[Evaluations]]:
+def _parse_schema_metadata(schema: Schema) -> tuple[UUID, str, type[Evaluations]]:
     """
     Validates and parses the pyarrow schema metadata.
     """
@@ -335,8 +338,10 @@ def _parse_schema_metadata(schema: Schema) -> Tuple[UUID, str, Type[Evaluations]
         arize_metadata = json.loads(metadata[b"arize"])
         eval_classes = {subclass.__name__: subclass for subclass in Evaluations.__subclasses__()}
         eval_id = UUID(arize_metadata["eval_id"])
-        if not isinstance((eval_name := arize_metadata["eval_name"]), str):
-            raise ValueError('Arize metadata must contain a string value for key "eval_name"')
+        if not isinstance((eval_name := arize_metadata["eval_name"]), str) or not eval_name.strip():
+            raise PhoenixEvaluationNameIsMissing(
+                'Arize metadata must contain a non-empty string value for key "eval_name"'
+            )
         evaluations_cls = eval_classes[arize_metadata["eval_type"]]
         return eval_id, eval_name, evaluations_cls
     except Exception as err:

phoenix/trace/span_json_decoder.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import json
 from datetime import datetime
-from typing import Any, Dict, Optional
+from typing import Any, Optional
 from openinference.semconv.trace import SpanAttributes
@@ -22,7 +22,7 @@ INPUT_MIME_TYPE = SpanAttributes.INPUT_MIME_TYPE
 OUTPUT_MIME_TYPE = SpanAttributes.OUTPUT_MIME_TYPE
-def json_to_attributes(obj: Optional[Dict[str, Any]]) -> Dict[str, Any]:
+def json_to_attributes(obj: Optional[dict[str, Any]]) -> dict[str, Any]:
     if obj is None:
         return {}
     if not isinstance(obj, dict):
@@ -34,7 +34,7 @@ def json_to_attributes(obj: Optional[Dict[str, Any]]) -> Dict[str, Any]:
     return obj
-def json_to_span(data: Dict[str, Any]) -> Any:
+def json_to_span(data: dict[str, Any]) -> Any:
     """
     A hook for json.loads to convert a dict to a Span object.
     """
@@ -80,7 +80,9 @@ def json_to_span(data: Dict[str, Any]) -> Any:
                 attributes=event.get("attributes") or {},
                 timestamp=datetime.fromisoformat(event["timestamp"]),
             )
-            for event in data["events"]
+            for event in (
+                json.loads(data["events"]) if isinstance(data["events"], str) else data["events"]
+            )
         ]
         data["conversation"] = (
             SpanConversationAttributes(**data["conversation"])

arize-phoenix 3.16.1__py3-none-any.whl → 7.7.0__py3-none-any.whl

Potentially problematic release.

arize-phoenix 3.16.1py3-none-any.whl → 7.7.0py3-none-any.whl