PyPI - arize-phoenix - Versions diffs - 3.16.1__py3-none-any.whl → 7.7.1__py3-none-any.whl - Mend

arize-phoenix 3.16.1py3-none-any.whl → 7.7.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (338) hide show

arize_phoenix-7.7.1.dist-info/METADATA +261 -0
arize_phoenix-7.7.1.dist-info/RECORD +345 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.1.dist-info}/WHEEL +1 -1
arize_phoenix-7.7.1.dist-info/entry_points.txt +3 -0
phoenix/__init__.py +86 -14
phoenix/auth.py +309 -0
phoenix/config.py +675 -45
phoenix/core/model.py +32 -30
phoenix/core/model_schema.py +102 -109
phoenix/core/model_schema_adapter.py +48 -45
phoenix/datetime_utils.py +24 -3
phoenix/db/README.md +54 -0
phoenix/db/__init__.py +4 -0
phoenix/db/alembic.ini +85 -0
phoenix/db/bulk_inserter.py +294 -0
phoenix/db/engines.py +208 -0
phoenix/db/enums.py +20 -0
phoenix/db/facilitator.py +113 -0
phoenix/db/helpers.py +159 -0
phoenix/db/insertion/constants.py +2 -0
phoenix/db/insertion/dataset.py +227 -0
phoenix/db/insertion/document_annotation.py +171 -0
phoenix/db/insertion/evaluation.py +191 -0
phoenix/db/insertion/helpers.py +98 -0
phoenix/db/insertion/span.py +193 -0
phoenix/db/insertion/span_annotation.py +158 -0
phoenix/db/insertion/trace_annotation.py +158 -0
phoenix/db/insertion/types.py +256 -0
phoenix/db/migrate.py +86 -0
phoenix/db/migrations/data_migration_scripts/populate_project_sessions.py +199 -0
phoenix/db/migrations/env.py +114 -0
phoenix/db/migrations/script.py.mako +26 -0
phoenix/db/migrations/versions/10460e46d750_datasets.py +317 -0
phoenix/db/migrations/versions/3be8647b87d8_add_token_columns_to_spans_table.py +126 -0
phoenix/db/migrations/versions/4ded9e43755f_create_project_sessions_table.py +66 -0
phoenix/db/migrations/versions/cd164e83824f_users_and_tokens.py +157 -0
phoenix/db/migrations/versions/cf03bd6bae1d_init.py +280 -0
phoenix/db/models.py +807 -0
phoenix/exceptions.py +5 -1
phoenix/experiments/__init__.py +6 -0
phoenix/experiments/evaluators/__init__.py +29 -0
phoenix/experiments/evaluators/base.py +158 -0
phoenix/experiments/evaluators/code_evaluators.py +184 -0
phoenix/experiments/evaluators/llm_evaluators.py +473 -0
phoenix/experiments/evaluators/utils.py +236 -0
phoenix/experiments/functions.py +772 -0
phoenix/experiments/tracing.py +86 -0
phoenix/experiments/types.py +726 -0
phoenix/experiments/utils.py +25 -0
phoenix/inferences/__init__.py +0 -0
phoenix/{datasets → inferences}/errors.py +6 -5
phoenix/{datasets → inferences}/fixtures.py +49 -42
phoenix/{datasets/dataset.py → inferences/inferences.py} +121 -105
phoenix/{datasets → inferences}/schema.py +11 -11
phoenix/{datasets → inferences}/validation.py +13 -14
phoenix/logging/__init__.py +3 -0
phoenix/logging/_config.py +90 -0
phoenix/logging/_filter.py +6 -0
phoenix/logging/_formatter.py +69 -0
phoenix/metrics/__init__.py +5 -4
phoenix/metrics/binning.py +4 -3
phoenix/metrics/metrics.py +2 -1
phoenix/metrics/mixins.py +7 -6
phoenix/metrics/retrieval_metrics.py +2 -1
phoenix/metrics/timeseries.py +5 -4
phoenix/metrics/wrappers.py +9 -3
phoenix/pointcloud/clustering.py +5 -5
phoenix/pointcloud/pointcloud.py +7 -5
phoenix/pointcloud/projectors.py +5 -6
phoenix/pointcloud/umap_parameters.py +53 -52
phoenix/server/api/README.md +28 -0
phoenix/server/api/auth.py +44 -0
phoenix/server/api/context.py +152 -9
phoenix/server/api/dataloaders/__init__.py +91 -0
phoenix/server/api/dataloaders/annotation_summaries.py +139 -0
phoenix/server/api/dataloaders/average_experiment_run_latency.py +54 -0
phoenix/server/api/dataloaders/cache/__init__.py +3 -0
phoenix/server/api/dataloaders/cache/two_tier_cache.py +68 -0
phoenix/server/api/dataloaders/dataset_example_revisions.py +131 -0
phoenix/server/api/dataloaders/dataset_example_spans.py +38 -0
phoenix/server/api/dataloaders/document_evaluation_summaries.py +144 -0
phoenix/server/api/dataloaders/document_evaluations.py +31 -0
phoenix/server/api/dataloaders/document_retrieval_metrics.py +89 -0
phoenix/server/api/dataloaders/experiment_annotation_summaries.py +79 -0
phoenix/server/api/dataloaders/experiment_error_rates.py +58 -0
phoenix/server/api/dataloaders/experiment_run_annotations.py +36 -0
phoenix/server/api/dataloaders/experiment_run_counts.py +49 -0
phoenix/server/api/dataloaders/experiment_sequence_number.py +44 -0
phoenix/server/api/dataloaders/latency_ms_quantile.py +188 -0
phoenix/server/api/dataloaders/min_start_or_max_end_times.py +85 -0
phoenix/server/api/dataloaders/project_by_name.py +31 -0
phoenix/server/api/dataloaders/record_counts.py +116 -0
phoenix/server/api/dataloaders/session_io.py +79 -0
phoenix/server/api/dataloaders/session_num_traces.py +30 -0
phoenix/server/api/dataloaders/session_num_traces_with_error.py +32 -0
phoenix/server/api/dataloaders/session_token_usages.py +41 -0
phoenix/server/api/dataloaders/session_trace_latency_ms_quantile.py +55 -0
phoenix/server/api/dataloaders/span_annotations.py +26 -0
phoenix/server/api/dataloaders/span_dataset_examples.py +31 -0
phoenix/server/api/dataloaders/span_descendants.py +57 -0
phoenix/server/api/dataloaders/span_projects.py +33 -0
phoenix/server/api/dataloaders/token_counts.py +124 -0
phoenix/server/api/dataloaders/trace_by_trace_ids.py +25 -0
phoenix/server/api/dataloaders/trace_root_spans.py +32 -0
phoenix/server/api/dataloaders/user_roles.py +30 -0
phoenix/server/api/dataloaders/users.py +33 -0
phoenix/server/api/exceptions.py +48 -0
phoenix/server/api/helpers/__init__.py +12 -0
phoenix/server/api/helpers/dataset_helpers.py +217 -0
phoenix/server/api/helpers/experiment_run_filters.py +763 -0
phoenix/server/api/helpers/playground_clients.py +948 -0
phoenix/server/api/helpers/playground_registry.py +70 -0
phoenix/server/api/helpers/playground_spans.py +455 -0
phoenix/server/api/input_types/AddExamplesToDatasetInput.py +16 -0
phoenix/server/api/input_types/AddSpansToDatasetInput.py +14 -0
phoenix/server/api/input_types/ChatCompletionInput.py +38 -0
phoenix/server/api/input_types/ChatCompletionMessageInput.py +24 -0
phoenix/server/api/input_types/ClearProjectInput.py +15 -0
phoenix/server/api/input_types/ClusterInput.py +2 -2
phoenix/server/api/input_types/CreateDatasetInput.py +12 -0
phoenix/server/api/input_types/CreateSpanAnnotationInput.py +18 -0
phoenix/server/api/input_types/CreateTraceAnnotationInput.py +18 -0
phoenix/server/api/input_types/DataQualityMetricInput.py +5 -2
phoenix/server/api/input_types/DatasetExampleInput.py +14 -0
phoenix/server/api/input_types/DatasetSort.py +17 -0
phoenix/server/api/input_types/DatasetVersionSort.py +16 -0
phoenix/server/api/input_types/DeleteAnnotationsInput.py +7 -0
phoenix/server/api/input_types/DeleteDatasetExamplesInput.py +13 -0
phoenix/server/api/input_types/DeleteDatasetInput.py +7 -0
phoenix/server/api/input_types/DeleteExperimentsInput.py +7 -0
phoenix/server/api/input_types/DimensionFilter.py +4 -4
phoenix/server/api/input_types/GenerativeModelInput.py +17 -0
phoenix/server/api/input_types/Granularity.py +1 -1
phoenix/server/api/input_types/InvocationParameters.py +162 -0
phoenix/server/api/input_types/PatchAnnotationInput.py +19 -0
phoenix/server/api/input_types/PatchDatasetExamplesInput.py +35 -0
phoenix/server/api/input_types/PatchDatasetInput.py +14 -0
phoenix/server/api/input_types/PerformanceMetricInput.py +5 -2
phoenix/server/api/input_types/ProjectSessionSort.py +29 -0
phoenix/server/api/input_types/SpanAnnotationSort.py +17 -0
phoenix/server/api/input_types/SpanSort.py +134 -69
phoenix/server/api/input_types/TemplateOptions.py +10 -0
phoenix/server/api/input_types/TraceAnnotationSort.py +17 -0
phoenix/server/api/input_types/UserRoleInput.py +9 -0
phoenix/server/api/mutations/__init__.py +28 -0
phoenix/server/api/mutations/api_key_mutations.py +167 -0
phoenix/server/api/mutations/chat_mutations.py +593 -0
phoenix/server/api/mutations/dataset_mutations.py +591 -0
phoenix/server/api/mutations/experiment_mutations.py +75 -0
phoenix/server/api/{types/ExportEventsMutation.py → mutations/export_events_mutations.py} +21 -18
phoenix/server/api/mutations/project_mutations.py +57 -0
phoenix/server/api/mutations/span_annotations_mutations.py +128 -0
phoenix/server/api/mutations/trace_annotations_mutations.py +127 -0
phoenix/server/api/mutations/user_mutations.py +329 -0
phoenix/server/api/openapi/__init__.py +0 -0
phoenix/server/api/openapi/main.py +17 -0
phoenix/server/api/openapi/schema.py +16 -0
phoenix/server/api/queries.py +738 -0
phoenix/server/api/routers/__init__.py +11 -0
phoenix/server/api/routers/auth.py +284 -0
phoenix/server/api/routers/embeddings.py +26 -0
phoenix/server/api/routers/oauth2.py +488 -0
phoenix/server/api/routers/v1/__init__.py +64 -0
phoenix/server/api/routers/v1/datasets.py +1017 -0
phoenix/server/api/routers/v1/evaluations.py +362 -0
phoenix/server/api/routers/v1/experiment_evaluations.py +115 -0
phoenix/server/api/routers/v1/experiment_runs.py +167 -0
phoenix/server/api/routers/v1/experiments.py +308 -0
phoenix/server/api/routers/v1/pydantic_compat.py +78 -0
phoenix/server/api/routers/v1/spans.py +267 -0
phoenix/server/api/routers/v1/traces.py +208 -0
phoenix/server/api/routers/v1/utils.py +95 -0
phoenix/server/api/schema.py +44 -241
phoenix/server/api/subscriptions.py +597 -0
phoenix/server/api/types/Annotation.py +21 -0
phoenix/server/api/types/AnnotationSummary.py +55 -0
phoenix/server/api/types/AnnotatorKind.py +16 -0
phoenix/server/api/types/ApiKey.py +27 -0
phoenix/server/api/types/AuthMethod.py +9 -0
phoenix/server/api/types/ChatCompletionMessageRole.py +11 -0
phoenix/server/api/types/ChatCompletionSubscriptionPayload.py +46 -0
phoenix/server/api/types/Cluster.py +25 -24
phoenix/server/api/types/CreateDatasetPayload.py +8 -0
phoenix/server/api/types/DataQualityMetric.py +31 -13
phoenix/server/api/types/Dataset.py +288 -63
phoenix/server/api/types/DatasetExample.py +85 -0
phoenix/server/api/types/DatasetExampleRevision.py +34 -0
phoenix/server/api/types/DatasetVersion.py +14 -0
phoenix/server/api/types/Dimension.py +32 -31
phoenix/server/api/types/DocumentEvaluationSummary.py +9 -8
phoenix/server/api/types/EmbeddingDimension.py +56 -49
phoenix/server/api/types/Evaluation.py +25 -31
phoenix/server/api/types/EvaluationSummary.py +30 -50
phoenix/server/api/types/Event.py +20 -20
phoenix/server/api/types/ExampleRevisionInterface.py +14 -0
phoenix/server/api/types/Experiment.py +152 -0
phoenix/server/api/types/ExperimentAnnotationSummary.py +13 -0
phoenix/server/api/types/ExperimentComparison.py +17 -0
phoenix/server/api/types/ExperimentRun.py +119 -0
phoenix/server/api/types/ExperimentRunAnnotation.py +56 -0
phoenix/server/api/types/GenerativeModel.py +9 -0
phoenix/server/api/types/GenerativeProvider.py +85 -0
phoenix/server/api/types/Inferences.py +80 -0
phoenix/server/api/types/InferencesRole.py +23 -0
phoenix/server/api/types/LabelFraction.py +7 -0
phoenix/server/api/types/MimeType.py +2 -2
phoenix/server/api/types/Model.py +54 -54
phoenix/server/api/types/PerformanceMetric.py +8 -5
phoenix/server/api/types/Project.py +407 -142
phoenix/server/api/types/ProjectSession.py +139 -0
phoenix/server/api/types/Segments.py +4 -4
phoenix/server/api/types/Span.py +221 -176
phoenix/server/api/types/SpanAnnotation.py +43 -0
phoenix/server/api/types/SpanIOValue.py +15 -0
phoenix/server/api/types/SystemApiKey.py +9 -0
phoenix/server/api/types/TemplateLanguage.py +10 -0
phoenix/server/api/types/TimeSeries.py +19 -15
phoenix/server/api/types/TokenUsage.py +11 -0
phoenix/server/api/types/Trace.py +154 -0
phoenix/server/api/types/TraceAnnotation.py +45 -0
phoenix/server/api/types/UMAPPoints.py +7 -7
phoenix/server/api/types/User.py +60 -0
phoenix/server/api/types/UserApiKey.py +45 -0
phoenix/server/api/types/UserRole.py +15 -0
phoenix/server/api/types/node.py +4 -112
phoenix/server/api/types/pagination.py +156 -57
phoenix/server/api/utils.py +34 -0
phoenix/server/app.py +864 -115
phoenix/server/bearer_auth.py +163 -0
phoenix/server/dml_event.py +136 -0
phoenix/server/dml_event_handler.py +256 -0
phoenix/server/email/__init__.py +0 -0
phoenix/server/email/sender.py +97 -0
phoenix/server/email/templates/__init__.py +0 -0
phoenix/server/email/templates/password_reset.html +19 -0
phoenix/server/email/types.py +11 -0
phoenix/server/grpc_server.py +102 -0
phoenix/server/jwt_store.py +505 -0
phoenix/server/main.py +305 -116
phoenix/server/oauth2.py +52 -0
phoenix/server/openapi/__init__.py +0 -0
phoenix/server/prometheus.py +111 -0
phoenix/server/rate_limiters.py +188 -0
phoenix/server/static/.vite/manifest.json +87 -0
phoenix/server/static/assets/components-Cy9nwIvF.js +2125 -0
phoenix/server/static/assets/index-BKvHIxkk.js +113 -0
phoenix/server/static/assets/pages-CUi2xCVQ.js +4449 -0
phoenix/server/static/assets/vendor-DvC8cT4X.js +894 -0
phoenix/server/static/assets/vendor-DxkFTwjz.css +1 -0
phoenix/server/static/assets/vendor-arizeai-Do1793cv.js +662 -0
phoenix/server/static/assets/vendor-codemirror-BzwZPyJM.js +24 -0
phoenix/server/static/assets/vendor-recharts-_Jb7JjhG.js +59 -0
phoenix/server/static/assets/vendor-shiki-Cl9QBraO.js +5 -0
phoenix/server/static/assets/vendor-three-DwGkEfCM.js +2998 -0
phoenix/server/telemetry.py +68 -0
phoenix/server/templates/index.html +82 -23
phoenix/server/thread_server.py +3 -3
phoenix/server/types.py +275 -0
phoenix/services.py +27 -18
phoenix/session/client.py +743 -68
phoenix/session/data_extractor.py +31 -7
phoenix/session/evaluation.py +3 -9
phoenix/session/session.py +263 -219
phoenix/settings.py +22 -0
phoenix/trace/__init__.py +2 -22
phoenix/trace/attributes.py +338 -0
phoenix/trace/dsl/README.md +116 -0
phoenix/trace/dsl/filter.py +663 -213
phoenix/trace/dsl/helpers.py +73 -21
phoenix/trace/dsl/query.py +574 -201
phoenix/trace/exporter.py +24 -19
phoenix/trace/fixtures.py +368 -32
phoenix/trace/otel.py +71 -219
phoenix/trace/projects.py +3 -2
phoenix/trace/schemas.py +33 -11
phoenix/trace/span_evaluations.py +21 -16
phoenix/trace/span_json_decoder.py +6 -4
phoenix/trace/span_json_encoder.py +2 -2
phoenix/trace/trace_dataset.py +47 -32
phoenix/trace/utils.py +21 -4
phoenix/utilities/__init__.py +0 -26
phoenix/utilities/client.py +132 -0
phoenix/utilities/deprecation.py +31 -0
phoenix/utilities/error_handling.py +3 -2
phoenix/utilities/json.py +109 -0
phoenix/utilities/logging.py +8 -0
phoenix/utilities/project.py +2 -2
phoenix/utilities/re.py +49 -0
phoenix/utilities/span_store.py +0 -23
phoenix/utilities/template_formatters.py +99 -0
phoenix/version.py +1 -1
arize_phoenix-3.16.1.dist-info/METADATA +0 -495
arize_phoenix-3.16.1.dist-info/RECORD +0 -178
phoenix/core/project.py +0 -619
phoenix/core/traces.py +0 -96
phoenix/experimental/evals/__init__.py +0 -73
phoenix/experimental/evals/evaluators.py +0 -413
phoenix/experimental/evals/functions/__init__.py +0 -4
phoenix/experimental/evals/functions/classify.py +0 -453
phoenix/experimental/evals/functions/executor.py +0 -353
phoenix/experimental/evals/functions/generate.py +0 -138
phoenix/experimental/evals/functions/processing.py +0 -76
phoenix/experimental/evals/models/__init__.py +0 -14
phoenix/experimental/evals/models/anthropic.py +0 -175
phoenix/experimental/evals/models/base.py +0 -170
phoenix/experimental/evals/models/bedrock.py +0 -221
phoenix/experimental/evals/models/litellm.py +0 -134
phoenix/experimental/evals/models/openai.py +0 -448
phoenix/experimental/evals/models/rate_limiters.py +0 -246
phoenix/experimental/evals/models/vertex.py +0 -173
phoenix/experimental/evals/models/vertexai.py +0 -186
phoenix/experimental/evals/retrievals.py +0 -96
phoenix/experimental/evals/templates/__init__.py +0 -50
phoenix/experimental/evals/templates/default_templates.py +0 -472
phoenix/experimental/evals/templates/template.py +0 -195
phoenix/experimental/evals/utils/__init__.py +0 -172
phoenix/experimental/evals/utils/threads.py +0 -27
phoenix/server/api/helpers.py +0 -11
phoenix/server/api/routers/evaluation_handler.py +0 -109
phoenix/server/api/routers/span_handler.py +0 -70
phoenix/server/api/routers/trace_handler.py +0 -60
phoenix/server/api/types/DatasetRole.py +0 -23
phoenix/server/static/index.css +0 -6
phoenix/server/static/index.js +0 -7447
phoenix/storage/span_store/__init__.py +0 -23
phoenix/storage/span_store/text_file.py +0 -85
phoenix/trace/dsl/missing.py +0 -60
phoenix/trace/langchain/__init__.py +0 -3
phoenix/trace/langchain/instrumentor.py +0 -35
phoenix/trace/llama_index/__init__.py +0 -3
phoenix/trace/llama_index/callback.py +0 -102
phoenix/trace/openai/__init__.py +0 -3
phoenix/trace/openai/instrumentor.py +0 -30
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.1.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.1.dist-info}/licenses/LICENSE +0 -0
/phoenix/{datasets → db/insertion}/__init__.py +0 -0
/phoenix/{experimental → db/migrations}/__init__.py +0 -0
/phoenix/{storage → db/migrations/data_migration_scripts}/__init__.py +0 -0

phoenix/trace/exporter.py CHANGED Viewed

@@ -7,16 +7,19 @@ from types import MethodType
 from typing import Any, Optional
 from urllib.parse import urljoin
-import requests
+import httpx
 from opentelemetry.exporter.otlp.proto.http.trace_exporter import OTLPSpanExporter
-from requests import Session
 from typing_extensions import TypeAlias, assert_never
 import phoenix.trace.v1 as pb
-from phoenix.config import get_env_collector_endpoint, get_env_host, get_env_port
+from phoenix.config import (
+    get_env_client_headers,
+    get_env_collector_endpoint,
+    get_env_host,
+    get_env_port,
+)
 logger = logging.getLogger(__name__)
-logger.addHandler(logging.NullHandler())
 END_OF_QUEUE = None  # sentinel value for queue termination
@@ -33,11 +36,11 @@ class _OpenInferenceExporter(OTLPSpanExporter):
         host = get_env_host()
         if host == "0.0.0.0":
             host = "127.0.0.1"
-        endpoint = urljoin(
-            get_env_collector_endpoint() or f"http://{host}:{get_env_port()}",
-            "/v1/traces",
-        )
-        _warn_if_phoenix_is_not_running(endpoint)
+        base_url = get_env_collector_endpoint() or f"http://{host}:{get_env_port()}"
+        base_url = base_url if base_url.endswith("/") else base_url + "/"
+        _warn_if_phoenix_is_not_running(base_url)
+        endpoint = urljoin(base_url, "v1/traces")
         super().__init__(endpoint)
@@ -68,15 +71,17 @@ class HttpExporter:
         """
         self._host = host or get_env_host()
         self._port = port or get_env_port()
-        self._base_url = (
+        base_url = (
             endpoint
             or get_env_collector_endpoint()
             or f"http://{'127.0.0.1' if self._host == '0.0.0.0' else self._host}:{self._port}"
         )
+        self._base_url = base_url if base_url.endswith("/") else base_url + "/"
         _warn_if_phoenix_is_not_running(self._base_url)
-        self._session = Session()
-        weakref.finalize(self, self._session.close)
-        self._session.headers.update(
+        headers = get_env_client_headers()
+        self._client = httpx.Client(headers=headers)
+        weakref.finalize(self, self._client.close)
+        self._client.headers.update(
             {
                 "content-type": "application/x-protobuf",
                 "content-encoding": "gzip",
@@ -109,24 +114,24 @@ class HttpExporter:
     def _send(self, message: Message) -> None:
         serialized = message.SerializeToString()
-        data = gzip.compress(serialized)
+        content = gzip.compress(serialized)
         try:
-            self._session.post(self._url(message), data=data).raise_for_status()
+            self._client.post(self._url(message), content=content).raise_for_status()
         except Exception as e:
             logger.exception(e)
     def _url(self, message: Message) -> str:
         if isinstance(message, pb.Evaluation):
-            return urljoin(self._base_url, "/v1/evaluations")
+            return urljoin(self._base_url, "v1/evaluations")
         logger.exception(f"unrecognized message type: {type(message)}")
         assert_never(message)
-def _warn_if_phoenix_is_not_running(endpoint: str) -> None:
+def _warn_if_phoenix_is_not_running(base_url: str) -> None:
     try:
-        requests.get(urljoin(endpoint, "/arize_phoenix_version")).raise_for_status()
+        httpx.get(urljoin(base_url, "arize_phoenix_version")).raise_for_status()
     except Exception:
         logger.warning(
-            f"Arize Phoenix is not running on {endpoint}. Launch Phoenix "
+            f"Arize Phoenix is not running on {base_url}. Launch Phoenix "
             f"with `import phoenix as px; px.launch_app()`"
         )

phoenix/trace/fixtures.py CHANGED Viewed

@@ -1,13 +1,37 @@
-from dataclasses import dataclass, field
-from typing import Iterable, Iterator, List, NamedTuple, Optional, Tuple, cast
-from urllib import request
+import logging
+import shutil
+from binascii import hexlify
+from collections import defaultdict
+from collections.abc import Iterable, Iterator, Sequence
+from dataclasses import dataclass, field, replace
+from datetime import datetime, timezone
+from io import StringIO
+from random import getrandbits
+from tempfile import NamedTemporaryFile
+from time import sleep, time
+from typing import (
+    NamedTuple,
+    Optional,
+    cast,
+)
+from urllib.parse import urljoin
+import httpx
 import pandas as pd
 from google.protobuf.wrappers_pb2 import DoubleValue, StringValue
+from httpx import ConnectError, HTTPStatusError
 import phoenix.trace.v1 as pb
+from phoenix.session.client import Client
+from phoenix.trace.schemas import Span
 from phoenix.trace.trace_dataset import TraceDataset
-from phoenix.trace.utils import json_lines_to_df
+from phoenix.trace.utils import (
+    download_json_traces_fixture,
+    json_lines_to_df,
+    parse_file_extension,
+)
+logger = logging.getLogger(__name__)
 class EvaluationResultSchema(NamedTuple):
@@ -28,18 +52,130 @@ class DocumentEvaluationFixture(EvaluationFixture):
     document_position: str = "document_position"
+@dataclass(frozen=True)
+class DatasetFixture:
+    file_name: str
+    name: str
+    input_keys: Sequence[str]
+    output_keys: Sequence[str]
+    metadata_keys: Sequence[str] = ()
+    description: Optional[str] = field(default=None)
+    _df: Optional[pd.DataFrame] = field(default=None, init=False, repr=False)
+    _csv: Optional[str] = field(default=None, init=False, repr=False)
+    def load(self) -> "DatasetFixture":
+        if self._df is None:
+            url = _url(self.file_name)
+            if parse_file_extension(self.file_name) == ".jsonl":
+                df = json_lines_to_df(download_json_traces_fixture(url))
+            elif parse_file_extension(self.file_name) == ".csv":
+                df = pd.read_csv(_url(self.file_name))
+            else:
+                try:
+                    df = pd.read_parquet(url)
+                except Exception:
+                    logger.warning(
+                        f"Failed to download example traces from {url=} "
+                        "due to exception {e=}. "
+                        "Returning empty dataframe for DatasetFixture"
+                    )
+                    df = pd.DataFrame()
+            object.__setattr__(self, "_df", df)
+        return self
+    @property
+    def dataframe(self) -> pd.DataFrame:
+        self.load()
+        return cast(pd.DataFrame, self._df).copy(deep=False)
+    @property
+    def csv(self) -> StringIO:
+        if self._csv is None:
+            with StringIO() as buffer:
+                self.dataframe.to_csv(buffer, index=False)
+                object.__setattr__(self, "_csv", buffer.getvalue())
+        return StringIO(self._csv)
 @dataclass(frozen=True)
 class TracesFixture:
     name: str
     description: str
     file_name: str
     evaluation_fixtures: Iterable[EvaluationFixture] = ()
+    dataset_fixtures: Iterable[DatasetFixture] = ()
+    project_name: Optional[str] = None
+demo_llama_index_rag_fixture = TracesFixture(
+    name="demo_llama_index_rag",
+    project_name="demo_llama_index",
+    description="Traces and evaluations of a RAG chatbot using LlamaIndex.",
+    file_name="demo_llama_index_rag_traces.parquet",
+    evaluation_fixtures=(
+        EvaluationFixture(
+            evaluation_name="Q&A Correctness",
+            file_name="demo_llama_index_rag_qa_correctness_eval.parquet",
+        ),
+        EvaluationFixture(
+            evaluation_name="Hallucination",
+            file_name="demo_llama_index_rag_hallucination_eval.parquet",
+        ),
+        DocumentEvaluationFixture(
+            evaluation_name="Relevance",
+            file_name="demo_llama_index_rag_doc_relevance_eval.parquet",
+        ),
+    ),
+    dataset_fixtures=(
+        DatasetFixture(
+            file_name="demo_llama_index_finetune_dataset.jsonl",
+            input_keys=("messages",),
+            output_keys=("messages",),
+            name="Demo LlamaIndex: RAG Q&A",
+            description="OpenAI GPT-3.5 LLM dataset for LlamaIndex demo",
+        ),
+    ),
+)
+demo_code_based_agent_fixture = TracesFixture(
+    name="demo_code_based_agent",
+    project_name="demo_agents",
+    description="LangGraph, LlamaIndex, and Code-based agent traces",
+    file_name="agent-demo-traces.parquet",
+)
+demo_langgraph_agent_fixture = TracesFixture(
+    name="demo_langgraph_agent",
+    project_name="demo_agents",
+    description="LangGraph, LlamaIndex, and Code-based agent traces",
+    file_name="langgraph-demo-traces-format-updated.parquet",
+)
+demo_llamaindex_workflows_agent_fixture = TracesFixture(
+    name="demo_llamaindex_workflows_agent",
+    project_name="demo_agents",
+    description="LangGraph, LlamaIndex, and Code-based agent traces",
+    file_name="llamaindex-workflow-demo-traces.parquet",
+)
+demo_o1_preview_timeseries_testing_fixture = TracesFixture(
+    name="demo_o1_preview_timeseries_evals",
+    project_name="demo_o1_preview_timeseries",
+    description="Shows the traces for a timeseries evaluation of o1-preview",
+    file_name="o1-traces-preview-testing.parquet",
+)
+demo_llama_index_rag_llm_fixture = TracesFixture(
+    name="demo_llama_index_rag_llm",
+    project_name="demo_llama_index_rag_llm",
+    description="LLM traces for RAG chatbot using LlamaIndex.",
+    file_name="demo_llama_index_llm_all_spans.parquet",
+)
 llama_index_rag_fixture = TracesFixture(
     name="llama_index_rag",
     description="Traces from running the llama_index on a RAG use case.",
-    file_name="llama_index_rag_v8.jsonl",
+    file_name="llama_index_rag_v8.parquet",
     evaluation_fixtures=(
         EvaluationFixture(
             evaluation_name="Q&A Correctness",
@@ -54,45 +190,104 @@ llama_index_rag_fixture = TracesFixture(
             file_name="llama_index_rag_v8.retrieved_documents_eval.parquet",
         ),
     ),
+    dataset_fixtures=(
+        DatasetFixture(
+            file_name="hybridial_samples.csv.gz",
+            input_keys=("messages", "ctxs"),
+            output_keys=("answers",),
+            name="ChatRAG-Bench: Hybrid Dialogue (samples)",
+            description="https://huggingface.co/datasets/nvidia/ChatRAG-Bench/viewer/hybridial",
+        ),
+        DatasetFixture(
+            file_name="sqa_samples.csv.gz",
+            input_keys=("messages", "ctxs"),
+            output_keys=("answers",),
+            name="ChatRAG-Bench: SQA (samples)",
+            description="https://huggingface.co/datasets/nvidia/ChatRAG-Bench/viewer/sqa",
+        ),
+        DatasetFixture(
+            file_name="doqa_cooking_samples.csv.gz",
+            input_keys=("messages", "ctxs"),
+            output_keys=("answers",),
+            name="ChatRAG-Bench: DoQA Cooking (samples)",
+            description="https://huggingface.co/datasets/nvidia/ChatRAG-Bench/viewer/doqa_cooking",
+        ),
+        DatasetFixture(
+            file_name="synthetic_convqa_samples.csv.gz",
+            input_keys=("messages", "document"),
+            output_keys=("answers",),
+            name="ChatQA-Train: Synthetic ConvQA (samples)",
+            description="https://huggingface.co/datasets/nvidia/ChatQA-Training-Data/viewer/synthetic_convqa",
+        ),
+    ),
+)
+project_sessions_llama_index_rag_arize_docs_fixture = TracesFixture(
+    name="project_sessions_llama_index_rag_arize_docs",
+    project_name="SESSIONS-DEMO",
+    file_name="project_sessions_demo_llama_index_query_engine_arize_docs.parquet",
+    description="RAG queries grouped by session.id and user.id.",
 )
 llama_index_calculator_agent_fixture = TracesFixture(
     name="llama_index_calculator_agent",
     description="Traces from running the llama_index with calculator tools.",
-    file_name="llama_index_calculator_agent_v3.jsonl",
+    file_name="llama_index_calculator_agent_v3.parquet",
 )
 llama_index_rag_fixture_with_davinci = TracesFixture(
     name="llama_index_rag_with_davinci",
     description="Traces from running llama_index on a RAG use case with the completions API.",
-    file_name="llama_index_rag_with_davinci_v0.jsonl",
+    file_name="llama_index_rag_with_davinci_v0.parquet",
 )
 langchain_rag_stuff_document_chain_fixture = TracesFixture(
     name="langchain_rag_stuff_document_chain",
+    project_name="demo_langchain_rag",
     description="LangChain RAG data",
-    file_name="langchain_rag.jsonl",
+    file_name="langchain_rag.parquet",
 )
 langchain_titanic_csv_agent_evaluator_fixture = TracesFixture(
     name="lc_titanic",
     description="LangChain titanic.csv Agent Evaluator",
-    file_name="lc_titanic.jsonl",
+    file_name="lc_titanic.parquet",
 )
 langchain_qa_with_sources_fixture = TracesFixture(
     name="langchain_qa_with_sources",
     description="LangChain QA with sources on financial data",
-    file_name="langchain_qa_with_sources_chain.jsonl",
+    file_name="langchain_qa_with_sources_chain.parquet",
+)
+vision_fixture = TracesFixture(
+    name="vision",
+    project_name="demo_multimodal",
+    description="Vision LLM Requests",
+    file_name="vision_fixture_trace_datasets.parquet",
+)
+anthropic_tools_fixture = TracesFixture(
+    name="anthropic_tools",
+    project_name="anthropic_tools",
+    description="Anthropic tools traces",
+    file_name="anthropic_tools.parquet",
 )
 random_fixture = TracesFixture(
     name="random",
+    project_name="demo_random",
     description="Randomly generated traces",
     file_name="random.jsonl",
 )
-TRACES_FIXTURES: List[TracesFixture] = [
+TRACES_FIXTURES: list[TracesFixture] = [
+    demo_llama_index_rag_fixture,
+    demo_llama_index_rag_llm_fixture,
+    demo_langgraph_agent_fixture,
+    demo_code_based_agent_fixture,
+    demo_llamaindex_workflows_agent_fixture,
+    demo_o1_preview_timeseries_testing_fixture,
     llama_index_rag_fixture,
     llama_index_rag_fixture_with_davinci,
     langchain_rag_stuff_document_chain_fixture,
@@ -100,14 +295,23 @@ TRACES_FIXTURES: List[TracesFixture] = [
     random_fixture,
     langchain_qa_with_sources_fixture,
     llama_index_calculator_agent_fixture,
+    vision_fixture,
+    anthropic_tools_fixture,
+    project_sessions_llama_index_rag_arize_docs_fixture,
 ]
-NAME_TO_TRACES_FIXTURE = {fixture.name: fixture for fixture in TRACES_FIXTURES}
+NAME_TO_TRACES_FIXTURE: dict[str, TracesFixture] = {
+    fixture.name: fixture for fixture in TRACES_FIXTURES
+}
+PROJ_NAME_TO_TRACES_FIXTURE: defaultdict[str, list[TracesFixture]] = defaultdict(list)
+for fixture in TRACES_FIXTURES:
+    if fixture.project_name:
+        PROJ_NAME_TO_TRACES_FIXTURE[fixture.project_name].append(fixture)
-def _get_trace_fixture_by_name(fixture_name: str) -> TracesFixture:
+def get_trace_fixture_by_name(fixture_name: str) -> TracesFixture:
     """
-    Returns the fixture whose name matches the input name.
+    Returns the trace fixture whose name matches the input name.
     Raises
     ------
@@ -120,31 +324,105 @@ def _get_trace_fixture_by_name(fixture_name: str) -> TracesFixture:
     return NAME_TO_TRACES_FIXTURE[fixture_name]
-def _download_traces_fixture(
-    fixture: TracesFixture,
-    host: Optional[str] = "https://storage.googleapis.com/",
-    bucket: Optional[str] = "arize-assets",
-    prefix: Optional[str] = "phoenix/traces/",
-) -> List[str]:
+def get_trace_fixtures_by_project_name(proj_name: str) -> list[TracesFixture]:
     """
-    Downloads the traces fixture from the phoenix bucket.
+    Returns a dictionary of project name (key) and set of TracesFixtures (value)
+    whose project name matches the input name.
+    Raises
+    ------
+    ValueError
+        if the input fixture name does not match any known project names.
     """
-    url = f"{host}{bucket}/{prefix}{fixture.file_name}"
-    with request.urlopen(url) as f:
-        return cast(List[str], f.readlines())
+    if proj_name not in PROJ_NAME_TO_TRACES_FIXTURE:
+        valid_fixture_proj_names = ", ".join(PROJ_NAME_TO_TRACES_FIXTURE.keys())
+        raise ValueError(
+            f'"{proj_name}" is invalid. Valid project names are: {valid_fixture_proj_names}'
+        )
+    return PROJ_NAME_TO_TRACES_FIXTURE[proj_name]
-def load_example_traces(use_case: str) -> TraceDataset:
+def load_example_traces(fixture_name: str) -> TraceDataset:
     """
     Loads a trace dataframe by name.
     """
-    fixture = _get_trace_fixture_by_name(use_case)
-    return TraceDataset(json_lines_to_df(_download_traces_fixture(fixture)))
+    fixture = get_trace_fixture_by_name(fixture_name)
+    url = _url(fixture.file_name)
+    if parse_file_extension(fixture.file_name) == ".jsonl":
+        return TraceDataset(json_lines_to_df(download_json_traces_fixture(url)))
+    try:
+        df = pd.read_parquet(url)
+    except Exception as e:
+        logger.warning(
+            f"Failed to download example traces from {url=} due to exception {e=}. "
+            "Returning empty TraceDataset"
+        )
+        df = pd.DataFrame()
+    return TraceDataset(df)
+def get_dataset_fixtures(fixture_name: str) -> Iterable[DatasetFixture]:
+    return (fixture.load() for fixture in get_trace_fixture_by_name(fixture_name).dataset_fixtures)
+def send_dataset_fixtures(
+    endpoint: str,
+    fixtures: Iterable[DatasetFixture],
+) -> None:
+    expiration = time() + 5
+    while time() < expiration:
+        try:
+            url = urljoin(endpoint, "/healthz")
+            httpx.get(url=url).raise_for_status()
+        except ConnectError:
+            sleep(0.1)
+            continue
+        except Exception as e:
+            print(str(e))
+            raise
+        break
+    client = Client(endpoint=endpoint)
+    for i, fixture in enumerate(fixtures):
+        try:
+            if i % 2:
+                client.upload_dataset(
+                    dataset_name=fixture.name,
+                    dataframe=fixture.dataframe,
+                    input_keys=fixture.input_keys,
+                    output_keys=fixture.output_keys,
+                    metadata_keys=fixture.metadata_keys,
+                    dataset_description=fixture.description,
+                )
+            else:
+                with NamedTemporaryFile() as tf:
+                    with open(tf.name, "w") as f:
+                        shutil.copyfileobj(fixture.csv, f)
+                        f.flush()
+                    client.upload_dataset(
+                        dataset_name=fixture.name,
+                        csv_file_path=tf.name,
+                        input_keys=fixture.input_keys,
+                        output_keys=fixture.output_keys,
+                        metadata_keys=fixture.metadata_keys,
+                        dataset_description=fixture.description,
+                    )
+        except HTTPStatusError as e:
+            print(e.response.content.decode())
+            pass
+        else:
+            name, df = fixture.name, fixture.dataframe
+            print(f"Dataset sent: {name=}, {len(df)=}")
-def get_evals_from_fixture(use_case: str) -> Iterator[pb.Evaluation]:
-    fixture = _get_trace_fixture_by_name(use_case)
+def get_evals_from_fixture(fixture_name: str) -> Iterator[pb.Evaluation]:
+    fixture = get_trace_fixture_by_name(fixture_name)
     for eval_fixture in fixture.evaluation_fixtures:
+        logger.info(
+            f"Loading eval fixture '{eval_fixture.evaluation_name}' from '{eval_fixture.file_name}'"
+        )
         yield from _read_eval_fixture(eval_fixture)
@@ -161,7 +439,7 @@ def _read_eval_fixture(eval_fixture: EvaluationFixture) -> Iterator[pb.Evaluatio
             explanation=StringValue(value=cast(str, explanation)) if explanation else None,
         )
         if isinstance(eval_fixture, DocumentEvaluationFixture):
-            span_id, document_position = cast(Tuple[str, int], index)
+            span_id, document_position = cast(tuple[str, int], index)
             # Legacy fixture files contain UUID strings for span_ids. The hyphens in these
             # strings need to be removed because we are also removing the hyphens from the
             # span_ids of their corresponding traces. In general, hyphen is not an allowed
@@ -191,7 +469,65 @@ def _read_eval_fixture(eval_fixture: EvaluationFixture) -> Iterator[pb.Evaluatio
 def _url(
     file_name: str,
     host: Optional[str] = "https://storage.googleapis.com/",
-    bucket: Optional[str] = "arize-assets",
-    prefix: Optional[str] = "phoenix/traces/",
+    bucket: Optional[str] = "arize-phoenix-assets",
+    prefix: Optional[str] = "traces/",
 ) -> str:
     return f"{host}{bucket}/{prefix}{file_name}"
+def reset_fixture_span_ids_and_timestamps(
+    spans: Iterable[Span],
+    evals: Iterable[pb.Evaluation] = (),
+) -> tuple[list[Span], list[pb.Evaluation]]:
+    old_spans, old_evals = list(spans), list(evals)
+    new_trace_ids: dict[str, str] = {}
+    new_span_ids: dict[str, str] = {}
+    for old_span in old_spans:
+        new_trace_ids[old_span.context.trace_id] = _new_trace_id()
+        new_span_ids[old_span.context.span_id] = _new_span_id()
+        if old_span.parent_id:
+            new_span_ids[old_span.parent_id] = _new_span_id()
+    for old_eval in old_evals:
+        subject_id = old_eval.subject_id
+        if trace_id := subject_id.trace_id:
+            new_trace_ids[trace_id] = _new_trace_id()
+        elif span_id := subject_id.span_id:
+            new_span_ids[span_id] = _new_span_id()
+        elif span_id := subject_id.document_retrieval_id.span_id:
+            new_span_ids[span_id] = _new_span_id()
+    max_end_time = max(old_span.end_time for old_span in old_spans)
+    time_diff = datetime.now(timezone.utc) - max_end_time
+    new_spans: list[Span] = []
+    new_evals: list[pb.Evaluation] = []
+    for old_span in old_spans:
+        new_trace_id = new_trace_ids[old_span.context.trace_id]
+        new_span_id = new_span_ids[old_span.context.span_id]
+        new_parent_id = new_span_ids[old_span.parent_id] if old_span.parent_id else None
+        new_span = replace(
+            old_span,
+            context=replace(old_span.context, trace_id=new_trace_id, span_id=new_span_id),
+            parent_id=new_parent_id,
+            start_time=old_span.start_time + time_diff,
+            end_time=old_span.end_time + time_diff,
+        )
+        new_spans.append(new_span)
+    for old_eval in old_evals:
+        new_eval = pb.Evaluation()
+        new_eval.CopyFrom(old_eval)
+        subject_id = new_eval.subject_id
+        if trace_id := subject_id.trace_id:
+            subject_id.trace_id = new_trace_ids[trace_id]
+        elif span_id := subject_id.span_id:
+            subject_id.span_id = new_span_ids[span_id]
+        elif span_id := subject_id.document_retrieval_id.span_id:
+            subject_id.document_retrieval_id.span_id = new_span_ids[span_id]
+        new_evals.append(new_eval)
+    return new_spans, new_evals
+def _new_trace_id() -> str:
+    return hexlify(getrandbits(128).to_bytes(16, "big")).decode()
+def _new_span_id() -> str:
+    return hexlify(getrandbits(64).to_bytes(8, "big")).decode()

arize-phoenix 3.16.1__py3-none-any.whl → 7.7.1__py3-none-any.whl

Potentially problematic release.

arize-phoenix 3.16.1py3-none-any.whl → 7.7.1py3-none-any.whl