PyPI - arize-phoenix - Versions diffs - 4.4.4rc4__py3-none-any.whl → 4.4.4rc6__py3-none-any.whl - Mend

arize-phoenix 4.4.4rc4py3-none-any.whl → 4.4.4rc6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (52) hide show

{arize_phoenix-4.4.4rc4.dist-info → arize_phoenix-4.4.4rc6.dist-info}/METADATA +12 -6
{arize_phoenix-4.4.4rc4.dist-info → arize_phoenix-4.4.4rc6.dist-info}/RECORD +47 -42
phoenix/config.py +21 -0
phoenix/datetime_utils.py +4 -0
phoenix/db/insertion/dataset.py +19 -16
phoenix/db/insertion/evaluation.py +4 -4
phoenix/db/insertion/helpers.py +4 -12
phoenix/db/insertion/span.py +3 -3
phoenix/db/migrations/versions/10460e46d750_datasets.py +2 -2
phoenix/db/models.py +8 -3
phoenix/experiments/__init__.py +6 -0
phoenix/experiments/evaluators/__init__.py +29 -0
phoenix/experiments/evaluators/base.py +153 -0
phoenix/{datasets → experiments}/evaluators/code_evaluators.py +25 -53
phoenix/{datasets → experiments}/evaluators/llm_evaluators.py +62 -31
phoenix/experiments/evaluators/utils.py +189 -0
phoenix/experiments/functions.py +616 -0
phoenix/{datasets → experiments}/tracing.py +19 -0
phoenix/experiments/types.py +722 -0
phoenix/experiments/utils.py +9 -0
phoenix/server/api/context.py +4 -0
phoenix/server/api/dataloaders/__init__.py +4 -0
phoenix/server/api/dataloaders/average_experiment_run_latency.py +54 -0
phoenix/server/api/dataloaders/experiment_run_counts.py +42 -0
phoenix/server/api/helpers/dataset_helpers.py +8 -7
phoenix/server/api/input_types/ClearProjectInput.py +15 -0
phoenix/server/api/mutations/project_mutations.py +9 -4
phoenix/server/api/routers/v1/__init__.py +1 -1
phoenix/server/api/routers/v1/dataset_examples.py +10 -10
phoenix/server/api/routers/v1/datasets.py +152 -48
phoenix/server/api/routers/v1/evaluations.py +4 -11
phoenix/server/api/routers/v1/experiment_evaluations.py +23 -23
phoenix/server/api/routers/v1/experiment_runs.py +5 -17
phoenix/server/api/routers/v1/experiments.py +5 -5
phoenix/server/api/routers/v1/spans.py +6 -4
phoenix/server/api/types/Experiment.py +12 -0
phoenix/server/api/types/ExperimentRun.py +1 -1
phoenix/server/api/types/ExperimentRunAnnotation.py +1 -1
phoenix/server/app.py +4 -0
phoenix/server/static/index.js +712 -588
phoenix/session/client.py +321 -28
phoenix/trace/fixtures.py +6 -6
phoenix/utilities/json.py +8 -8
phoenix/version.py +1 -1
phoenix/datasets/__init__.py +0 -0
phoenix/datasets/evaluators/__init__.py +0 -18
phoenix/datasets/evaluators/_utils.py +0 -13
phoenix/datasets/experiments.py +0 -485
phoenix/datasets/types.py +0 -212
{arize_phoenix-4.4.4rc4.dist-info → arize_phoenix-4.4.4rc6.dist-info}/WHEEL +0 -0
{arize_phoenix-4.4.4rc4.dist-info → arize_phoenix-4.4.4rc6.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-4.4.4rc4.dist-info → arize_phoenix-4.4.4rc6.dist-info}/licenses/LICENSE +0 -0

phoenix/experiments/utils.py ADDED Viewed

@@ -0,0 +1,9 @@
+from phoenix.config import get_web_base_url
+def get_experiment_url(*, dataset_id: str, experiment_id: str) -> str:
+    return f"{get_web_base_url()}datasets/{dataset_id}/compare?experimentId={experiment_id}"
+def get_dataset_experiments_url(*, dataset_id: str) -> str:
+    return f"{get_web_base_url()}datasets/{dataset_id}/experiments"

phoenix/server/api/context.py CHANGED Viewed

@@ -11,6 +11,7 @@ from typing_extensions import TypeAlias
 from phoenix.core.model_schema import Model
 from phoenix.server.api.dataloaders import (
+    AverageExperimentRunLatencyDataLoader,
     CacheForDataLoaders,
     DatasetExampleRevisionsDataLoader,
     DatasetExampleSpansDataLoader,
@@ -20,6 +21,7 @@ from phoenix.server.api.dataloaders import (
     EvaluationSummaryDataLoader,
     ExperimentAnnotationSummaryDataLoader,
     ExperimentErrorRatesDataLoader,
+    ExperimentRunCountsDataLoader,
     ExperimentSequenceNumberDataLoader,
     LatencyMsQuantileDataLoader,
     MinStartOrMaxEndTimeDataLoader,
@@ -36,6 +38,7 @@ from phoenix.server.api.dataloaders import (
 @dataclass
 class DataLoaders:
+    average_experiment_run_latency: AverageExperimentRunLatencyDataLoader
     dataset_example_revisions: DatasetExampleRevisionsDataLoader
     dataset_example_spans: DatasetExampleSpansDataLoader
     document_evaluation_summaries: DocumentEvaluationSummaryDataLoader
@@ -44,6 +47,7 @@ class DataLoaders:
     evaluation_summaries: EvaluationSummaryDataLoader
     experiment_annotation_summaries: ExperimentAnnotationSummaryDataLoader
     experiment_error_rates: ExperimentErrorRatesDataLoader
+    experiment_run_counts: ExperimentRunCountsDataLoader
     experiment_sequence_number: ExperimentSequenceNumberDataLoader
     latency_ms_quantile: LatencyMsQuantileDataLoader
     min_start_or_max_end_times: MinStartOrMaxEndTimeDataLoader

phoenix/server/api/dataloaders/__init__.py CHANGED Viewed

@@ -8,6 +8,7 @@ from phoenix.db.insertion.evaluation import (
 )
 from phoenix.db.insertion.span import ClearProjectSpansEvent, SpanInsertionEvent
+from .average_experiment_run_latency import AverageExperimentRunLatencyDataLoader
 from .dataset_example_revisions import DatasetExampleRevisionsDataLoader
 from .dataset_example_spans import DatasetExampleSpansDataLoader
 from .document_evaluation_summaries import (
@@ -19,6 +20,7 @@ from .document_retrieval_metrics import DocumentRetrievalMetricsDataLoader
 from .evaluation_summaries import EvaluationSummaryCache, EvaluationSummaryDataLoader
 from .experiment_annotation_summaries import ExperimentAnnotationSummaryDataLoader
 from .experiment_error_rates import ExperimentErrorRatesDataLoader
+from .experiment_run_counts import ExperimentRunCountsDataLoader
 from .experiment_sequence_number import ExperimentSequenceNumberDataLoader
 from .latency_ms_quantile import LatencyMsQuantileCache, LatencyMsQuantileDataLoader
 from .min_start_or_max_end_times import MinStartOrMaxEndTimeCache, MinStartOrMaxEndTimeDataLoader
@@ -33,6 +35,7 @@ from .trace_row_ids import TraceRowIdsDataLoader
 __all__ = [
     "CacheForDataLoaders",
+    "AverageExperimentRunLatencyDataLoader",
     "DatasetExampleRevisionsDataLoader",
     "DatasetExampleSpansDataLoader",
     "DocumentEvaluationSummaryDataLoader",
@@ -41,6 +44,7 @@ __all__ = [
     "EvaluationSummaryDataLoader",
     "ExperimentAnnotationSummaryDataLoader",
     "ExperimentErrorRatesDataLoader",
+    "ExperimentRunCountsDataLoader",
     "ExperimentSequenceNumberDataLoader",
     "LatencyMsQuantileDataLoader",
     "MinStartOrMaxEndTimeDataLoader",

phoenix/server/api/dataloaders/average_experiment_run_latency.py ADDED Viewed

@@ -0,0 +1,54 @@
+from typing import (
+    AsyncContextManager,
+    Callable,
+    List,
+)
+from sqlalchemy import func, select
+from sqlalchemy.ext.asyncio import AsyncSession
+from strawberry.dataloader import DataLoader
+from typing_extensions import TypeAlias
+from phoenix.db import models
+ExperimentID: TypeAlias = int
+RunLatency: TypeAlias = float
+Key: TypeAlias = ExperimentID
+Result: TypeAlias = RunLatency
+class AverageExperimentRunLatencyDataLoader(DataLoader[Key, Result]):
+    def __init__(
+        self,
+        db: Callable[[], AsyncContextManager[AsyncSession]],
+    ) -> None:
+        super().__init__(load_fn=self._load_fn)
+        self._db = db
+    async def _load_fn(self, keys: List[Key]) -> List[Result]:
+        experiment_ids = keys
+        async with self._db() as session:
+            avg_latencies = {
+                experiment_id: avg_latency
+                async for experiment_id, avg_latency in await session.stream(
+                    select(
+                        models.ExperimentRun.experiment_id,
+                        func.avg(
+                            func.extract(
+                                "epoch",
+                                models.ExperimentRun.end_time,
+                            )
+                            - func.extract(
+                                "epoch",
+                                models.ExperimentRun.start_time,
+                            )
+                        ),
+                    )
+                    .where(models.ExperimentRun.experiment_id.in_(set(experiment_ids)))
+                    .group_by(models.ExperimentRun.experiment_id)
+                )
+            }
+        return [
+            avg_latencies.get(experiment_id, ValueError(f"Unknown experiment: {experiment_id}"))
+            for experiment_id in experiment_ids
+        ]

phoenix/server/api/dataloaders/experiment_run_counts.py ADDED Viewed

@@ -0,0 +1,42 @@
+from typing import (
+    AsyncContextManager,
+    Callable,
+    List,
+)
+from sqlalchemy import func, select
+from sqlalchemy.ext.asyncio import AsyncSession
+from strawberry.dataloader import DataLoader
+from typing_extensions import TypeAlias
+from phoenix.db import models
+ExperimentID: TypeAlias = int
+RunCount: TypeAlias = int
+Key: TypeAlias = ExperimentID
+Result: TypeAlias = RunCount
+class ExperimentRunCountsDataLoader(DataLoader[Key, Result]):
+    def __init__(
+        self,
+        db: Callable[[], AsyncContextManager[AsyncSession]],
+    ) -> None:
+        super().__init__(load_fn=self._load_fn)
+        self._db = db
+    async def _load_fn(self, keys: List[Key]) -> List[Result]:
+        experiment_ids = keys
+        async with self._db() as session:
+            run_counts = {
+                experiment_id: run_count
+                async for experiment_id, run_count in await session.stream(
+                    select(models.ExperimentRun.experiment_id, func.count())
+                    .where(models.ExperimentRun.experiment_id.in_(set(experiment_ids)))
+                    .group_by(models.ExperimentRun.experiment_id)
+                )
+            }
+        return [
+            run_counts.get(experiment_id, ValueError(f"Unknown experiment: {experiment_id}"))
+            for experiment_id in experiment_ids
+        ]

phoenix/server/api/helpers/dataset_helpers.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import json
 from typing import Any, Dict, Literal, Mapping, Optional, Protocol
 from openinference.semconv.trace import (
@@ -128,14 +129,14 @@ def _get_generic_io_value(
     Makes a best-effort attempt to extract the input or output value from a span
     and returns it as a dictionary.
     """
-    if isinstance(io_value, str) and (
-        mime_type == OpenInferenceMimeTypeValues.TEXT.value or mime_type is None
-    ):
+    if mime_type == OpenInferenceMimeTypeValues.JSON.value:
+        parsed_value = json.loads(io_value)
+        if isinstance(parsed_value, dict):
+            return parsed_value
+        else:
+            return {kind: parsed_value}
+    if isinstance(io_value, str):
         return {kind: io_value}
-    if isinstance(io_value, dict) and (
-        mime_type == OpenInferenceMimeTypeValues.JSON.value or mime_type is None
-    ):
-        return io_value
     return {}

phoenix/server/api/input_types/ClearProjectInput.py ADDED Viewed

@@ -0,0 +1,15 @@
+from datetime import datetime
+from typing import Optional
+import strawberry
+from strawberry import UNSET
+from strawberry.relay import GlobalID
+@strawberry.input
+class ClearProjectInput:
+    id: GlobalID
+    end_time: Optional[datetime] = strawberry.field(
+        default=UNSET,
+        description="The time up to which to purge data. Time is right-open /non-inclusive.",
+    )

phoenix/server/api/mutations/project_mutations.py CHANGED Viewed

@@ -8,6 +8,7 @@ from phoenix.config import DEFAULT_PROJECT_NAME
 from phoenix.db import models
 from phoenix.db.insertion.span import ClearProjectSpansEvent
 from phoenix.server.api.context import Context
+from phoenix.server.api.input_types.ClearProjectInput import ClearProjectInput
 from phoenix.server.api.mutations.auth import IsAuthenticated
 from phoenix.server.api.queries import Query
 from phoenix.server.api.types.node import from_global_id_with_expected_type
@@ -32,11 +33,15 @@ class ProjectMutationMixin:
         return Query()
     @strawberry.mutation(permission_classes=[IsAuthenticated])  # type: ignore
-    async def clear_project(self, info: Info[Context, None], id: GlobalID) -> Query:
-        project_id = from_global_id_with_expected_type(global_id=id, expected_type_name="Project")
+    async def clear_project(self, info: Info[Context, None], input: ClearProjectInput) -> Query:
+        project_id = from_global_id_with_expected_type(
+            global_id=input.id, expected_type_name="Project"
+        )
         delete_statement = delete(models.Trace).where(models.Trace.project_rowid == project_id)
+        if input.end_time is not None:
+            delete_statement = delete_statement.where(models.Trace.start_time < input.end_time)
         async with info.context.db() as session:
             await session.execute(delete_statement)
-            if cache := info.context.cache_for_dataloaders:
-                cache.invalidate(ClearProjectSpansEvent(project_rowid=project_id))
+        if cache := info.context.cache_for_dataloaders:
+            cache.invalidate(ClearProjectSpansEvent(project_rowid=project_id))
         return Query()

phoenix/server/api/routers/v1/__init__.py CHANGED Viewed

@@ -80,7 +80,7 @@ V1_ROUTES = [
     ),
     Route(
         "/v1/experiment_evaluations",
-        experiment_evaluations.create_experiment_evaluation,
+        experiment_evaluations.upsert_experiment_evaluation,
         methods=["POST"],
     ),
 ]

phoenix/server/api/routers/v1/dataset_examples.py CHANGED Viewed

@@ -21,7 +21,7 @@ async def list_dataset_examples(request: Request) -> Response:
           type: string
         description: Dataset ID
       - in: query
-        name: version-id
+        name: version_id
         schema:
           type: string
         description: Dataset version ID. If omitted, returns the latest version.
@@ -79,7 +79,7 @@ async def list_dataset_examples(request: Request) -> Response:
         description: Dataset does not exist.
     """
     dataset_id = GlobalID.from_id(request.path_params["id"])
-    raw_version_id = request.query_params.get("version-id")
+    raw_version_id = request.query_params.get("version_id")
     version_id = GlobalID.from_id(raw_version_id) if raw_version_id else None
     if (dataset_type := dataset_id.type_name) != "Dataset":
@@ -167,12 +167,12 @@ async def list_dataset_examples(request: Request) -> Response:
             }
             async for example, revision in await session.stream(query)
         ]
-        return JSONResponse(
-            {
-                "data": {
-                    "dataset_id": str(GlobalID("Dataset", str(resolved_dataset_id))),
-                    "version_id": str(GlobalID("DatasetVersion", str(resolved_version_id))),
-                    "examples": examples,
-                }
+    return JSONResponse(
+        {
+            "data": {
+                "dataset_id": str(GlobalID("Dataset", str(resolved_dataset_id))),
+                "version_id": str(GlobalID("DatasetVersion", str(resolved_version_id))),
+                "examples": examples,
             }
-        )
+        }
+    )

phoenix/server/api/routers/v1/datasets.py CHANGED Viewed

@@ -13,11 +13,12 @@ from typing import (
     Awaitable,
     Callable,
     Coroutine,
-    Dict,
     FrozenSet,
     Iterator,
     List,
+    Mapping,
     Optional,
+    Sequence,
     Tuple,
     Union,
     cast,
@@ -32,8 +33,8 @@ from starlette.datastructures import FormData, UploadFile
 from starlette.requests import Request
 from starlette.responses import JSONResponse, Response
 from starlette.status import (
-    HTTP_403_FORBIDDEN,
     HTTP_404_NOT_FOUND,
+    HTTP_409_CONFLICT,
     HTTP_422_UNPROCESSABLE_ENTITY,
     HTTP_429_TOO_MANY_REQUESTS,
 )
@@ -44,6 +45,7 @@ from phoenix.db import models
 from phoenix.db.insertion.dataset import (
     DatasetAction,
     DatasetExampleAdditionEvent,
+    ExampleContent,
     add_dataset_examples,
 )
 from phoenix.server.api.types.Dataset import Dataset
@@ -231,7 +233,7 @@ async def get_dataset_by_id(request: Request) -> Response:
             "updated_at": dataset.updated_at.isoformat(),
             "example_count": example_count,
         }
-        return JSONResponse(content=output_dict)
+        return JSONResponse(content={"data": output_dict})
 async def get_dataset_versions(request: Request) -> Response:
@@ -350,7 +352,7 @@ async def get_dataset_versions(request: Request) -> Response:
 async def post_datasets_upload(request: Request) -> Response:
     """
-    summary: Upload CSV or PyArrow file as dataset
+    summary: Upload dataset as either JSON or file (CSV or PyArrow)
     operationId: uploadDataset
     tags:
       - datasets
@@ -362,6 +364,32 @@ async def post_datasets_upload(request: Request) -> Response:
           type: boolean
     requestBody:
       content:
+        application/json:
+          schema:
+            type: object
+            required:
+              - name
+              - inputs
+            properties:
+              action:
+                type: string
+                enum: [create, append]
+              name:
+                type: string
+              description:
+                type: string
+              inputs:
+                type: array
+                items:
+                  type: object
+              outputs:
+                type: array
+                items:
+                  type: object
+              metadata:
+                type: array
+                items:
+                  type: object
         multipart/form-data:
           schema:
             type: object
@@ -401,22 +429,18 @@ async def post_datasets_upload(request: Request) -> Response:
         description: Success
       403:
         description: Forbidden
+      409:
+        description: Dataset of the same name already exists
       422:
         description: Request body is invalid
     """
-    if request.app.state.read_only:
-        return Response(status_code=HTTP_403_FORBIDDEN)
-    async with request.form() as form:
+    request_content_type = request.headers["content-type"]
+    examples: Union[Examples, Awaitable[Examples]]
+    if request_content_type.startswith("application/json"):
         try:
-            (
-                action,
-                name,
-                description,
-                input_keys,
-                output_keys,
-                metadata_keys,
-                file,
-            ) = await _parse_form_data(form)
+            examples, action, name, description = await run_in_threadpool(
+                _process_json, await request.json()
+            )
         except ValueError as e:
             return Response(
                 content=str(e),
@@ -426,24 +450,53 @@ async def post_datasets_upload(request: Request) -> Response:
             async with request.app.state.db() as session:
                 if await _check_table_exists(session, name):
                     return Response(
-                        content=f"Dataset already exists: {name=}",
-                        status_code=HTTP_422_UNPROCESSABLE_ENTITY,
+                        content=f"Dataset with the same name already exists: {name=}",
+                        status_code=HTTP_409_CONFLICT,
                     )
-        content = await file.read()
-    try:
-        examples: Union[Examples, Awaitable[Examples]]
-        content_type = FileContentType(file.content_type)
-        if content_type is FileContentType.CSV:
-            encoding = FileContentEncoding(file.headers.get("content-encoding"))
-            examples, column_headers = await _process_csv(content, encoding)
-        elif content_type is FileContentType.PYARROW:
-            examples, column_headers = await _process_pyarrow(content)
-        else:
-            assert_never(content_type)
-        _check_keys_exist(column_headers, input_keys, output_keys, metadata_keys)
-    except ValueError as e:
+    elif request_content_type.startswith("multipart/form-data"):
+        async with request.form() as form:
+            try:
+                (
+                    action,
+                    name,
+                    description,
+                    input_keys,
+                    output_keys,
+                    metadata_keys,
+                    file,
+                ) = await _parse_form_data(form)
+            except ValueError as e:
+                return Response(
+                    content=str(e),
+                    status_code=HTTP_422_UNPROCESSABLE_ENTITY,
+                )
+            if action is DatasetAction.CREATE:
+                async with request.app.state.db() as session:
+                    if await _check_table_exists(session, name):
+                        return Response(
+                            content=f"Dataset with the same name already exists: {name=}",
+                            status_code=HTTP_409_CONFLICT,
+                        )
+            content = await file.read()
+        try:
+            file_content_type = FileContentType(file.content_type)
+            if file_content_type is FileContentType.CSV:
+                encoding = FileContentEncoding(file.headers.get("content-encoding"))
+                examples = await _process_csv(
+                    content, encoding, input_keys, output_keys, metadata_keys
+                )
+            elif file_content_type is FileContentType.PYARROW:
+                examples = await _process_pyarrow(content, input_keys, output_keys, metadata_keys)
+            else:
+                assert_never(file_content_type)
+        except ValueError as e:
+            return Response(
+                content=str(e),
+                status_code=HTTP_422_UNPROCESSABLE_ENTITY,
+            )
+    else:
         return Response(
-            content=str(e),
+            content=str("Invalid request Content-Type"),
             status_code=HTTP_422_UNPROCESSABLE_ENTITY,
         )
     operation = cast(
@@ -454,9 +507,6 @@ async def post_datasets_upload(request: Request) -> Response:
             action=action,
             name=name,
             description=description,
-            input_keys=input_keys,
-            output_keys=output_keys,
-            metadata_keys=metadata_keys,
         ),
     )
     if request.query_params.get("sync") == "true":
@@ -505,13 +555,46 @@ InputKeys: TypeAlias = FrozenSet[str]
 OutputKeys: TypeAlias = FrozenSet[str]
 MetadataKeys: TypeAlias = FrozenSet[str]
 DatasetId: TypeAlias = int
-Examples: TypeAlias = Iterator[Dict[str, Any]]
+Examples: TypeAlias = Iterator[ExampleContent]
+def _process_json(
+    data: Mapping[str, Any],
+) -> Tuple[Examples, DatasetAction, Name, Description]:
+    name = data.get("name")
+    if not name:
+        raise ValueError("Dataset name is required")
+    description = data.get("description") or ""
+    inputs = data.get("inputs")
+    if not inputs:
+        raise ValueError("input is required")
+    if not isinstance(inputs, list) or not _is_all_dict(inputs):
+        raise ValueError("Input should be a list containing only dictionary objects")
+    outputs, metadata = data.get("outputs"), data.get("metadata")
+    for k, v in {"outputs": outputs, "metadata": metadata}.items():
+        if v and not (isinstance(v, list) and len(v) == len(inputs) and _is_all_dict(v)):
+            raise ValueError(
+                f"{k} should be a list of same length as input containing only dictionary objects"
+            )
+    examples: List[ExampleContent] = []
+    for i, obj in enumerate(inputs):
+        example = ExampleContent(
+            input=obj,
+            output=outputs[i] if outputs else {},
+            metadata=metadata[i] if metadata else {},
+        )
+        examples.append(example)
+    action = DatasetAction(cast(Optional[str], data.get("action")) or "create")
+    return iter(examples), action, name, description
 async def _process_csv(
     content: bytes,
     content_encoding: FileContentEncoding,
-) -> Tuple[Examples, FrozenSet[str]]:
+    input_keys: InputKeys,
+    output_keys: OutputKeys,
+    metadata_keys: MetadataKeys,
+) -> Examples:
     if content_encoding is FileContentEncoding.GZIP:
         content = await run_in_threadpool(gzip.decompress, content)
     elif content_encoding is FileContentEncoding.DEFLATE:
@@ -525,22 +608,39 @@ async def _process_csv(
     if freq > 1:
         raise ValueError(f"Duplicated column header in CSV file: {header}")
     column_headers = frozenset(reader.fieldnames)
-    return reader, column_headers
+    _check_keys_exist(column_headers, input_keys, output_keys, metadata_keys)
+    return (
+        ExampleContent(
+            input={k: row.get(k) for k in input_keys},
+            output={k: row.get(k) for k in output_keys},
+            metadata={k: row.get(k) for k in metadata_keys},
+        )
+        for row in iter(reader)
+    )
 async def _process_pyarrow(
     content: bytes,
-) -> Tuple[Awaitable[Examples], FrozenSet[str]]:
+    input_keys: InputKeys,
+    output_keys: OutputKeys,
+    metadata_keys: MetadataKeys,
+) -> Awaitable[Examples]:
     try:
         reader = pa.ipc.open_stream(content)
     except pa.ArrowInvalid as e:
         raise ValueError("File is not valid pyarrow") from e
     column_headers = frozenset(reader.schema.names)
+    _check_keys_exist(column_headers, input_keys, output_keys, metadata_keys)
+    def get_examples() -> Iterator[ExampleContent]:
+        for row in reader.read_pandas().to_dict(orient="records"):
+            yield ExampleContent(
+                input={k: row.get(k) for k in input_keys},
+                output={k: row.get(k) for k in output_keys},
+                metadata={k: row.get(k) for k in metadata_keys},
+            )
-    def get_examples() -> Iterator[Dict[str, Any]]:
-        yield from reader.read_pandas().to_dict(orient="records")
-    return run_in_threadpool(get_examples), column_headers
+    return run_in_threadpool(get_examples)
 async def _check_table_exists(session: AsyncSession, name: str) -> bool:
@@ -613,7 +713,7 @@ async def get_dataset_csv(request: Request) -> Response:
           type: string
         description: Dataset ID
       - in: query
-        name: version
+        name: version_id
         schema:
           type: string
         description: Dataset version ID. If omitted, returns the latest version.
@@ -662,7 +762,7 @@ async def get_dataset_jsonl_openai_ft(request: Request) -> Response:
           type: string
         description: Dataset ID
       - in: query
-        name: version
+        name: version_id
         schema:
           type: string
         description: Dataset version ID. If omitted, returns the latest version.
@@ -711,7 +811,7 @@ async def get_dataset_jsonl_openai_evals(request: Request) -> Response:
           type: string
         description: Dataset ID
       - in: query
-        name: version
+        name: version_id
         schema:
           type: string
         description: Dataset version ID. If omitted, returns the latest version.
@@ -815,9 +915,9 @@ async def _get_db_examples(request: Request) -> Tuple[str, List[models.DatasetEx
         raise ValueError("Missing Dataset ID")
     dataset_id = from_global_id_with_expected_type(GlobalID.from_id(id_), Dataset.__name__)
     dataset_version_id: Optional[int] = None
-    if version := request.query_params.get("version"):
+    if version_id := request.query_params.get("version_id"):
         dataset_version_id = from_global_id_with_expected_type(
-            GlobalID.from_id(version),
+            GlobalID.from_id(version_id),
             DatasetVersion.__name__,
         )
     latest_version = (
@@ -859,3 +959,7 @@ async def _get_db_examples(request: Request) -> Tuple[str, List[models.DatasetEx
             raise ValueError("Dataset does not exist.")
         examples = [r async for r in await session.stream_scalars(stmt)]
     return dataset_name, examples
+def _is_all_dict(seq: Sequence[Any]) -> bool:
+    return all(map(lambda obj: isinstance(obj, dict), seq))

phoenix/server/api/routers/v1/evaluations.py CHANGED Viewed

@@ -45,13 +45,6 @@ async def post_evaluations(request: Request) -> Response:
     operationId: addEvaluations
     tags:
       - private
-    parameters:
-      - name: project-name
-        in: query
-        schema:
-          type: string
-          default: default
-        description: The project name to add the evaluation to
     requestBody:
       required: true
       content:
@@ -107,7 +100,7 @@ async def get_evaluations(request: Request) -> Response:
     tags:
       - private
     parameters:
-      - name: project-name
+      - name: project_name
         in: query
         schema:
           type: string
@@ -122,9 +115,9 @@ async def get_evaluations(request: Request) -> Response:
         description: Not found
     """
     project_name = (
-        request.query_params.get("project-name")
-        # read from headers for backwards compatibility
-        or request.headers.get("project-name")
+        request.query_params.get("project_name")
+        or request.query_params.get("project-name")  # for backward compatibility
+        or request.headers.get("project-name")  # read from headers for backwards compatibility
         or DEFAULT_PROJECT_NAME
     )

arize-phoenix 4.4.4rc4__py3-none-any.whl → 4.4.4rc6__py3-none-any.whl

Potentially problematic release.

arize-phoenix 4.4.4rc4py3-none-any.whl → 4.4.4rc6py3-none-any.whl