PyPI - arize-phoenix - Versions diffs - 3.16.1__py3-none-any.whl → 7.7.0__py3-none-any.whl - Mend

arize-phoenix 3.16.1py3-none-any.whl → 7.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (338) hide show

arize_phoenix-7.7.0.dist-info/METADATA +261 -0
arize_phoenix-7.7.0.dist-info/RECORD +345 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/WHEEL +1 -1
arize_phoenix-7.7.0.dist-info/entry_points.txt +3 -0
phoenix/__init__.py +86 -14
phoenix/auth.py +309 -0
phoenix/config.py +675 -45
phoenix/core/model.py +32 -30
phoenix/core/model_schema.py +102 -109
phoenix/core/model_schema_adapter.py +48 -45
phoenix/datetime_utils.py +24 -3
phoenix/db/README.md +54 -0
phoenix/db/__init__.py +4 -0
phoenix/db/alembic.ini +85 -0
phoenix/db/bulk_inserter.py +294 -0
phoenix/db/engines.py +208 -0
phoenix/db/enums.py +20 -0
phoenix/db/facilitator.py +113 -0
phoenix/db/helpers.py +159 -0
phoenix/db/insertion/constants.py +2 -0
phoenix/db/insertion/dataset.py +227 -0
phoenix/db/insertion/document_annotation.py +171 -0
phoenix/db/insertion/evaluation.py +191 -0
phoenix/db/insertion/helpers.py +98 -0
phoenix/db/insertion/span.py +193 -0
phoenix/db/insertion/span_annotation.py +158 -0
phoenix/db/insertion/trace_annotation.py +158 -0
phoenix/db/insertion/types.py +256 -0
phoenix/db/migrate.py +86 -0
phoenix/db/migrations/data_migration_scripts/populate_project_sessions.py +199 -0
phoenix/db/migrations/env.py +114 -0
phoenix/db/migrations/script.py.mako +26 -0
phoenix/db/migrations/versions/10460e46d750_datasets.py +317 -0
phoenix/db/migrations/versions/3be8647b87d8_add_token_columns_to_spans_table.py +126 -0
phoenix/db/migrations/versions/4ded9e43755f_create_project_sessions_table.py +66 -0
phoenix/db/migrations/versions/cd164e83824f_users_and_tokens.py +157 -0
phoenix/db/migrations/versions/cf03bd6bae1d_init.py +280 -0
phoenix/db/models.py +807 -0
phoenix/exceptions.py +5 -1
phoenix/experiments/__init__.py +6 -0
phoenix/experiments/evaluators/__init__.py +29 -0
phoenix/experiments/evaluators/base.py +158 -0
phoenix/experiments/evaluators/code_evaluators.py +184 -0
phoenix/experiments/evaluators/llm_evaluators.py +473 -0
phoenix/experiments/evaluators/utils.py +236 -0
phoenix/experiments/functions.py +772 -0
phoenix/experiments/tracing.py +86 -0
phoenix/experiments/types.py +726 -0
phoenix/experiments/utils.py +25 -0
phoenix/inferences/__init__.py +0 -0
phoenix/{datasets → inferences}/errors.py +6 -5
phoenix/{datasets → inferences}/fixtures.py +49 -42
phoenix/{datasets/dataset.py → inferences/inferences.py} +121 -105
phoenix/{datasets → inferences}/schema.py +11 -11
phoenix/{datasets → inferences}/validation.py +13 -14
phoenix/logging/__init__.py +3 -0
phoenix/logging/_config.py +90 -0
phoenix/logging/_filter.py +6 -0
phoenix/logging/_formatter.py +69 -0
phoenix/metrics/__init__.py +5 -4
phoenix/metrics/binning.py +4 -3
phoenix/metrics/metrics.py +2 -1
phoenix/metrics/mixins.py +7 -6
phoenix/metrics/retrieval_metrics.py +2 -1
phoenix/metrics/timeseries.py +5 -4
phoenix/metrics/wrappers.py +9 -3
phoenix/pointcloud/clustering.py +5 -5
phoenix/pointcloud/pointcloud.py +7 -5
phoenix/pointcloud/projectors.py +5 -6
phoenix/pointcloud/umap_parameters.py +53 -52
phoenix/server/api/README.md +28 -0
phoenix/server/api/auth.py +44 -0
phoenix/server/api/context.py +152 -9
phoenix/server/api/dataloaders/__init__.py +91 -0
phoenix/server/api/dataloaders/annotation_summaries.py +139 -0
phoenix/server/api/dataloaders/average_experiment_run_latency.py +54 -0
phoenix/server/api/dataloaders/cache/__init__.py +3 -0
phoenix/server/api/dataloaders/cache/two_tier_cache.py +68 -0
phoenix/server/api/dataloaders/dataset_example_revisions.py +131 -0
phoenix/server/api/dataloaders/dataset_example_spans.py +38 -0
phoenix/server/api/dataloaders/document_evaluation_summaries.py +144 -0
phoenix/server/api/dataloaders/document_evaluations.py +31 -0
phoenix/server/api/dataloaders/document_retrieval_metrics.py +89 -0
phoenix/server/api/dataloaders/experiment_annotation_summaries.py +79 -0
phoenix/server/api/dataloaders/experiment_error_rates.py +58 -0
phoenix/server/api/dataloaders/experiment_run_annotations.py +36 -0
phoenix/server/api/dataloaders/experiment_run_counts.py +49 -0
phoenix/server/api/dataloaders/experiment_sequence_number.py +44 -0
phoenix/server/api/dataloaders/latency_ms_quantile.py +188 -0
phoenix/server/api/dataloaders/min_start_or_max_end_times.py +85 -0
phoenix/server/api/dataloaders/project_by_name.py +31 -0
phoenix/server/api/dataloaders/record_counts.py +116 -0
phoenix/server/api/dataloaders/session_io.py +79 -0
phoenix/server/api/dataloaders/session_num_traces.py +30 -0
phoenix/server/api/dataloaders/session_num_traces_with_error.py +32 -0
phoenix/server/api/dataloaders/session_token_usages.py +41 -0
phoenix/server/api/dataloaders/session_trace_latency_ms_quantile.py +55 -0
phoenix/server/api/dataloaders/span_annotations.py +26 -0
phoenix/server/api/dataloaders/span_dataset_examples.py +31 -0
phoenix/server/api/dataloaders/span_descendants.py +57 -0
phoenix/server/api/dataloaders/span_projects.py +33 -0
phoenix/server/api/dataloaders/token_counts.py +124 -0
phoenix/server/api/dataloaders/trace_by_trace_ids.py +25 -0
phoenix/server/api/dataloaders/trace_root_spans.py +32 -0
phoenix/server/api/dataloaders/user_roles.py +30 -0
phoenix/server/api/dataloaders/users.py +33 -0
phoenix/server/api/exceptions.py +48 -0
phoenix/server/api/helpers/__init__.py +12 -0
phoenix/server/api/helpers/dataset_helpers.py +217 -0
phoenix/server/api/helpers/experiment_run_filters.py +763 -0
phoenix/server/api/helpers/playground_clients.py +948 -0
phoenix/server/api/helpers/playground_registry.py +70 -0
phoenix/server/api/helpers/playground_spans.py +455 -0
phoenix/server/api/input_types/AddExamplesToDatasetInput.py +16 -0
phoenix/server/api/input_types/AddSpansToDatasetInput.py +14 -0
phoenix/server/api/input_types/ChatCompletionInput.py +38 -0
phoenix/server/api/input_types/ChatCompletionMessageInput.py +24 -0
phoenix/server/api/input_types/ClearProjectInput.py +15 -0
phoenix/server/api/input_types/ClusterInput.py +2 -2
phoenix/server/api/input_types/CreateDatasetInput.py +12 -0
phoenix/server/api/input_types/CreateSpanAnnotationInput.py +18 -0
phoenix/server/api/input_types/CreateTraceAnnotationInput.py +18 -0
phoenix/server/api/input_types/DataQualityMetricInput.py +5 -2
phoenix/server/api/input_types/DatasetExampleInput.py +14 -0
phoenix/server/api/input_types/DatasetSort.py +17 -0
phoenix/server/api/input_types/DatasetVersionSort.py +16 -0
phoenix/server/api/input_types/DeleteAnnotationsInput.py +7 -0
phoenix/server/api/input_types/DeleteDatasetExamplesInput.py +13 -0
phoenix/server/api/input_types/DeleteDatasetInput.py +7 -0
phoenix/server/api/input_types/DeleteExperimentsInput.py +7 -0
phoenix/server/api/input_types/DimensionFilter.py +4 -4
phoenix/server/api/input_types/GenerativeModelInput.py +17 -0
phoenix/server/api/input_types/Granularity.py +1 -1
phoenix/server/api/input_types/InvocationParameters.py +162 -0
phoenix/server/api/input_types/PatchAnnotationInput.py +19 -0
phoenix/server/api/input_types/PatchDatasetExamplesInput.py +35 -0
phoenix/server/api/input_types/PatchDatasetInput.py +14 -0
phoenix/server/api/input_types/PerformanceMetricInput.py +5 -2
phoenix/server/api/input_types/ProjectSessionSort.py +29 -0
phoenix/server/api/input_types/SpanAnnotationSort.py +17 -0
phoenix/server/api/input_types/SpanSort.py +134 -69
phoenix/server/api/input_types/TemplateOptions.py +10 -0
phoenix/server/api/input_types/TraceAnnotationSort.py +17 -0
phoenix/server/api/input_types/UserRoleInput.py +9 -0
phoenix/server/api/mutations/__init__.py +28 -0
phoenix/server/api/mutations/api_key_mutations.py +167 -0
phoenix/server/api/mutations/chat_mutations.py +593 -0
phoenix/server/api/mutations/dataset_mutations.py +591 -0
phoenix/server/api/mutations/experiment_mutations.py +75 -0
phoenix/server/api/{types/ExportEventsMutation.py → mutations/export_events_mutations.py} +21 -18
phoenix/server/api/mutations/project_mutations.py +57 -0
phoenix/server/api/mutations/span_annotations_mutations.py +128 -0
phoenix/server/api/mutations/trace_annotations_mutations.py +127 -0
phoenix/server/api/mutations/user_mutations.py +329 -0
phoenix/server/api/openapi/__init__.py +0 -0
phoenix/server/api/openapi/main.py +17 -0
phoenix/server/api/openapi/schema.py +16 -0
phoenix/server/api/queries.py +738 -0
phoenix/server/api/routers/__init__.py +11 -0
phoenix/server/api/routers/auth.py +284 -0
phoenix/server/api/routers/embeddings.py +26 -0
phoenix/server/api/routers/oauth2.py +488 -0
phoenix/server/api/routers/v1/__init__.py +64 -0
phoenix/server/api/routers/v1/datasets.py +1017 -0
phoenix/server/api/routers/v1/evaluations.py +362 -0
phoenix/server/api/routers/v1/experiment_evaluations.py +115 -0
phoenix/server/api/routers/v1/experiment_runs.py +167 -0
phoenix/server/api/routers/v1/experiments.py +308 -0
phoenix/server/api/routers/v1/pydantic_compat.py +78 -0
phoenix/server/api/routers/v1/spans.py +267 -0
phoenix/server/api/routers/v1/traces.py +208 -0
phoenix/server/api/routers/v1/utils.py +95 -0
phoenix/server/api/schema.py +44 -241
phoenix/server/api/subscriptions.py +597 -0
phoenix/server/api/types/Annotation.py +21 -0
phoenix/server/api/types/AnnotationSummary.py +55 -0
phoenix/server/api/types/AnnotatorKind.py +16 -0
phoenix/server/api/types/ApiKey.py +27 -0
phoenix/server/api/types/AuthMethod.py +9 -0
phoenix/server/api/types/ChatCompletionMessageRole.py +11 -0
phoenix/server/api/types/ChatCompletionSubscriptionPayload.py +46 -0
phoenix/server/api/types/Cluster.py +25 -24
phoenix/server/api/types/CreateDatasetPayload.py +8 -0
phoenix/server/api/types/DataQualityMetric.py +31 -13
phoenix/server/api/types/Dataset.py +288 -63
phoenix/server/api/types/DatasetExample.py +85 -0
phoenix/server/api/types/DatasetExampleRevision.py +34 -0
phoenix/server/api/types/DatasetVersion.py +14 -0
phoenix/server/api/types/Dimension.py +32 -31
phoenix/server/api/types/DocumentEvaluationSummary.py +9 -8
phoenix/server/api/types/EmbeddingDimension.py +56 -49
phoenix/server/api/types/Evaluation.py +25 -31
phoenix/server/api/types/EvaluationSummary.py +30 -50
phoenix/server/api/types/Event.py +20 -20
phoenix/server/api/types/ExampleRevisionInterface.py +14 -0
phoenix/server/api/types/Experiment.py +152 -0
phoenix/server/api/types/ExperimentAnnotationSummary.py +13 -0
phoenix/server/api/types/ExperimentComparison.py +17 -0
phoenix/server/api/types/ExperimentRun.py +119 -0
phoenix/server/api/types/ExperimentRunAnnotation.py +56 -0
phoenix/server/api/types/GenerativeModel.py +9 -0
phoenix/server/api/types/GenerativeProvider.py +85 -0
phoenix/server/api/types/Inferences.py +80 -0
phoenix/server/api/types/InferencesRole.py +23 -0
phoenix/server/api/types/LabelFraction.py +7 -0
phoenix/server/api/types/MimeType.py +2 -2
phoenix/server/api/types/Model.py +54 -54
phoenix/server/api/types/PerformanceMetric.py +8 -5
phoenix/server/api/types/Project.py +407 -142
phoenix/server/api/types/ProjectSession.py +139 -0
phoenix/server/api/types/Segments.py +4 -4
phoenix/server/api/types/Span.py +221 -176
phoenix/server/api/types/SpanAnnotation.py +43 -0
phoenix/server/api/types/SpanIOValue.py +15 -0
phoenix/server/api/types/SystemApiKey.py +9 -0
phoenix/server/api/types/TemplateLanguage.py +10 -0
phoenix/server/api/types/TimeSeries.py +19 -15
phoenix/server/api/types/TokenUsage.py +11 -0
phoenix/server/api/types/Trace.py +154 -0
phoenix/server/api/types/TraceAnnotation.py +45 -0
phoenix/server/api/types/UMAPPoints.py +7 -7
phoenix/server/api/types/User.py +60 -0
phoenix/server/api/types/UserApiKey.py +45 -0
phoenix/server/api/types/UserRole.py +15 -0
phoenix/server/api/types/node.py +4 -112
phoenix/server/api/types/pagination.py +156 -57
phoenix/server/api/utils.py +34 -0
phoenix/server/app.py +864 -115
phoenix/server/bearer_auth.py +163 -0
phoenix/server/dml_event.py +136 -0
phoenix/server/dml_event_handler.py +256 -0
phoenix/server/email/__init__.py +0 -0
phoenix/server/email/sender.py +97 -0
phoenix/server/email/templates/__init__.py +0 -0
phoenix/server/email/templates/password_reset.html +19 -0
phoenix/server/email/types.py +11 -0
phoenix/server/grpc_server.py +102 -0
phoenix/server/jwt_store.py +505 -0
phoenix/server/main.py +305 -116
phoenix/server/oauth2.py +52 -0
phoenix/server/openapi/__init__.py +0 -0
phoenix/server/prometheus.py +111 -0
phoenix/server/rate_limiters.py +188 -0
phoenix/server/static/.vite/manifest.json +87 -0
phoenix/server/static/assets/components-Cy9nwIvF.js +2125 -0
phoenix/server/static/assets/index-BKvHIxkk.js +113 -0
phoenix/server/static/assets/pages-CUi2xCVQ.js +4449 -0
phoenix/server/static/assets/vendor-DvC8cT4X.js +894 -0
phoenix/server/static/assets/vendor-DxkFTwjz.css +1 -0
phoenix/server/static/assets/vendor-arizeai-Do1793cv.js +662 -0
phoenix/server/static/assets/vendor-codemirror-BzwZPyJM.js +24 -0
phoenix/server/static/assets/vendor-recharts-_Jb7JjhG.js +59 -0
phoenix/server/static/assets/vendor-shiki-Cl9QBraO.js +5 -0
phoenix/server/static/assets/vendor-three-DwGkEfCM.js +2998 -0
phoenix/server/telemetry.py +68 -0
phoenix/server/templates/index.html +82 -23
phoenix/server/thread_server.py +3 -3
phoenix/server/types.py +275 -0
phoenix/services.py +27 -18
phoenix/session/client.py +743 -68
phoenix/session/data_extractor.py +31 -7
phoenix/session/evaluation.py +3 -9
phoenix/session/session.py +263 -219
phoenix/settings.py +22 -0
phoenix/trace/__init__.py +2 -22
phoenix/trace/attributes.py +338 -0
phoenix/trace/dsl/README.md +116 -0
phoenix/trace/dsl/filter.py +663 -213
phoenix/trace/dsl/helpers.py +73 -21
phoenix/trace/dsl/query.py +574 -201
phoenix/trace/exporter.py +24 -19
phoenix/trace/fixtures.py +368 -32
phoenix/trace/otel.py +71 -219
phoenix/trace/projects.py +3 -2
phoenix/trace/schemas.py +33 -11
phoenix/trace/span_evaluations.py +21 -16
phoenix/trace/span_json_decoder.py +6 -4
phoenix/trace/span_json_encoder.py +2 -2
phoenix/trace/trace_dataset.py +47 -32
phoenix/trace/utils.py +21 -4
phoenix/utilities/__init__.py +0 -26
phoenix/utilities/client.py +132 -0
phoenix/utilities/deprecation.py +31 -0
phoenix/utilities/error_handling.py +3 -2
phoenix/utilities/json.py +109 -0
phoenix/utilities/logging.py +8 -0
phoenix/utilities/project.py +2 -2
phoenix/utilities/re.py +49 -0
phoenix/utilities/span_store.py +0 -23
phoenix/utilities/template_formatters.py +99 -0
phoenix/version.py +1 -1
arize_phoenix-3.16.1.dist-info/METADATA +0 -495
arize_phoenix-3.16.1.dist-info/RECORD +0 -178
phoenix/core/project.py +0 -619
phoenix/core/traces.py +0 -96
phoenix/experimental/evals/__init__.py +0 -73
phoenix/experimental/evals/evaluators.py +0 -413
phoenix/experimental/evals/functions/__init__.py +0 -4
phoenix/experimental/evals/functions/classify.py +0 -453
phoenix/experimental/evals/functions/executor.py +0 -353
phoenix/experimental/evals/functions/generate.py +0 -138
phoenix/experimental/evals/functions/processing.py +0 -76
phoenix/experimental/evals/models/__init__.py +0 -14
phoenix/experimental/evals/models/anthropic.py +0 -175
phoenix/experimental/evals/models/base.py +0 -170
phoenix/experimental/evals/models/bedrock.py +0 -221
phoenix/experimental/evals/models/litellm.py +0 -134
phoenix/experimental/evals/models/openai.py +0 -448
phoenix/experimental/evals/models/rate_limiters.py +0 -246
phoenix/experimental/evals/models/vertex.py +0 -173
phoenix/experimental/evals/models/vertexai.py +0 -186
phoenix/experimental/evals/retrievals.py +0 -96
phoenix/experimental/evals/templates/__init__.py +0 -50
phoenix/experimental/evals/templates/default_templates.py +0 -472
phoenix/experimental/evals/templates/template.py +0 -195
phoenix/experimental/evals/utils/__init__.py +0 -172
phoenix/experimental/evals/utils/threads.py +0 -27
phoenix/server/api/helpers.py +0 -11
phoenix/server/api/routers/evaluation_handler.py +0 -109
phoenix/server/api/routers/span_handler.py +0 -70
phoenix/server/api/routers/trace_handler.py +0 -60
phoenix/server/api/types/DatasetRole.py +0 -23
phoenix/server/static/index.css +0 -6
phoenix/server/static/index.js +0 -7447
phoenix/storage/span_store/__init__.py +0 -23
phoenix/storage/span_store/text_file.py +0 -85
phoenix/trace/dsl/missing.py +0 -60
phoenix/trace/langchain/__init__.py +0 -3
phoenix/trace/langchain/instrumentor.py +0 -35
phoenix/trace/llama_index/__init__.py +0 -3
phoenix/trace/llama_index/callback.py +0 -102
phoenix/trace/openai/__init__.py +0 -3
phoenix/trace/openai/instrumentor.py +0 -30
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-3.16.1.dist-info → arize_phoenix-7.7.0.dist-info}/licenses/LICENSE +0 -0
/phoenix/{datasets → db/insertion}/__init__.py +0 -0
/phoenix/{experimental → db/migrations}/__init__.py +0 -0
/phoenix/{storage → db/migrations/data_migration_scripts}/__init__.py +0 -0

phoenix/experimental/evals/functions/executor.py DELETED Viewed

@@ -1,353 +0,0 @@
-from __future__ import annotations
-import asyncio
-import logging
-import signal
-import traceback
-from typing import Any, Callable, Coroutine, List, Optional, Protocol, Sequence, Tuple, Union
-from tqdm.auto import tqdm
-from phoenix.exceptions import PhoenixException
-logger = logging.getLogger(__name__)
-class Unset:
-    pass
-_unset = Unset()
-class Executor(Protocol):
-    def run(self, inputs: Sequence[Any]) -> List[Any]: ...
-class AsyncExecutor(Executor):
-    """
-    A class that provides asynchronous execution of tasks using a producer-consumer pattern.
-    An async interface is provided by the `execute` method, which returns a coroutine, and a sync
-    interface is provided by the `run` method.
-    Args:
-        generation_fn (Callable[[Any], Coroutine[Any, Any, Any]]): A coroutine function that
-        generates tasks to be executed.
-        concurrency (int, optional): The number of concurrent consumers. Defaults to 3.
-        tqdm_bar_format (Optional[str], optional): The format string for the progress bar. Defaults
-        to None.
-        max_retries (int, optional): The maximum number of times to retry on exceptions. Defaults to
-        10.
-        exit_on_error (bool, optional): Whether to exit execution on the first encountered error.
-        Defaults to True.
-        fallback_return_value (Union[Unset, Any], optional): The fallback return value for tasks
-        that encounter errors. Defaults to _unset.
-        termination_signal (signal.Signals, optional): The signal handled to terminate the executor.
-    """
-    def __init__(
-        self,
-        generation_fn: Callable[[Any], Coroutine[Any, Any, Any]],
-        concurrency: int = 3,
-        tqdm_bar_format: Optional[str] = None,
-        max_retries: int = 10,
-        exit_on_error: bool = True,
-        fallback_return_value: Union[Unset, Any] = _unset,
-        termination_signal: signal.Signals = signal.SIGINT,
-    ):
-        self.generate = generation_fn
-        self.fallback_return_value = fallback_return_value
-        self.concurrency = concurrency
-        self.tqdm_bar_format = tqdm_bar_format
-        self.max_retries = max_retries
-        self.exit_on_error = exit_on_error
-        self.base_priority = 0
-        self.termination_signal = termination_signal
-    async def producer(
-        self,
-        inputs: Sequence[Any],
-        queue: asyncio.PriorityQueue[Tuple[int, Any]],
-        max_fill: int,
-        done_producing: asyncio.Event,
-        termination_signal: asyncio.Event,
-    ) -> None:
-        try:
-            for index, input in enumerate(inputs):
-                if termination_signal.is_set():
-                    break
-                while queue.qsize() >= max_fill:
-                    # keep room in the queue for requeues
-                    await asyncio.sleep(1)
-                await queue.put((self.base_priority, (index, input)))
-        finally:
-            done_producing.set()
-    async def consumer(
-        self,
-        output: List[Any],
-        queue: asyncio.PriorityQueue[Tuple[int, Any]],
-        done_producing: asyncio.Event,
-        termination_event: asyncio.Event,
-        progress_bar: tqdm[Any],
-    ) -> None:
-        termination_event_watcher = None
-        while True:
-            marked_done = False
-            try:
-                priority, item = await asyncio.wait_for(queue.get(), timeout=1)
-            except asyncio.TimeoutError:
-                if done_producing.is_set() and queue.empty():
-                    break
-                continue
-            if termination_event.is_set():
-                # discard any remaining items in the queue
-                queue.task_done()
-                marked_done = True
-                continue
-            index, payload = item
-            try:
-                generate_task = asyncio.create_task(self.generate(payload))
-                termination_event_watcher = asyncio.create_task(termination_event.wait())
-                done, pending = await asyncio.wait(
-                    [generate_task, termination_event_watcher],
-                    timeout=120,
-                    return_when=asyncio.FIRST_COMPLETED,
-                )
-                if generate_task in done:
-                    output[index] = generate_task.result()
-                    progress_bar.update()
-                elif termination_event.is_set():
-                    # discard the pending task and remaining items in the queue
-                    if not generate_task.done():
-                        generate_task.cancel()
-                        try:
-                            # allow any cleanup to finish for the cancelled task
-                            await generate_task
-                        except asyncio.CancelledError:
-                            # Handle the cancellation exception
-                            pass
-                    queue.task_done()
-                    marked_done = True
-                    continue
-                else:
-                    tqdm.write("Worker timeout, requeuing")
-                    # task timeouts are requeued at base priority
-                    await queue.put((self.base_priority, item))
-            except Exception as exc:
-                is_phoenix_exception = isinstance(exc, PhoenixException)
-                if (retry_count := abs(priority)) <= self.max_retries and not is_phoenix_exception:
-                    tqdm.write(
-                        f"Exception in worker on attempt {retry_count + 1}: raised {repr(exc)}"
-                    )
-                    tqdm.write("Requeuing...")
-                    await queue.put((priority - 1, item))
-                else:
-                    tqdm.write(f"Exception in worker: {traceback.format_exc()}")
-                    if self.exit_on_error:
-                        termination_event.set()
-                    else:
-                        progress_bar.update()
-            finally:
-                if not marked_done:
-                    queue.task_done()
-                if termination_event_watcher and not termination_event_watcher.done():
-                    termination_event_watcher.cancel()
-    async def execute(self, inputs: Sequence[Any]) -> List[Any]:
-        termination_event = asyncio.Event()
-        def termination_handler(signum: int, frame: Any) -> None:
-            termination_event.set()
-            tqdm.write("Process was interrupted. The return value will be incomplete...")
-        signal.signal(self.termination_signal, termination_handler)
-        outputs = [self.fallback_return_value] * len(inputs)
-        progress_bar = tqdm(total=len(inputs), bar_format=self.tqdm_bar_format)
-        max_queue_size = 5 * self.concurrency  # limit the queue to bound memory usage
-        max_fill = max_queue_size - (2 * self.concurrency)  # ensure there is always room to requeue
-        queue: asyncio.PriorityQueue[Tuple[int, Any]] = asyncio.PriorityQueue(
-            maxsize=max_queue_size
-        )
-        done_producing = asyncio.Event()
-        producer = asyncio.create_task(
-            self.producer(inputs, queue, max_fill, done_producing, termination_event)
-        )
-        consumers = [
-            asyncio.create_task(
-                self.consumer(outputs, queue, done_producing, termination_event, progress_bar)
-            )
-            for _ in range(self.concurrency)
-        ]
-        await asyncio.gather(producer, *consumers)
-        join_task = asyncio.create_task(queue.join())
-        termination_event_watcher = asyncio.create_task(termination_event.wait())
-        done, pending = await asyncio.wait(
-            [join_task, termination_event_watcher], return_when=asyncio.FIRST_COMPLETED
-        )
-        if termination_event_watcher in done:
-            # Cancel all tasks
-            if not join_task.done():
-                join_task.cancel()
-            if not producer.done():
-                producer.cancel()
-            for task in consumers:
-                if not task.done():
-                    task.cancel()
-        if not termination_event_watcher.done():
-            termination_event_watcher.cancel()
-        # reset the SIGTERM handler
-        signal.signal(self.termination_signal, signal.SIG_DFL)  # reset the SIGTERM handler
-        return outputs
-    def run(self, inputs: Sequence[Any]) -> List[Any]:
-        return asyncio.run(self.execute(inputs))
-class SyncExecutor(Executor):
-    """
-    Synchronous executor for generating outputs from inputs using a given generation function.
-    Args:
-        generation_fn (Callable[[Any], Any]): The generation function that takes an input and
-        returns an output.
-        tqdm_bar_format (Optional[str], optional): The format string for the progress bar. Defaults
-        to None.
-        max_retries (int, optional): The maximum number of times to retry on exceptions. Defaults to
-        10.
-        exit_on_error (bool, optional): Whether to exit execution on the first encountered error.
-        Defaults to True.
-        fallback_return_value (Union[Unset, Any], optional): The fallback return value for tasks
-        that encounter errors. Defaults to _unset.
-    """
-    def __init__(
-        self,
-        generation_fn: Callable[[Any], Any],
-        tqdm_bar_format: Optional[str] = None,
-        max_retries: int = 10,
-        exit_on_error: bool = True,
-        fallback_return_value: Union[Unset, Any] = _unset,
-        termination_signal: signal.Signals = signal.SIGINT,
-    ):
-        self.generate = generation_fn
-        self.fallback_return_value = fallback_return_value
-        self.tqdm_bar_format = tqdm_bar_format
-        self.max_retries = max_retries
-        self.exit_on_error = exit_on_error
-        self.termination_signal = termination_signal
-        self._TERMINATE = False
-    def _signal_handler(self, signum: int, frame: Any) -> None:
-        tqdm.write("Process was interrupted. The return value will be incomplete...")
-        self._TERMINATE = True
-    def run(self, inputs: Sequence[Any]) -> List[Any]:
-        signal.signal(self.termination_signal, self._signal_handler)
-        outputs = [self.fallback_return_value] * len(inputs)
-        progress_bar = tqdm(total=len(inputs), bar_format=self.tqdm_bar_format)
-        for index, input in enumerate(inputs):
-            try:
-                for attempt in range(self.max_retries + 1):
-                    if self._TERMINATE:
-                        return outputs
-                    try:
-                        result = self.generate(input)
-                        outputs[index] = result
-                        progress_bar.update()
-                        break
-                    except Exception as exc:
-                        is_phoenix_exception = isinstance(exc, PhoenixException)
-                        if attempt >= self.max_retries or is_phoenix_exception:
-                            raise exc
-                        else:
-                            tqdm.write(f"Exception in worker on attempt {attempt + 1}: {exc}")
-                            tqdm.write("Retrying...")
-            except Exception as exc:
-                tqdm.write(f"Exception in worker: {exc}")
-                if self.exit_on_error:
-                    return outputs
-                else:
-                    progress_bar.update()
-        signal.signal(self.termination_signal, signal.SIG_DFL)  # reset the SIGTERM handler
-        return outputs
-def get_executor_on_sync_context(
-    sync_fn: Callable[[Any], Any],
-    async_fn: Callable[[Any], Coroutine[Any, Any, Any]],
-    run_sync: bool = False,
-    concurrency: int = 3,
-    tqdm_bar_format: Optional[str] = None,
-    exit_on_error: bool = True,
-    fallback_return_value: Union[Unset, Any] = _unset,
-) -> Executor:
-    if run_sync:
-        return SyncExecutor(
-            sync_fn,
-            tqdm_bar_format=tqdm_bar_format,
-            exit_on_error=exit_on_error,
-            fallback_return_value=fallback_return_value,
-        )
-    if _running_event_loop_exists():
-        if getattr(asyncio, "_nest_patched", False):
-            return AsyncExecutor(
-                async_fn,
-                concurrency=concurrency,
-                tqdm_bar_format=tqdm_bar_format,
-                exit_on_error=exit_on_error,
-                fallback_return_value=fallback_return_value,
-            )
-        else:
-            logger.warning(
-                "🐌!! If running llm_classify inside a notebook, patching the event loop with "
-                "nest_asyncio will allow asynchronous eval submission, and is significantly "
-                "faster. To patch the event loop, run `nest_asyncio.apply()`."
-            )
-            return SyncExecutor(
-                sync_fn,
-                tqdm_bar_format=tqdm_bar_format,
-                exit_on_error=exit_on_error,
-                fallback_return_value=fallback_return_value,
-            )
-    else:
-        return AsyncExecutor(
-            async_fn,
-            concurrency=concurrency,
-            tqdm_bar_format=tqdm_bar_format,
-            exit_on_error=exit_on_error,
-            fallback_return_value=fallback_return_value,
-        )
-def _running_event_loop_exists() -> bool:
-    """Checks for a running event loop.
-    Returns:
-        bool: True if a running event loop exists, False otherwise.
-    """
-    try:
-        asyncio.get_running_loop()
-        return True
-    except RuntimeError:
-        return False

phoenix/experimental/evals/functions/generate.py DELETED Viewed

@@ -1,138 +0,0 @@
-import logging
-from typing import Any, Callable, Dict, Optional, Tuple, Union
-import pandas as pd
-from phoenix.experimental.evals.functions.executor import (
-    get_executor_on_sync_context,
-)
-from phoenix.experimental.evals.models import BaseEvalModel, set_verbosity
-from phoenix.experimental.evals.templates import (
-    PromptTemplate,
-    map_template,
-    normalize_prompt_template,
-)
-from phoenix.experimental.evals.utils import get_tqdm_progress_bar_formatter
-logger = logging.getLogger(__name__)
-def _no_op_parser(response: str, response_index: int) -> Dict[str, str]:
-    return {"output": response}
-def llm_generate(
-    dataframe: pd.DataFrame,
-    template: Union[PromptTemplate, str],
-    model: BaseEvalModel,
-    system_instruction: Optional[str] = None,
-    verbose: bool = False,
-    output_parser: Optional[Callable[[str, int], Dict[str, Any]]] = None,
-    include_prompt: bool = False,
-    include_response: bool = False,
-    run_sync: bool = False,
-    concurrency: Optional[int] = None,
-) -> pd.DataFrame:
-    """
-    Generates a text using a template using an LLM. This function is useful
-    if you want to generate synthetic data, such as irrelevant responses
-    Args:
-        dataframe (pandas.DataFrame): A pandas dataframe in which each row
-        represents a record to be used as in input to the template. All
-        template variable names must appear as column names in the dataframe
-        (extra columns unrelated to the template are permitted).
-        template (Union[PromptTemplate, str]): The prompt template as either an
-        instance of PromptTemplate or a string. If the latter, the variable
-        names should be surrounded by curly braces so that a call to `.format`
-        can be made to substitute variable values.
-        model (BaseEvalModel): An LLM model class.
-        system_instruction (Optional[str], optional): An optional system
-        message.
-        verbose (bool, optional): If True, prints detailed information to stdout such as model
-        invocation parameters and retry info. Default False.
-        output_parser (Callable[[str, int], Dict[str, Any]], optional): An optional function
-        that takes each generated response and response index and parses it to a dictionary. The
-        keys of the dictionary should correspond to the column names of the output dataframe. If
-        None, the output dataframe will have a single column named "output". Default None.
-        include_prompt (bool, default=False): If True, includes a column named `prompt` in the
-        output dataframe containing the prompt used for each generation.
-        include_response (bool, default=False): If True, includes a column named `response` in the
-        output dataframe containing the raw response from the LLM prior to applying the output
-        parser.
-        run_sync (bool, default=False): If True, forces synchronous request submission. Otherwise
-        evaluations will be run asynchronously if possible.
-        concurrency (Optional[int], default=None): The number of concurrent evals if async
-        submission is possible. If not provided, a recommended default concurrency is set on a
-        per-model basis.
-    Returns:
-        generations_dataframe (pandas.DataFrame): A dataframe where each row
-        represents the generated output
-    """
-    concurrency = concurrency or model.default_concurrency
-    # clients need to be reloaded to ensure that async evals work properly
-    model.reload_client()
-    tqdm_bar_format = get_tqdm_progress_bar_formatter("llm_generate")
-    output_parser = output_parser or _no_op_parser
-    template = normalize_prompt_template(template)
-    logger.info(f"Template: \n{template.prompt()}\n")
-    logger.info(f"Template variables: {template.variables}")
-    prompts = map_template(dataframe, template)
-    async def _run_llm_generation_async(enumerated_prompt: Tuple[int, str]) -> Dict[str, Any]:
-        index, prompt = enumerated_prompt
-        with set_verbosity(model, verbose) as verbose_model:
-            response = await verbose_model._async_generate(
-                prompt,
-                instruction=system_instruction,
-            )
-        parsed_response = output_parser(response, index)
-        if include_prompt:
-            parsed_response["prompt"] = prompt
-        if include_response:
-            parsed_response["response"] = response
-        return parsed_response
-    def _run_llm_generation_sync(enumerated_prompt: Tuple[int, str]) -> Dict[str, Any]:
-        index, prompt = enumerated_prompt
-        with set_verbosity(model, verbose) as verbose_model:
-            response = verbose_model._generate(
-                prompt,
-                instruction=system_instruction,
-            )
-        parsed_response = output_parser(response, index)
-        if include_prompt:
-            parsed_response["prompt"] = prompt
-        if include_response:
-            parsed_response["response"] = response
-        return parsed_response
-    fallback_return_value = {
-        "output": "generation-failed",
-        **({"prompt": ""} if include_prompt else {}),
-        **({"response": ""} if include_response else {}),
-    }
-    executor = get_executor_on_sync_context(
-        _run_llm_generation_sync,
-        _run_llm_generation_async,
-        run_sync=run_sync,
-        concurrency=concurrency,
-        tqdm_bar_format=tqdm_bar_format,
-        exit_on_error=True,
-        fallback_return_value=fallback_return_value,
-    )
-    output = executor.run(list(enumerate(prompts.tolist())))
-    return pd.DataFrame(output)

phoenix/experimental/evals/functions/processing.py DELETED Viewed

@@ -1,76 +0,0 @@
-"""
-Token processing functions for supported models. This module is being deprecated.
-"""
-import logging
-import sys
-from typing import Any, List
-from ..models import BaseEvalModel
-logger = logging.getLogger(__name__)
-_DEPRECATION_WARNING = (
-    "The processing module is being deprecated. For advanced token processing, please use the "
-    "encoding approach recommended by the model provider. For example, OpenAI models can use the "
-    "`tiktoken` library to encode and decode text. For other models, please refer to the model "
-    "provider's documentation."
-)
-def truncate_text_by_model(model: BaseEvalModel, text: str, token_buffer: int = 0) -> str:
-    """Truncates text using a give model token limit.
-    Args:
-        model (BaseEvalModel): The model to use as reference.
-        text (str): The text to be truncated.
-        token_buffer (int, optional): The number of tokens to be left as buffer. For example, if the
-        `model` has a token limit of 1,000 and we want to leave a buffer of 50, the text will be
-        truncated such that the resulting text comprises 950 tokens. Defaults to 0.
-    Returns:
-        str: Truncated text
-    """
-    max_token_count = model.max_context_size - token_buffer
-    tokens = model.get_tokens_from_text(text)
-    if len(tokens) > max_token_count:
-        return model.get_text_from_tokens(tokens[:max_token_count]) + "..."
-    return text
-def concatenate_and_truncate_chunks(
-    chunks: List[str], model: BaseEvalModel, token_buffer: int
-) -> str:
-    """_summary_"""
-    """Given a list of `chunks` of text, this function will return the concatenated chunks
-    truncated to a token limit given by the `model` and `token_buffer`. See the function
-    `truncate_text_by_model` for information on the truncation process.
-    Args:
-        chunks (List[str]): A list of pieces of text.
-        model (BaseEvalModel): The model to use as reference.
-        token_buffer (int): The number of tokens to be left as buffer. For example, if the
-        `model` has a token limit of 1,000 and we want to leave a buffer of 50, the text will be
-        truncated such that the resulting text comprises 950 tokens. Defaults to 0.
-    Returns:
-        str: _description_
-    """
-    return truncate_text_by_model(model=model, text=" ".join(chunks), token_buffer=token_buffer)
-class _DEPRECATED_MODULE:
-    __all__ = ("truncate_text_by_model", "concatenate_and_truncate_chunks")
-    def __getattr__(self, name: str) -> Any:
-        if name == "truncate_text_by_model":
-            logger.warning(_DEPRECATION_WARNING)
-            return truncate_text_by_model
-        if name == "concatenate_and_truncate_chunks":
-            logger.warning(_DEPRECATION_WARNING)
-            return concatenate_and_truncate_chunks
-        raise AttributeError(f"module {__name__} has no attribute {name}")
-# See e.g. https://stackoverflow.com/a/7668273
-sys.modules[__name__] = _DEPRECATED_MODULE()  # type: ignore

phoenix/experimental/evals/models/__init__.py DELETED Viewed

@@ -1,14 +0,0 @@
-from .base import BaseEvalModel, set_verbosity
-from .bedrock import BedrockModel
-from .litellm import LiteLLMModel
-from .openai import OpenAIModel
-from .vertexai import VertexAIModel
-__all__ = [
-    "BedrockModel",
-    "BaseEvalModel",
-    "LiteLLMModel",
-    "OpenAIModel",
-    "VertexAIModel",
-    "set_verbosity",
-]

arize-phoenix 3.16.1__py3-none-any.whl → 7.7.0__py3-none-any.whl

Potentially problematic release.

arize-phoenix 3.16.1py3-none-any.whl → 7.7.0py3-none-any.whl