arize-phoenix 0.0.40__tar.gz → 0.0.41__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of arize-phoenix might be problematic. Click here for more details.
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/PKG-INFO +22 -21
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/README.md +21 -20
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/__init__.py +1 -1
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/functions/binary.py +8 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/retrievals.py +3 -1
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/index.js +357 -357
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/fixtures.py +9 -2
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/.gitignore +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/IP_NOTICE +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/LICENSE +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/pyproject.toml +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/config.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/core/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/core/embedding_dimension.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/core/model.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/core/model_schema.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/core/model_schema_adapter.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/core/traces.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datasets/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datasets/dataset.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datasets/errors.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datasets/fixtures.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datasets/schema.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datasets/validation.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/datetime_utils.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/functions/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/functions/common.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/functions/generate.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/models/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/models/base.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/models/openai.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/models/vertexai.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/templates/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/templates/default_templates.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/templates/template.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/utils/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/utils/downloads.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/utils/threads.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/utils/types.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/utils.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/README.md +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/binning.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/metrics.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/mixins.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/timeseries.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/metrics/wrappers.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/pointcloud/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/pointcloud/clustering.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/pointcloud/pointcloud.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/pointcloud/projectors.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/py.typed +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/context.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/helpers.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/ClusterInput.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/Coordinates.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/DataQualityMetricInput.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/DimensionFilter.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/DimensionInput.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/Granularity.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/PerformanceMetricInput.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/SpanSort.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/TimeRange.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/input_types/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/interceptor.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/schema.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Cluster.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DataQualityMetric.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Dataset.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DatasetInfo.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DatasetRole.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DatasetValues.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Dimension.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DimensionDataType.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DimensionShape.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DimensionType.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/DimensionWithValue.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/EmbeddingDimension.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/EmbeddingMetadata.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Event.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/EventMetadata.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/ExportEventsMutation.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/ExportedFile.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Functionality.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/MimeType.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Model.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/NumericRange.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/PerformanceMetric.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/PromptResponse.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Retrieval.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/ScalarDriftMetricEnum.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Segments.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/SortDir.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/Span.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/TimeSeries.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/UMAPPoints.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/VectorDriftMetricEnum.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/node.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/api/types/pagination.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/app.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/main.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/span_handler.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-114x114.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-120x120.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-144x144.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-152x152.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-180x180.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-72x72.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon-76x76.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/apple-touch-icon.png +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/favicon.ico +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/index.css +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/static/modernizr.js +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/templates/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/templates/index.html +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/server/thread_server.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/services.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/session/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/session/session.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/exporter.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/filter.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/langchain/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/langchain/instrumentor.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/langchain/tracer.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/llama_index/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/llama_index/callback.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/schemas.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/semantic_conventions.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/span_json_decoder.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/span_json_encoder.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/trace_dataset.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/tracer.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/utils.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/v1/__init__.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/v1/trace_pb2.py +0 -0
- {arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/trace/v1/trace_pb2.pyi +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: arize-phoenix
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.41
|
|
4
4
|
Summary: ML Observability in your notebook
|
|
5
5
|
Project-URL: Documentation, https://docs.arize.com/phoenix/
|
|
6
6
|
Project-URL: Issues, https://github.com/Arize-ai/phoenix/issues
|
|
@@ -82,28 +82,28 @@ Description-Content-Type: text/markdown
|
|
|
82
82
|
|
|
83
83
|
Phoenix provides MLOps and LLMOps insights at lightning speed with zero-config observability. Phoenix provides a notebook-first experience for monitoring your models and LLM Applications by providing:
|
|
84
84
|
|
|
85
|
-
- **LLM
|
|
85
|
+
- **LLM Traces** - Trace through the execution of your LLM Application to understand the internals of your LLM Application and to troubleshoot problems related to things like retrieval and tool execution.
|
|
86
86
|
- **LLM Evals** - Leverage the power of large language models to evaluate your generative model or application's relevance, toxicity, and more.
|
|
87
87
|
- **Embedding Analysis** - Explore embedding point-clouds and identify clusters of high drift and performance degradation.
|
|
88
|
-
- **RAG
|
|
88
|
+
- **RAG Analysis** - Visualize your generative application's search and retrieval process to solve improve your retrieval-augmented generation.
|
|
89
89
|
- **Structured Data Analysis** - Statistically analyze your structured data by performing A/B analysis, temporal drift analysis, and more.
|
|
90
90
|
|
|
91
91
|
**Table of Contents**
|
|
92
92
|
|
|
93
|
-
-
|
|
94
|
-
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
-
|
|
98
|
-
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
-
|
|
103
|
-
-
|
|
104
|
-
-
|
|
105
|
-
-
|
|
106
|
-
-
|
|
93
|
+
- [Installation](#installation)
|
|
94
|
+
- [LLM Traces](#llm-traces)
|
|
95
|
+
- [Tracing with LlamaIndex](#tracing-with-llamaindex)
|
|
96
|
+
- [Tracing with LangChain](#tracing-with-langchain)
|
|
97
|
+
- [LLM Evals](#llm-evals)
|
|
98
|
+
- [Embedding Analysis](#embedding-analysis)
|
|
99
|
+
- [UMAP-based Exploratory Data Analysis](#umap-based-exploratory-data-analysis)
|
|
100
|
+
- [Cluster-driven Drift and Performance Analysis](#cluster-driven-drift-and-performance-analysis)
|
|
101
|
+
- [Exportable Clusters](#exportable-clusters)
|
|
102
|
+
- [Retrieval-Augmented Generation Analysis](#retrieval-augmented-generation-analysis)
|
|
103
|
+
- [Structured Data Analysis](#structured-data-analysis)
|
|
104
|
+
- [Community](#community)
|
|
105
|
+
- [Thanks](#thanks)
|
|
106
|
+
- [Copyright, Patent, and License](#copyright-patent-and-license)
|
|
107
107
|
|
|
108
108
|
## Installation
|
|
109
109
|
|
|
@@ -119,7 +119,7 @@ Some functionality such as LLM evals are under the `experimental` subpackage.
|
|
|
119
119
|
pip install arize-phoenix[experimental]
|
|
120
120
|
```
|
|
121
121
|
|
|
122
|
-
## LLM
|
|
122
|
+
## LLM Traces
|
|
123
123
|
|
|
124
124
|

|
|
125
125
|
|
|
@@ -129,7 +129,7 @@ With the advent of powerful LLMs, it is now possible to build LLM Applications t
|
|
|
129
129
|
|
|
130
130
|
[](https://colab.research.google.com/github/Arize-ai/phoenix/blob/main/tutorials/tracing/llama_index_tracing_tutorial.ipynb) [](https://github.com/Arize-ai/phoenix/blob/main/tutorials/tracing/llama_index_tracing_tutorial.ipynb)
|
|
131
131
|
|
|
132
|
-

|
|
133
133
|
|
|
134
134
|
To extract traces from your LlamaIndex application, you will have to add Phoenix's `OpenInferenceTraceCallback` to your LlamaIndex application. A callback (in this case an OpenInference `Tracer`) is a class that automatically accumulates `spans` that trac your application as it executes. The OpenInference `Tracer` is a tracer that is specifically designed to work with Phoenix and by default exports the traces to a locally running phoenix server.
|
|
135
135
|
|
|
@@ -199,12 +199,13 @@ import pandas as pd
|
|
|
199
199
|
# Launch phoenix
|
|
200
200
|
session = px.launch_app()
|
|
201
201
|
|
|
202
|
-
# Once you have started a Phoenix server, you can start your LangChain application with the
|
|
202
|
+
# Once you have started a Phoenix server, you can start your LangChain application with the OpenInferenceTracer as a callback. To do this, you will have to instrument your LangChain application with the tracer:
|
|
203
203
|
|
|
204
|
-
from phoenix.trace.langchain import OpenInferenceTracer
|
|
204
|
+
from phoenix.trace.langchain import OpenInferenceTracer, LangChainInstrumentor
|
|
205
205
|
|
|
206
206
|
# If no exporter is specified, the tracer will export to the locally running Phoenix server
|
|
207
207
|
tracer = OpenInferenceTracer()
|
|
208
|
+
LangChainInstrumentor(tracer).instrument()
|
|
208
209
|
|
|
209
210
|
# Initialize your LangChain application
|
|
210
211
|
from langchain.chains import RetrievalQA
|
|
@@ -28,28 +28,28 @@
|
|
|
28
28
|
|
|
29
29
|
Phoenix provides MLOps and LLMOps insights at lightning speed with zero-config observability. Phoenix provides a notebook-first experience for monitoring your models and LLM Applications by providing:
|
|
30
30
|
|
|
31
|
-
- **LLM
|
|
31
|
+
- **LLM Traces** - Trace through the execution of your LLM Application to understand the internals of your LLM Application and to troubleshoot problems related to things like retrieval and tool execution.
|
|
32
32
|
- **LLM Evals** - Leverage the power of large language models to evaluate your generative model or application's relevance, toxicity, and more.
|
|
33
33
|
- **Embedding Analysis** - Explore embedding point-clouds and identify clusters of high drift and performance degradation.
|
|
34
|
-
- **RAG
|
|
34
|
+
- **RAG Analysis** - Visualize your generative application's search and retrieval process to solve improve your retrieval-augmented generation.
|
|
35
35
|
- **Structured Data Analysis** - Statistically analyze your structured data by performing A/B analysis, temporal drift analysis, and more.
|
|
36
36
|
|
|
37
37
|
**Table of Contents**
|
|
38
38
|
|
|
39
|
-
-
|
|
40
|
-
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
-
|
|
44
|
-
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
-
|
|
49
|
-
-
|
|
50
|
-
-
|
|
51
|
-
-
|
|
52
|
-
-
|
|
39
|
+
- [Installation](#installation)
|
|
40
|
+
- [LLM Traces](#llm-traces)
|
|
41
|
+
- [Tracing with LlamaIndex](#tracing-with-llamaindex)
|
|
42
|
+
- [Tracing with LangChain](#tracing-with-langchain)
|
|
43
|
+
- [LLM Evals](#llm-evals)
|
|
44
|
+
- [Embedding Analysis](#embedding-analysis)
|
|
45
|
+
- [UMAP-based Exploratory Data Analysis](#umap-based-exploratory-data-analysis)
|
|
46
|
+
- [Cluster-driven Drift and Performance Analysis](#cluster-driven-drift-and-performance-analysis)
|
|
47
|
+
- [Exportable Clusters](#exportable-clusters)
|
|
48
|
+
- [Retrieval-Augmented Generation Analysis](#retrieval-augmented-generation-analysis)
|
|
49
|
+
- [Structured Data Analysis](#structured-data-analysis)
|
|
50
|
+
- [Community](#community)
|
|
51
|
+
- [Thanks](#thanks)
|
|
52
|
+
- [Copyright, Patent, and License](#copyright-patent-and-license)
|
|
53
53
|
|
|
54
54
|
## Installation
|
|
55
55
|
|
|
@@ -65,7 +65,7 @@ Some functionality such as LLM evals are under the `experimental` subpackage.
|
|
|
65
65
|
pip install arize-phoenix[experimental]
|
|
66
66
|
```
|
|
67
67
|
|
|
68
|
-
## LLM
|
|
68
|
+
## LLM Traces
|
|
69
69
|
|
|
70
70
|

|
|
71
71
|
|
|
@@ -75,7 +75,7 @@ With the advent of powerful LLMs, it is now possible to build LLM Applications t
|
|
|
75
75
|
|
|
76
76
|
[](https://colab.research.google.com/github/Arize-ai/phoenix/blob/main/tutorials/tracing/llama_index_tracing_tutorial.ipynb) [](https://github.com/Arize-ai/phoenix/blob/main/tutorials/tracing/llama_index_tracing_tutorial.ipynb)
|
|
77
77
|
|
|
78
|
-

|
|
79
79
|
|
|
80
80
|
To extract traces from your LlamaIndex application, you will have to add Phoenix's `OpenInferenceTraceCallback` to your LlamaIndex application. A callback (in this case an OpenInference `Tracer`) is a class that automatically accumulates `spans` that trac your application as it executes. The OpenInference `Tracer` is a tracer that is specifically designed to work with Phoenix and by default exports the traces to a locally running phoenix server.
|
|
81
81
|
|
|
@@ -145,12 +145,13 @@ import pandas as pd
|
|
|
145
145
|
# Launch phoenix
|
|
146
146
|
session = px.launch_app()
|
|
147
147
|
|
|
148
|
-
# Once you have started a Phoenix server, you can start your LangChain application with the
|
|
148
|
+
# Once you have started a Phoenix server, you can start your LangChain application with the OpenInferenceTracer as a callback. To do this, you will have to instrument your LangChain application with the tracer:
|
|
149
149
|
|
|
150
|
-
from phoenix.trace.langchain import OpenInferenceTracer
|
|
150
|
+
from phoenix.trace.langchain import OpenInferenceTracer, LangChainInstrumentor
|
|
151
151
|
|
|
152
152
|
# If no exporter is specified, the tracer will export to the locally running Phoenix server
|
|
153
153
|
tracer = OpenInferenceTracer()
|
|
154
|
+
LangChainInstrumentor(tracer).instrument()
|
|
154
155
|
|
|
155
156
|
# Initialize your LangChain application
|
|
156
157
|
from langchain.chains import RetrievalQA
|
|
@@ -5,7 +5,7 @@ from .session.session import Session, active_session, close_app, launch_app
|
|
|
5
5
|
from .trace.fixtures import load_example_traces
|
|
6
6
|
from .trace.trace_dataset import TraceDataset
|
|
7
7
|
|
|
8
|
-
__version__ = "0.0.
|
|
8
|
+
__version__ = "0.0.41"
|
|
9
9
|
|
|
10
10
|
# module level doc-string
|
|
11
11
|
__doc__ = """
|
{arize_phoenix-0.0.40 → arize_phoenix-0.0.41}/src/phoenix/experimental/evals/functions/binary.py
RENAMED
|
@@ -183,8 +183,16 @@ def _extract_rail(string: str, positive_rail: str, negative_rail: str) -> Option
|
|
|
183
183
|
|
|
184
184
|
string = "regular..irregular" - contains both rails
|
|
185
185
|
Output: None
|
|
186
|
+
|
|
187
|
+
string = "Irregular"
|
|
188
|
+
Output: "irregular"
|
|
186
189
|
"""
|
|
187
190
|
|
|
191
|
+
# Convert the inputs to lowercase for case-insensitive matching
|
|
192
|
+
string = string.lower()
|
|
193
|
+
positive_rail = positive_rail.lower()
|
|
194
|
+
negative_rail = negative_rail.lower()
|
|
195
|
+
|
|
188
196
|
positive_pos, negative_pos = string.find(positive_rail), string.find(negative_rail)
|
|
189
197
|
|
|
190
198
|
# If both positive and negative rails are in the string
|
|
@@ -4,7 +4,6 @@ Helper functions for evaluating the retrieval step of retrieval-augmented genera
|
|
|
4
4
|
|
|
5
5
|
from typing import List, Optional
|
|
6
6
|
|
|
7
|
-
from openai import ChatCompletion
|
|
8
7
|
from tenacity import (
|
|
9
8
|
retry,
|
|
10
9
|
stop_after_attempt,
|
|
@@ -75,6 +74,9 @@ def classify_relevance(query: str, document: str, model_name: str) -> Optional[b
|
|
|
75
74
|
(True meaning relevant, False meaning irrelevant), or None if the LLM produces an
|
|
76
75
|
unparseable output.
|
|
77
76
|
"""
|
|
77
|
+
|
|
78
|
+
from openai import ChatCompletion
|
|
79
|
+
|
|
78
80
|
prompt = _QUERY_CONTEXT_PROMPT_TEMPLATE.format(
|
|
79
81
|
query=query,
|
|
80
82
|
reference=document,
|