PyPI - arize-phoenix - Versions diffs - 1.9.1rc2__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

arize-phoenix 1.9.1rc2py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of arize-phoenix might be problematic. Click here for more details.

Files changed (21) hide show

{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/METADATA +2 -2
{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/RECORD +21 -19
{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/WHEEL +1 -1
phoenix/__init__.py +1 -1
phoenix/core/traces.py +1 -1
phoenix/exceptions.py +2 -0
phoenix/experimental/evals/__init__.py +3 -2
phoenix/experimental/evals/evaluators.py +89 -46
phoenix/experimental/evals/functions/classify.py +102 -386
phoenix/experimental/evals/functions/executor.py +353 -0
phoenix/experimental/evals/functions/generate.py +76 -32
phoenix/experimental/evals/models/rate_limiters.py +25 -5
phoenix/experimental/evals/templates/__init__.py +0 -2
phoenix/experimental/evals/templates/template.py +2 -5
phoenix/experimental/evals/utils/__init__.py +66 -0
phoenix/server/app.py +3 -2
phoenix/server/main.py +3 -0
phoenix/server/static/index.js +548 -449
phoenix/trace/openai/instrumentor.py +51 -14
{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/licenses/IP_NOTICE +0 -0
{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/licenses/LICENSE +0 -0

{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: arize-phoenix
-Version: 1.9.1rc2
+Version: 2.0.0
 Summary: ML Observability in your notebook
 Project-URL: Documentation, https://docs.arize.com/phoenix/
 Project-URL: Issues, https://github.com/Arize-ai/phoenix/issues
@@ -55,7 +55,7 @@ Requires-Dist: strawberry-graphql[debug-server]==0.208.2; extra == 'dev'
 Provides-Extra: experimental
 Requires-Dist: tenacity; extra == 'experimental'
 Provides-Extra: llama-index
-Requires-Dist: llama-index>=0.9.14; extra == 'llama-index'
+Requires-Dist: llama-index==0.9.14; extra == 'llama-index'
 Description-Content-Type: text/markdown
 <p align="center">

{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/RECORD RENAMED Viewed

@@ -1,6 +1,7 @@
-phoenix/__init__.py,sha256=QB9EbwlNjt7WAQhba0vhPsnO0dyEVYbdrRbKP9ndWMw,1376
+phoenix/__init__.py,sha256=PMI2WOSvZVHGPpuhM_CPM29ejrA1b-XOHI8jJXHWHeE,1373
 phoenix/config.py,sha256=ErvGg22SSiuqPJtIX1WZE5KcM2lt6XOGZ__HwRg3JqA,2390
 phoenix/datetime_utils.py,sha256=D955QLrkgrrSdUM6NyqbCeAu2SMsjhR5rHVQEsVUdng,2773
+phoenix/exceptions.py,sha256=igIWGAg3m8jm5YwQDeCY1p8ml_60A7zaGVXJ1yZhY9s,44
 phoenix/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
 phoenix/services.py,sha256=slL4Uu___QQSKEssgD738-WAld-kzVQnpW92uKLxV4E,4886
 phoenix/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -9,7 +10,7 @@ phoenix/core/evals.py,sha256=tBHVgEEQW6zsNAAQCYIN-BbVHy5Q-hgF5UpQy1SmkwE,6538
 phoenix/core/model.py,sha256=vQ6RxpUPlncezJvur5u6xBN0Lkrk2gW0cTyb-qqaSqA,4713
 phoenix/core/model_schema.py,sha256=rR9VdhL_oXxbprDTPQJBXs5hw5sMPQmzx__m6Kwsxug,50394
 phoenix/core/model_schema_adapter.py,sha256=3GkyzqUST4fYi-Bgs8qAam5hwMCdQRZTDLjZ9Bnzdm4,8268
-phoenix/core/traces.py,sha256=unJ4x-LRBPexCzZPk3ImLcqiXT60u76-ABbgi_eXTgk,14314
+phoenix/core/traces.py,sha256=uNhtCpgXP9L0ahOoP9ZOBmLnubyUTkICiDB4XB-h5GY,14312
 phoenix/datasets/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 phoenix/datasets/dataset.py,sha256=scKVZ7zc6Dpc_ntt-pWhzY-KWqOJEwKePuyNnKSVTGE,30515
 phoenix/datasets/errors.py,sha256=cGp9vxnw4SewFoWBV3ZGMkhE0Kh73lPIv3Ppz_H_RoA,8261
@@ -17,24 +18,25 @@ phoenix/datasets/fixtures.py,sha256=0_PacL3dw49zulKpFpPdhvxJxeGmHTguqIyf2VXkBkk,
 phoenix/datasets/schema.py,sha256=bF1d2Md6NyqQZuC4Ym5A52f2_IcazkyxGFZ11HPqSg0,6668
 phoenix/datasets/validation.py,sha256=dZ9lCFUV0EY7HCkQkQBrs-GLAEIZdpOqUxwD5l4dp88,8294
 phoenix/experimental/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-phoenix/experimental/evals/__init__.py,sha256=dplCn-3MhT1EkiJd-FCPpipYnHG1jJvvikCrhVrRcS8,1446
-phoenix/experimental/evals/evaluators.py,sha256=ZLhuGRVs8S7Z6YRjgtU-7WLJ7pZKD5xTg0tuP6HCPz0,8849
+phoenix/experimental/evals/__init__.py,sha256=90k7hxxghhqDCftoAWsdOiUsJqYwNuJBXjhbpb3Na4I,1499
+phoenix/experimental/evals/evaluators.py,sha256=JEEow9CM3u9GkVey8KEora8e7cbmhJgazd5wh35_LPE,10311
 phoenix/experimental/evals/retrievals.py,sha256=o3fqrsYbYZjyGj_jWkN_9VQVyXjLkDKDw5Ws7l8bwdI,3828
 phoenix/experimental/evals/functions/__init__.py,sha256=3FMGrjmgxegXAwgDV_RpaN-73cFVyBiO8YwZvml5P9c,156
-phoenix/experimental/evals/functions/classify.py,sha256=S711OPnamxE_8hVUUU2dcY4pb5zjGIVNY2-kLBpW9_E,29326
-phoenix/experimental/evals/functions/generate.py,sha256=ju-ZbhgMWw4P7yEligYpRa7yraNsL3En8hoVao_U3X4,3555
+phoenix/experimental/evals/functions/classify.py,sha256=Q0FMOpU6WFr4m3dtBpJlNyrj2ExTYMB-XjR1EreeeXg,18731
+phoenix/experimental/evals/functions/executor.py,sha256=TSw2lVhkl6-VBYcXSlUl3E0U4OuJWnhwhed7NmFgbF8,13376
+phoenix/experimental/evals/functions/generate.py,sha256=sdr6TeXn5JLEKM0NqYtvq01Lq48Q7uatb0fsq5zQgVY,5310
 phoenix/experimental/evals/functions/processing.py,sha256=F4xtLsulLV4a8CkuLldRddsCim75dSTIShEJUYN6I6w,1823
 phoenix/experimental/evals/models/__init__.py,sha256=j1N7DhiOPbcaemtVBONcQ0miNnGQwEXz4u3P3Vwe6-4,320
 phoenix/experimental/evals/models/base.py,sha256=aSE3Al3MsLvzNKuN2e-z6O-RB5mgpisH4UQqwNQcqp0,7734
 phoenix/experimental/evals/models/bedrock.py,sha256=CRPmBuSLc_nRnKKWLHhGMxdWEISIKUJM1tzIlOQ_qWM,7927
 phoenix/experimental/evals/models/litellm.py,sha256=jrRlph22xWxMXMUabUWjIO2e-sHxQzlQwSM-SnAACFQ,4714
 phoenix/experimental/evals/models/openai.py,sha256=Kl2uES3HRcZGFqblfBQZ6D1BpDffuLZDAqVTjhrSXXQ,17101
-phoenix/experimental/evals/models/rate_limiters.py,sha256=aQkgEyeDxWS1yFAX_eagKK2eKuTY0WKD74jFDx9Hgrw,9279
+phoenix/experimental/evals/models/rate_limiters.py,sha256=5GVN0RQKt36Przg3-9jLgocRmyg-tbeO-cdbuLIx89w,10160
 phoenix/experimental/evals/models/vertexai.py,sha256=NfBpQq0l7XzP-wDEDsK27IRiQBzA1GXEdfwlAf8leX4,5609
-phoenix/experimental/evals/templates/__init__.py,sha256=5dXgCvQrHPCvYIOwKUHaEYOzQpHh6fjhe1dUMC2yi2A,1470
+phoenix/experimental/evals/templates/__init__.py,sha256=-KFIVh1xQLPcJP8Mv_tieIndxE02mg_c2QaibAuHJuE,1432
 phoenix/experimental/evals/templates/default_templates.py,sha256=8BetD8Xufc2f62CPZ9mbysyvDofnbFPalwB0u-KckuE,20614
-phoenix/experimental/evals/templates/template.py,sha256=NThw-12f0I-UkwulFJ_ER3T-W5vc2xee0T-joKWT-_U,6178
-phoenix/experimental/evals/utils/__init__.py,sha256=xdryDIwSLKLF0Ps132dxr3BFisIFAveMAgAyFBbym-c,1505
+phoenix/experimental/evals/templates/template.py,sha256=VAX_ZeV3vNWCODipMy7EtaYdQ0c7WA6H2Mx0i1axXf0,6005
+phoenix/experimental/evals/utils/__init__.py,sha256=PnCsNppI9KRFrQpsKWbLN58FNXsnUA3qqjLwNhoe_6Q,3715
 phoenix/experimental/evals/utils/threads.py,sha256=ksI-egarPnlxit0qKKjtjZ2L82qGLxqxZ6s92O0eBA4,1005
 phoenix/metrics/README.md,sha256=5gekqTU-5gGdMwvcfNp2Wlu8p1ul9kGY_jq0XXQusoI,1964
 phoenix/metrics/__init__.py,sha256=sLp7td1GIt_0Z8dPUyP4L0-_4x9c871yAaGX30oMsvg,2433
@@ -50,9 +52,9 @@ phoenix/pointcloud/pointcloud.py,sha256=ms-h1FLC0xXb3sk256zpSuZQDE2hdOAJzRNBklP0
 phoenix/pointcloud/projectors.py,sha256=zO_RrtDYSv2rqVOfIP2_9Cv11Dc8EmcZR94xhFcBYPU,1057
 phoenix/pointcloud/umap_parameters.py,sha256=lJsEOrbSuSiqI7g4Yt6xj7kgYxEqoep4ZHWLr6VWBqw,1760
 phoenix/server/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-phoenix/server/app.py,sha256=BTHd3hK1uCR8FS_EN86dQ5tdvFux6vsF47x_w5l--Z0,7070
+phoenix/server/app.py,sha256=SEKUBgiXCH6tCXelrzbuwuY_EbDFC8CD7J5W7BkZSzM,7125
 phoenix/server/evaluation_handler.py,sha256=HzaoD8Cv9HbEdd0nYSTZoakKsE8Ic5lVjeuBh0vnhoA,1554
-phoenix/server/main.py,sha256=jZipipFs3jUFPr3y_yvqdKEgtjF3TdMK7UYanYqdINQ,6650
+phoenix/server/main.py,sha256=cBJ_S_6TQBlV0Uj6N6ps3xq86VIv6nYKR49OYDcborg,6775
 phoenix/server/span_handler.py,sha256=TCwzbvtKfAc3CaI2Ao7Q5cfORWtQ56cU7j-43wgbOBc,1263
 phoenix/server/thread_server.py,sha256=a9Vnzc69ZLqJbI_FUSOY3eeuYCiCq6aprPj2gS_RB-M,2097
 phoenix/server/api/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -119,7 +121,7 @@ phoenix/server/static/apple-touch-icon-76x76.png,sha256=CT_xT12I0u2i0WU8JzBZBuOQ
 phoenix/server/static/apple-touch-icon.png,sha256=fOfpjqGpWYbJ0eAurKsyoZP1EAs6ZVooBJ_SGk2ZkDs,3801
 phoenix/server/static/favicon.ico,sha256=bY0vvCKRftemZfPShwZtE93DiiQdaYaozkPGwNFr6H8,34494
 phoenix/server/static/index.css,sha256=KKGpx4iwF91VGRm0YN-4cn8oC-oIqC6HecoPf0x3ZM8,1885
-phoenix/server/static/index.js,sha256=huKhVku8d8SJ1kbxInNmUbfwJDuWEHplVlMQE6kDIsM,3195596
+phoenix/server/static/index.js,sha256=hxV2PRT6IFyBLfCFykM1Xi537pefpFiNVeJTcU4YZyI,3216221
 phoenix/server/static/modernizr.js,sha256=mvK-XtkNqjOral-QvzoqsyOMECXIMu5BQwSVN_wcU9c,2564
 phoenix/server/templates/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 phoenix/server/templates/index.html,sha256=UKAw1N5ysyOYiFgP5Hfd4oaSqc_Y7quEtC9FGvtsIBA,1425
@@ -151,7 +153,7 @@ phoenix/trace/llama_index/callback.py,sha256=YW3qqzWZUEs9aiDx-2628Eae_rct_Yb-DDz
 phoenix/trace/llama_index/debug_callback.py,sha256=SKToD9q_QADSGTJ5lhilqRVKaUnUSRXUvURCzN4by2U,1367
 phoenix/trace/llama_index/streaming.py,sha256=5cTtr8evvcEAB88Xb4ih3WEw0xAF4x5W9PehUX9l5_0,3258
 phoenix/trace/openai/__init__.py,sha256=J3G0uqCxGdksUpaQVHds_Egv2drvh8UEqoLjiQAOveg,79
-phoenix/trace/openai/instrumentor.py,sha256=UKbLn7XnhGRDCOmpuvo91yUAXslpSOjzRVdMap3rV-U,23367
+phoenix/trace/openai/instrumentor.py,sha256=H1T2_1uqeH2lKCKeMmirEUl6PRtHQlQTXfsLR_hwDFM,24948
 phoenix/trace/v1/__init__.py,sha256=gzPW6vBuE_Z1bymL935cuiFBty1Tl9v2RCgAKY6vfPM,200
 phoenix/trace/v1/evaluation_pb2.py,sha256=8sXvv2BW_vqD30MOMbmkeE2zpmm7ncik21kl3e-HzeQ,2254
 phoenix/trace/v1/evaluation_pb2.pyi,sha256=cCbbx06gwQmaH14s3J1X25TtaARh-k1abbxQdQCXGm8,4500
@@ -161,8 +163,8 @@ phoenix/trace/v1/utils.py,sha256=j7gunL9CuSi7Xif56oWYGx0sc7KjfJhXzWcJia4ZM-8,178
 phoenix/utilities/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 phoenix/utilities/error_handling.py,sha256=7b5rpGFj9EWZ8yrZK1IHvxB89suWk3lggDayUQcvZds,1946
 phoenix/utilities/logging.py,sha256=lDXd6EGaamBNcQxL4vP1au9-i_SXe0OraUDiJOcszSw,222
-arize_phoenix-1.9.1rc2.dist-info/METADATA,sha256=2mcwsD5CIJSenW4g6OymRAoIzKHlzJbgz6O9LZw0rc4,26313
-arize_phoenix-1.9.1rc2.dist-info/WHEEL,sha256=rKV0FgtKSxe-Q3jTBlmgn27qdhTm0_K1YKwPwAPskZ0,87
-arize_phoenix-1.9.1rc2.dist-info/licenses/IP_NOTICE,sha256=JBqyyCYYxGDfzQ0TtsQgjts41IJoa-hiwDrBjCb9gHM,469
-arize_phoenix-1.9.1rc2.dist-info/licenses/LICENSE,sha256=HFkW9REuMOkvKRACuwLPT0hRydHb3zNg-fdFt94td18,3794
-arize_phoenix-1.9.1rc2.dist-info/RECORD,,
+arize_phoenix-2.0.0.dist-info/METADATA,sha256=aPHvi6tNxDcZhbOnRkeFus1Zw5dvniTbkET_ythER2c,26310
+arize_phoenix-2.0.0.dist-info/WHEEL,sha256=mRYSEL3Ih6g5a_CVMIcwiF__0Ae4_gLYh01YFNwiq1k,87
+arize_phoenix-2.0.0.dist-info/licenses/IP_NOTICE,sha256=JBqyyCYYxGDfzQ0TtsQgjts41IJoa-hiwDrBjCb9gHM,469
+arize_phoenix-2.0.0.dist-info/licenses/LICENSE,sha256=HFkW9REuMOkvKRACuwLPT0hRydHb3zNg-fdFt94td18,3794
+arize_phoenix-2.0.0.dist-info/RECORD,,

{arize_phoenix-1.9.1rc2.dist-info → arize_phoenix-2.0.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: hatchling 1.20.0
+Generator: hatchling 1.21.0
 Root-Is-Purelib: true
 Tag: py3-none-any

phoenix/__init__.py CHANGED Viewed

@@ -6,7 +6,7 @@ from .session.session import NotebookEnvironment, Session, active_session, close
 from .trace.fixtures import load_example_traces
 from .trace.trace_dataset import TraceDataset
-__version__ = "1.9.1rc2"
+__version__ = "2.0.0"
 # module level doc-string
 __doc__ = """

phoenix/core/traces.py CHANGED Viewed

@@ -169,7 +169,7 @@ class Traces:
                 if (
                     (span := self[span_id])
                     and start_time <= span.start_time < stop_time
-                    and (span.parent_id is None) == bool(root_spans_only)
+                    and (not root_spans_only or span.parent_id is None)
                 ):
                     yield span
             return

phoenix/exceptions.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ class PhoenixException(Exception):
2	+ pass

phoenix/experimental/evals/__init__.py CHANGED Viewed

@@ -1,3 +1,4 @@
+from .evaluators import LLMEvaluator
 from .functions import llm_classify, llm_generate, run_relevance_eval
 from .models import BedrockModel, LiteLLMModel, OpenAIModel, VertexAIModel
 from .retrievals import compute_precisions_at_k
@@ -8,7 +9,6 @@ from .templates import (
     HALLUCINATION_PROMPT_TEMPLATE,
     HUMAN_VS_AI_PROMPT_RAILS_MAP,
     HUMAN_VS_AI_PROMPT_TEMPLATE,
-    NOT_PARSABLE,
     QA_PROMPT_RAILS_MAP,
     QA_PROMPT_TEMPLATE,
     RAG_RELEVANCY_PROMPT_RAILS_MAP,
@@ -18,7 +18,7 @@ from .templates import (
     ClassificationTemplate,
     PromptTemplate,
 )
-from .utils import download_benchmark_dataset
+from .utils import NOT_PARSABLE, download_benchmark_dataset
 __all__ = [
     "compute_precisions_at_k",
@@ -29,6 +29,7 @@ __all__ = [
     "VertexAIModel",
     "BedrockModel",
     "LiteLLMModel",
+    "LLMEvaluator",
     "PromptTemplate",
     "ClassificationTemplate",
     "CODE_READABILITY_PROMPT_RAILS_MAP",

phoenix/experimental/evals/evaluators.py CHANGED Viewed

@@ -1,10 +1,11 @@
-from typing import List, Mapping, Optional
+from typing import List, Mapping, Optional, Tuple
 from phoenix.experimental.evals.models import set_verbosity
+from phoenix.experimental.evals.utils import parse_openai_function_call, snap_to_rail
 from phoenix.utilities.logging import printif
 from .models import BaseEvalModel
-from .templates import ClassificationTemplate, PromptTemplate
+from .templates import ClassificationTemplate, PromptOptions, PromptTemplate
 Record = Mapping[str, str]
@@ -20,51 +21,80 @@ class LLMEvaluator:
         self,
         model: BaseEvalModel,
         template: ClassificationTemplate,
-        name: str,
-        verbose: bool = False,
     ) -> None:
         """Initializer for LLMEvaluator.
         Args:
             model (BaseEvalModel): The LLM model to use for evaluation.
             template (ClassificationTemplate): The evaluation template.
-            name (str): The name of the evaluator.
-            verbose (bool, optional): Whether to print verbose output.
         """
         self._model = model
         self._template = template
-        self.name = name
-        self._verbose = verbose
-    def evaluate(self, record: Record) -> str:
-        """Evaluates a single record.
+    def evaluate(
+        self,
+        record: Record,
+        provide_explanation: bool = False,
+        verbose: bool = False,
+    ) -> Tuple[str, Optional[str]]:
+        """
+        Evaluates a single record.
         Args:
             record (Record): The record to evaluate.
+            provide_explanation (bool, optional): Whether to provide an
+            explanation.
+            verbose (bool, optional): Whether to print verbose output.
         Returns:
-            EvaluationResult: The result of the evaluation
+            Tuple[str, Optional[str]]: The label and explanation (if provided).
         """
-        prompt = self._template.format(record)
-        with set_verbosity(self._model, self._verbose) as verbose_model:
+        prompt = self._template.format(
+            record, options=PromptOptions(provide_explanation=provide_explanation)
+        )
+        with set_verbosity(self._model, verbose) as verbose_model:
             unparsed_output = verbose_model(prompt)
-        parsed_output = _snap_to_rail(unparsed_output, self._template.rails, self._verbose)
-        return parsed_output
-    async def aevaluate(self, record: Record) -> str:
-        """Evaluates a single record.
+        label, explanation = _extract_label_and_explanation(
+            unparsed_output=unparsed_output,
+            template=self._template,
+            use_openai_function_call=False,
+            provide_explanation=provide_explanation,
+            verbose=verbose,
+        )
+        return label, explanation
+    async def aevaluate(
+        self, record: Record, provide_explanation: bool = False, verbose: bool = False
+    ) -> Tuple[str, Optional[str]]:
+        """
+        Evaluates a single record.
         Args:
             record (Record): The record to evaluate.
+            provide_explanation (bool, optional): Whether to provide an
+            explanation.
+            verbose (bool, optional): Whether to print verbose output.
         Returns:
-            EvaluationResult: The result of the evaluation
+            Tuple[str, Optional[str]]: The label and explanation (if provided).
         """
-        prompt = self._template.format(dict(record))
-        with set_verbosity(self._model, self._verbose) as verbose_model:
+        prompt = self._template.format(
+            record, options=PromptOptions(provide_explanation=provide_explanation)
+        )
+        with set_verbosity(self._model, verbose) as verbose_model:
             unparsed_output = await verbose_model._async_generate(prompt)
-        parsed_output = _snap_to_rail(unparsed_output, self._template.rails, self._verbose)
-        return parsed_output
+        label, explanation = _extract_label_and_explanation(
+            unparsed_output=unparsed_output,
+            template=self._template,
+            use_openai_function_call=False,
+            provide_explanation=provide_explanation,
+            verbose=verbose,
+        )
+        return label, explanation
 class MapReducer:
@@ -202,33 +232,46 @@ class Refiner:
         return model(reduce_prompt)
-def _snap_to_rail(raw_string: Optional[str], rails: List[str], verbose: bool = False) -> str:
+def _extract_label_and_explanation(
+    unparsed_output: str,
+    template: ClassificationTemplate,
+    provide_explanation: bool,
+    use_openai_function_call: bool,
+    verbose: bool,
+) -> Tuple[str, Optional[str]]:
     """
-    Snaps a string to the nearest rail, or returns None if the string cannot be
-    snapped to a rail.
+    Extracts the label and explanation from the unparsed output.
     Args:
-        raw_string (str): An input to be snapped to a rail.
+        unparsed_output (str): The raw output to be parsed.
+        template (ClassificationTemplate): The template used to generate the
+        output.
-        rails (List[str]): The target set of strings to snap to.
+        provide_explanation (bool): Whether the output includes an explanation.
+        use_openai_function_call (bool): Whether the output was generated using
+        function calling.
+        verbose (bool): If True, print verbose output to stdout.
     Returns:
-        str: A string from the rails argument or "UNPARSABLE" if the input
-        string could not be snapped.
+        Tuple[str, Optional[str]]: A tuple containing the label and an
+        explanation (if one is provided).
     """
-    if not raw_string:
-        return NOT_PARSABLE
-    snap_string = raw_string.lower()
-    rails = list(set(rail.lower() for rail in rails))
-    rails.sort(key=len, reverse=True)
-    found_rails = set()
-    for rail in rails:
-        if rail in snap_string:
-            found_rails.add(rail)
-            snap_string = snap_string.replace(rail, "")
-    if len(found_rails) != 1:
-        printif(verbose, f"- Cannot snap {repr(raw_string)} to rails")
-        return NOT_PARSABLE
-    rail = list(found_rails)[0]
-    printif(verbose, f"- Snapped {repr(raw_string)} to rail: {rail}")
-    return rail
+    if not use_openai_function_call:
+        if provide_explanation:
+            unrailed_label, explanation = (
+                template.extract_label_from_explanation(unparsed_output),
+                unparsed_output,
+            )
+            printif(
+                verbose and unrailed_label == NOT_PARSABLE,
+                f"- Could not parse {repr(unparsed_output)}",
+            )
+        else:
+            unrailed_label = unparsed_output
+            explanation = None
+    else:
+        unrailed_label, explanation = parse_openai_function_call(unparsed_output)
+    return snap_to_rail(unrailed_label, template.rails, verbose=verbose), explanation

arize-phoenix 1.9.1rc2__py3-none-any.whl → 2.0.0__py3-none-any.whl

Potentially problematic release.

arize-phoenix 1.9.1rc2py3-none-any.whl → 2.0.0py3-none-any.whl