@arizeai/phoenix-evals 0.7.0 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
- package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
- package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js +33 -0
- package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
- package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
- package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
- package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js +30 -0
- package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
- package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
- package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
- package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js +86 -0
- package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
- package/dist/esm/__generated__/default_templates/index.d.ts +3 -0
- package/dist/esm/__generated__/default_templates/index.d.ts.map +1 -1
- package/dist/esm/__generated__/default_templates/index.js +3 -0
- package/dist/esm/__generated__/default_templates/index.js.map +1 -1
- package/dist/esm/core/EvaluatorBase.d.ts.map +1 -1
- package/dist/esm/llm/createCorrectnessEvaluator.d.ts.map +1 -1
- package/dist/esm/llm/createDocumentRelevanceEvaluator.d.ts.map +1 -1
- package/dist/esm/llm/createDocumentRelevanceEvaluator.js.map +1 -1
- package/dist/esm/llm/createFaithfulnessEvaluator.d.ts +24 -0
- package/dist/esm/llm/createFaithfulnessEvaluator.d.ts.map +1 -0
- package/dist/esm/llm/createFaithfulnessEvaluator.js +19 -0
- package/dist/esm/llm/createFaithfulnessEvaluator.js.map +1 -0
- package/dist/esm/llm/createHallucinationEvaluator.d.ts +12 -0
- package/dist/esm/llm/createHallucinationEvaluator.d.ts.map +1 -1
- package/dist/esm/llm/createHallucinationEvaluator.js +17 -0
- package/dist/esm/llm/createHallucinationEvaluator.js.map +1 -1
- package/dist/esm/llm/createToolInvocationEvaluator.d.ts +74 -0
- package/dist/esm/llm/createToolInvocationEvaluator.d.ts.map +1 -0
- package/dist/esm/llm/createToolInvocationEvaluator.js +60 -0
- package/dist/esm/llm/createToolInvocationEvaluator.js.map +1 -0
- package/dist/esm/llm/createToolResponseHandlingEvaluator.d.ts +78 -0
- package/dist/esm/llm/createToolResponseHandlingEvaluator.d.ts.map +1 -0
- package/dist/esm/llm/createToolResponseHandlingEvaluator.js +59 -0
- package/dist/esm/llm/createToolResponseHandlingEvaluator.js.map +1 -0
- package/dist/esm/llm/createToolSelectionEvaluator.d.ts +64 -0
- package/dist/esm/llm/createToolSelectionEvaluator.d.ts.map +1 -0
- package/dist/esm/llm/createToolSelectionEvaluator.js +50 -0
- package/dist/esm/llm/createToolSelectionEvaluator.js.map +1 -0
- package/dist/esm/llm/index.d.ts +9 -5
- package/dist/esm/llm/index.d.ts.map +1 -1
- package/dist/esm/llm/index.js +9 -5
- package/dist/esm/llm/index.js.map +1 -1
- package/dist/esm/tsconfig.esm.tsbuildinfo +1 -1
- package/dist/esm/types/evals.d.ts.map +1 -1
- package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
- package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
- package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js +36 -0
- package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
- package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
- package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
- package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js +33 -0
- package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
- package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
- package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
- package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js +89 -0
- package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
- package/dist/src/__generated__/default_templates/index.d.ts +3 -0
- package/dist/src/__generated__/default_templates/index.d.ts.map +1 -1
- package/dist/src/__generated__/default_templates/index.js +7 -1
- package/dist/src/__generated__/default_templates/index.js.map +1 -1
- package/dist/src/core/EvaluatorBase.d.ts.map +1 -1
- package/dist/src/llm/createCorrectnessEvaluator.d.ts.map +1 -1
- package/dist/src/llm/createDocumentRelevanceEvaluator.d.ts.map +1 -1
- package/dist/src/llm/createDocumentRelevanceEvaluator.js.map +1 -1
- package/dist/src/llm/createFaithfulnessEvaluator.d.ts +24 -0
- package/dist/src/llm/createFaithfulnessEvaluator.d.ts.map +1 -0
- package/dist/src/llm/createFaithfulnessEvaluator.js +30 -0
- package/dist/src/llm/createFaithfulnessEvaluator.js.map +1 -0
- package/dist/src/llm/createHallucinationEvaluator.d.ts +12 -0
- package/dist/src/llm/createHallucinationEvaluator.d.ts.map +1 -1
- package/dist/src/llm/createHallucinationEvaluator.js +17 -0
- package/dist/src/llm/createHallucinationEvaluator.js.map +1 -1
- package/dist/src/llm/createToolInvocationEvaluator.d.ts +74 -0
- package/dist/src/llm/createToolInvocationEvaluator.d.ts.map +1 -0
- package/dist/src/llm/createToolInvocationEvaluator.js +71 -0
- package/dist/src/llm/createToolInvocationEvaluator.js.map +1 -0
- package/dist/src/llm/createToolResponseHandlingEvaluator.d.ts +78 -0
- package/dist/src/llm/createToolResponseHandlingEvaluator.d.ts.map +1 -0
- package/dist/src/llm/createToolResponseHandlingEvaluator.js +70 -0
- package/dist/src/llm/createToolResponseHandlingEvaluator.js.map +1 -0
- package/dist/src/llm/createToolSelectionEvaluator.d.ts +64 -0
- package/dist/src/llm/createToolSelectionEvaluator.d.ts.map +1 -0
- package/dist/src/llm/createToolSelectionEvaluator.js +61 -0
- package/dist/src/llm/createToolSelectionEvaluator.js.map +1 -0
- package/dist/src/llm/index.d.ts +9 -5
- package/dist/src/llm/index.d.ts.map +1 -1
- package/dist/src/llm/index.js +9 -5
- package/dist/src/llm/index.js.map +1 -1
- package/dist/src/types/evals.d.ts.map +1 -1
- package/dist/tsconfig.tsbuildinfo +1 -1
- package/package.json +1 -1
- package/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.ts +35 -0
- package/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.ts +32 -0
- package/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.ts +88 -0
- package/src/__generated__/default_templates/index.ts +3 -0
- package/src/core/EvaluatorBase.ts +3 -3
- package/src/llm/createCorrectnessEvaluator.ts +3 -3
- package/src/llm/createDocumentRelevanceEvaluator.ts +7 -11
- package/src/llm/createFaithfulnessEvaluator.ts +52 -0
- package/src/llm/createHallucinationEvaluator.ts +25 -3
- package/src/llm/createToolInvocationEvaluator.ts +103 -0
- package/src/llm/createToolResponseHandlingEvaluator.ts +109 -0
- package/src/llm/createToolSelectionEvaluator.ts +93 -0
- package/src/llm/index.ts +9 -5
- package/src/types/evals.ts +5 -4
package/src/types/evals.ts
CHANGED
|
@@ -110,8 +110,8 @@ export type CreateLLMEvaluatorArgs<RecordType extends Record<string, unknown>> =
|
|
|
110
110
|
|
|
111
111
|
export interface CreateClassificationEvaluatorArgs<
|
|
112
112
|
RecordType extends Record<string, unknown>,
|
|
113
|
-
>
|
|
114
|
-
|
|
113
|
+
>
|
|
114
|
+
extends CreateClassifierArgs, CreateLLMEvaluatorArgs<RecordType> {
|
|
115
115
|
/**
|
|
116
116
|
* The prompt template to use for classification
|
|
117
117
|
*/
|
|
@@ -156,8 +156,9 @@ interface EvaluatorDescription {
|
|
|
156
156
|
* The Base Evaluator interface
|
|
157
157
|
* This is the interface that all evaluators must implement
|
|
158
158
|
*/
|
|
159
|
-
export interface EvaluatorInterface<
|
|
160
|
-
extends
|
|
159
|
+
export interface EvaluatorInterface<
|
|
160
|
+
ExampleType extends Record<string, unknown>,
|
|
161
|
+
> extends EvaluatorDescription {
|
|
161
162
|
/**
|
|
162
163
|
* The function that evaluates the example
|
|
163
164
|
*/
|