@arizeai/phoenix-evals 0.7.0 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (107) hide show
  1. package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
  2. package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
  3. package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js +33 -0
  4. package/dist/esm/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
  5. package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
  6. package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
  7. package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js +30 -0
  8. package/dist/esm/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
  9. package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
  10. package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
  11. package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js +86 -0
  12. package/dist/esm/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
  13. package/dist/esm/__generated__/default_templates/index.d.ts +3 -0
  14. package/dist/esm/__generated__/default_templates/index.d.ts.map +1 -1
  15. package/dist/esm/__generated__/default_templates/index.js +3 -0
  16. package/dist/esm/__generated__/default_templates/index.js.map +1 -1
  17. package/dist/esm/core/EvaluatorBase.d.ts.map +1 -1
  18. package/dist/esm/llm/createCorrectnessEvaluator.d.ts.map +1 -1
  19. package/dist/esm/llm/createDocumentRelevanceEvaluator.d.ts.map +1 -1
  20. package/dist/esm/llm/createDocumentRelevanceEvaluator.js.map +1 -1
  21. package/dist/esm/llm/createFaithfulnessEvaluator.d.ts +24 -0
  22. package/dist/esm/llm/createFaithfulnessEvaluator.d.ts.map +1 -0
  23. package/dist/esm/llm/createFaithfulnessEvaluator.js +19 -0
  24. package/dist/esm/llm/createFaithfulnessEvaluator.js.map +1 -0
  25. package/dist/esm/llm/createHallucinationEvaluator.d.ts +12 -0
  26. package/dist/esm/llm/createHallucinationEvaluator.d.ts.map +1 -1
  27. package/dist/esm/llm/createHallucinationEvaluator.js +17 -0
  28. package/dist/esm/llm/createHallucinationEvaluator.js.map +1 -1
  29. package/dist/esm/llm/createToolInvocationEvaluator.d.ts +74 -0
  30. package/dist/esm/llm/createToolInvocationEvaluator.d.ts.map +1 -0
  31. package/dist/esm/llm/createToolInvocationEvaluator.js +60 -0
  32. package/dist/esm/llm/createToolInvocationEvaluator.js.map +1 -0
  33. package/dist/esm/llm/createToolResponseHandlingEvaluator.d.ts +78 -0
  34. package/dist/esm/llm/createToolResponseHandlingEvaluator.d.ts.map +1 -0
  35. package/dist/esm/llm/createToolResponseHandlingEvaluator.js +59 -0
  36. package/dist/esm/llm/createToolResponseHandlingEvaluator.js.map +1 -0
  37. package/dist/esm/llm/createToolSelectionEvaluator.d.ts +64 -0
  38. package/dist/esm/llm/createToolSelectionEvaluator.d.ts.map +1 -0
  39. package/dist/esm/llm/createToolSelectionEvaluator.js +50 -0
  40. package/dist/esm/llm/createToolSelectionEvaluator.js.map +1 -0
  41. package/dist/esm/llm/index.d.ts +9 -5
  42. package/dist/esm/llm/index.d.ts.map +1 -1
  43. package/dist/esm/llm/index.js +9 -5
  44. package/dist/esm/llm/index.js.map +1 -1
  45. package/dist/esm/tsconfig.esm.tsbuildinfo +1 -1
  46. package/dist/esm/types/evals.d.ts.map +1 -1
  47. package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
  48. package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
  49. package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js +36 -0
  50. package/dist/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
  51. package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
  52. package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
  53. package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js +33 -0
  54. package/dist/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
  55. package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts +3 -0
  56. package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.d.ts.map +1 -0
  57. package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js +89 -0
  58. package/dist/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.js.map +1 -0
  59. package/dist/src/__generated__/default_templates/index.d.ts +3 -0
  60. package/dist/src/__generated__/default_templates/index.d.ts.map +1 -1
  61. package/dist/src/__generated__/default_templates/index.js +7 -1
  62. package/dist/src/__generated__/default_templates/index.js.map +1 -1
  63. package/dist/src/core/EvaluatorBase.d.ts.map +1 -1
  64. package/dist/src/llm/createCorrectnessEvaluator.d.ts.map +1 -1
  65. package/dist/src/llm/createDocumentRelevanceEvaluator.d.ts.map +1 -1
  66. package/dist/src/llm/createDocumentRelevanceEvaluator.js.map +1 -1
  67. package/dist/src/llm/createFaithfulnessEvaluator.d.ts +24 -0
  68. package/dist/src/llm/createFaithfulnessEvaluator.d.ts.map +1 -0
  69. package/dist/src/llm/createFaithfulnessEvaluator.js +30 -0
  70. package/dist/src/llm/createFaithfulnessEvaluator.js.map +1 -0
  71. package/dist/src/llm/createHallucinationEvaluator.d.ts +12 -0
  72. package/dist/src/llm/createHallucinationEvaluator.d.ts.map +1 -1
  73. package/dist/src/llm/createHallucinationEvaluator.js +17 -0
  74. package/dist/src/llm/createHallucinationEvaluator.js.map +1 -1
  75. package/dist/src/llm/createToolInvocationEvaluator.d.ts +74 -0
  76. package/dist/src/llm/createToolInvocationEvaluator.d.ts.map +1 -0
  77. package/dist/src/llm/createToolInvocationEvaluator.js +71 -0
  78. package/dist/src/llm/createToolInvocationEvaluator.js.map +1 -0
  79. package/dist/src/llm/createToolResponseHandlingEvaluator.d.ts +78 -0
  80. package/dist/src/llm/createToolResponseHandlingEvaluator.d.ts.map +1 -0
  81. package/dist/src/llm/createToolResponseHandlingEvaluator.js +70 -0
  82. package/dist/src/llm/createToolResponseHandlingEvaluator.js.map +1 -0
  83. package/dist/src/llm/createToolSelectionEvaluator.d.ts +64 -0
  84. package/dist/src/llm/createToolSelectionEvaluator.d.ts.map +1 -0
  85. package/dist/src/llm/createToolSelectionEvaluator.js +61 -0
  86. package/dist/src/llm/createToolSelectionEvaluator.js.map +1 -0
  87. package/dist/src/llm/index.d.ts +9 -5
  88. package/dist/src/llm/index.d.ts.map +1 -1
  89. package/dist/src/llm/index.js +9 -5
  90. package/dist/src/llm/index.js.map +1 -1
  91. package/dist/src/types/evals.d.ts.map +1 -1
  92. package/dist/tsconfig.tsbuildinfo +1 -1
  93. package/package.json +1 -1
  94. package/src/__generated__/default_templates/FAITHFULNESS_CLASSIFICATION_EVALUATOR_CONFIG.ts +35 -0
  95. package/src/__generated__/default_templates/TOOL_INVOCATION_CLASSIFICATION_EVALUATOR_CONFIG.ts +32 -0
  96. package/src/__generated__/default_templates/TOOL_RESPONSE_HANDLING_CLASSIFICATION_EVALUATOR_CONFIG.ts +88 -0
  97. package/src/__generated__/default_templates/index.ts +3 -0
  98. package/src/core/EvaluatorBase.ts +3 -3
  99. package/src/llm/createCorrectnessEvaluator.ts +3 -3
  100. package/src/llm/createDocumentRelevanceEvaluator.ts +7 -11
  101. package/src/llm/createFaithfulnessEvaluator.ts +52 -0
  102. package/src/llm/createHallucinationEvaluator.ts +25 -3
  103. package/src/llm/createToolInvocationEvaluator.ts +103 -0
  104. package/src/llm/createToolResponseHandlingEvaluator.ts +109 -0
  105. package/src/llm/createToolSelectionEvaluator.ts +93 -0
  106. package/src/llm/index.ts +9 -5
  107. package/src/types/evals.ts +5 -4
@@ -110,8 +110,8 @@ export type CreateLLMEvaluatorArgs<RecordType extends Record<string, unknown>> =
110
110
 
111
111
  export interface CreateClassificationEvaluatorArgs<
112
112
  RecordType extends Record<string, unknown>,
113
- > extends CreateClassifierArgs,
114
- CreateLLMEvaluatorArgs<RecordType> {
113
+ >
114
+ extends CreateClassifierArgs, CreateLLMEvaluatorArgs<RecordType> {
115
115
  /**
116
116
  * The prompt template to use for classification
117
117
  */
@@ -156,8 +156,9 @@ interface EvaluatorDescription {
156
156
  * The Base Evaluator interface
157
157
  * This is the interface that all evaluators must implement
158
158
  */
159
- export interface EvaluatorInterface<ExampleType extends Record<string, unknown>>
160
- extends EvaluatorDescription {
159
+ export interface EvaluatorInterface<
160
+ ExampleType extends Record<string, unknown>,
161
+ > extends EvaluatorDescription {
161
162
  /**
162
163
  * The function that evaluates the example
163
164
  */