npm - vitest-evals - Versions diffs - 0.1.4 → 0.2.0 - Mend

vitest-evals 0.1.4 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/README.md +16 -11
package/dist/compatibility.test.d.mts +2 -0
package/dist/compatibility.test.d.ts +2 -0
package/dist/compatibility.test.js +45009 -0
package/dist/compatibility.test.js.map +1 -0
package/dist/compatibility.test.mjs +45864 -0
package/dist/compatibility.test.mjs.map +1 -0
package/dist/formatScores.test.d.mts +2 -0
package/dist/formatScores.test.d.ts +2 -0
package/dist/formatScores.test.js +195 -0
package/dist/formatScores.test.js.map +1 -0
package/dist/formatScores.test.mjs +194 -0
package/dist/formatScores.test.mjs.map +1 -0
package/dist/index.d.mts +9 -1
package/dist/index.d.ts +9 -1
package/dist/index.js +18 -13
package/dist/index.js.map +1 -1
package/dist/index.mjs +18 -13
package/dist/index.mjs.map +1 -1
package/dist/reporter.d.mts +7 -0
package/dist/reporter.d.ts +7 -0
package/dist/reporter.js +53 -0
package/dist/reporter.js.map +1 -0
package/dist/reporter.mjs +22 -0
package/dist/reporter.mjs.map +1 -0
package/dist/wrapText.test.d.mts +2 -0
package/dist/wrapText.test.d.ts +2 -0
package/dist/wrapText.test.js +162 -0
package/dist/wrapText.test.js.map +1 -0
package/dist/wrapText.test.mjs +161 -0
package/dist/wrapText.test.mjs.map +1 -0
package/package.json +27 -14

package/README.md CHANGED Viewed

@@ -18,7 +18,7 @@ async function answerQuestion(prompt: string) {
   const { text } = await generateText({
     model,
     prompt,
-  })
+  });
   return text;
 }
 ```
@@ -52,7 +52,7 @@ describeEval("my evals", {
   // The timeout for each test. Defaults to 10s. You may need to increase this if your model
   // provider has high latency or you're using a large number of scorers.
-  // timeout: 10000,
+  // timeout: 60000,
   // A check to determine if these tests should run. This is helpful to control tests so they only
   // in certain situations, for example if a model providers API key is defined.
@@ -70,7 +70,12 @@ import { Factuality } from "autoevals";
 describe("my test suite", () => {
   it("kind of works", () => {
-    expect("What is the capital of France?").toEval("Paris", answerQuestion, Factuality, 0.8)
+    expect("What is the capital of France?").toEval(
+      "Paris",
+      answerQuestion,
+      Factuality,
+      0.8
+    );
   });
 });
 ```
@@ -81,28 +86,28 @@ Scorers are compatible with the `autoevals` interface, but are also simple to im
 ```javascript
 export const Contains = async (opts: {
-  input: string;
-  expected: string;
-  output: string;
+  input: string,
+  expected: string,
+  output: string,
 }) => {
   return {
     score: output.indexOf(expected) !== -1 ? 1.0 : 0.0,
   };
-}
+};
 ```
 For something more realistic, here's a reimplementation of the Factuality scorer from `autoevals`, with some flexibility
 on the model, enabling you to evaluate against multiple models:
-```javascript
+````javascript
 import { generateObject, type LanguageModel } from "ai";
 import { z } from "zod";
 /**
  * A Factuality checker utilizing the `ai` SDK based on the implementation in `autoevals`.
- *
+ *
  * @param model - The language model to utilize (via `ai`).
- *
+ *
  * @example
  * ```javascript
  * import { openai } from "@ai-sdk/openai";
@@ -167,7 +172,7 @@ export function Factuality(model: LanguageModel) {
     };
   };
 }
-```
+````
 ### Separating Evals

package/dist/compatibility.test.d.mts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+
2	+ export { }

package/dist/compatibility.test.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+
2	+ export { }