npm - @huggingface/tasks - Versions diffs - 0.20.7 → 0.20.8 - Mend

@huggingface/tasks 0.20.7 → 0.20.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/commonjs/eval.d.ts +5 -0
package/dist/commonjs/eval.d.ts.map +1 -1
package/dist/commonjs/eval.js +5 -0
package/dist/esm/eval.d.ts +5 -0
package/dist/esm/eval.d.ts.map +1 -1
package/dist/esm/eval.js +5 -0
package/package.json +1 -1
package/src/eval.ts +6 -0

package/dist/commonjs/eval.d.ts CHANGED Viewed

@@ -52,5 +52,10 @@ export declare const EVALUATION_FRAMEWORKS: {
         readonly description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.";
         readonly url: "https://github.com/NVIDIA-NeMo/Evaluator";
     };
+    readonly "yc-bench": {
+        readonly name: "yc-bench";
+        readonly description: "YC Bench is a long-horizon deterministic benchmark for LLM agents. The agent plays CEO of an AI startup over a simulated 1–3 year run.";
+        readonly url: "https://github.com/collinear-ai/yc-bench";
+    };
 };
 //# sourceMappingURL=eval.d.ts.map

package/dist/commonjs/eval.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAsDxB~~,CAAC"}
1	+ {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA4DxB,CAAC"}

package/dist/commonjs/eval.js CHANGED Viewed

@@ -55,4 +55,9 @@ exports.EVALUATION_FRAMEWORKS = {
         description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.",
         url: "https://github.com/NVIDIA-NeMo/Evaluator",
     },
+    "yc-bench": {
+        name: "yc-bench",
+        description: "YC Bench is a long-horizon deterministic benchmark for LLM agents. The agent plays CEO of an AI startup over a simulated 1–3 year run.",
+        url: "https://github.com/collinear-ai/yc-bench",
+    },
 };

package/dist/esm/eval.d.ts CHANGED Viewed

@@ -52,5 +52,10 @@ export declare const EVALUATION_FRAMEWORKS: {
         readonly description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.";
         readonly url: "https://github.com/NVIDIA-NeMo/Evaluator";
     };
+    readonly "yc-bench": {
+        readonly name: "yc-bench";
+        readonly description: "YC Bench is a long-horizon deterministic benchmark for LLM agents. The agent plays CEO of an AI startup over a simulated 1–3 year run.";
+        readonly url: "https://github.com/collinear-ai/yc-bench";
+    };
 };
 //# sourceMappingURL=eval.d.ts.map

package/dist/esm/eval.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAsDxB~~,CAAC"}
1	+ {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA4DxB,CAAC"}

package/dist/esm/eval.js CHANGED Viewed

@@ -52,4 +52,9 @@ export const EVALUATION_FRAMEWORKS = {
         description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.",
         url: "https://github.com/NVIDIA-NeMo/Evaluator",
     },
+    "yc-bench": {
+        name: "yc-bench",
+        description: "YC Bench is a long-horizon deterministic benchmark for LLM agents. The agent plays CEO of an AI startup over a simulated 1–3 year run.",
+        url: "https://github.com/collinear-ai/yc-bench",
+    },
 };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@huggingface/tasks",
-  "version": "0.20.7",
+  "version": "0.20.8",
   "description": "List of ML tasks for huggingface.co/tasks",
   "keywords": [
     "hub",

package/src/eval.ts CHANGED Viewed

@@ -55,4 +55,10 @@ export const EVALUATION_FRAMEWORKS = {
 			"NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.",
 		url: "https://github.com/NVIDIA-NeMo/Evaluator",
 	},
+	"yc-bench": {
+		name: "yc-bench",
+		description:
+			"YC Bench is a long-horizon deterministic benchmark for LLM agents. The agent plays CEO of an AI startup over a simulated 1–3 year run.",
+		url: "https://github.com/collinear-ai/yc-bench",
+	},
 } as const;