npm - @huggingface/tasks - Versions diffs - 0.19.89 → 0.19.90 - Mend

@huggingface/tasks 0.19.89 → 0.19.90

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/commonjs/eval.d.ts +7 -2
package/dist/commonjs/eval.d.ts.map +1 -1
package/dist/commonjs/eval.js +7 -2
package/dist/esm/eval.d.ts +7 -2
package/dist/esm/eval.d.ts.map +1 -1
package/dist/esm/eval.js +7 -2
package/package.json +1 -1
package/src/eval.ts +8 -2

package/dist/commonjs/eval.d.ts CHANGED Viewed

@@ -17,8 +17,8 @@ export declare const EVALUATION_FRAMEWORKS: {
         readonly description: "Multimodal toolbox for evaluating embeddings and retrieval systems.";
         readonly url: "https://github.com/embeddings-benchmark/mteb";
     };
-    readonly "olmo-bench": {
-        readonly name: "olmo-bench";
+    readonly "olmocr-bench": {
+        readonly name: "olmocr-bench";
         readonly description: "olmOCR-Bench is a framework for evaluating document-level OCR of various tools.";
         readonly url: "https://github.com/allenai/olmocr/tree/main/olmocr/bench";
     };
@@ -42,5 +42,10 @@ export declare const EVALUATION_FRAMEWORKS: {
         readonly description: "SWE-Bench Pro is a challenging benchmark evaluating LLMs/Agents on long-horizon software engineering tasks.";
         readonly url: "https://github.com/scaleapi/SWE-bench_Pro-os";
     };
+    readonly "nemo-evaluator": {
+        readonly name: "nemo-evaluator";
+        readonly description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.";
+        readonly url: "https://github.com/NVIDIA-NeMo/Evaluator";
+    };
 };
 //# sourceMappingURL=eval.d.ts.map

package/dist/commonjs/eval.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA0CxB~~,CAAC"}
1	+ {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAgDxB,CAAC"}

package/dist/commonjs/eval.js CHANGED Viewed

@@ -20,8 +20,8 @@ exports.EVALUATION_FRAMEWORKS = {
         description: "Multimodal toolbox for evaluating embeddings and retrieval systems.",
         url: "https://github.com/embeddings-benchmark/mteb",
     },
-    "olmo-bench": {
-        name: "olmo-bench",
+    "olmocr-bench": {
+        name: "olmocr-bench",
         description: "olmOCR-Bench is a framework for evaluating document-level OCR of various tools.",
         url: "https://github.com/allenai/olmocr/tree/main/olmocr/bench",
     },
@@ -45,4 +45,9 @@ exports.EVALUATION_FRAMEWORKS = {
         description: "SWE-Bench Pro is a challenging benchmark evaluating LLMs/Agents on long-horizon software engineering tasks.",
         url: "https://github.com/scaleapi/SWE-bench_Pro-os",
     },
+    "nemo-evaluator": {
+        name: "nemo-evaluator",
+        description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.",
+        url: "https://github.com/NVIDIA-NeMo/Evaluator",
+    },
 };

package/dist/esm/eval.d.ts CHANGED Viewed

@@ -17,8 +17,8 @@ export declare const EVALUATION_FRAMEWORKS: {
         readonly description: "Multimodal toolbox for evaluating embeddings and retrieval systems.";
         readonly url: "https://github.com/embeddings-benchmark/mteb";
     };
-    readonly "olmo-bench": {
-        readonly name: "olmo-bench";
+    readonly "olmocr-bench": {
+        readonly name: "olmocr-bench";
         readonly description: "olmOCR-Bench is a framework for evaluating document-level OCR of various tools.";
         readonly url: "https://github.com/allenai/olmocr/tree/main/olmocr/bench";
     };
@@ -42,5 +42,10 @@ export declare const EVALUATION_FRAMEWORKS: {
         readonly description: "SWE-Bench Pro is a challenging benchmark evaluating LLMs/Agents on long-horizon software engineering tasks.";
         readonly url: "https://github.com/scaleapi/SWE-bench_Pro-os";
     };
+    readonly "nemo-evaluator": {
+        readonly name: "nemo-evaluator";
+        readonly description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.";
+        readonly url: "https://github.com/NVIDIA-NeMo/Evaluator";
+    };
 };
 //# sourceMappingURL=eval.d.ts.map

package/dist/esm/eval.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA0CxB~~,CAAC"}
1	+ {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../src/eval.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,eAAO,MAAM,qBAAqB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAgDxB,CAAC"}

package/dist/esm/eval.js CHANGED Viewed

@@ -17,8 +17,8 @@ export const EVALUATION_FRAMEWORKS = {
         description: "Multimodal toolbox for evaluating embeddings and retrieval systems.",
         url: "https://github.com/embeddings-benchmark/mteb",
     },
-    "olmo-bench": {
-        name: "olmo-bench",
+    "olmocr-bench": {
+        name: "olmocr-bench",
         description: "olmOCR-Bench is a framework for evaluating document-level OCR of various tools.",
         url: "https://github.com/allenai/olmocr/tree/main/olmocr/bench",
     },
@@ -42,4 +42,9 @@ export const EVALUATION_FRAMEWORKS = {
         description: "SWE-Bench Pro is a challenging benchmark evaluating LLMs/Agents on long-horizon software engineering tasks.",
         url: "https://github.com/scaleapi/SWE-bench_Pro-os",
     },
+    "nemo-evaluator": {
+        name: "nemo-evaluator",
+        description: "NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.",
+        url: "https://github.com/NVIDIA-NeMo/Evaluator",
+    },
 };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@huggingface/tasks",
-  "version": "0.19.89",
+  "version": "0.19.90",
   "description": "List of ML tasks for huggingface.co/tasks",
   "keywords": [
     "hub",

package/src/eval.ts CHANGED Viewed

@@ -17,8 +17,8 @@ export const EVALUATION_FRAMEWORKS = {
 		description: "Multimodal toolbox for evaluating embeddings and retrieval systems.",
 		url: "https://github.com/embeddings-benchmark/mteb",
 	},
-	"olmo-bench": {
-		name: "olmo-bench",
+	"olmocr-bench": {
+		name: "olmocr-bench",
 		description: "olmOCR-Bench is a framework for evaluating document-level OCR of various tools.",
 		url: "https://github.com/allenai/olmocr/tree/main/olmocr/bench",
 	},
@@ -43,4 +43,10 @@ export const EVALUATION_FRAMEWORKS = {
 			"SWE-Bench Pro is a challenging benchmark evaluating LLMs/Agents on long-horizon software engineering tasks.",
 		url: "https://github.com/scaleapi/SWE-bench_Pro-os",
 	},
+	"nemo-evaluator": {
+		name: "nemo-evaluator",
+		description:
+			"NeMo Evaluator is an open-source platform for robust, reproducible, and scalable evaluation of Large Language Models across 100+ benchmarks.",
+		url: "https://github.com/NVIDIA-NeMo/Evaluator",
+	},
 } as const;