@learning-commons/evaluators 0.5.0 → 0.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +8 -0
- package/README.md +12 -0
- package/dist/batch/cli.js +39 -17
- package/dist/batch/cli.js.map +1 -1
- package/dist/batch/index.cjs +21 -8
- package/dist/batch/index.cjs.map +1 -1
- package/dist/batch/index.d.cts +1 -0
- package/dist/batch/index.d.ts +1 -0
- package/dist/batch/index.js +21 -8
- package/dist/batch/index.js.map +1 -1
- package/dist/index.cjs +18 -6
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.cts +2 -0
- package/dist/index.d.ts +2 -0
- package/dist/index.js +18 -6
- package/dist/index.js.map +1 -1
- package/package.json +6 -2
- package/src/batch/README.md +14 -1
package/dist/batch/index.cjs
CHANGED
|
@@ -1304,7 +1304,9 @@ var VocabularyEvaluator = class _VocabularyEvaluator extends BaseEvaluator {
|
|
|
1304
1304
|
reasoning: complexityResponse.data.reasoning,
|
|
1305
1305
|
metadata: {
|
|
1306
1306
|
model: modelLabel,
|
|
1307
|
-
processingTimeMs: latencyMs
|
|
1307
|
+
processingTimeMs: latencyMs,
|
|
1308
|
+
inputTokens: totalTokenUsage.input_tokens,
|
|
1309
|
+
outputTokens: totalTokenUsage.output_tokens
|
|
1308
1310
|
},
|
|
1309
1311
|
_internal: complexityResponse.data
|
|
1310
1312
|
};
|
|
@@ -1634,7 +1636,9 @@ var SentenceStructureEvaluator = class _SentenceStructureEvaluator extends BaseE
|
|
|
1634
1636
|
reasoning: complexityResponse.data.reasoning,
|
|
1635
1637
|
metadata: {
|
|
1636
1638
|
model: this.provider.label,
|
|
1637
|
-
processingTimeMs: latencyMs
|
|
1639
|
+
processingTimeMs: latencyMs,
|
|
1640
|
+
inputTokens: totalTokenUsage.input_tokens,
|
|
1641
|
+
outputTokens: totalTokenUsage.output_tokens
|
|
1638
1642
|
},
|
|
1639
1643
|
_internal: {
|
|
1640
1644
|
sentenceAnalysis: analysisResponse.data,
|
|
@@ -1840,7 +1844,9 @@ var GradeLevelAppropriatenessEvaluator = class extends BaseEvaluator {
|
|
|
1840
1844
|
reasoning: response.data.reasoning,
|
|
1841
1845
|
metadata: {
|
|
1842
1846
|
model: this.provider.label,
|
|
1843
|
-
processingTimeMs: latencyMs
|
|
1847
|
+
processingTimeMs: latencyMs,
|
|
1848
|
+
inputTokens: tokenUsage.input_tokens,
|
|
1849
|
+
outputTokens: tokenUsage.output_tokens
|
|
1844
1850
|
},
|
|
1845
1851
|
_internal: response.data
|
|
1846
1852
|
};
|
|
@@ -2042,7 +2048,9 @@ var SmkEvaluator = class _SmkEvaluator extends BaseEvaluator {
|
|
|
2042
2048
|
reasoning: response.data.reasoning,
|
|
2043
2049
|
metadata: {
|
|
2044
2050
|
model: this.provider.label,
|
|
2045
|
-
processingTimeMs: latencyMs
|
|
2051
|
+
processingTimeMs: latencyMs,
|
|
2052
|
+
inputTokens: totalTokenUsage.input_tokens,
|
|
2053
|
+
outputTokens: totalTokenUsage.output_tokens
|
|
2046
2054
|
},
|
|
2047
2055
|
_internal: response.data
|
|
2048
2056
|
};
|
|
@@ -2248,7 +2256,9 @@ var ConventionalityEvaluator = class _ConventionalityEvaluator extends BaseEvalu
|
|
|
2248
2256
|
reasoning: response.data.reasoning,
|
|
2249
2257
|
metadata: {
|
|
2250
2258
|
model: this.provider.label,
|
|
2251
|
-
processingTimeMs: latencyMs
|
|
2259
|
+
processingTimeMs: latencyMs,
|
|
2260
|
+
inputTokens: totalTokenUsage.input_tokens,
|
|
2261
|
+
outputTokens: totalTokenUsage.output_tokens
|
|
2252
2262
|
},
|
|
2253
2263
|
_internal: response.data
|
|
2254
2264
|
};
|
|
@@ -2523,7 +2533,9 @@ var PurposeEvaluator = class _PurposeEvaluator extends BaseEvaluator {
|
|
|
2523
2533
|
reasoning: response.data.reasoning,
|
|
2524
2534
|
metadata: {
|
|
2525
2535
|
model: this.provider.label,
|
|
2526
|
-
processingTimeMs: latencyMs
|
|
2536
|
+
processingTimeMs: latencyMs,
|
|
2537
|
+
inputTokens: tokenUsage.input_tokens,
|
|
2538
|
+
outputTokens: tokenUsage.output_tokens
|
|
2527
2539
|
},
|
|
2528
2540
|
_internal: response.data
|
|
2529
2541
|
};
|
|
@@ -2636,6 +2648,7 @@ var BatchEvaluator = class {
|
|
|
2636
2648
|
concurrency: 3,
|
|
2637
2649
|
maxRetries: 2,
|
|
2638
2650
|
telemetry: false,
|
|
2651
|
+
bypassRowLimit: false,
|
|
2639
2652
|
...config
|
|
2640
2653
|
};
|
|
2641
2654
|
this.limit = pLimit__default.default(this.config.concurrency);
|
|
@@ -2789,9 +2802,9 @@ var BatchEvaluator = class {
|
|
|
2789
2802
|
`Unknown evaluator group: "${groupId}". Available: ${EVALUATOR_GROUPS.map((g) => g.id).join(", ")}`
|
|
2790
2803
|
);
|
|
2791
2804
|
}
|
|
2792
|
-
if (inputs.length > group.maxInputRows) {
|
|
2805
|
+
if (!this.config.bypassRowLimit && inputs.length > group.maxInputRows) {
|
|
2793
2806
|
throw new Error(
|
|
2794
|
-
`Input exceeds limit for "${group.id}": ${inputs.length} rows (max ${group.maxInputRows}). Split into smaller batches.`
|
|
2807
|
+
`Input exceeds limit for "${group.id}": ${inputs.length} rows (max ${group.maxInputRows}). Split into smaller batches, or pass { bypassRowLimit: true } in BatchConfig to bypass (use --bypass-row-limit on the CLI).`
|
|
2795
2808
|
);
|
|
2796
2809
|
}
|
|
2797
2810
|
this.isCancelled = false;
|