@swarmtools/evals 0.2.15 → 0.2.18
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Test cases for strategy selection quality
|
|
3
|
+
*
|
|
4
|
+
* Each case includes:
|
|
5
|
+
* - input: task description to classify
|
|
6
|
+
* - expected: strategy that should be selected
|
|
7
|
+
*/
|
|
8
|
+
export interface StrategySelectionTestCase {
|
|
9
|
+
input: {
|
|
10
|
+
task: string;
|
|
11
|
+
context?: string;
|
|
12
|
+
};
|
|
13
|
+
expected: {
|
|
14
|
+
strategy: "file-based" | "feature-based" | "risk-based" | "research-based";
|
|
15
|
+
reasoning?: string;
|
|
16
|
+
};
|
|
17
|
+
}
|
|
18
|
+
export declare const strategySelectionCases: StrategySelectionTestCase[];
|
|
19
|
+
//# sourceMappingURL=strategy-selection.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"strategy-selection.d.ts","sourceRoot":"","sources":["../../src/fixtures/strategy-selection.ts"],"names":[],"mappings":"AAAA;;;;;;GAMG;AAEH,MAAM,WAAW,yBAAyB;IACxC,KAAK,EAAE;QACL,IAAI,EAAE,MAAM,CAAC;QACb,OAAO,CAAC,EAAE,MAAM,CAAC;KAClB,CAAC;IACF,QAAQ,EAAE;QACR,QAAQ,EAAE,YAAY,GAAG,eAAe,GAAG,YAAY,GAAG,gBAAgB,CAAC;QAC3E,SAAS,CAAC,EAAE,MAAM,CAAC;KACpB,CAAC;CACH;AAED,eAAO,MAAM,sBAAsB,EAAE,yBAAyB,EAsN7D,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"strategy-selection.eval.d.ts","sourceRoot":"","sources":["../src/strategy-selection.eval.ts"],"names":[],"mappings":""}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@swarmtools/evals",
|
|
3
|
-
"version": "0.2.
|
|
3
|
+
"version": "0.2.18",
|
|
4
4
|
"description": "Evaluation suite for swarm-tools multi-agent coordination",
|
|
5
5
|
"type": "module",
|
|
6
6
|
"main": "./dist/index.js",
|
|
@@ -33,8 +33,8 @@
|
|
|
33
33
|
"dependencies": {
|
|
34
34
|
"evalite": "^1.0.0-beta.10",
|
|
35
35
|
"ai": "6.0.0-beta.150",
|
|
36
|
-
"opencode-swarm-plugin": "0.
|
|
37
|
-
"swarm-mail": "1.
|
|
36
|
+
"opencode-swarm-plugin": "0.53.0",
|
|
37
|
+
"swarm-mail": "1.9.0"
|
|
38
38
|
},
|
|
39
39
|
"devDependencies": {
|
|
40
40
|
"@types/node": "^22.19.3",
|