@wayai/cli 0.2.45 → 0.2.46
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
|
@@ -82,7 +82,7 @@ async function findLatestSessionForEval(client, hubId, evalName) {
|
|
|
82
82
|
// Sessions are ordered by created_at desc, so first match is the latest
|
|
83
83
|
for (const session of completedSessions) {
|
|
84
84
|
const details = await client.getEvalSessionDetails(session.eval_session_id);
|
|
85
|
-
const hasEval = details.data.results.some((r) => r.
|
|
85
|
+
const hasEval = details.data.results.some((r) => r.eval_id === matchingEval.eval_id);
|
|
86
86
|
if (hasEval) {
|
|
87
87
|
return session.eval_session_id;
|
|
88
88
|
}
|
|
@@ -117,7 +117,7 @@ async function showRunDetails(client, sessionId, evalNameFilter, jsonOutput) {
|
|
|
117
117
|
if (evalNameFilter) {
|
|
118
118
|
const matchingResult = details.data.results.find((r) => r.eval?.eval_name?.toLowerCase() === evalNameFilter.toLowerCase());
|
|
119
119
|
if (matchingResult) {
|
|
120
|
-
evalId = matchingResult.
|
|
120
|
+
evalId = matchingResult.eval_id;
|
|
121
121
|
}
|
|
122
122
|
}
|
|
123
123
|
const runsResult = await client.getEvalSessionRuns(sessionId, { evalId });
|
|
@@ -131,7 +131,7 @@ async function showRunDetails(client, sessionId, evalNameFilter, jsonOutput) {
|
|
|
131
131
|
return;
|
|
132
132
|
}
|
|
133
133
|
for (const run of runsResult.data.runs) {
|
|
134
|
-
const evalName = run.eval?.eval_name || run.
|
|
134
|
+
const evalName = run.eval?.eval_name || run.eval_id.slice(0, 8);
|
|
135
135
|
const status = run.response_match === true ? 'PASS' : run.response_match === false ? 'FAIL' : 'PENDING';
|
|
136
136
|
const time = run.execution_time_ms != null ? `(${(run.execution_time_ms / 1000).toFixed(1)}s)` : '';
|
|
137
137
|
console.log(`${evalName} — Run #${run.run_number} [${status}] ${time}`);
|
package/dist/lib/api-client.d.ts
CHANGED
|
@@ -75,8 +75,8 @@ export declare class ApiClient {
|
|
|
75
75
|
eval_name: string;
|
|
76
76
|
enabled: boolean;
|
|
77
77
|
number_of_runs: number;
|
|
78
|
-
|
|
79
|
-
|
|
78
|
+
responder_agent_id: string;
|
|
79
|
+
hub_id: string;
|
|
80
80
|
agent?: {
|
|
81
81
|
agent_id: string;
|
|
82
82
|
agent_name: string;
|
|
@@ -95,7 +95,7 @@ export declare class ApiClient {
|
|
|
95
95
|
eval_session_id: string;
|
|
96
96
|
session_name: string;
|
|
97
97
|
session_status: string;
|
|
98
|
-
|
|
98
|
+
hub_id: string;
|
|
99
99
|
total_evals: number;
|
|
100
100
|
total_runs: number;
|
|
101
101
|
successful_runs: number;
|
|
@@ -114,7 +114,7 @@ export declare class ApiClient {
|
|
|
114
114
|
eval_session_id: string;
|
|
115
115
|
session_name: string;
|
|
116
116
|
session_status: string;
|
|
117
|
-
|
|
117
|
+
hub_id: string;
|
|
118
118
|
};
|
|
119
119
|
};
|
|
120
120
|
message: string;
|
|
@@ -141,7 +141,7 @@ export declare class ApiClient {
|
|
|
141
141
|
};
|
|
142
142
|
results: Array<{
|
|
143
143
|
eval_session_result_id: string;
|
|
144
|
-
|
|
144
|
+
eval_id: string;
|
|
145
145
|
total_runs: number;
|
|
146
146
|
successful_runs: number;
|
|
147
147
|
failed_runs: number;
|
|
@@ -158,7 +158,7 @@ export declare class ApiClient {
|
|
|
158
158
|
eval?: {
|
|
159
159
|
eval_id: string;
|
|
160
160
|
eval_name: string;
|
|
161
|
-
|
|
161
|
+
responder_agent_id: string;
|
|
162
162
|
} | null;
|
|
163
163
|
}>;
|
|
164
164
|
};
|
|
@@ -171,7 +171,7 @@ export declare class ApiClient {
|
|
|
171
171
|
data: {
|
|
172
172
|
runs: Array<{
|
|
173
173
|
eval_session_run_id: string;
|
|
174
|
-
|
|
174
|
+
eval_id: string;
|
|
175
175
|
run_number: number;
|
|
176
176
|
eval_response: {
|
|
177
177
|
role: string;
|
|
@@ -185,7 +185,7 @@ export declare class ApiClient {
|
|
|
185
185
|
eval?: {
|
|
186
186
|
eval_id: string;
|
|
187
187
|
eval_name: string;
|
|
188
|
-
|
|
188
|
+
responder_agent_id: string;
|
|
189
189
|
} | null;
|
|
190
190
|
}>;
|
|
191
191
|
total_count: number;
|
|
@@ -333,7 +333,7 @@ export declare class ApiClient {
|
|
|
333
333
|
data: Array<{
|
|
334
334
|
project_id: string;
|
|
335
335
|
project_name: string;
|
|
336
|
-
|
|
336
|
+
organization_id: string;
|
|
337
337
|
created_at: string;
|
|
338
338
|
}>;
|
|
339
339
|
}>;
|
|
@@ -342,7 +342,7 @@ export declare class ApiClient {
|
|
|
342
342
|
hub_id: string;
|
|
343
343
|
hub_name: string;
|
|
344
344
|
hub_environment: string;
|
|
345
|
-
|
|
345
|
+
project_id: string;
|
|
346
346
|
hub_type: string;
|
|
347
347
|
[key: string]: unknown;
|
|
348
348
|
}>;
|
|
@@ -351,7 +351,7 @@ export declare class ApiClient {
|
|
|
351
351
|
data: Array<{
|
|
352
352
|
project_id: string;
|
|
353
353
|
project_name: string;
|
|
354
|
-
|
|
354
|
+
organization_id: string;
|
|
355
355
|
created_at: string;
|
|
356
356
|
}>;
|
|
357
357
|
}>;
|
package/dist/lib/api-client.js
CHANGED
|
@@ -63,7 +63,7 @@ export class ApiClient {
|
|
|
63
63
|
}
|
|
64
64
|
async syncSkills(hubId, connectionId) {
|
|
65
65
|
return this.request('POST', '/api/setup/resources/sync-skills', {
|
|
66
|
-
|
|
66
|
+
hub_id: hubId,
|
|
67
67
|
...(connectionId && { connection_id: connectionId }),
|
|
68
68
|
});
|
|
69
69
|
}
|
|
@@ -113,7 +113,7 @@ export class ApiClient {
|
|
|
113
113
|
}
|
|
114
114
|
async createEvalSession(hubId, sessionName) {
|
|
115
115
|
return this.request('POST', '/api/evals/sessions', {
|
|
116
|
-
session: {
|
|
116
|
+
session: { hub_id: hubId, session_name: sessionName },
|
|
117
117
|
});
|
|
118
118
|
}
|
|
119
119
|
async runEvalSession(sessionId) {
|
|
@@ -159,13 +159,13 @@ export class ApiClient {
|
|
|
159
159
|
}
|
|
160
160
|
async createProject(organizationId, projectName) {
|
|
161
161
|
return this.request('POST', '/api/setup/projects', {
|
|
162
|
-
|
|
162
|
+
organization_id: organizationId,
|
|
163
163
|
project_name: projectName,
|
|
164
164
|
});
|
|
165
165
|
}
|
|
166
166
|
async createHub(projectId, hubName, hubType, hubDescription) {
|
|
167
167
|
return this.request('POST', '/api/setup/hubs', {
|
|
168
|
-
|
|
168
|
+
project_id: projectId,
|
|
169
169
|
hub_name: hubName,
|
|
170
170
|
...(hubType && { hub_type: hubType }),
|
|
171
171
|
...(hubDescription && { hub_description: hubDescription }),
|
package/dist/lib/eval-format.js
CHANGED
|
@@ -11,7 +11,7 @@ export function printResultsTable(results, mode) {
|
|
|
11
11
|
let totalPassed = 0;
|
|
12
12
|
let totalRuns = 0;
|
|
13
13
|
for (const r of results) {
|
|
14
|
-
const evalName = r.eval?.eval_name || r.
|
|
14
|
+
const evalName = r.eval?.eval_name || r.eval_id.slice(0, 8);
|
|
15
15
|
const passed = `${r.successful_runs}/${r.total_runs} passed`;
|
|
16
16
|
const avgTime = r.avg_execution_time_ms != null ? `avg ${(r.avg_execution_time_ms / 1000).toFixed(1)}s` : '';
|
|
17
17
|
let scoresStr = '';
|