@wix/evalforge-evaluator 0.144.0 → 0.145.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +1 -71
- package/build/index.js.map +2 -2
- package/build/index.mjs +1 -71
- package/build/index.mjs.map +2 -2
- package/build/types/api-client.d.ts +1 -7
- package/package.json +5 -5
package/build/index.js
CHANGED
|
@@ -155,34 +155,12 @@ function createApiClient(serverUrl, options = "") {
|
|
|
155
155
|
getScenario(projectId2, id) {
|
|
156
156
|
return fetchJson(`/projects/${projectId2}/test-scenarios/${id}`);
|
|
157
157
|
},
|
|
158
|
-
getSkill(projectId2, id) {
|
|
159
|
-
return fetchJson(`/projects/${projectId2}/skills/${id}`);
|
|
160
|
-
},
|
|
161
|
-
getSkillVersion(projectId2, skillId, versionId) {
|
|
162
|
-
return fetchJson(
|
|
163
|
-
`/projects/${projectId2}/skills/${skillId}/versions/${versionId}`
|
|
164
|
-
);
|
|
165
|
-
},
|
|
166
|
-
getLatestSkillVersion(projectId2, skillId) {
|
|
167
|
-
return fetchJson(
|
|
168
|
-
`/projects/${projectId2}/skills/${skillId}/versions/latest`
|
|
169
|
-
);
|
|
170
|
-
},
|
|
171
158
|
getAgent(projectId2, id) {
|
|
172
159
|
return fetchJson(`/projects/${projectId2}/agents/${id}`);
|
|
173
160
|
},
|
|
174
161
|
getTemplate(projectId2, id) {
|
|
175
162
|
return fetchJson(`/projects/${projectId2}/templates/${id}`);
|
|
176
163
|
},
|
|
177
|
-
getMcp(projectId2, id) {
|
|
178
|
-
return fetchJson(`/projects/${projectId2}/mcps/${id}`);
|
|
179
|
-
},
|
|
180
|
-
getSubAgent(projectId2, id) {
|
|
181
|
-
return fetchJson(`/projects/${projectId2}/sub-agents/${id}`);
|
|
182
|
-
},
|
|
183
|
-
getRule(projectId2, id) {
|
|
184
|
-
return fetchJson(`/projects/${projectId2}/rules/${id}`);
|
|
185
|
-
},
|
|
186
164
|
getPreset(projectId2, id) {
|
|
187
165
|
return fetchJson(`/projects/${projectId2}/presets/${id}`);
|
|
188
166
|
},
|
|
@@ -397,54 +375,6 @@ async function fetchEvaluationData(api, projectId2, evalRunId2) {
|
|
|
397
375
|
break;
|
|
398
376
|
}
|
|
399
377
|
}
|
|
400
|
-
} else {
|
|
401
|
-
const resolvedSkillIds = evalRun.skillIds ?? [];
|
|
402
|
-
if (resolvedSkillIds.length > 0) {
|
|
403
|
-
const fetchResults = await Promise.allSettled(
|
|
404
|
-
resolvedSkillIds.map((id) => api.getSkill(projectId2, id))
|
|
405
|
-
);
|
|
406
|
-
skills = fetchResults.filter(
|
|
407
|
-
(r) => r.status === "fulfilled"
|
|
408
|
-
).map((r) => r.value).filter((s) => !s.deleted);
|
|
409
|
-
if (evalRun.skillVersions && Object.keys(evalRun.skillVersions).length > 0) {
|
|
410
|
-
skills = await Promise.all(
|
|
411
|
-
skills.map(async (skill) => {
|
|
412
|
-
const versionId = evalRun.skillVersions?.[skill.id];
|
|
413
|
-
if (versionId) {
|
|
414
|
-
const version = await api.getSkillVersion(
|
|
415
|
-
projectId2,
|
|
416
|
-
skill.id,
|
|
417
|
-
versionId
|
|
418
|
-
);
|
|
419
|
-
return { ...skill, latestVersion: version };
|
|
420
|
-
}
|
|
421
|
-
return skill;
|
|
422
|
-
})
|
|
423
|
-
);
|
|
424
|
-
}
|
|
425
|
-
skills = skills.map((skill) => {
|
|
426
|
-
const hasPinnedVersion = evalRun.skillVersions?.[skill.id];
|
|
427
|
-
if (!hasPinnedVersion && skill.source) {
|
|
428
|
-
return { ...skill, latestVersion: void 0 };
|
|
429
|
-
}
|
|
430
|
-
return skill;
|
|
431
|
-
});
|
|
432
|
-
}
|
|
433
|
-
if (evalRun.mcpIds && evalRun.mcpIds.length > 0) {
|
|
434
|
-
mcps = await Promise.all(
|
|
435
|
-
evalRun.mcpIds.map((id) => api.getMcp(projectId2, id))
|
|
436
|
-
);
|
|
437
|
-
}
|
|
438
|
-
if (evalRun.subAgentIds && evalRun.subAgentIds.length > 0) {
|
|
439
|
-
subAgents = await Promise.all(
|
|
440
|
-
evalRun.subAgentIds.map((id) => api.getSubAgent(projectId2, id))
|
|
441
|
-
);
|
|
442
|
-
}
|
|
443
|
-
if (evalRun.ruleIds && evalRun.ruleIds.length > 0) {
|
|
444
|
-
rules = await Promise.all(
|
|
445
|
-
evalRun.ruleIds.map((id) => api.getRule(projectId2, id))
|
|
446
|
-
);
|
|
447
|
-
}
|
|
448
378
|
}
|
|
449
379
|
const templateIds = [
|
|
450
380
|
...new Set(
|
|
@@ -5029,7 +4959,7 @@ async function runEvaluation(projectId2, evalRunId2) {
|
|
|
5029
4959
|
hasAgent: !!agent,
|
|
5030
4960
|
agentId: evalData.evalRun.agentId,
|
|
5031
4961
|
presetId: evalData.evalRun.presetId,
|
|
5032
|
-
|
|
4962
|
+
capabilityIds: evalData.evalRun.capabilityIds
|
|
5033
4963
|
};
|
|
5034
4964
|
if (scenarioItems.length > 0 && !agent) {
|
|
5035
4965
|
throw new Error(
|