@wix/evalforge-evaluator 0.75.0 → 0.77.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +6 -2
- package/build/index.js.map +2 -2
- package/build/index.mjs +6 -2
- package/build/index.mjs.map +2 -2
- package/package.json +2 -2
package/build/index.js
CHANGED
|
@@ -300,9 +300,12 @@ async function fetchEvaluationData(api, projectId2, evalRunId2) {
|
|
|
300
300
|
if (evalRun.skillsGroupId) {
|
|
301
301
|
skillsGroup = await api.getSkillsGroup(projectId2, evalRun.skillsGroupId);
|
|
302
302
|
if (skillsGroup.skillIds.length > 0) {
|
|
303
|
-
|
|
303
|
+
const fetchResults = await Promise.allSettled(
|
|
304
304
|
skillsGroup.skillIds.map((id) => api.getSkill(projectId2, id))
|
|
305
305
|
);
|
|
306
|
+
skills = fetchResults.filter(
|
|
307
|
+
(r) => r.status === "fulfilled"
|
|
308
|
+
).map((r) => r.value).filter((s) => !s.deleted);
|
|
306
309
|
}
|
|
307
310
|
if (evalRun.skillVersions && Object.keys(evalRun.skillVersions).length > 0) {
|
|
308
311
|
skills = await Promise.all(
|
|
@@ -1140,7 +1143,8 @@ IMPORTANT: This is an automated evaluation run. Follow these guidelines:
|
|
|
1140
1143
|
3. Do NOT use the Task tool to delegate simple operations - do them directly yourself.
|
|
1141
1144
|
4. Keep your approach simple and direct - avoid excessive planning.
|
|
1142
1145
|
5. Make targeted edits using Read and Edit tools rather than exploring the entire codebase.
|
|
1143
|
-
6. If you encounter an error, fix it directly rather than starting over
|
|
1146
|
+
6. If you encounter an error, fix it directly rather than starting over.
|
|
1147
|
+
7. Your project root is the current working directory. Always create and modify source code files relative to the project root, NOT inside .claude/skills/ directories.`;
|
|
1144
1148
|
const fullPrompt = scenario.triggerPrompt + evaluatorPromptSuffix;
|
|
1145
1149
|
for await (const message of query({
|
|
1146
1150
|
prompt: fullPrompt,
|