@wix/evalforge-evaluator 0.75.0 → 0.77.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.js CHANGED
@@ -300,9 +300,12 @@ async function fetchEvaluationData(api, projectId2, evalRunId2) {
300
300
  if (evalRun.skillsGroupId) {
301
301
  skillsGroup = await api.getSkillsGroup(projectId2, evalRun.skillsGroupId);
302
302
  if (skillsGroup.skillIds.length > 0) {
303
- skills = await Promise.all(
303
+ const fetchResults = await Promise.allSettled(
304
304
  skillsGroup.skillIds.map((id) => api.getSkill(projectId2, id))
305
305
  );
306
+ skills = fetchResults.filter(
307
+ (r) => r.status === "fulfilled"
308
+ ).map((r) => r.value).filter((s) => !s.deleted);
306
309
  }
307
310
  if (evalRun.skillVersions && Object.keys(evalRun.skillVersions).length > 0) {
308
311
  skills = await Promise.all(
@@ -1140,7 +1143,8 @@ IMPORTANT: This is an automated evaluation run. Follow these guidelines:
1140
1143
  3. Do NOT use the Task tool to delegate simple operations - do them directly yourself.
1141
1144
  4. Keep your approach simple and direct - avoid excessive planning.
1142
1145
  5. Make targeted edits using Read and Edit tools rather than exploring the entire codebase.
1143
- 6. If you encounter an error, fix it directly rather than starting over.`;
1146
+ 6. If you encounter an error, fix it directly rather than starting over.
1147
+ 7. Your project root is the current working directory. Always create and modify source code files relative to the project root, NOT inside .claude/skills/ directories.`;
1144
1148
  const fullPrompt = scenario.triggerPrompt + evaluatorPromptSuffix;
1145
1149
  for await (const message of query({
1146
1150
  prompt: fullPrompt,