npm - @wix/evalforge-evaluator - Versions diffs - 0.75.0 → 0.77.0 - Mend

@wix/evalforge-evaluator 0.75.0 → 0.77.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/build/index.js CHANGED Viewed

@@ -300,9 +300,12 @@ async function fetchEvaluationData(api, projectId2, evalRunId2) {
   if (evalRun.skillsGroupId) {
     skillsGroup = await api.getSkillsGroup(projectId2, evalRun.skillsGroupId);
     if (skillsGroup.skillIds.length > 0) {
-      skills = await Promise.all(
+      const fetchResults = await Promise.allSettled(
         skillsGroup.skillIds.map((id) => api.getSkill(projectId2, id))
       );
+      skills = fetchResults.filter(
+        (r) => r.status === "fulfilled"
+      ).map((r) => r.value).filter((s) => !s.deleted);
     }
     if (evalRun.skillVersions && Object.keys(evalRun.skillVersions).length > 0) {
       skills = await Promise.all(
@@ -1140,7 +1143,8 @@ IMPORTANT: This is an automated evaluation run. Follow these guidelines:
 3. Do NOT use the Task tool to delegate simple operations - do them directly yourself.
 4. Keep your approach simple and direct - avoid excessive planning.
 5. Make targeted edits using Read and Edit tools rather than exploring the entire codebase.
-6. If you encounter an error, fix it directly rather than starting over.`;
+6. If you encounter an error, fix it directly rather than starting over.
+7. Your project root is the current working directory. Always create and modify source code files relative to the project root, NOT inside .claude/skills/ directories.`;
       const fullPrompt = scenario.triggerPrompt + evaluatorPromptSuffix;
       for await (const message of query({
         prompt: fullPrompt,