npm - @wix/evalforge-types - Versions diffs - 0.41.0 → 0.43.0 - Mend

@wix/evalforge-types 0.41.0 → 0.43.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/build/index.js +48 -5
package/build/index.js.map +2 -2
package/build/index.mjs +42 -5
package/build/index.mjs.map +3 -3
package/build/types/agent/adapter.d.ts +20 -7
package/build/types/common/models.d.ts +4 -0
package/build/types/index.d.ts +1 -1
package/build/types/target/agent.d.ts +45 -8
package/package.json +2 -2

package/build/index.js CHANGED Viewed

@@ -20,6 +20,8 @@ var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: tru
 // src/index.ts
 var index_exports = {};
 __export(index_exports, {
+  AGENT_TYPE_LABELS: () => AGENT_TYPE_LABELS,
+  ALL_AVAILABLE_MODEL_IDS: () => ALL_AVAILABLE_MODEL_IDS,
   AVAILABLE_MODEL_IDS: () => AVAILABLE_MODEL_IDS,
   AVAILABLE_OPENAI_MODEL_IDS: () => AVAILABLE_OPENAI_MODEL_IDS,
   AVAILABLE_RUN_COMMANDS: () => AVAILABLE_RUN_COMMANDS,
@@ -27,7 +29,10 @@ __export(index_exports, {
   AgentRunCommand: () => AgentRunCommand,
   AgentRunCommandSchema: () => AgentRunCommandSchema,
   AgentSchema: () => AgentSchema,
+  AgentType: () => AgentType,
+  AgentTypeSchema: () => AgentTypeSchema,
   AllowedCommands: () => AllowedCommands,
+  AnyModelSchema: () => AnyModelSchema,
   ApiCallSchema: () => ApiCallSchema,
   AssertionConfigSchema: () => AssertionConfigSchema,
   AssertionParameterSchema: () => AssertionParameterSchema,
@@ -61,6 +66,7 @@ __export(index_exports, {
   CreateTestScenarioInputSchema: () => CreateTestScenarioInputSchema,
   CreateTestSuiteInputSchema: () => CreateTestSuiteInputSchema,
   CustomAssertionSchema: () => CustomAssertionSchema,
+  DEFAULT_EVALUATOR_SYSTEM_PROMPT: () => DEFAULT_EVALUATOR_SYSTEM_PROMPT,
   DEFAULT_JUDGE_MODEL: () => DEFAULT_JUDGE_MODEL,
   DiffContentSchema: () => DiffContentSchema,
   DiffLineSchema: () => DiffLineSchema,
@@ -1125,9 +1131,16 @@ var AVAILABLE_OPENAI_MODEL_IDS = Object.values(
 var OpenAIModelSchema = import_zod4.z.enum(
   AVAILABLE_OPENAI_MODEL_IDS
 );
+var ALL_AVAILABLE_MODEL_IDS = [
+  ...AVAILABLE_MODEL_IDS,
+  ...AVAILABLE_OPENAI_MODEL_IDS
+];
+var AnyModelSchema = import_zod4.z.enum(
+  ALL_AVAILABLE_MODEL_IDS
+);
 var nullToUndefined = (val) => val === null ? void 0 : val;
 var ModelConfigSchema = import_zod4.z.object({
-  model: ClaudeModelSchema,
+  model: AnyModelSchema,
   temperature: import_zod4.z.preprocess(
     nullToUndefined,
     import_zod4.z.number().min(0).max(1).optional()
@@ -1170,6 +1183,24 @@ var TargetSchema = TenantEntitySchema.extend({
 // src/target/agent.ts
 var import_zod6 = require("zod");
+var DEFAULT_EVALUATOR_SYSTEM_PROMPT = `IMPORTANT: This is an automated evaluation run. Follow these guidelines:
+1. Execute the requested changes immediately without asking for confirmation.
+2. Do NOT ask "would you like me to proceed?" or similar questions.
+3. Do NOT use the Task tool to delegate simple operations - do them directly yourself.
+4. Keep your approach simple and direct - avoid excessive planning.
+5. Make targeted edits using Read and Edit tools rather than exploring the entire codebase.
+6. If you encounter an error, fix it directly rather than starting over.
+7. Your project root is the current working directory. Always create and modify source code files relative to the project root, NOT inside .claude/skills/ directories.
+8. Before finishing, run the project's package manager install command (e.g. \`npm install\`, \`yarn install\`, or \`pnpm install\` depending on the lockfile present) to ensure all dependencies are installed and the project is ready to build.`;
+var AgentType = {
+  CLI: "cli",
+  SDK: "sdk"
+};
+var AgentTypeSchema = import_zod6.z.enum([AgentType.CLI, AgentType.SDK]);
+var AGENT_TYPE_LABELS = {
+  [AgentType.CLI]: "CLI Agent",
+  [AgentType.SDK]: "Simple Agent"
+};
 var AgentRunCommand = /* @__PURE__ */ ((AgentRunCommand2) => {
   AgentRunCommand2["CLAUDE"] = "claude";
   return AgentRunCommand2;
@@ -1180,10 +1211,15 @@ var RUN_COMMAND_LABELS = {
 };
 var AgentRunCommandSchema = import_zod6.z.nativeEnum(AgentRunCommand);
 var AgentSchema = TargetSchema.extend({
-  /** Command to run the agent */
-  runCommand: AgentRunCommandSchema,
+  /** Agent type: 'cli' for external CLI tools, 'sdk' for in-process SDK agents */
+  agentType: AgentTypeSchema.default(AgentType.CLI),
+  /** Command to run the agent (required for CLI agents, absent for SDK agents) */
+  runCommand: AgentRunCommandSchema.optional(),
   /** Optional model configuration override */
-  modelConfig: ModelConfigSchema.optional()
+  modelConfig: ModelConfigSchema.optional(),
+  systemPrompt: import_zod6.z.string().nullish().describe(
+    "Override for eval runs. undefined=default instructions, null=raw agent, string=append to claude_code preset. See https://docs.anthropic.com/en/docs/claude-code/sdk/modifying-system-prompts"
+  )
 });
 var CreateAgentInputSchema = AgentSchema.omit({
   id: true,
@@ -1192,7 +1228,8 @@ var CreateAgentInputSchema = AgentSchema.omit({
   deleted: true
 });
 var UpdateAgentInputSchema = CreateAgentInputSchema.partial().extend({
-  modelConfig: ModelConfigSchema.optional().nullable()
+  modelConfig: ModelConfigSchema.optional().nullable(),
+  systemPrompt: import_zod6.z.string().optional().nullable()
 });
 // src/target/skill.ts
@@ -2358,6 +2395,8 @@ function getSystemAssertion(id) {
 }
 // Annotate the CommonJS export names for ESM import in node:
 0 && (module.exports = {
+  AGENT_TYPE_LABELS,
+  ALL_AVAILABLE_MODEL_IDS,
   AVAILABLE_MODEL_IDS,
   AVAILABLE_OPENAI_MODEL_IDS,
   AVAILABLE_RUN_COMMANDS,
@@ -2365,7 +2404,10 @@ function getSystemAssertion(id) {
   AgentRunCommand,
   AgentRunCommandSchema,
   AgentSchema,
+  AgentType,
+  AgentTypeSchema,
   AllowedCommands,
+  AnyModelSchema,
   ApiCallSchema,
   AssertionConfigSchema,
   AssertionParameterSchema,
@@ -2399,6 +2441,7 @@ function getSystemAssertion(id) {
   CreateTestScenarioInputSchema,
   CreateTestSuiteInputSchema,
   CustomAssertionSchema,
+  DEFAULT_EVALUATOR_SYSTEM_PROMPT,
   DEFAULT_JUDGE_MODEL,
   DiffContentSchema,
   DiffLineSchema,