@wix/evalforge-types 0.40.0 → 0.42.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +918 -900
- package/build/index.js.map +4 -4
- package/build/index.mjs +914 -914
- package/build/index.mjs.map +4 -4
- package/build/types/agent/adapter.d.ts +7 -0
- package/build/types/common/models.d.ts +6 -2
- package/build/types/index.d.ts +1 -1
- package/build/types/target/agent.d.ts +10 -1
- package/package.json +3 -3
|
@@ -60,6 +60,13 @@ export interface AgentExecutionContext {
|
|
|
60
60
|
subAgents?: SubAgent[];
|
|
61
61
|
/** Rules to write (CLAUDE.md, AGENTS.md, .cursor/rules/*.md based on ruleType) */
|
|
62
62
|
rules?: Rule[];
|
|
63
|
+
/**
|
|
64
|
+
* System prompt override for evaluation runs.
|
|
65
|
+
* - undefined: use default evaluator behavioral instructions
|
|
66
|
+
* - null: no system prompt (raw agent behavior)
|
|
67
|
+
* - string: custom system prompt text
|
|
68
|
+
*/
|
|
69
|
+
systemPrompt?: string | null;
|
|
63
70
|
}
|
|
64
71
|
/**
|
|
65
72
|
* Token usage statistics from agent execution.
|
|
@@ -1,11 +1,15 @@
|
|
|
1
1
|
import { z } from 'zod';
|
|
2
|
-
import { ClaudeModel } from '@wix/ambassador-ds-wix-ai-gateway-v1-prompt/types';
|
|
3
|
-
export { ClaudeModel };
|
|
2
|
+
import { ClaudeModel, Model as OpenAIModel } from '@wix/ambassador-ds-wix-ai-gateway-v1-prompt/types';
|
|
3
|
+
export { ClaudeModel, OpenAIModel };
|
|
4
4
|
export declare const AVAILABLE_MODEL_IDS: ClaudeModel[];
|
|
5
5
|
export declare const DEFAULT_JUDGE_MODEL: string;
|
|
6
6
|
export declare const ClaudeModelSchema: z.ZodEnum<{
|
|
7
7
|
[x: string]: string;
|
|
8
8
|
}>;
|
|
9
|
+
export declare const AVAILABLE_OPENAI_MODEL_IDS: OpenAIModel[];
|
|
10
|
+
export declare const OpenAIModelSchema: z.ZodEnum<{
|
|
11
|
+
[x: string]: string;
|
|
12
|
+
}>;
|
|
9
13
|
export declare const ModelConfigSchema: z.ZodObject<{
|
|
10
14
|
model: z.ZodEnum<{
|
|
11
15
|
[x: string]: string;
|
package/build/types/index.d.ts
CHANGED
|
@@ -7,7 +7,7 @@
|
|
|
7
7
|
* - BaseEntity: id, name, description, dates
|
|
8
8
|
* - TenantEntity: extends BaseEntity with projectId
|
|
9
9
|
* - Target: extends TenantEntity (base for testable entities)
|
|
10
|
-
* - Agent: CLI-based agent (runCommand, modelConfig)
|
|
10
|
+
* - Agent: CLI-based agent (runCommand, modelConfig, systemPrompt)
|
|
11
11
|
* - Skill: SKILL.md-based capability
|
|
12
12
|
*
|
|
13
13
|
* Test Types (9 total):
|
|
@@ -1,4 +1,10 @@
|
|
|
1
1
|
import { z } from 'zod';
|
|
2
|
+
/**
|
|
3
|
+
* Default behavioral instructions appended to the Claude Code system prompt
|
|
4
|
+
* during evaluation runs. These ensure the agent executes autonomously without
|
|
5
|
+
* waiting for human confirmation.
|
|
6
|
+
*/
|
|
7
|
+
export declare const DEFAULT_EVALUATOR_SYSTEM_PROMPT = "IMPORTANT: This is an automated evaluation run. Follow these guidelines:\n1. Execute the requested changes immediately without asking for confirmation.\n2. Do NOT ask \"would you like me to proceed?\" or similar questions.\n3. Do NOT use the Task tool to delegate simple operations - do them directly yourself.\n4. Keep your approach simple and direct - avoid excessive planning.\n5. Make targeted edits using Read and Edit tools rather than exploring the entire codebase.\n6. If you encounter an error, fix it directly rather than starting over.\n7. Your project root is the current working directory. Always create and modify source code files relative to the project root, NOT inside .claude/skills/ directories.\n8. Before finishing, run the project's package manager install command (e.g. `npm install`, `yarn install`, or `pnpm install` depending on the lockfile present) to ensure all dependencies are installed and the project is ready to build.";
|
|
2
8
|
/**
|
|
3
9
|
* Supported agent CLI commands.
|
|
4
10
|
*
|
|
@@ -35,6 +41,7 @@ export declare const AgentSchema: z.ZodObject<{
|
|
|
35
41
|
temperature: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
|
|
36
42
|
maxTokens: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
|
|
37
43
|
}, z.core.$strip>>;
|
|
44
|
+
systemPrompt: z.ZodOptional<z.ZodNullable<z.ZodString>>;
|
|
38
45
|
}, z.core.$strip>;
|
|
39
46
|
export type Agent = z.infer<typeof AgentSchema>;
|
|
40
47
|
/**
|
|
@@ -52,11 +59,12 @@ export declare const CreateAgentInputSchema: z.ZodObject<{
|
|
|
52
59
|
temperature: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
|
|
53
60
|
maxTokens: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
|
|
54
61
|
}, z.core.$strip>>;
|
|
62
|
+
systemPrompt: z.ZodOptional<z.ZodNullable<z.ZodString>>;
|
|
55
63
|
}, z.core.$strip>;
|
|
56
64
|
export type CreateAgentInput = z.infer<typeof CreateAgentInputSchema>;
|
|
57
65
|
/**
|
|
58
66
|
* Input schema for updating an Agent.
|
|
59
|
-
* modelConfig can be null to explicitly clear
|
|
67
|
+
* modelConfig and systemPrompt can be null to explicitly clear (vs undefined = keep existing).
|
|
60
68
|
*/
|
|
61
69
|
export declare const UpdateAgentInputSchema: z.ZodObject<{
|
|
62
70
|
name: z.ZodOptional<z.ZodString>;
|
|
@@ -70,5 +78,6 @@ export declare const UpdateAgentInputSchema: z.ZodObject<{
|
|
|
70
78
|
temperature: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
|
|
71
79
|
maxTokens: z.ZodPipe<z.ZodTransform<{} | undefined, unknown>, z.ZodOptional<z.ZodNumber>>;
|
|
72
80
|
}, z.core.$strip>>>;
|
|
81
|
+
systemPrompt: z.ZodNullable<z.ZodOptional<z.ZodString>>;
|
|
73
82
|
}, z.core.$strip>;
|
|
74
83
|
export type UpdateAgentInput = z.infer<typeof UpdateAgentInputSchema>;
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@wix/evalforge-types",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.42.0",
|
|
4
4
|
"description": "Unified types for EvalForge agent evaluation system",
|
|
5
5
|
"files": [
|
|
6
6
|
"build"
|
|
@@ -20,7 +20,7 @@
|
|
|
20
20
|
"devDependencies": {
|
|
21
21
|
"@eslint/js": "^9.39.2",
|
|
22
22
|
"@types/node": "^22.19.3",
|
|
23
|
-
"@wix/ambassador-ds-wix-ai-gateway-v1-prompt": "^1.0.
|
|
23
|
+
"@wix/ambassador-ds-wix-ai-gateway-v1-prompt": "^1.0.309",
|
|
24
24
|
"esbuild": "^0.27.2",
|
|
25
25
|
"eslint": "^9.39.2",
|
|
26
26
|
"eslint-config-prettier": "^10.1.8",
|
|
@@ -47,5 +47,5 @@
|
|
|
47
47
|
"artifactId": "evalforge-types"
|
|
48
48
|
}
|
|
49
49
|
},
|
|
50
|
-
"falconPackageHash": "
|
|
50
|
+
"falconPackageHash": "a1c04ff67ad300ec0b1e9ca64caea1018dbc5cea4058a42831f8fcbc"
|
|
51
51
|
}
|