@tyvm/knowhow 0.0.21 → 0.0.23
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +3 -1
- package/src/agents/base/base.ts +16 -7
- package/src/agents/configurable/ConfigAgent.ts +5 -3
- package/src/agents/developer/developer.ts +3 -4
- package/src/agents/index.ts +26 -2
- package/src/agents/patcher/patcher.ts +3 -5
- package/src/agents/researcher/researcher.ts +3 -4
- package/src/agents/tools/agentCall.ts +5 -2
- package/src/agents/tools/executeScript/README.md +78 -0
- package/src/agents/tools/executeScript/definition.ts +73 -0
- package/src/agents/tools/executeScript/examples/dependency-injection-validation.ts +272 -0
- package/src/agents/tools/executeScript/examples/quick-test.ts +74 -0
- package/src/agents/tools/executeScript/examples/serialization-test.ts +321 -0
- package/src/agents/tools/executeScript/examples/test-runner.ts +197 -0
- package/src/agents/tools/executeScript/index.ts +93 -0
- package/src/agents/tools/index.ts +1 -0
- package/src/agents/tools/list.ts +2 -1
- package/src/agents/vim/vim.ts +3 -4
- package/src/ai.ts +2 -1
- package/src/chat.ts +4 -2
- package/src/cli.ts +7 -15
- package/src/clients/index.ts +23 -9
- package/src/dataset/diffs/test.ts +2 -1
- package/src/index.ts +3 -3
- package/src/services/AgentService.ts +9 -10
- package/src/services/EventService.ts +0 -2
- package/src/services/GitHub.ts +0 -1
- package/src/services/KnowhowClient.ts +0 -3
- package/src/services/Mcp.ts +0 -2
- package/src/services/S3.ts +0 -1
- package/src/services/Tools.ts +63 -8
- package/src/services/flags.ts +0 -1
- package/src/services/index.ts +56 -0
- package/src/services/modules/index.ts +53 -0
- package/src/{modules → services/modules}/types.ts +16 -5
- package/src/services/script-execution/SandboxContext.ts +278 -0
- package/src/services/script-execution/ScriptExecutor.ts +339 -0
- package/src/services/script-execution/ScriptPolicy.ts +236 -0
- package/src/services/script-execution/ScriptTracer.ts +249 -0
- package/src/services/script-execution/types.ts +134 -0
- package/src/worker.ts +3 -3
- package/tests/integration/fileblocks/readwrite.test.ts +2 -1
- package/tests/integration/patching.test.ts +5 -5
- package/ts_build/src/agents/base/base.d.ts +9 -4
- package/ts_build/src/agents/base/base.js +7 -10
- package/ts_build/src/agents/base/base.js.map +1 -1
- package/ts_build/src/agents/configurable/ConfigAgent.d.ts +2 -2
- package/ts_build/src/agents/configurable/ConfigAgent.js +2 -2
- package/ts_build/src/agents/configurable/ConfigAgent.js.map +1 -1
- package/ts_build/src/agents/developer/developer.d.ts +2 -3
- package/ts_build/src/agents/developer/developer.js +3 -4
- package/ts_build/src/agents/developer/developer.js.map +1 -1
- package/ts_build/src/agents/index.d.ts +11 -2
- package/ts_build/src/agents/index.js +19 -3
- package/ts_build/src/agents/index.js.map +1 -1
- package/ts_build/src/agents/patcher/patcher.d.ts +2 -3
- package/ts_build/src/agents/patcher/patcher.js +3 -4
- package/ts_build/src/agents/patcher/patcher.js.map +1 -1
- package/ts_build/src/agents/researcher/researcher.d.ts +2 -3
- package/ts_build/src/agents/researcher/researcher.js +3 -4
- package/ts_build/src/agents/researcher/researcher.js.map +1 -1
- package/ts_build/src/agents/tools/agentCall.js +4 -4
- package/ts_build/src/agents/tools/agentCall.js.map +1 -1
- package/ts_build/src/agents/tools/executeScript/definition.d.ts +2 -0
- package/ts_build/src/agents/tools/executeScript/definition.js +70 -0
- package/ts_build/src/agents/tools/executeScript/definition.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/examples/dependency-injection-validation.d.ts +18 -0
- package/ts_build/src/agents/tools/executeScript/examples/dependency-injection-validation.js +192 -0
- package/ts_build/src/agents/tools/executeScript/examples/dependency-injection-validation.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/examples/quick-test.d.ts +3 -0
- package/ts_build/src/agents/tools/executeScript/examples/quick-test.js +65 -0
- package/ts_build/src/agents/tools/executeScript/examples/quick-test.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/examples/serialization-test.d.ts +15 -0
- package/ts_build/src/agents/tools/executeScript/examples/serialization-test.js +266 -0
- package/ts_build/src/agents/tools/executeScript/examples/serialization-test.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/examples/simple-example.d.ts +20 -0
- package/ts_build/src/agents/tools/executeScript/examples/simple-example.js +35 -0
- package/ts_build/src/agents/tools/executeScript/examples/simple-example.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/examples/test-runner.d.ts +4 -0
- package/ts_build/src/agents/tools/executeScript/examples/test-runner.js +198 -0
- package/ts_build/src/agents/tools/executeScript/examples/test-runner.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/handler.d.ts +27 -0
- package/ts_build/src/agents/tools/executeScript/handler.js +64 -0
- package/ts_build/src/agents/tools/executeScript/handler.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript/index.d.ts +27 -0
- package/ts_build/src/agents/tools/executeScript/index.js +70 -0
- package/ts_build/src/agents/tools/executeScript/index.js.map +1 -0
- package/ts_build/src/agents/tools/executeScript.d.ts +29 -0
- package/ts_build/src/agents/tools/executeScript.js +124 -0
- package/ts_build/src/agents/tools/executeScript.js.map +1 -0
- package/ts_build/src/agents/tools/index.d.ts +1 -0
- package/ts_build/src/agents/tools/index.js +1 -0
- package/ts_build/src/agents/tools/index.js.map +1 -1
- package/ts_build/src/agents/tools/list.js +2 -0
- package/ts_build/src/agents/tools/list.js.map +1 -1
- package/ts_build/src/agents/vim/vim.d.ts +2 -3
- package/ts_build/src/agents/vim/vim.js +3 -4
- package/ts_build/src/agents/vim/vim.js.map +1 -1
- package/ts_build/src/ai.js +2 -1
- package/ts_build/src/ai.js.map +1 -1
- package/ts_build/src/chat.js +10 -9
- package/ts_build/src/chat.js.map +1 -1
- package/ts_build/src/cli.js +12 -19
- package/ts_build/src/cli.js.map +1 -1
- package/ts_build/src/clients/index.d.ts +9 -2
- package/ts_build/src/clients/index.js +17 -4
- package/ts_build/src/clients/index.js.map +1 -1
- package/ts_build/src/dataset/diffs/test.js +2 -1
- package/ts_build/src/dataset/diffs/test.js.map +1 -1
- package/ts_build/src/index.js +10 -10
- package/ts_build/src/index.js.map +1 -1
- package/ts_build/src/services/AgentService.d.ts +7 -3
- package/ts_build/src/services/AgentService.js +11 -10
- package/ts_build/src/services/AgentService.js.map +1 -1
- package/ts_build/src/services/EventService.d.ts +0 -1
- package/ts_build/src/services/EventService.js +1 -2
- package/ts_build/src/services/EventService.js.map +1 -1
- package/ts_build/src/services/GitHub.d.ts +0 -1
- package/ts_build/src/services/GitHub.js +1 -2
- package/ts_build/src/services/GitHub.js.map +1 -1
- package/ts_build/src/services/KnowhowClient.d.ts +0 -1
- package/ts_build/src/services/KnowhowClient.js +1 -2
- package/ts_build/src/services/KnowhowClient.js.map +1 -1
- package/ts_build/src/services/Mcp.d.ts +0 -1
- package/ts_build/src/services/Mcp.js +1 -2
- package/ts_build/src/services/Mcp.js.map +1 -1
- package/ts_build/src/services/S3.d.ts +0 -1
- package/ts_build/src/services/S3.js +1 -2
- package/ts_build/src/services/S3.js.map +1 -1
- package/ts_build/src/services/Tools.d.ts +22 -1
- package/ts_build/src/services/Tools.js +32 -6
- package/ts_build/src/services/Tools.js.map +1 -1
- package/ts_build/src/services/flags.d.ts +0 -1
- package/ts_build/src/services/flags.js +1 -2
- package/ts_build/src/services/flags.js.map +1 -1
- package/ts_build/src/services/index.d.ts +25 -0
- package/ts_build/src/services/index.js +42 -1
- package/ts_build/src/services/index.js.map +1 -1
- package/ts_build/src/services/modules/example-usage.d.ts +11 -0
- package/ts_build/src/services/modules/example-usage.js +43 -0
- package/ts_build/src/services/modules/example-usage.js.map +1 -0
- package/ts_build/src/services/modules/index.d.ts +4 -0
- package/ts_build/src/services/modules/index.js +44 -0
- package/ts_build/src/services/modules/index.js.map +1 -0
- package/ts_build/src/services/modules/types.d.ts +47 -0
- package/ts_build/src/services/modules/types.js +3 -0
- package/ts_build/src/services/modules/types.js.map +1 -0
- package/ts_build/src/services/script-execution/SandboxContext.d.ts +34 -0
- package/ts_build/src/services/script-execution/SandboxContext.js +186 -0
- package/ts_build/src/services/script-execution/SandboxContext.js.map +1 -0
- package/ts_build/src/services/script-execution/ScriptExecutor.d.ts +17 -0
- package/ts_build/src/services/script-execution/ScriptExecutor.js +211 -0
- package/ts_build/src/services/script-execution/ScriptExecutor.js.map +1 -0
- package/ts_build/src/services/script-execution/ScriptPolicy.d.ts +27 -0
- package/ts_build/src/services/script-execution/ScriptPolicy.js +150 -0
- package/ts_build/src/services/script-execution/ScriptPolicy.js.map +1 -0
- package/ts_build/src/services/script-execution/ScriptTracer.d.ts +19 -0
- package/ts_build/src/services/script-execution/ScriptTracer.js +186 -0
- package/ts_build/src/services/script-execution/ScriptTracer.js.map +1 -0
- package/ts_build/src/services/script-execution/types.d.ts +108 -0
- package/ts_build/src/services/script-execution/types.js +3 -0
- package/ts_build/src/services/script-execution/types.js.map +1 -0
- package/ts_build/src/services/singletons.d.ts +17 -0
- package/ts_build/src/services/singletons.js +28 -0
- package/ts_build/src/services/singletons.js.map +1 -0
- package/ts_build/src/worker.js +4 -3
- package/ts_build/src/worker.js.map +1 -1
- package/ts_build/tests/integration/fileblocks/readwrite.test.js +10 -9
- package/ts_build/tests/integration/fileblocks/readwrite.test.js.map +1 -1
- package/ts_build/tests/integration/patching.test.js +9 -10
- package/ts_build/tests/integration/patching.test.js.map +1 -1
- package/src/modules/index.ts +0 -37
|
@@ -0,0 +1,74 @@
|
|
|
1
|
+
#!/usr/bin/env ts-node
|
|
2
|
+
/**
|
|
3
|
+
* Quick test for executeScript - minimal example
|
|
4
|
+
* Usage: npx ts-node src/agents/tools/executeScript/examples/quick-test.ts
|
|
5
|
+
*/
|
|
6
|
+
|
|
7
|
+
import { executeScript } from "../../executeScript";
|
|
8
|
+
import { services } from "../../../../services";
|
|
9
|
+
|
|
10
|
+
// Simple test script
|
|
11
|
+
const simpleScript = `
|
|
12
|
+
console.log("Hello from executeScript!");
|
|
13
|
+
|
|
14
|
+
async function main() {
|
|
15
|
+
// Test basic functionality
|
|
16
|
+
console.log("Running simple test...");
|
|
17
|
+
|
|
18
|
+
// Try a simple tool call
|
|
19
|
+
const files = await callTool("fileSearch", { searchTerm: "*.ts" });
|
|
20
|
+
console.log("Found", files?.length || 0, "TypeScript files");
|
|
21
|
+
|
|
22
|
+
return {
|
|
23
|
+
message: "Simple test completed!",
|
|
24
|
+
filesFound: files?.length || 0,
|
|
25
|
+
timestamp: new Date().toISOString()
|
|
26
|
+
};
|
|
27
|
+
}
|
|
28
|
+
|
|
29
|
+
await main().then(result => {
|
|
30
|
+
console.log("Result:", result);
|
|
31
|
+
}).catch(error => {
|
|
32
|
+
console.error("Error:", error);
|
|
33
|
+
});
|
|
34
|
+
`;
|
|
35
|
+
|
|
36
|
+
async function quickTest() {
|
|
37
|
+
console.log("🧪 Quick executeScript test\n");
|
|
38
|
+
|
|
39
|
+
try {
|
|
40
|
+
const { Tools, Clients } = services();
|
|
41
|
+
const result = await executeScript({
|
|
42
|
+
script: simpleScript,
|
|
43
|
+
maxToolCalls: 5,
|
|
44
|
+
maxTokens: 100,
|
|
45
|
+
maxExecutionTimeMs: 10000,
|
|
46
|
+
maxCostUsd: 0.1,
|
|
47
|
+
});
|
|
48
|
+
|
|
49
|
+
console.log("\n📊 QUICK TEST RESULT:");
|
|
50
|
+
console.log("Success:", result.success);
|
|
51
|
+
console.log("Result:", result.result);
|
|
52
|
+
console.log("Tool calls:", result.quotaUsage.toolCalls);
|
|
53
|
+
console.log("Cost: $" + result.quotaUsage.costUsd.toFixed(4));
|
|
54
|
+
|
|
55
|
+
if (result.consoleOutput.length > 0) {
|
|
56
|
+
console.log("\n📝 Console Output:");
|
|
57
|
+
result.consoleOutput.forEach((entry) => {
|
|
58
|
+
console.log(` ${entry}`);
|
|
59
|
+
});
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
if (!result.success) {
|
|
63
|
+
console.log("❌ Error:", result.error);
|
|
64
|
+
}
|
|
65
|
+
} catch (error) {
|
|
66
|
+
console.error("💥 Test failed:", error);
|
|
67
|
+
}
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
if (require.main === module) {
|
|
71
|
+
quickTest();
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
export { quickTest };
|
|
@@ -0,0 +1,321 @@
|
|
|
1
|
+
#!/usr/bin/env ts-node
|
|
2
|
+
/**
|
|
3
|
+
* Serialization Test for executeScript - demonstrates transfer issues
|
|
4
|
+
* Usage: npx ts-node src/agents/tools/executeScript/examples/serialization-test.ts
|
|
5
|
+
*
|
|
6
|
+
* This test demonstrates the "A non-transferable value was passed" errors
|
|
7
|
+
* that occur when trying to return complex objects from executeScript.
|
|
8
|
+
*/
|
|
9
|
+
|
|
10
|
+
import { executeScript } from "../../executeScript";
|
|
11
|
+
import { services } from "../../../../services";
|
|
12
|
+
|
|
13
|
+
interface TestCase {
|
|
14
|
+
name: string;
|
|
15
|
+
script: string;
|
|
16
|
+
expectedToWork: boolean;
|
|
17
|
+
description: string;
|
|
18
|
+
}
|
|
19
|
+
|
|
20
|
+
const testCases: TestCase[] = [
|
|
21
|
+
{
|
|
22
|
+
name: "primitive-string",
|
|
23
|
+
expectedToWork: true,
|
|
24
|
+
description: "Simple string return - should work",
|
|
25
|
+
script: `
|
|
26
|
+
console.log("Testing primitive string return");
|
|
27
|
+
return "Hello World";
|
|
28
|
+
`,
|
|
29
|
+
},
|
|
30
|
+
|
|
31
|
+
{
|
|
32
|
+
name: "primitive-number",
|
|
33
|
+
expectedToWork: true,
|
|
34
|
+
description: "Simple number return - should work",
|
|
35
|
+
script: `
|
|
36
|
+
console.log("Testing primitive number return");
|
|
37
|
+
return 42;
|
|
38
|
+
`,
|
|
39
|
+
},
|
|
40
|
+
|
|
41
|
+
{
|
|
42
|
+
name: "primitive-boolean",
|
|
43
|
+
expectedToWork: true,
|
|
44
|
+
description: "Simple boolean return - should work",
|
|
45
|
+
script: `
|
|
46
|
+
console.log("Testing primitive boolean return");
|
|
47
|
+
return true;
|
|
48
|
+
`,
|
|
49
|
+
},
|
|
50
|
+
|
|
51
|
+
{
|
|
52
|
+
name: "simple-array",
|
|
53
|
+
expectedToWork: true, // You mentioned this works
|
|
54
|
+
description: "Simple array return - you said this works",
|
|
55
|
+
script: `
|
|
56
|
+
console.log("Testing simple array return");
|
|
57
|
+
return [1, 2, 3, "hello"];
|
|
58
|
+
`,
|
|
59
|
+
},
|
|
60
|
+
|
|
61
|
+
{
|
|
62
|
+
name: "simple-object",
|
|
63
|
+
expectedToWork: false, // This is where I got errors
|
|
64
|
+
description:
|
|
65
|
+
"Simple object return - expected to fail with transferable error",
|
|
66
|
+
script: `
|
|
67
|
+
console.log("Testing simple object return");
|
|
68
|
+
return {
|
|
69
|
+
message: "Hello",
|
|
70
|
+
count: 42,
|
|
71
|
+
success: true
|
|
72
|
+
};
|
|
73
|
+
`,
|
|
74
|
+
},
|
|
75
|
+
|
|
76
|
+
{
|
|
77
|
+
name: "nested-object",
|
|
78
|
+
expectedToWork: false,
|
|
79
|
+
description: "Nested object return - expected to fail",
|
|
80
|
+
script: `
|
|
81
|
+
console.log("Testing nested object return");
|
|
82
|
+
return {
|
|
83
|
+
data: {
|
|
84
|
+
items: [1, 2, 3],
|
|
85
|
+
metadata: { timestamp: new Date().toISOString() }
|
|
86
|
+
},
|
|
87
|
+
status: "success"
|
|
88
|
+
};
|
|
89
|
+
`,
|
|
90
|
+
},
|
|
91
|
+
|
|
92
|
+
{
|
|
93
|
+
name: "object-with-functions",
|
|
94
|
+
expectedToWork: false,
|
|
95
|
+
description: "Object with functions - definitely should fail",
|
|
96
|
+
script: `
|
|
97
|
+
console.log("Testing object with functions");
|
|
98
|
+
return {
|
|
99
|
+
data: [1, 2, 3],
|
|
100
|
+
transform: function(x) { return x * 2; },
|
|
101
|
+
helper: () => "test"
|
|
102
|
+
};
|
|
103
|
+
`,
|
|
104
|
+
},
|
|
105
|
+
|
|
106
|
+
{
|
|
107
|
+
name: "array-of-objects",
|
|
108
|
+
expectedToWork: false, // Based on my experience
|
|
109
|
+
description: "Array containing objects - expected to fail",
|
|
110
|
+
script: `
|
|
111
|
+
console.log("Testing array of objects");
|
|
112
|
+
return [
|
|
113
|
+
{ id: 1, name: "Alice" },
|
|
114
|
+
{ id: 2, name: "Bob" },
|
|
115
|
+
{ id: 3, name: "Charlie" }
|
|
116
|
+
];
|
|
117
|
+
`,
|
|
118
|
+
},
|
|
119
|
+
|
|
120
|
+
{
|
|
121
|
+
name: "json-stringify-workaround",
|
|
122
|
+
expectedToWork: true,
|
|
123
|
+
description: "Using JSON.stringify as workaround - should work",
|
|
124
|
+
script: `
|
|
125
|
+
console.log("Testing JSON.stringify workaround");
|
|
126
|
+
const data = {
|
|
127
|
+
message: "Hello",
|
|
128
|
+
items: [1, 2, 3],
|
|
129
|
+
nested: { key: "value" }
|
|
130
|
+
};
|
|
131
|
+
return JSON.stringify(data);
|
|
132
|
+
`,
|
|
133
|
+
},
|
|
134
|
+
|
|
135
|
+
{
|
|
136
|
+
name: "tool-call-result",
|
|
137
|
+
expectedToWork: false, // Based on my experience with news aggregation
|
|
138
|
+
description: "Tool call result object - expected to fail",
|
|
139
|
+
script: `
|
|
140
|
+
console.log("Testing tool call result return");
|
|
141
|
+
|
|
142
|
+
try {
|
|
143
|
+
const searchResult = await callTool("fileSearch", { searchTerm: "package.json" });
|
|
144
|
+
|
|
145
|
+
// Try to return a structured response with the tool result
|
|
146
|
+
return {
|
|
147
|
+
success: true,
|
|
148
|
+
toolResult: searchResult,
|
|
149
|
+
timestamp: new Date().toISOString()
|
|
150
|
+
};
|
|
151
|
+
} catch (error) {
|
|
152
|
+
return {
|
|
153
|
+
success: false,
|
|
154
|
+
error: error.message
|
|
155
|
+
};
|
|
156
|
+
}
|
|
157
|
+
`,
|
|
158
|
+
},
|
|
159
|
+
|
|
160
|
+
{
|
|
161
|
+
name: "date-object",
|
|
162
|
+
expectedToWork: false,
|
|
163
|
+
description: "Date object return - expected to fail",
|
|
164
|
+
script: `
|
|
165
|
+
console.log("Testing Date object return");
|
|
166
|
+
return new Date();
|
|
167
|
+
`,
|
|
168
|
+
},
|
|
169
|
+
|
|
170
|
+
{
|
|
171
|
+
name: "map-object",
|
|
172
|
+
expectedToWork: false,
|
|
173
|
+
description: "Map object return - expected to fail",
|
|
174
|
+
script: `
|
|
175
|
+
console.log("Testing Map object return");
|
|
176
|
+
const map = new Map();
|
|
177
|
+
map.set("key1", "value1");
|
|
178
|
+
map.set("key2", "value2");
|
|
179
|
+
return map;
|
|
180
|
+
`,
|
|
181
|
+
},
|
|
182
|
+
];
|
|
183
|
+
|
|
184
|
+
async function runSerializationTests() {
|
|
185
|
+
console.log("🧪 Running executeScript Serialization Tests\\n");
|
|
186
|
+
console.log("=".repeat(80));
|
|
187
|
+
|
|
188
|
+
const results = {
|
|
189
|
+
passed: 0,
|
|
190
|
+
failed: 0,
|
|
191
|
+
unexpected: 0,
|
|
192
|
+
details: [] as any[],
|
|
193
|
+
};
|
|
194
|
+
|
|
195
|
+
for (const testCase of testCases) {
|
|
196
|
+
console.log(`\\n📋 Testing: ${testCase.name}`);
|
|
197
|
+
console.log(`📝 Description: ${testCase.description}`);
|
|
198
|
+
console.log(`🎯 Expected to work: ${testCase.expectedToWork}`);
|
|
199
|
+
|
|
200
|
+
try {
|
|
201
|
+
const result = await executeScript({
|
|
202
|
+
script: testCase.script,
|
|
203
|
+
maxToolCalls: 5,
|
|
204
|
+
maxTokens: 500,
|
|
205
|
+
maxExecutionTimeMs: 10000,
|
|
206
|
+
maxCostUsd: 0.1,
|
|
207
|
+
});
|
|
208
|
+
|
|
209
|
+
const actualWorked = result.success;
|
|
210
|
+
const matchesExpectation = actualWorked === testCase.expectedToWork;
|
|
211
|
+
|
|
212
|
+
if (matchesExpectation) {
|
|
213
|
+
results.passed++;
|
|
214
|
+
console.log(`✅ PASS - Behaved as expected`);
|
|
215
|
+
} else {
|
|
216
|
+
results.unexpected++;
|
|
217
|
+
console.log(
|
|
218
|
+
`⚠️ UNEXPECTED - Expected ${
|
|
219
|
+
testCase.expectedToWork ? "success" : "failure"
|
|
220
|
+
}, got ${actualWorked ? "success" : "failure"}`
|
|
221
|
+
);
|
|
222
|
+
}
|
|
223
|
+
|
|
224
|
+
results.details.push({
|
|
225
|
+
name: testCase.name,
|
|
226
|
+
expected: testCase.expectedToWork,
|
|
227
|
+
actual: actualWorked,
|
|
228
|
+
matches: matchesExpectation,
|
|
229
|
+
result: actualWorked ? result.result : null,
|
|
230
|
+
error: actualWorked ? null : result.error,
|
|
231
|
+
consoleOutput: result.consoleOutput,
|
|
232
|
+
});
|
|
233
|
+
|
|
234
|
+
if (actualWorked) {
|
|
235
|
+
console.log(`📊 Result type: ${typeof result.result}`);
|
|
236
|
+
console.log(
|
|
237
|
+
`📊 Result: ${JSON.stringify(result.result).substring(0, 200)}${
|
|
238
|
+
JSON.stringify(result.result).length > 200 ? "..." : ""
|
|
239
|
+
}`
|
|
240
|
+
);
|
|
241
|
+
} else {
|
|
242
|
+
console.log(`❌ Error: ${result.error}`);
|
|
243
|
+
}
|
|
244
|
+
|
|
245
|
+
if (result.consoleOutput.length > 0) {
|
|
246
|
+
console.log(`📝 Console: ${result.consoleOutput.join(", ")}`);
|
|
247
|
+
}
|
|
248
|
+
} catch (error) {
|
|
249
|
+
results.failed++;
|
|
250
|
+
console.log(`💥 TEST FRAMEWORK ERROR: ${error.message}`);
|
|
251
|
+
|
|
252
|
+
results.details.push({
|
|
253
|
+
name: testCase.name,
|
|
254
|
+
expected: testCase.expectedToWork,
|
|
255
|
+
actual: false,
|
|
256
|
+
matches: !testCase.expectedToWork,
|
|
257
|
+
result: null,
|
|
258
|
+
error: error.message,
|
|
259
|
+
consoleOutput: [],
|
|
260
|
+
});
|
|
261
|
+
}
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
// Print summary
|
|
265
|
+
console.log("\\n" + "=".repeat(80));
|
|
266
|
+
console.log("📊 SERIALIZATION TEST SUMMARY");
|
|
267
|
+
console.log("=".repeat(80));
|
|
268
|
+
console.log(`✅ Tests matching expectations: ${results.passed}`);
|
|
269
|
+
console.log(`⚠️ Unexpected behaviors: ${results.unexpected}`);
|
|
270
|
+
console.log(`💥 Framework failures: ${results.failed}`);
|
|
271
|
+
console.log(`📋 Total tests: ${testCases.length}`);
|
|
272
|
+
|
|
273
|
+
if (results.unexpected > 0) {
|
|
274
|
+
console.log("\\n🔍 UNEXPECTED RESULTS:");
|
|
275
|
+
results.details
|
|
276
|
+
.filter((d) => !d.matches)
|
|
277
|
+
.forEach((detail) => {
|
|
278
|
+
console.log(
|
|
279
|
+
` - ${detail.name}: Expected ${
|
|
280
|
+
detail.expected ? "success" : "failure"
|
|
281
|
+
}, got ${detail.actual ? "success" : "failure"}`
|
|
282
|
+
);
|
|
283
|
+
if (detail.error) {
|
|
284
|
+
console.log(` Error: ${detail.error}`);
|
|
285
|
+
}
|
|
286
|
+
});
|
|
287
|
+
}
|
|
288
|
+
|
|
289
|
+
// Analysis and recommendations
|
|
290
|
+
console.log("\\n🔬 ANALYSIS:");
|
|
291
|
+
|
|
292
|
+
const workingTypes = results.details
|
|
293
|
+
.filter((d) => d.actual)
|
|
294
|
+
.map((d) => d.name);
|
|
295
|
+
const failingTypes = results.details
|
|
296
|
+
.filter((d) => !d.actual)
|
|
297
|
+
.map((d) => d.name);
|
|
298
|
+
|
|
299
|
+
console.log("\\n✅ Types that work:");
|
|
300
|
+
workingTypes.forEach((name) => console.log(` - ${name}`));
|
|
301
|
+
|
|
302
|
+
console.log("\\n❌ Types that fail:");
|
|
303
|
+
failingTypes.forEach((name) => console.log(` - ${name}`));
|
|
304
|
+
|
|
305
|
+
console.log("\\n💡 RECOMMENDATIONS:");
|
|
306
|
+
console.log(" 1. Use JSON.stringify() for complex objects");
|
|
307
|
+
console.log(" 2. Return primitive values when possible");
|
|
308
|
+
console.log(" 3. Consider createArtifact() for structured data");
|
|
309
|
+
console.log(" 4. Test your return types with this suite");
|
|
310
|
+
|
|
311
|
+
return results;
|
|
312
|
+
}
|
|
313
|
+
|
|
314
|
+
if (require.main === module) {
|
|
315
|
+
runSerializationTests().catch((error) => {
|
|
316
|
+
console.error("Test suite failed:", error);
|
|
317
|
+
process.exit(1);
|
|
318
|
+
});
|
|
319
|
+
}
|
|
320
|
+
|
|
321
|
+
export { runSerializationTests, testCases };
|
|
@@ -0,0 +1,197 @@
|
|
|
1
|
+
#!/usr/bin/env ts-node
|
|
2
|
+
/**
|
|
3
|
+
* Test runner for the executeScript tool
|
|
4
|
+
* Usage: npx ts-node src/agents/tools/executeScript/examples/test-runner.ts
|
|
5
|
+
*/
|
|
6
|
+
|
|
7
|
+
import { executeScript } from "../../executeScript";
|
|
8
|
+
import { services } from "../../../../services";
|
|
9
|
+
import { Clients } from "../../../../clients";
|
|
10
|
+
import { includedTools } from "../../../tools/list";
|
|
11
|
+
import * as allTools from "../../../tools";
|
|
12
|
+
|
|
13
|
+
// Sample script to test with
|
|
14
|
+
const testScript = `
|
|
15
|
+
// Test script that demonstrates various executeScript capabilities
|
|
16
|
+
console.log("Starting test script execution...");
|
|
17
|
+
|
|
18
|
+
async function main() {
|
|
19
|
+
// Test 1: Simple console output
|
|
20
|
+
console.log("Test 1: Basic logging works");
|
|
21
|
+
|
|
22
|
+
// Test 2: Call a tool (file search)
|
|
23
|
+
try {
|
|
24
|
+
console.log("Test 2: Calling fileSearch tool...");
|
|
25
|
+
const searchResult = await callTool("fileSearch", {
|
|
26
|
+
searchTerm: "package.json"
|
|
27
|
+
});
|
|
28
|
+
console.log("File search result:", searchResult);
|
|
29
|
+
} catch (error) {
|
|
30
|
+
console.error("Tool call failed:", error.message);
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
// Test 3: Call another tool (text search)
|
|
34
|
+
try {
|
|
35
|
+
console.log("Test 3: Calling textSearch tool...");
|
|
36
|
+
const textResult = await callTool("textSearch", {
|
|
37
|
+
searchTerm: "executeScript"
|
|
38
|
+
});
|
|
39
|
+
console.log("Text search found", textResult?.length || 0, "matches");
|
|
40
|
+
} catch (error) {
|
|
41
|
+
console.error("Text search failed:", error.message);
|
|
42
|
+
}
|
|
43
|
+
|
|
44
|
+
// Test 4: Make an LLM call
|
|
45
|
+
try {
|
|
46
|
+
console.log("Test 4: Making LLM call...");
|
|
47
|
+
const llmResponse = await llm([
|
|
48
|
+
{
|
|
49
|
+
role: "system",
|
|
50
|
+
content: "You are a helpful assistant. Respond with exactly one sentence."
|
|
51
|
+
},
|
|
52
|
+
{
|
|
53
|
+
role: "user",
|
|
54
|
+
content: "What is 2+2? Just give the answer briefly."
|
|
55
|
+
}
|
|
56
|
+
], {
|
|
57
|
+
model: "gpt-4o-mini",
|
|
58
|
+
max_tokens: 50
|
|
59
|
+
});
|
|
60
|
+
|
|
61
|
+
console.log("LLM Response:", llmResponse.choices[0].message.content);
|
|
62
|
+
} catch (error) {
|
|
63
|
+
console.error("LLM call failed:", error.message);
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
// Test 5: Create an artifact
|
|
67
|
+
try {
|
|
68
|
+
console.log("Test 5: Creating artifact...");
|
|
69
|
+
createArtifact("test-results.md", \`# Test Results
|
|
70
|
+
|
|
71
|
+
Script executed successfully at: \${new Date().toISOString()}
|
|
72
|
+
|
|
73
|
+
This is a test artifact created by the executeScript tool.
|
|
74
|
+
|
|
75
|
+
## Test Summary
|
|
76
|
+
- Console logging: ✓
|
|
77
|
+
- Tool calls: ✓
|
|
78
|
+
- LLM calls: ✓
|
|
79
|
+
- Artifact creation: ✓
|
|
80
|
+
\`, "markdown");
|
|
81
|
+
console.log("Artifact created successfully");
|
|
82
|
+
} catch (error) {
|
|
83
|
+
console.error("Artifact creation failed:", error.message);
|
|
84
|
+
}
|
|
85
|
+
|
|
86
|
+
// Return final result
|
|
87
|
+
return {
|
|
88
|
+
success: true,
|
|
89
|
+
message: "All tests completed successfully",
|
|
90
|
+
timestamp: new Date().toISOString(),
|
|
91
|
+
testsRun: 5
|
|
92
|
+
};
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
// Execute the main function
|
|
96
|
+
await main().then(result => {
|
|
97
|
+
console.log("=== SCRIPT COMPLETED ===");
|
|
98
|
+
console.log("Final result:", JSON.stringify(result, null, 2));
|
|
99
|
+
}).catch(error => {
|
|
100
|
+
console.error("=== SCRIPT FAILED ===");
|
|
101
|
+
console.error("Error:", error);
|
|
102
|
+
throw error;
|
|
103
|
+
});
|
|
104
|
+
`;
|
|
105
|
+
|
|
106
|
+
async function runTest() {
|
|
107
|
+
console.log("🚀 Starting executeScript test...\n");
|
|
108
|
+
const { Tools } = services();
|
|
109
|
+
|
|
110
|
+
try {
|
|
111
|
+
Tools.defineTools(includedTools, allTools);
|
|
112
|
+
|
|
113
|
+
console.log("📋 Test Parameters:");
|
|
114
|
+
console.log("- Max Tool Calls: 10");
|
|
115
|
+
console.log("- Max Tokens: 1000");
|
|
116
|
+
console.log("- Max Execution Time: 60s");
|
|
117
|
+
console.log("- Max Cost: $0.50\n");
|
|
118
|
+
|
|
119
|
+
const startTime = Date.now();
|
|
120
|
+
|
|
121
|
+
// Execute the test script
|
|
122
|
+
const result = await executeScript({
|
|
123
|
+
script: testScript,
|
|
124
|
+
maxToolCalls: 10,
|
|
125
|
+
maxTokens: 1000,
|
|
126
|
+
maxExecutionTimeMs: 60000,
|
|
127
|
+
maxCostUsd: 0.5,
|
|
128
|
+
});
|
|
129
|
+
|
|
130
|
+
const executionTime = Date.now() - startTime;
|
|
131
|
+
|
|
132
|
+
console.log("\n" + "=".repeat(60));
|
|
133
|
+
console.log("🎯 TEST RESULTS");
|
|
134
|
+
console.log("=".repeat(60));
|
|
135
|
+
console.log(`⏱️ Execution Time: ${executionTime}ms`);
|
|
136
|
+
console.log(`✅ Success: ${result.success}`);
|
|
137
|
+
|
|
138
|
+
if (result.success) {
|
|
139
|
+
console.log(`📊 Result:`, result.result);
|
|
140
|
+
console.log(`🔧 Tool Calls Made: ${result.quotaUsage.toolCalls}`);
|
|
141
|
+
console.log(`🎯 Tokens Used: ${result.quotaUsage.tokens}`);
|
|
142
|
+
console.log(`💰 Cost: $${result.quotaUsage.costUsd.toFixed(4)}`);
|
|
143
|
+
|
|
144
|
+
if (result.artifacts.length > 0) {
|
|
145
|
+
console.log(`📁 Artifacts Created: ${result.artifacts.length}`);
|
|
146
|
+
result.artifacts.forEach((artifact) => {
|
|
147
|
+
console.log(
|
|
148
|
+
` - ${artifact.name} (${artifact.type}, ${artifact.contentLength} bytes)`
|
|
149
|
+
);
|
|
150
|
+
});
|
|
151
|
+
}
|
|
152
|
+
|
|
153
|
+
if (result.consoleOutput.length > 0) {
|
|
154
|
+
console.log(
|
|
155
|
+
`\n📝 Console Output (${result.consoleOutput.length} entries):`
|
|
156
|
+
);
|
|
157
|
+
result.consoleOutput.forEach((entry) => {
|
|
158
|
+
console.log(` ${entry}`);
|
|
159
|
+
});
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
if (result.violations.length > 0) {
|
|
163
|
+
console.log(`\n⚠️ Policy Violations: ${result.violations.length}`);
|
|
164
|
+
result.violations.forEach((violation) => {
|
|
165
|
+
console.log(` - ${JSON.stringify(violation)}`);
|
|
166
|
+
});
|
|
167
|
+
}
|
|
168
|
+
} else {
|
|
169
|
+
console.log(`❌ Error: ${result.error}`);
|
|
170
|
+
|
|
171
|
+
if (result.consoleOutput.length > 0) {
|
|
172
|
+
console.log(`\n📝 Console Output Before Failure:`);
|
|
173
|
+
result.consoleOutput.forEach((entry) => {
|
|
174
|
+
console.log(` ${entry}`);
|
|
175
|
+
});
|
|
176
|
+
}
|
|
177
|
+
}
|
|
178
|
+
|
|
179
|
+
console.log("\n" + "=".repeat(60));
|
|
180
|
+
console.log(result.success ? "🎉 TEST PASSED!" : "💥 TEST FAILED!");
|
|
181
|
+
console.log("=".repeat(60));
|
|
182
|
+
} catch (error) {
|
|
183
|
+
console.error("\n💥 TEST RUNNER ERROR:");
|
|
184
|
+
console.error(error);
|
|
185
|
+
process.exit(1);
|
|
186
|
+
}
|
|
187
|
+
}
|
|
188
|
+
|
|
189
|
+
// Run the test if this file is executed directly
|
|
190
|
+
if (require.main === module) {
|
|
191
|
+
runTest().catch((error) => {
|
|
192
|
+
console.error("Unhandled error:", error);
|
|
193
|
+
process.exit(1);
|
|
194
|
+
});
|
|
195
|
+
}
|
|
196
|
+
|
|
197
|
+
export { runTest, testScript };
|
|
@@ -0,0 +1,93 @@
|
|
|
1
|
+
import { ScriptExecutor } from "../../../services/script-execution/ScriptExecutor";
|
|
2
|
+
import { ToolsService } from "../../../services/Tools";
|
|
3
|
+
import {
|
|
4
|
+
ExecutionRequest,
|
|
5
|
+
ExecutionResult,
|
|
6
|
+
} from "../../../services/script-execution/types";
|
|
7
|
+
import { services } from "src/services";
|
|
8
|
+
|
|
9
|
+
export async function executeScript({
|
|
10
|
+
script,
|
|
11
|
+
maxToolCalls,
|
|
12
|
+
maxTokens,
|
|
13
|
+
maxExecutionTimeMs,
|
|
14
|
+
maxCostUsd,
|
|
15
|
+
}: {
|
|
16
|
+
script: string;
|
|
17
|
+
maxToolCalls?: number;
|
|
18
|
+
maxTokens?: number;
|
|
19
|
+
maxExecutionTimeMs?: number;
|
|
20
|
+
maxCostUsd?: number;
|
|
21
|
+
}) {
|
|
22
|
+
try {
|
|
23
|
+
// Get context from bound ToolsService
|
|
24
|
+
const toolService = (
|
|
25
|
+
this instanceof ToolsService ? this : services().Tools
|
|
26
|
+
) as ToolsService;
|
|
27
|
+
const toolContext = toolService.getContext();
|
|
28
|
+
const { Clients, Tools } = toolContext;
|
|
29
|
+
|
|
30
|
+
if (!Clients) {
|
|
31
|
+
throw new Error("Clients not available in tool context");
|
|
32
|
+
}
|
|
33
|
+
|
|
34
|
+
// Create script executor with access to tools and clients
|
|
35
|
+
const executor = new ScriptExecutor(Tools, Clients);
|
|
36
|
+
|
|
37
|
+
// Execute the script
|
|
38
|
+
const result = await executor.execute({
|
|
39
|
+
script,
|
|
40
|
+
quotas: {
|
|
41
|
+
maxToolCalls: maxToolCalls || 50,
|
|
42
|
+
maxTokens: maxTokens || 10000,
|
|
43
|
+
maxExecutionTimeMs: maxExecutionTimeMs || 30000,
|
|
44
|
+
maxCostUsd: maxCostUsd || 1.0,
|
|
45
|
+
maxMemoryMb: 100,
|
|
46
|
+
},
|
|
47
|
+
});
|
|
48
|
+
|
|
49
|
+
// If there were policy violations, include them in the response
|
|
50
|
+
const violations = result.trace.events
|
|
51
|
+
.filter((e) => e.type.includes("violation") || e.type.includes("error"))
|
|
52
|
+
.map((e) => e.data);
|
|
53
|
+
|
|
54
|
+
// Format the response
|
|
55
|
+
return {
|
|
56
|
+
success: result.success,
|
|
57
|
+
result: result.result,
|
|
58
|
+
error: result.error,
|
|
59
|
+
artifacts: result.artifacts.map((a) => ({
|
|
60
|
+
id: a.id,
|
|
61
|
+
name: a.name,
|
|
62
|
+
type: a.type,
|
|
63
|
+
contentLength: a.content.length,
|
|
64
|
+
createdAt: a.createdAt,
|
|
65
|
+
})),
|
|
66
|
+
consoleOutput: result.consoleOutput,
|
|
67
|
+
metrics: result.trace.metrics,
|
|
68
|
+
violations,
|
|
69
|
+
executionTimeMs: result.trace.endTime - result.trace.startTime,
|
|
70
|
+
quotaUsage: {
|
|
71
|
+
toolCalls: result.trace.metrics.toolCallCount,
|
|
72
|
+
tokens: result.trace.metrics.tokenUsage.total,
|
|
73
|
+
costUsd: result.trace.metrics.costUsd,
|
|
74
|
+
},
|
|
75
|
+
};
|
|
76
|
+
} catch (error) {
|
|
77
|
+
return {
|
|
78
|
+
success: false,
|
|
79
|
+
error: error instanceof Error ? error.message : String(error),
|
|
80
|
+
result: null,
|
|
81
|
+
artifacts: [],
|
|
82
|
+
consoleOutput: [],
|
|
83
|
+
metrics: null,
|
|
84
|
+
violations: [],
|
|
85
|
+
executionTimeMs: 0,
|
|
86
|
+
quotaUsage: {
|
|
87
|
+
toolCalls: 0,
|
|
88
|
+
tokens: 0,
|
|
89
|
+
costUsd: 0,
|
|
90
|
+
},
|
|
91
|
+
};
|
|
92
|
+
}
|
|
93
|
+
}
|
package/src/agents/tools/list.ts
CHANGED
|
@@ -7,6 +7,7 @@ import * as github from "./github/definitions";
|
|
|
7
7
|
import * as asana from "./asana/definitions";
|
|
8
8
|
import * as language from "./language/definitions";
|
|
9
9
|
import { googleSearchDefinition } from "./googleSearch";
|
|
10
|
+
import { executeScriptDefinition } from "./executeScript/definition";
|
|
10
11
|
|
|
11
12
|
export const includedTools = [
|
|
12
13
|
{
|
|
@@ -552,7 +553,7 @@ export const includedTools = [
|
|
|
552
553
|
},
|
|
553
554
|
},
|
|
554
555
|
},
|
|
555
|
-
|
|
556
|
+
executeScriptDefinition,
|
|
556
557
|
googleSearchDefinition,
|
|
557
558
|
...asana.definitions,
|
|
558
559
|
...github.definitions,
|