erosolar-cli 1.7.334 → 1.7.336
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +24 -148
- package/dist/bin/erosolar.js +5 -21
- package/dist/bin/erosolar.js.map +1 -1
- package/dist/capabilities/agentSpawningCapability.d.ts.map +1 -1
- package/dist/capabilities/agentSpawningCapability.js +56 -31
- package/dist/capabilities/agentSpawningCapability.js.map +1 -1
- package/dist/contracts/agent-schemas.json +0 -15
- package/dist/contracts/tools.schema.json +0 -9
- package/dist/core/agent.d.ts +2 -2
- package/dist/core/agent.d.ts.map +1 -1
- package/dist/core/agent.js.map +1 -1
- package/dist/core/customCommands.d.ts +1 -0
- package/dist/core/customCommands.d.ts.map +1 -1
- package/dist/core/customCommands.js +3 -0
- package/dist/core/customCommands.js.map +1 -1
- package/dist/core/hooks.d.ts +113 -0
- package/dist/core/hooks.d.ts.map +1 -0
- package/dist/core/hooks.js +267 -0
- package/dist/core/hooks.js.map +1 -0
- package/dist/core/metricsTracker.d.ts +122 -0
- package/dist/core/metricsTracker.d.ts.map +1 -0
- package/dist/{alpha-zero → core}/metricsTracker.js +2 -5
- package/dist/core/metricsTracker.js.map +1 -0
- package/dist/core/securityAssessment.d.ts +91 -0
- package/dist/core/securityAssessment.d.ts.map +1 -0
- package/dist/core/securityAssessment.js +580 -0
- package/dist/core/securityAssessment.js.map +1 -0
- package/dist/core/toolPreconditions.d.ts.map +1 -1
- package/dist/core/toolPreconditions.js +0 -14
- package/dist/core/toolPreconditions.js.map +1 -1
- package/dist/core/toolRuntime.d.ts +22 -1
- package/dist/core/toolRuntime.d.ts.map +1 -1
- package/dist/core/toolRuntime.js +0 -5
- package/dist/core/toolRuntime.js.map +1 -1
- package/dist/core/toolValidation.d.ts.map +1 -1
- package/dist/core/toolValidation.js +14 -3
- package/dist/core/toolValidation.js.map +1 -1
- package/dist/core/validationRunner.d.ts +1 -3
- package/dist/core/validationRunner.d.ts.map +1 -1
- package/dist/core/validationRunner.js.map +1 -1
- package/dist/core/verification.d.ts +137 -0
- package/dist/core/verification.d.ts.map +1 -0
- package/dist/core/verification.js +323 -0
- package/dist/core/verification.js.map +1 -0
- package/dist/headless/headlessApp.d.ts.map +1 -1
- package/dist/headless/headlessApp.js +21 -0
- package/dist/headless/headlessApp.js.map +1 -1
- package/dist/mcp/sseClient.d.ts.map +1 -1
- package/dist/mcp/sseClient.js +9 -18
- package/dist/mcp/sseClient.js.map +1 -1
- package/dist/plugins/tools/build/buildPlugin.d.ts +0 -6
- package/dist/plugins/tools/build/buildPlugin.d.ts.map +1 -1
- package/dist/plugins/tools/build/buildPlugin.js +4 -10
- package/dist/plugins/tools/build/buildPlugin.js.map +1 -1
- package/dist/plugins/tools/nodeDefaults.d.ts.map +1 -1
- package/dist/plugins/tools/nodeDefaults.js +0 -2
- package/dist/plugins/tools/nodeDefaults.js.map +1 -1
- package/dist/runtime/agentSession.d.ts +2 -2
- package/dist/runtime/agentSession.d.ts.map +1 -1
- package/dist/runtime/agentSession.js +2 -2
- package/dist/runtime/agentSession.js.map +1 -1
- package/dist/shell/interactiveShell.d.ts +16 -7
- package/dist/shell/interactiveShell.d.ts.map +1 -1
- package/dist/shell/interactiveShell.js +235 -166
- package/dist/shell/interactiveShell.js.map +1 -1
- package/dist/shell/shellApp.d.ts +2 -0
- package/dist/shell/shellApp.d.ts.map +1 -1
- package/dist/shell/shellApp.js +40 -9
- package/dist/shell/shellApp.js.map +1 -1
- package/dist/shell/systemPrompt.d.ts.map +1 -1
- package/dist/shell/systemPrompt.js +1 -4
- package/dist/shell/systemPrompt.js.map +1 -1
- package/dist/shell/terminalInput.d.ts +149 -118
- package/dist/shell/terminalInput.d.ts.map +1 -1
- package/dist/shell/terminalInput.js +638 -532
- package/dist/shell/terminalInput.js.map +1 -1
- package/dist/shell/terminalInputAdapter.d.ts +79 -21
- package/dist/shell/terminalInputAdapter.d.ts.map +1 -1
- package/dist/shell/terminalInputAdapter.js +99 -30
- package/dist/shell/terminalInputAdapter.js.map +1 -1
- package/dist/subagents/agentConfig.d.ts +27 -0
- package/dist/subagents/agentConfig.d.ts.map +1 -0
- package/dist/subagents/agentConfig.js +89 -0
- package/dist/subagents/agentConfig.js.map +1 -0
- package/dist/subagents/agentRegistry.d.ts +33 -0
- package/dist/subagents/agentRegistry.d.ts.map +1 -0
- package/dist/subagents/agentRegistry.js +162 -0
- package/dist/subagents/agentRegistry.js.map +1 -0
- package/dist/subagents/taskRunner.d.ts +7 -1
- package/dist/subagents/taskRunner.d.ts.map +1 -1
- package/dist/subagents/taskRunner.js +180 -47
- package/dist/subagents/taskRunner.js.map +1 -1
- package/dist/ui/ShellUIAdapter.d.ts.map +1 -1
- package/dist/ui/ShellUIAdapter.js +13 -12
- package/dist/ui/ShellUIAdapter.js.map +1 -1
- package/dist/ui/display.d.ts +24 -45
- package/dist/ui/display.d.ts.map +1 -1
- package/dist/ui/display.js +140 -259
- package/dist/ui/display.js.map +1 -1
- package/dist/ui/theme.d.ts.map +1 -1
- package/dist/ui/theme.js +6 -8
- package/dist/ui/theme.js.map +1 -1
- package/dist/ui/toolDisplay.d.ts +0 -158
- package/dist/ui/toolDisplay.d.ts.map +1 -1
- package/dist/ui/toolDisplay.js +0 -348
- package/dist/ui/toolDisplay.js.map +1 -1
- package/dist/ui/unified/layout.d.ts +1 -0
- package/dist/ui/unified/layout.d.ts.map +1 -1
- package/dist/ui/unified/layout.js +15 -25
- package/dist/ui/unified/layout.js.map +1 -1
- package/dist/utils/frontmatter.d.ts +10 -0
- package/dist/utils/frontmatter.d.ts.map +1 -0
- package/dist/utils/frontmatter.js +78 -0
- package/dist/utils/frontmatter.js.map +1 -0
- package/package.json +4 -4
- package/dist/alpha-zero/agentWrapper.d.ts +0 -84
- package/dist/alpha-zero/agentWrapper.d.ts.map +0 -1
- package/dist/alpha-zero/agentWrapper.js +0 -171
- package/dist/alpha-zero/agentWrapper.js.map +0 -1
- package/dist/alpha-zero/codeEvaluator.d.ts +0 -25
- package/dist/alpha-zero/codeEvaluator.d.ts.map +0 -1
- package/dist/alpha-zero/codeEvaluator.js +0 -273
- package/dist/alpha-zero/codeEvaluator.js.map +0 -1
- package/dist/alpha-zero/competitiveRunner.d.ts +0 -66
- package/dist/alpha-zero/competitiveRunner.d.ts.map +0 -1
- package/dist/alpha-zero/competitiveRunner.js +0 -224
- package/dist/alpha-zero/competitiveRunner.js.map +0 -1
- package/dist/alpha-zero/index.d.ts +0 -67
- package/dist/alpha-zero/index.d.ts.map +0 -1
- package/dist/alpha-zero/index.js +0 -99
- package/dist/alpha-zero/index.js.map +0 -1
- package/dist/alpha-zero/introspection.d.ts +0 -128
- package/dist/alpha-zero/introspection.d.ts.map +0 -1
- package/dist/alpha-zero/introspection.js +0 -300
- package/dist/alpha-zero/introspection.js.map +0 -1
- package/dist/alpha-zero/metricsTracker.d.ts +0 -71
- package/dist/alpha-zero/metricsTracker.d.ts.map +0 -1
- package/dist/alpha-zero/metricsTracker.js.map +0 -1
- package/dist/alpha-zero/security/core.d.ts +0 -125
- package/dist/alpha-zero/security/core.d.ts.map +0 -1
- package/dist/alpha-zero/security/core.js +0 -271
- package/dist/alpha-zero/security/core.js.map +0 -1
- package/dist/alpha-zero/security/google.d.ts +0 -125
- package/dist/alpha-zero/security/google.d.ts.map +0 -1
- package/dist/alpha-zero/security/google.js +0 -311
- package/dist/alpha-zero/security/google.js.map +0 -1
- package/dist/alpha-zero/security/googleLoader.d.ts +0 -17
- package/dist/alpha-zero/security/googleLoader.d.ts.map +0 -1
- package/dist/alpha-zero/security/googleLoader.js +0 -41
- package/dist/alpha-zero/security/googleLoader.js.map +0 -1
- package/dist/alpha-zero/security/index.d.ts +0 -29
- package/dist/alpha-zero/security/index.d.ts.map +0 -1
- package/dist/alpha-zero/security/index.js +0 -32
- package/dist/alpha-zero/security/index.js.map +0 -1
- package/dist/alpha-zero/security/simulation.d.ts +0 -124
- package/dist/alpha-zero/security/simulation.d.ts.map +0 -1
- package/dist/alpha-zero/security/simulation.js +0 -277
- package/dist/alpha-zero/security/simulation.js.map +0 -1
- package/dist/alpha-zero/selfModification.d.ts +0 -109
- package/dist/alpha-zero/selfModification.d.ts.map +0 -1
- package/dist/alpha-zero/selfModification.js +0 -233
- package/dist/alpha-zero/selfModification.js.map +0 -1
- package/dist/alpha-zero/types.d.ts +0 -170
- package/dist/alpha-zero/types.d.ts.map +0 -1
- package/dist/alpha-zero/types.js +0 -31
- package/dist/alpha-zero/types.js.map +0 -1
- package/dist/capabilities/securityTestingCapability.d.ts +0 -13
- package/dist/capabilities/securityTestingCapability.d.ts.map +0 -1
- package/dist/capabilities/securityTestingCapability.js +0 -25
- package/dist/capabilities/securityTestingCapability.js.map +0 -1
- package/dist/core/aiFlowOptimizer.d.ts +0 -26
- package/dist/core/aiFlowOptimizer.d.ts.map +0 -1
- package/dist/core/aiFlowOptimizer.js +0 -31
- package/dist/core/aiFlowOptimizer.js.map +0 -1
- package/dist/core/aiOptimizationEngine.d.ts +0 -158
- package/dist/core/aiOptimizationEngine.d.ts.map +0 -1
- package/dist/core/aiOptimizationEngine.js +0 -428
- package/dist/core/aiOptimizationEngine.js.map +0 -1
- package/dist/core/aiOptimizationIntegration.d.ts +0 -93
- package/dist/core/aiOptimizationIntegration.d.ts.map +0 -1
- package/dist/core/aiOptimizationIntegration.js +0 -250
- package/dist/core/aiOptimizationIntegration.js.map +0 -1
- package/dist/core/enhancedErrorRecovery.d.ts +0 -100
- package/dist/core/enhancedErrorRecovery.d.ts.map +0 -1
- package/dist/core/enhancedErrorRecovery.js +0 -345
- package/dist/core/enhancedErrorRecovery.js.map +0 -1
- package/dist/core/hooksSystem.d.ts +0 -65
- package/dist/core/hooksSystem.d.ts.map +0 -1
- package/dist/core/hooksSystem.js +0 -273
- package/dist/core/hooksSystem.js.map +0 -1
- package/dist/core/memorySystem.d.ts +0 -48
- package/dist/core/memorySystem.d.ts.map +0 -1
- package/dist/core/memorySystem.js +0 -271
- package/dist/core/memorySystem.js.map +0 -1
- package/dist/core/unified/errors.d.ts +0 -189
- package/dist/core/unified/errors.d.ts.map +0 -1
- package/dist/core/unified/errors.js +0 -497
- package/dist/core/unified/errors.js.map +0 -1
- package/dist/core/unified/index.d.ts +0 -19
- package/dist/core/unified/index.d.ts.map +0 -1
- package/dist/core/unified/index.js +0 -68
- package/dist/core/unified/index.js.map +0 -1
- package/dist/core/unified/schema.d.ts +0 -101
- package/dist/core/unified/schema.d.ts.map +0 -1
- package/dist/core/unified/schema.js +0 -350
- package/dist/core/unified/schema.js.map +0 -1
- package/dist/core/unified/toolRuntime.d.ts +0 -179
- package/dist/core/unified/toolRuntime.d.ts.map +0 -1
- package/dist/core/unified/toolRuntime.js +0 -517
- package/dist/core/unified/toolRuntime.js.map +0 -1
- package/dist/core/unified/tools.d.ts +0 -127
- package/dist/core/unified/tools.d.ts.map +0 -1
- package/dist/core/unified/tools.js +0 -1333
- package/dist/core/unified/tools.js.map +0 -1
- package/dist/core/unified/types.d.ts +0 -352
- package/dist/core/unified/types.d.ts.map +0 -1
- package/dist/core/unified/types.js +0 -12
- package/dist/core/unified/types.js.map +0 -1
- package/dist/core/unified/version.d.ts +0 -209
- package/dist/core/unified/version.d.ts.map +0 -1
- package/dist/core/unified/version.js +0 -454
- package/dist/core/unified/version.js.map +0 -1
- package/dist/plugins/tools/security/securityPlugin.d.ts +0 -3
- package/dist/plugins/tools/security/securityPlugin.d.ts.map +0 -1
- package/dist/plugins/tools/security/securityPlugin.js +0 -12
- package/dist/plugins/tools/security/securityPlugin.js.map +0 -1
- package/dist/security/active-stack-security.d.ts +0 -112
- package/dist/security/active-stack-security.d.ts.map +0 -1
- package/dist/security/active-stack-security.js +0 -296
- package/dist/security/active-stack-security.js.map +0 -1
- package/dist/security/advanced-persistence-research.d.ts +0 -92
- package/dist/security/advanced-persistence-research.d.ts.map +0 -1
- package/dist/security/advanced-persistence-research.js +0 -195
- package/dist/security/advanced-persistence-research.js.map +0 -1
- package/dist/security/advanced-targeting.d.ts +0 -119
- package/dist/security/advanced-targeting.d.ts.map +0 -1
- package/dist/security/advanced-targeting.js +0 -233
- package/dist/security/advanced-targeting.js.map +0 -1
- package/dist/security/assessment/vulnerabilityAssessment.d.ts +0 -104
- package/dist/security/assessment/vulnerabilityAssessment.d.ts.map +0 -1
- package/dist/security/assessment/vulnerabilityAssessment.js +0 -315
- package/dist/security/assessment/vulnerabilityAssessment.js.map +0 -1
- package/dist/security/authorization/securityAuthorization.d.ts +0 -88
- package/dist/security/authorization/securityAuthorization.d.ts.map +0 -1
- package/dist/security/authorization/securityAuthorization.js +0 -172
- package/dist/security/authorization/securityAuthorization.js.map +0 -1
- package/dist/security/comprehensive-targeting.d.ts +0 -85
- package/dist/security/comprehensive-targeting.d.ts.map +0 -1
- package/dist/security/comprehensive-targeting.js +0 -438
- package/dist/security/comprehensive-targeting.js.map +0 -1
- package/dist/security/global-security-integration.d.ts +0 -91
- package/dist/security/global-security-integration.d.ts.map +0 -1
- package/dist/security/global-security-integration.js +0 -218
- package/dist/security/global-security-integration.js.map +0 -1
- package/dist/security/index.d.ts +0 -38
- package/dist/security/index.d.ts.map +0 -1
- package/dist/security/index.js +0 -47
- package/dist/security/index.js.map +0 -1
- package/dist/security/persistence-analyzer.d.ts +0 -56
- package/dist/security/persistence-analyzer.d.ts.map +0 -1
- package/dist/security/persistence-analyzer.js +0 -187
- package/dist/security/persistence-analyzer.js.map +0 -1
- package/dist/security/persistence-cli.d.ts +0 -36
- package/dist/security/persistence-cli.d.ts.map +0 -1
- package/dist/security/persistence-cli.js +0 -160
- package/dist/security/persistence-cli.js.map +0 -1
- package/dist/security/persistence-research.d.ts +0 -92
- package/dist/security/persistence-research.d.ts.map +0 -1
- package/dist/security/persistence-research.js +0 -364
- package/dist/security/persistence-research.js.map +0 -1
- package/dist/security/research/persistenceResearch.d.ts +0 -97
- package/dist/security/research/persistenceResearch.d.ts.map +0 -1
- package/dist/security/research/persistenceResearch.js +0 -282
- package/dist/security/research/persistenceResearch.js.map +0 -1
- package/dist/security/security-integration.d.ts +0 -74
- package/dist/security/security-integration.d.ts.map +0 -1
- package/dist/security/security-integration.js +0 -137
- package/dist/security/security-integration.js.map +0 -1
- package/dist/security/security-testing-framework.d.ts +0 -112
- package/dist/security/security-testing-framework.d.ts.map +0 -1
- package/dist/security/security-testing-framework.js +0 -364
- package/dist/security/security-testing-framework.js.map +0 -1
- package/dist/security/simulation/attackSimulation.d.ts +0 -93
- package/dist/security/simulation/attackSimulation.d.ts.map +0 -1
- package/dist/security/simulation/attackSimulation.js +0 -341
- package/dist/security/simulation/attackSimulation.js.map +0 -1
- package/dist/security/strategic-operations.d.ts +0 -100
- package/dist/security/strategic-operations.d.ts.map +0 -1
- package/dist/security/strategic-operations.js +0 -276
- package/dist/security/strategic-operations.js.map +0 -1
- package/dist/security/tool-security-wrapper.d.ts +0 -58
- package/dist/security/tool-security-wrapper.d.ts.map +0 -1
- package/dist/security/tool-security-wrapper.js +0 -156
- package/dist/security/tool-security-wrapper.js.map +0 -1
- package/dist/shell/claudeCodeStreamHandler.d.ts +0 -145
- package/dist/shell/claudeCodeStreamHandler.d.ts.map +0 -1
- package/dist/shell/claudeCodeStreamHandler.js +0 -322
- package/dist/shell/claudeCodeStreamHandler.js.map +0 -1
- package/dist/shell/inputQueueManager.d.ts +0 -144
- package/dist/shell/inputQueueManager.d.ts.map +0 -1
- package/dist/shell/inputQueueManager.js +0 -290
- package/dist/shell/inputQueueManager.js.map +0 -1
- package/dist/shell/metricsTracker.d.ts +0 -60
- package/dist/shell/metricsTracker.d.ts.map +0 -1
- package/dist/shell/metricsTracker.js +0 -119
- package/dist/shell/metricsTracker.js.map +0 -1
- package/dist/shell/streamingOutputManager.d.ts +0 -115
- package/dist/shell/streamingOutputManager.d.ts.map +0 -1
- package/dist/shell/streamingOutputManager.js +0 -225
- package/dist/shell/streamingOutputManager.js.map +0 -1
- package/dist/tools/securityTools.d.ts +0 -22
- package/dist/tools/securityTools.d.ts.map +0 -1
- package/dist/tools/securityTools.js +0 -448
- package/dist/tools/securityTools.js.map +0 -1
- package/dist/ui/persistentPrompt.d.ts +0 -50
- package/dist/ui/persistentPrompt.d.ts.map +0 -1
- package/dist/ui/persistentPrompt.js +0 -92
- package/dist/ui/persistentPrompt.js.map +0 -1
- package/dist/ui/terminalUISchema.d.ts +0 -195
- package/dist/ui/terminalUISchema.d.ts.map +0 -1
- package/dist/ui/terminalUISchema.js +0 -113
- package/dist/ui/terminalUISchema.js.map +0 -1
- package/scripts/deploy-security-capabilities.js +0 -178
|
@@ -1,273 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Code Evaluator
|
|
3
|
-
*
|
|
4
|
-
* AST-based code quality evaluation for generated code.
|
|
5
|
-
*
|
|
6
|
-
* Principal Investigator: Bo Shang
|
|
7
|
-
* Framework: erosolar-cli
|
|
8
|
-
*/
|
|
9
|
-
/**
|
|
10
|
-
* Extract code blocks from a response string.
|
|
11
|
-
*/
|
|
12
|
-
export function extractCodeBlocks(response) {
|
|
13
|
-
const codeBlockRegex = /```(?:\w+)?\n([\s\S]*?)```/g;
|
|
14
|
-
const blocks = [];
|
|
15
|
-
let match;
|
|
16
|
-
while ((match = codeBlockRegex.exec(response)) !== null) {
|
|
17
|
-
const code = match[1]?.trim();
|
|
18
|
-
if (code && code.length > 0) {
|
|
19
|
-
blocks.push(code);
|
|
20
|
-
}
|
|
21
|
-
}
|
|
22
|
-
return blocks;
|
|
23
|
-
}
|
|
24
|
-
/**
|
|
25
|
-
* Evaluate code quality metrics.
|
|
26
|
-
*
|
|
27
|
-
* This is a heuristic-based evaluation that analyzes code patterns.
|
|
28
|
-
* For production use, consider integrating actual AST parsers.
|
|
29
|
-
*/
|
|
30
|
-
export function evaluateCodeQuality(code) {
|
|
31
|
-
const lines = code.split('\n');
|
|
32
|
-
const totalLines = lines.length;
|
|
33
|
-
// Calculate individual scores
|
|
34
|
-
const codeQualityScore = calculateCodeQualityScore(code, lines);
|
|
35
|
-
const algorithmEfficiency = calculateEfficiencyScore(code, lines);
|
|
36
|
-
const errorHandlingScore = calculateErrorHandlingScore(code);
|
|
37
|
-
const documentationScore = calculateDocumentationScore(code, lines);
|
|
38
|
-
const maintainabilityScore = calculateMaintainabilityScore(code, lines, totalLines);
|
|
39
|
-
const securityScore = calculateSecurityScore(code);
|
|
40
|
-
return {
|
|
41
|
-
codeQualityScore,
|
|
42
|
-
algorithmEfficiency,
|
|
43
|
-
errorHandlingScore,
|
|
44
|
-
documentationScore,
|
|
45
|
-
maintainabilityScore,
|
|
46
|
-
securityScore,
|
|
47
|
-
};
|
|
48
|
-
}
|
|
49
|
-
/**
|
|
50
|
-
* Calculate overall code quality score.
|
|
51
|
-
*/
|
|
52
|
-
function calculateCodeQualityScore(code, lines) {
|
|
53
|
-
let score = 0.5; // Base score
|
|
54
|
-
// Check for consistent indentation
|
|
55
|
-
const indentationConsistent = checkIndentationConsistency(lines);
|
|
56
|
-
if (indentationConsistent) {
|
|
57
|
-
score += 0.1;
|
|
58
|
-
}
|
|
59
|
-
// Check for reasonable line lengths
|
|
60
|
-
const longLines = lines.filter((line) => line.length > 120).length;
|
|
61
|
-
if (longLines / lines.length < 0.1) {
|
|
62
|
-
score += 0.1;
|
|
63
|
-
}
|
|
64
|
-
// Check for naming conventions (camelCase or snake_case)
|
|
65
|
-
if (/[a-z][A-Z]/.test(code) || /_[a-z]/.test(code)) {
|
|
66
|
-
score += 0.1;
|
|
67
|
-
}
|
|
68
|
-
// Check for modular structure (functions/classes)
|
|
69
|
-
if (/(?:function|def|class|const\s+\w+\s*=\s*(?:async\s*)?\()/.test(code)) {
|
|
70
|
-
score += 0.1;
|
|
71
|
-
}
|
|
72
|
-
// Penalize magic numbers
|
|
73
|
-
const magicNumbers = code.match(/(?<![.\w])[2-9]\d*(?![.\w])/g) || [];
|
|
74
|
-
if (magicNumbers.length > 5) {
|
|
75
|
-
score -= 0.1;
|
|
76
|
-
}
|
|
77
|
-
return Math.max(0, Math.min(1, score));
|
|
78
|
-
}
|
|
79
|
-
/**
|
|
80
|
-
* Calculate algorithm efficiency score.
|
|
81
|
-
*/
|
|
82
|
-
function calculateEfficiencyScore(code, _lines) {
|
|
83
|
-
let score = 0.5;
|
|
84
|
-
// Check for efficient data structures
|
|
85
|
-
if (/(?:Map|Set|WeakMap|WeakSet|dict|set)\s*\(/.test(code)) {
|
|
86
|
-
score += 0.15;
|
|
87
|
-
}
|
|
88
|
-
// Penalize nested loops (potential O(n^2) or worse)
|
|
89
|
-
const nestedLoops = code.match(/(?:for|while)[\s\S]*?(?:for|while)/g)?.length || 0;
|
|
90
|
-
if (nestedLoops > 2) {
|
|
91
|
-
score -= 0.2;
|
|
92
|
-
}
|
|
93
|
-
// Check for early returns (efficient control flow)
|
|
94
|
-
if (/return\s+(?!undefined|null)/.test(code)) {
|
|
95
|
-
score += 0.1;
|
|
96
|
-
}
|
|
97
|
-
// Check for caching/memoization patterns
|
|
98
|
-
if (/(?:cache|memo|stored|cached)/i.test(code)) {
|
|
99
|
-
score += 0.15;
|
|
100
|
-
}
|
|
101
|
-
// Penalize string concatenation in loops
|
|
102
|
-
if (/(?:for|while)[\s\S]*?\+\s*=\s*['"`]/.test(code)) {
|
|
103
|
-
score -= 0.1;
|
|
104
|
-
}
|
|
105
|
-
return Math.max(0, Math.min(1, score));
|
|
106
|
-
}
|
|
107
|
-
/**
|
|
108
|
-
* Calculate error handling score.
|
|
109
|
-
*/
|
|
110
|
-
function calculateErrorHandlingScore(code) {
|
|
111
|
-
let score = 0.3;
|
|
112
|
-
// Check for try-catch blocks
|
|
113
|
-
const tryCatchCount = (code.match(/try\s*\{/g) || []).length;
|
|
114
|
-
if (tryCatchCount > 0) {
|
|
115
|
-
score += 0.2 * Math.min(tryCatchCount, 3);
|
|
116
|
-
}
|
|
117
|
-
// Check for error type checking
|
|
118
|
-
if (/instanceof\s+(?:Error|TypeError|RangeError)/i.test(code)) {
|
|
119
|
-
score += 0.1;
|
|
120
|
-
}
|
|
121
|
-
// Check for null/undefined checks
|
|
122
|
-
const nullChecks = (code.match(/(?:!==?\s*(?:null|undefined)|\?\?|\.?\?\.)/g) || []).length;
|
|
123
|
-
if (nullChecks > 0) {
|
|
124
|
-
score += 0.1 * Math.min(nullChecks / 3, 1);
|
|
125
|
-
}
|
|
126
|
-
// Check for error logging
|
|
127
|
-
if (/(?:console\.error|logger\.error|throw\s+new)/i.test(code)) {
|
|
128
|
-
score += 0.1;
|
|
129
|
-
}
|
|
130
|
-
// Check for finally blocks (cleanup)
|
|
131
|
-
if (/finally\s*\{/.test(code)) {
|
|
132
|
-
score += 0.1;
|
|
133
|
-
}
|
|
134
|
-
return Math.max(0, Math.min(1, score));
|
|
135
|
-
}
|
|
136
|
-
/**
|
|
137
|
-
* Calculate documentation score.
|
|
138
|
-
*/
|
|
139
|
-
function calculateDocumentationScore(code, lines) {
|
|
140
|
-
let score = 0.2;
|
|
141
|
-
// Check for JSDoc/docstring comments
|
|
142
|
-
const docComments = (code.match(/\/\*\*[\s\S]*?\*\/|"""[\s\S]*?"""|'''[\s\S]*?'''/g) || []).length;
|
|
143
|
-
if (docComments > 0) {
|
|
144
|
-
score += 0.3 * Math.min(docComments / 3, 1);
|
|
145
|
-
}
|
|
146
|
-
// Check for inline comments
|
|
147
|
-
const inlineComments = lines.filter((line) => /(?:\/\/|#)\s*\w/.test(line)).length;
|
|
148
|
-
const commentRatio = inlineComments / lines.length;
|
|
149
|
-
if (commentRatio > 0.05 && commentRatio < 0.3) {
|
|
150
|
-
score += 0.2;
|
|
151
|
-
}
|
|
152
|
-
// Check for type annotations (TypeScript/Python type hints)
|
|
153
|
-
if (/:\s*(?:string|number|boolean|any|\w+\[\]|Dict|List|Optional)/i.test(code)) {
|
|
154
|
-
score += 0.2;
|
|
155
|
-
}
|
|
156
|
-
// Check for meaningful variable names (longer than 2 chars)
|
|
157
|
-
const shortNames = (code.match(/\b[a-z]{1,2}\b/g) || []).length;
|
|
158
|
-
if (shortNames / lines.length < 0.5) {
|
|
159
|
-
score += 0.1;
|
|
160
|
-
}
|
|
161
|
-
return Math.max(0, Math.min(1, score));
|
|
162
|
-
}
|
|
163
|
-
/**
|
|
164
|
-
* Calculate maintainability score.
|
|
165
|
-
*/
|
|
166
|
-
function calculateMaintainabilityScore(code, lines, totalLines) {
|
|
167
|
-
let score = 0.5;
|
|
168
|
-
// Check function length (prefer smaller functions)
|
|
169
|
-
const functionMatches = code.match(/(?:function|def|=>\s*\{)/g) || [];
|
|
170
|
-
if (functionMatches.length > 0) {
|
|
171
|
-
const avgFunctionLength = totalLines / functionMatches.length;
|
|
172
|
-
if (avgFunctionLength < 30) {
|
|
173
|
-
score += 0.2;
|
|
174
|
-
}
|
|
175
|
-
else if (avgFunctionLength > 100) {
|
|
176
|
-
score -= 0.2;
|
|
177
|
-
}
|
|
178
|
-
}
|
|
179
|
-
// Check for single responsibility (low coupling indicators)
|
|
180
|
-
const importCount = (code.match(/(?:import|require|from\s+['"])/g) || []).length;
|
|
181
|
-
if (importCount < 10) {
|
|
182
|
-
score += 0.1;
|
|
183
|
-
}
|
|
184
|
-
// Check for constants (uppercase naming)
|
|
185
|
-
if (/const\s+[A-Z_]+\s*=/.test(code)) {
|
|
186
|
-
score += 0.1;
|
|
187
|
-
}
|
|
188
|
-
// Penalize deeply nested code
|
|
189
|
-
const maxIndentation = Math.max(...lines.map((line) => {
|
|
190
|
-
const match = line.match(/^(\s*)/);
|
|
191
|
-
return match ? match[1].length : 0;
|
|
192
|
-
}));
|
|
193
|
-
if (maxIndentation > 20) {
|
|
194
|
-
score -= 0.15;
|
|
195
|
-
}
|
|
196
|
-
return Math.max(0, Math.min(1, score));
|
|
197
|
-
}
|
|
198
|
-
/**
|
|
199
|
-
* Calculate security score.
|
|
200
|
-
*/
|
|
201
|
-
function calculateSecurityScore(code) {
|
|
202
|
-
let score = 0.7; // Assume secure by default
|
|
203
|
-
// Check for potential injection vulnerabilities
|
|
204
|
-
const dangerousPatterns = [
|
|
205
|
-
/eval\s*\(/i,
|
|
206
|
-
/exec\s*\(/i,
|
|
207
|
-
/Function\s*\(/i,
|
|
208
|
-
/innerHTML\s*=/i,
|
|
209
|
-
/dangerouslySetInnerHTML/i,
|
|
210
|
-
/document\.write/i,
|
|
211
|
-
];
|
|
212
|
-
for (const pattern of dangerousPatterns) {
|
|
213
|
-
if (pattern.test(code)) {
|
|
214
|
-
score -= 0.15;
|
|
215
|
-
}
|
|
216
|
-
}
|
|
217
|
-
// Check for hardcoded secrets
|
|
218
|
-
if (/(?:password|secret|api[_-]?key|token)\s*=\s*['"][^'"]+['"]/i.test(code)) {
|
|
219
|
-
score -= 0.3;
|
|
220
|
-
}
|
|
221
|
-
// Check for SQL injection risks
|
|
222
|
-
if (/(?:SELECT|INSERT|UPDATE|DELETE)[\s\S]*?\$\{/.test(code)) {
|
|
223
|
-
score -= 0.2;
|
|
224
|
-
}
|
|
225
|
-
// Check for input validation
|
|
226
|
-
if (/(?:validate|sanitize|escape|parameterized)/i.test(code)) {
|
|
227
|
-
score += 0.1;
|
|
228
|
-
}
|
|
229
|
-
return Math.max(0, Math.min(1, score));
|
|
230
|
-
}
|
|
231
|
-
/**
|
|
232
|
-
* Check for consistent indentation.
|
|
233
|
-
*/
|
|
234
|
-
function checkIndentationConsistency(lines) {
|
|
235
|
-
const indentSizes = new Set();
|
|
236
|
-
for (const line of lines) {
|
|
237
|
-
if (line.trim().length === 0)
|
|
238
|
-
continue;
|
|
239
|
-
const match = line.match(/^(\s*)/);
|
|
240
|
-
if (match && match[1]) {
|
|
241
|
-
const size = match[1].length;
|
|
242
|
-
if (size > 0) {
|
|
243
|
-
indentSizes.add(size);
|
|
244
|
-
}
|
|
245
|
-
}
|
|
246
|
-
}
|
|
247
|
-
// Check if all indentations are multiples of a common base
|
|
248
|
-
const sizes = Array.from(indentSizes).sort((a, b) => a - b);
|
|
249
|
-
if (sizes.length < 2)
|
|
250
|
-
return true;
|
|
251
|
-
const base = sizes[0];
|
|
252
|
-
return sizes.every((size) => size % base === 0);
|
|
253
|
-
}
|
|
254
|
-
/**
|
|
255
|
-
* Calculate a composite reward score from metrics.
|
|
256
|
-
*/
|
|
257
|
-
export function calculateRewardScore(metrics) {
|
|
258
|
-
const weights = {
|
|
259
|
-
codeQuality: 0.25,
|
|
260
|
-
efficiency: 0.2,
|
|
261
|
-
errorHandling: 0.2,
|
|
262
|
-
documentation: 0.15,
|
|
263
|
-
maintainability: 0.1,
|
|
264
|
-
security: 0.1,
|
|
265
|
-
};
|
|
266
|
-
return (metrics.codeQualityScore * weights.codeQuality +
|
|
267
|
-
metrics.algorithmEfficiency * weights.efficiency +
|
|
268
|
-
metrics.errorHandlingScore * weights.errorHandling +
|
|
269
|
-
metrics.documentationScore * weights.documentation +
|
|
270
|
-
metrics.maintainabilityScore * weights.maintainability +
|
|
271
|
-
metrics.securityScore * weights.security) * 100;
|
|
272
|
-
}
|
|
273
|
-
//# sourceMappingURL=codeEvaluator.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"codeEvaluator.js","sourceRoot":"","sources":["../../src/alpha-zero/codeEvaluator.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAIH;;GAEG;AACH,MAAM,UAAU,iBAAiB,CAAC,QAAgB;IAChD,MAAM,cAAc,GAAG,6BAA6B,CAAC;IACrD,MAAM,MAAM,GAAa,EAAE,CAAC;IAC5B,IAAI,KAAK,CAAC;IAEV,OAAO,CAAC,KAAK,GAAG,cAAc,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,KAAK,IAAI,EAAE,CAAC;QACxD,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,EAAE,IAAI,EAAE,CAAC;QAC9B,IAAI,IAAI,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC5B,MAAM,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACpB,CAAC;IACH,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;;;;GAKG;AACH,MAAM,UAAU,mBAAmB,CAAC,IAAY;IAC9C,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC;IAC/B,MAAM,UAAU,GAAG,KAAK,CAAC,MAAM,CAAC;IAEhC,8BAA8B;IAC9B,MAAM,gBAAgB,GAAG,yBAAyB,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;IAChE,MAAM,mBAAmB,GAAG,wBAAwB,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;IAClE,MAAM,kBAAkB,GAAG,2BAA2B,CAAC,IAAI,CAAC,CAAC;IAC7D,MAAM,kBAAkB,GAAG,2BAA2B,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;IACpE,MAAM,oBAAoB,GAAG,6BAA6B,CAAC,IAAI,EAAE,KAAK,EAAE,UAAU,CAAC,CAAC;IACpF,MAAM,aAAa,GAAG,sBAAsB,CAAC,IAAI,CAAC,CAAC;IAEnD,OAAO;QACL,gBAAgB;QAChB,mBAAmB;QACnB,kBAAkB;QAClB,kBAAkB;QAClB,oBAAoB;QACpB,aAAa;KACd,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,yBAAyB,CAAC,IAAY,EAAE,KAAe;IAC9D,IAAI,KAAK,GAAG,GAAG,CAAC,CAAC,aAAa;IAE9B,mCAAmC;IACnC,MAAM,qBAAqB,GAAG,2BAA2B,CAAC,KAAK,CAAC,CAAC;IACjE,IAAI,qBAAqB,EAAE,CAAC;QAC1B,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,oCAAoC;IACpC,MAAM,SAAS,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAI,CAAC,MAAM,GAAG,GAAG,CAAC,CAAC,MAAM,CAAC;IACnE,IAAI,SAAS,GAAG,KAAK,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;QACnC,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yDAAyD;IACzD,IAAI,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACnD,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,kDAAkD;IAClD,IAAI,0DAA0D,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC1E,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yBAAyB;IACzB,MAAM,YAAY,GAAG,IAAI,CAAC,KAAK,CAAC,8BAA8B,CAAC,IAAI,EAAE,CAAC;IACtE,IAAI,YAAY,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC5B,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,wBAAwB,CAAC,IAAY,EAAE,MAAgB;IAC9D,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,sCAAsC;IACtC,IAAI,2CAA2C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC3D,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,oDAAoD;IACpD,MAAM,WAAW,GACf,IAAI,CAAC,KAAK,CAAC,qCAAqC,CAAC,EAAE,MAAM,IAAI,CAAC,CAAC;IACjE,IAAI,WAAW,GAAG,CAAC,EAAE,CAAC;QACpB,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,mDAAmD;IACnD,IAAI,6BAA6B,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7C,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yCAAyC;IACzC,IAAI,+BAA+B,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC/C,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,yCAAyC;IACzC,IAAI,qCAAqC,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACrD,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,2BAA2B,CAAC,IAAY;IAC/C,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,6BAA6B;IAC7B,MAAM,aAAa,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IAC7D,IAAI,aAAa,GAAG,CAAC,EAAE,CAAC;QACtB,KAAK,IAAI,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,aAAa,EAAE,CAAC,CAAC,CAAC;IAC5C,CAAC;IAED,gCAAgC;IAChC,IAAI,8CAA8C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC9D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,kCAAkC;IAClC,MAAM,UAAU,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,6CAA6C,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IAC5F,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;QACnB,KAAK,IAAI,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,UAAU,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC;IAC7C,CAAC;IAED,0BAA0B;IAC1B,IAAI,+CAA+C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC/D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,qCAAqC;IACrC,IAAI,cAAc,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC9B,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,2BAA2B,CAAC,IAAY,EAAE,KAAe;IAChE,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,qCAAqC;IACrC,MAAM,WAAW,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,mDAAmD,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IACnG,IAAI,WAAW,GAAG,CAAC,EAAE,CAAC;QACpB,KAAK,IAAI,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,WAAW,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC;IAC9C,CAAC;IAED,4BAA4B;IAC5B,MAAM,cAAc,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAC3C,iBAAiB,CAAC,IAAI,CAAC,IAAI,CAAC,CAC7B,CAAC,MAAM,CAAC;IACT,MAAM,YAAY,GAAG,cAAc,GAAG,KAAK,CAAC,MAAM,CAAC;IACnD,IAAI,YAAY,GAAG,IAAI,IAAI,YAAY,GAAG,GAAG,EAAE,CAAC;QAC9C,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,4DAA4D;IAC5D,IAAI,+DAA+D,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC/E,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,4DAA4D;IAC5D,MAAM,UAAU,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,iBAAiB,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IAChE,IAAI,UAAU,GAAG,KAAK,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;QACpC,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,6BAA6B,CACpC,IAAY,EACZ,KAAe,EACf,UAAkB;IAElB,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,mDAAmD;IACnD,MAAM,eAAe,GAAG,IAAI,CAAC,KAAK,CAAC,2BAA2B,CAAC,IAAI,EAAE,CAAC;IACtE,IAAI,eAAe,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC/B,MAAM,iBAAiB,GAAG,UAAU,GAAG,eAAe,CAAC,MAAM,CAAC;QAC9D,IAAI,iBAAiB,GAAG,EAAE,EAAE,CAAC;YAC3B,KAAK,IAAI,GAAG,CAAC;QACf,CAAC;aAAM,IAAI,iBAAiB,GAAG,GAAG,EAAE,CAAC;YACnC,KAAK,IAAI,GAAG,CAAC;QACf,CAAC;IACH,CAAC;IAED,4DAA4D;IAC5D,MAAM,WAAW,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,iCAAiC,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IACjF,IAAI,WAAW,GAAG,EAAE,EAAE,CAAC;QACrB,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yCAAyC;IACzC,IAAI,qBAAqB,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACrC,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,8BAA8B;IAC9B,MAAM,cAAc,GAAG,IAAI,CAAC,GAAG,CAC7B,GAAG,KAAK,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE;QACpB,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC;QACnC,OAAO,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAE,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC;IACtC,CAAC,CAAC,CACH,CAAC;IACF,IAAI,cAAc,GAAG,EAAE,EAAE,CAAC;QACxB,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,sBAAsB,CAAC,IAAY;IAC1C,IAAI,KAAK,GAAG,GAAG,CAAC,CAAC,2BAA2B;IAE5C,gDAAgD;IAChD,MAAM,iBAAiB,GAAG;QACxB,YAAY;QACZ,YAAY;QACZ,gBAAgB;QAChB,gBAAgB;QAChB,0BAA0B;QAC1B,kBAAkB;KACnB,CAAC;IAEF,KAAK,MAAM,OAAO,IAAI,iBAAiB,EAAE,CAAC;QACxC,IAAI,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;YACvB,KAAK,IAAI,IAAI,CAAC;QAChB,CAAC;IACH,CAAC;IAED,8BAA8B;IAC9B,IAAI,6DAA6D,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7E,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,gCAAgC;IAChC,IAAI,6CAA6C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,6BAA6B;IAC7B,IAAI,6CAA6C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,2BAA2B,CAAC,KAAe;IAClD,MAAM,WAAW,GAAG,IAAI,GAAG,EAAU,CAAC;IAEtC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,IAAI,IAAI,CAAC,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC;YAAE,SAAS;QAEvC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC;QACnC,IAAI,KAAK,IAAI,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC;YACtB,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC;YAC7B,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;gBACb,WAAW,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;YACxB,CAAC;QACH,CAAC;IACH,CAAC;IAED,2DAA2D;IAC3D,MAAM,KAAK,GAAG,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;IAC5D,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC;QAAE,OAAO,IAAI,CAAC;IAElC,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;IACtB,OAAO,KAAK,CAAC,KAAK,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAK,GAAG,IAAK,KAAK,CAAC,CAAC,CAAC;AACpD,CAAC;AAED;;GAEG;AACH,MAAM,UAAU,oBAAoB,CAAC,OAA2B;IAC9D,MAAM,OAAO,GAAG;QACd,WAAW,EAAE,IAAI;QACjB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,GAAG;QAClB,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,GAAG;QACpB,QAAQ,EAAE,GAAG;KACd,CAAC;IAEF,OAAO,CACL,OAAO,CAAC,gBAAgB,GAAG,OAAO,CAAC,WAAW;QAC9C,OAAO,CAAC,mBAAmB,GAAG,OAAO,CAAC,UAAU;QAChD,OAAO,CAAC,kBAAkB,GAAG,OAAO,CAAC,aAAa;QAClD,OAAO,CAAC,kBAAkB,GAAG,OAAO,CAAC,aAAa;QAClD,OAAO,CAAC,oBAAoB,GAAG,OAAO,CAAC,eAAe;QACtD,OAAO,CAAC,aAAa,GAAG,OAAO,CAAC,QAAQ,CACzC,GAAG,GAAG,CAAC;AACV,CAAC"}
|
|
@@ -1,66 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Competitive Agent Runner
|
|
3
|
-
*
|
|
4
|
-
* Runs competitive comparisons between two AI agents.
|
|
5
|
-
*
|
|
6
|
-
* Principal Investigator: Bo Shang
|
|
7
|
-
* Framework: erosolar-cli
|
|
8
|
-
*/
|
|
9
|
-
import type { CompetitionRoundResult, CompetitionStandings, TournamentConfig, TournamentResult, TournamentCallbacks, TournamentStatus } from './types.js';
|
|
10
|
-
import { AlphaZeroAgentWrapper } from './agentWrapper.js';
|
|
11
|
-
/**
|
|
12
|
-
* Run competitive comparisons between two agents.
|
|
13
|
-
*/
|
|
14
|
-
export declare class CompetitiveAgentRunner {
|
|
15
|
-
private readonly agent1;
|
|
16
|
-
private readonly agent2;
|
|
17
|
-
private readonly roundResults;
|
|
18
|
-
constructor(agent1: AlphaZeroAgentWrapper, agent2: AlphaZeroAgentWrapper);
|
|
19
|
-
/**
|
|
20
|
-
* Run both agents on the same prompt and compare results.
|
|
21
|
-
*/
|
|
22
|
-
runComparison(prompt: string, evaluateCode?: boolean): Promise<CompetitionRoundResult>;
|
|
23
|
-
/**
|
|
24
|
-
* Run a single agent and return results.
|
|
25
|
-
*/
|
|
26
|
-
private runAgent;
|
|
27
|
-
/**
|
|
28
|
-
* Get current competition standings.
|
|
29
|
-
*/
|
|
30
|
-
getStandings(): CompetitionStandings;
|
|
31
|
-
/**
|
|
32
|
-
* Get all round results.
|
|
33
|
-
*/
|
|
34
|
-
getRoundResults(): CompetitionRoundResult[];
|
|
35
|
-
/**
|
|
36
|
-
* Reset competition history.
|
|
37
|
-
*/
|
|
38
|
-
reset(): void;
|
|
39
|
-
}
|
|
40
|
-
/**
|
|
41
|
-
* Tournament runner for multi-round competitions.
|
|
42
|
-
*/
|
|
43
|
-
export declare class TournamentRunner {
|
|
44
|
-
private readonly agent1;
|
|
45
|
-
private readonly agent2;
|
|
46
|
-
private status;
|
|
47
|
-
private currentResult;
|
|
48
|
-
constructor(agent1: AlphaZeroAgentWrapper, agent2: AlphaZeroAgentWrapper);
|
|
49
|
-
/**
|
|
50
|
-
* Run a tournament with the given configuration.
|
|
51
|
-
*/
|
|
52
|
-
run(config: TournamentConfig, callbacks?: TournamentCallbacks): Promise<TournamentResult>;
|
|
53
|
-
/**
|
|
54
|
-
* Get current tournament status.
|
|
55
|
-
*/
|
|
56
|
-
getStatus(): TournamentStatus;
|
|
57
|
-
/**
|
|
58
|
-
* Get the tournament result (if completed).
|
|
59
|
-
*/
|
|
60
|
-
getResult(): TournamentResult | null;
|
|
61
|
-
}
|
|
62
|
-
/**
|
|
63
|
-
* Generate a summary of tournament results.
|
|
64
|
-
*/
|
|
65
|
-
export declare function formatTournamentSummary(result: TournamentResult): string;
|
|
66
|
-
//# sourceMappingURL=competitiveRunner.d.ts.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"competitiveRunner.d.ts","sourceRoot":"","sources":["../../src/alpha-zero/competitiveRunner.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAEH,OAAO,KAAK,EACV,sBAAsB,EACtB,oBAAoB,EACpB,gBAAgB,EAChB,gBAAgB,EAChB,mBAAmB,EACnB,gBAAgB,EACjB,MAAM,YAAY,CAAC;AACpB,OAAO,EAAE,qBAAqB,EAAE,MAAM,mBAAmB,CAAC;AAG1D;;GAEG;AACH,qBAAa,sBAAsB;IACjC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAgC;gBAEjD,MAAM,EAAE,qBAAqB,EAAE,MAAM,EAAE,qBAAqB;IAKxE;;OAEG;IACG,aAAa,CAAC,MAAM,EAAE,MAAM,EAAE,YAAY,UAAO,GAAG,OAAO,CAAC,sBAAsB,CAAC;IAqDzF;;OAEG;YACW,QAAQ;IAgCtB;;OAEG;IACH,YAAY,IAAI,oBAAoB;IA0BpC;;OAEG;IACH,eAAe,IAAI,sBAAsB,EAAE;IAI3C;;OAEG;IACH,KAAK,IAAI,IAAI;CAGd;AAED;;GAEG;AACH,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,MAAM,CAA+B;IAC7C,OAAO,CAAC,aAAa,CAAiC;gBAE1C,MAAM,EAAE,qBAAqB,EAAE,MAAM,EAAE,qBAAqB;IAKxE;;OAEG;IACG,GAAG,CAAC,MAAM,EAAE,gBAAgB,EAAE,SAAS,CAAC,EAAE,mBAAmB,GAAG,OAAO,CAAC,gBAAgB,CAAC;IA2C/F;;OAEG;IACH,SAAS,IAAI,gBAAgB;IAI7B;;OAEG;IACH,SAAS,IAAI,gBAAgB,GAAG,IAAI;CAGrC;AAED;;GAEG;AACH,wBAAgB,uBAAuB,CAAC,MAAM,EAAE,gBAAgB,GAAG,MAAM,CAyBxE"}
|
|
@@ -1,224 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Competitive Agent Runner
|
|
3
|
-
*
|
|
4
|
-
* Runs competitive comparisons between two AI agents.
|
|
5
|
-
*
|
|
6
|
-
* Principal Investigator: Bo Shang
|
|
7
|
-
* Framework: erosolar-cli
|
|
8
|
-
*/
|
|
9
|
-
import { extractCodeBlocks, evaluateCodeQuality, calculateRewardScore } from './codeEvaluator.js';
|
|
10
|
-
/**
|
|
11
|
-
* Run competitive comparisons between two agents.
|
|
12
|
-
*/
|
|
13
|
-
export class CompetitiveAgentRunner {
|
|
14
|
-
agent1;
|
|
15
|
-
agent2;
|
|
16
|
-
roundResults = [];
|
|
17
|
-
constructor(agent1, agent2) {
|
|
18
|
-
this.agent1 = agent1;
|
|
19
|
-
this.agent2 = agent2;
|
|
20
|
-
}
|
|
21
|
-
/**
|
|
22
|
-
* Run both agents on the same prompt and compare results.
|
|
23
|
-
*/
|
|
24
|
-
async runComparison(prompt, evaluateCode = true) {
|
|
25
|
-
const startTime = Date.now();
|
|
26
|
-
// Run both agents concurrently
|
|
27
|
-
const [result1, result2] = await Promise.allSettled([
|
|
28
|
-
this.runAgent(this.agent1, prompt, evaluateCode),
|
|
29
|
-
this.runAgent(this.agent2, prompt, evaluateCode),
|
|
30
|
-
]);
|
|
31
|
-
const agent1Result = result1.status === 'fulfilled'
|
|
32
|
-
? result1.value
|
|
33
|
-
: { response: '', error: String(result1.reason), score: 0, timeMs: 0 };
|
|
34
|
-
const agent2Result = result2.status === 'fulfilled'
|
|
35
|
-
? result2.value
|
|
36
|
-
: { response: '', error: String(result2.reason), score: 0, timeMs: 0 };
|
|
37
|
-
const totalTimeMs = Date.now() - startTime;
|
|
38
|
-
// Determine winner
|
|
39
|
-
let winner;
|
|
40
|
-
if (agent1Result.score > agent2Result.score) {
|
|
41
|
-
winner = this.agent1.getAgentId();
|
|
42
|
-
}
|
|
43
|
-
else if (agent2Result.score > agent1Result.score) {
|
|
44
|
-
winner = this.agent2.getAgentId();
|
|
45
|
-
}
|
|
46
|
-
else {
|
|
47
|
-
winner = 'tie';
|
|
48
|
-
}
|
|
49
|
-
const result = {
|
|
50
|
-
prompt: prompt.slice(0, 100),
|
|
51
|
-
agent1: {
|
|
52
|
-
id: this.agent1.getAgentId(),
|
|
53
|
-
score: agent1Result.score,
|
|
54
|
-
responseLength: agent1Result.response.length,
|
|
55
|
-
timeMs: agent1Result.timeMs,
|
|
56
|
-
error: agent1Result.error,
|
|
57
|
-
},
|
|
58
|
-
agent2: {
|
|
59
|
-
id: this.agent2.getAgentId(),
|
|
60
|
-
score: agent2Result.score,
|
|
61
|
-
responseLength: agent2Result.response.length,
|
|
62
|
-
timeMs: agent2Result.timeMs,
|
|
63
|
-
error: agent2Result.error,
|
|
64
|
-
},
|
|
65
|
-
winner,
|
|
66
|
-
totalTimeMs,
|
|
67
|
-
};
|
|
68
|
-
this.roundResults.push(result);
|
|
69
|
-
return result;
|
|
70
|
-
}
|
|
71
|
-
/**
|
|
72
|
-
* Run a single agent and return results.
|
|
73
|
-
*/
|
|
74
|
-
async runAgent(agent, prompt, evaluateCode) {
|
|
75
|
-
const startTime = Date.now();
|
|
76
|
-
try {
|
|
77
|
-
const response = await agent.send(prompt);
|
|
78
|
-
const timeMs = Date.now() - startTime;
|
|
79
|
-
// Calculate score
|
|
80
|
-
let score = 50; // Base score
|
|
81
|
-
if (evaluateCode && response.includes('```')) {
|
|
82
|
-
const codeBlocks = extractCodeBlocks(response);
|
|
83
|
-
if (codeBlocks.length > 0) {
|
|
84
|
-
const metrics = evaluateCodeQuality(codeBlocks[0]);
|
|
85
|
-
score = calculateRewardScore(metrics);
|
|
86
|
-
}
|
|
87
|
-
}
|
|
88
|
-
return { response, score, timeMs };
|
|
89
|
-
}
|
|
90
|
-
catch (error) {
|
|
91
|
-
return {
|
|
92
|
-
response: '',
|
|
93
|
-
score: 0,
|
|
94
|
-
timeMs: Date.now() - startTime,
|
|
95
|
-
error: error instanceof Error ? error.message : String(error),
|
|
96
|
-
};
|
|
97
|
-
}
|
|
98
|
-
}
|
|
99
|
-
/**
|
|
100
|
-
* Get current competition standings.
|
|
101
|
-
*/
|
|
102
|
-
getStandings() {
|
|
103
|
-
const agent1Wins = this.roundResults.filter((r) => r.winner === this.agent1.getAgentId()).length;
|
|
104
|
-
const agent2Wins = this.roundResults.filter((r) => r.winner === this.agent2.getAgentId()).length;
|
|
105
|
-
const ties = this.roundResults.filter((r) => r.winner === 'tie').length;
|
|
106
|
-
const total = this.roundResults.length;
|
|
107
|
-
return {
|
|
108
|
-
totalRounds: total,
|
|
109
|
-
agent1: {
|
|
110
|
-
id: this.agent1.getAgentId(),
|
|
111
|
-
wins: agent1Wins,
|
|
112
|
-
winRate: total > 0 ? agent1Wins / total : 0,
|
|
113
|
-
},
|
|
114
|
-
agent2: {
|
|
115
|
-
id: this.agent2.getAgentId(),
|
|
116
|
-
wins: agent2Wins,
|
|
117
|
-
winRate: total > 0 ? agent2Wins / total : 0,
|
|
118
|
-
},
|
|
119
|
-
ties,
|
|
120
|
-
};
|
|
121
|
-
}
|
|
122
|
-
/**
|
|
123
|
-
* Get all round results.
|
|
124
|
-
*/
|
|
125
|
-
getRoundResults() {
|
|
126
|
-
return [...this.roundResults];
|
|
127
|
-
}
|
|
128
|
-
/**
|
|
129
|
-
* Reset competition history.
|
|
130
|
-
*/
|
|
131
|
-
reset() {
|
|
132
|
-
this.roundResults.length = 0;
|
|
133
|
-
}
|
|
134
|
-
}
|
|
135
|
-
/**
|
|
136
|
-
* Tournament runner for multi-round competitions.
|
|
137
|
-
*/
|
|
138
|
-
export class TournamentRunner {
|
|
139
|
-
agent1;
|
|
140
|
-
agent2;
|
|
141
|
-
status = 'pending';
|
|
142
|
-
currentResult = null;
|
|
143
|
-
constructor(agent1, agent2) {
|
|
144
|
-
this.agent1 = agent1;
|
|
145
|
-
this.agent2 = agent2;
|
|
146
|
-
}
|
|
147
|
-
/**
|
|
148
|
-
* Run a tournament with the given configuration.
|
|
149
|
-
*/
|
|
150
|
-
async run(config, callbacks) {
|
|
151
|
-
this.status = 'running';
|
|
152
|
-
const startTime = new Date();
|
|
153
|
-
const runner = new CompetitiveAgentRunner(this.agent1, this.agent2);
|
|
154
|
-
const rounds = [];
|
|
155
|
-
try {
|
|
156
|
-
for (let i = 0; i < config.rounds; i++) {
|
|
157
|
-
const prompt = config.prompts[i % config.prompts.length];
|
|
158
|
-
callbacks?.onRoundStart?.(i + 1, prompt);
|
|
159
|
-
const result = await runner.runComparison(prompt, config.evaluateCode);
|
|
160
|
-
rounds.push(result);
|
|
161
|
-
callbacks?.onRoundComplete?.(i + 1, result);
|
|
162
|
-
}
|
|
163
|
-
const endTime = new Date();
|
|
164
|
-
const totalDurationMs = endTime.getTime() - startTime.getTime();
|
|
165
|
-
const result = {
|
|
166
|
-
tournamentId: config.tournamentId,
|
|
167
|
-
config,
|
|
168
|
-
rounds,
|
|
169
|
-
standings: runner.getStandings(),
|
|
170
|
-
startTime: startTime.toISOString(),
|
|
171
|
-
endTime: endTime.toISOString(),
|
|
172
|
-
totalDurationMs,
|
|
173
|
-
};
|
|
174
|
-
this.currentResult = result;
|
|
175
|
-
this.status = 'completed';
|
|
176
|
-
callbacks?.onTournamentComplete?.(result);
|
|
177
|
-
return result;
|
|
178
|
-
}
|
|
179
|
-
catch (error) {
|
|
180
|
-
this.status = 'failed';
|
|
181
|
-
const err = error instanceof Error ? error : new Error(String(error));
|
|
182
|
-
callbacks?.onError?.(err);
|
|
183
|
-
throw err;
|
|
184
|
-
}
|
|
185
|
-
}
|
|
186
|
-
/**
|
|
187
|
-
* Get current tournament status.
|
|
188
|
-
*/
|
|
189
|
-
getStatus() {
|
|
190
|
-
return this.status;
|
|
191
|
-
}
|
|
192
|
-
/**
|
|
193
|
-
* Get the tournament result (if completed).
|
|
194
|
-
*/
|
|
195
|
-
getResult() {
|
|
196
|
-
return this.currentResult;
|
|
197
|
-
}
|
|
198
|
-
}
|
|
199
|
-
/**
|
|
200
|
-
* Generate a summary of tournament results.
|
|
201
|
-
*/
|
|
202
|
-
export function formatTournamentSummary(result) {
|
|
203
|
-
const lines = [
|
|
204
|
-
`Tournament: ${result.tournamentId}`,
|
|
205
|
-
'='.repeat(50),
|
|
206
|
-
'',
|
|
207
|
-
'Final Standings:',
|
|
208
|
-
` ${result.standings.agent1.id}: ${result.standings.agent1.wins} wins (${(result.standings.agent1.winRate * 100).toFixed(1)}%)`,
|
|
209
|
-
` ${result.standings.agent2.id}: ${result.standings.agent2.wins} wins (${(result.standings.agent2.winRate * 100).toFixed(1)}%)`,
|
|
210
|
-
` Ties: ${result.standings.ties}`,
|
|
211
|
-
'',
|
|
212
|
-
`Total Rounds: ${result.standings.totalRounds}`,
|
|
213
|
-
`Duration: ${(result.totalDurationMs / 1000).toFixed(2)}s`,
|
|
214
|
-
'',
|
|
215
|
-
'Round Results:',
|
|
216
|
-
];
|
|
217
|
-
for (let i = 0; i < result.rounds.length; i++) {
|
|
218
|
-
const round = result.rounds[i];
|
|
219
|
-
lines.push(` Round ${i + 1}: ${round.winner === 'tie' ? 'Tie' : `${round.winner} wins`} ` +
|
|
220
|
-
`(${round.agent1.score.toFixed(1)} vs ${round.agent2.score.toFixed(1)})`);
|
|
221
|
-
}
|
|
222
|
-
return lines.join('\n');
|
|
223
|
-
}
|
|
224
|
-
//# sourceMappingURL=competitiveRunner.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"competitiveRunner.js","sourceRoot":"","sources":["../../src/alpha-zero/competitiveRunner.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAWH,OAAO,EAAE,iBAAiB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,oBAAoB,CAAC;AAElG;;GAEG;AACH,MAAM,OAAO,sBAAsB;IAChB,MAAM,CAAwB;IAC9B,MAAM,CAAwB;IAC9B,YAAY,GAA6B,EAAE,CAAC;IAE7D,YAAY,MAA6B,EAAE,MAA6B;QACtE,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;QACrB,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;IACvB,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,aAAa,CAAC,MAAc,EAAE,YAAY,GAAG,IAAI;QACrD,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAE7B,+BAA+B;QAC/B,MAAM,CAAC,OAAO,EAAE,OAAO,CAAC,GAAG,MAAM,OAAO,CAAC,UAAU,CAAC;YAClD,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,MAAM,EAAE,MAAM,EAAE,YAAY,CAAC;YAChD,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,MAAM,EAAE,MAAM,EAAE,YAAY,CAAC;SACjD,CAAC,CAAC;QAEH,MAAM,YAAY,GAAG,OAAO,CAAC,MAAM,KAAK,WAAW;YACjD,CAAC,CAAC,OAAO,CAAC,KAAK;YACf,CAAC,CAAC,EAAE,QAAQ,EAAE,EAAE,EAAE,KAAK,EAAE,MAAM,CAAE,OAAiC,CAAC,MAAM,CAAC,EAAE,KAAK,EAAE,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,CAAC;QAEpG,MAAM,YAAY,GAAG,OAAO,CAAC,MAAM,KAAK,WAAW;YACjD,CAAC,CAAC,OAAO,CAAC,KAAK;YACf,CAAC,CAAC,EAAE,QAAQ,EAAE,EAAE,EAAE,KAAK,EAAE,MAAM,CAAE,OAAiC,CAAC,MAAM,CAAC,EAAE,KAAK,EAAE,CAAC,EAAE,MAAM,EAAE,CAAC,EAAE,CAAC;QAEpG,MAAM,WAAW,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;QAE3C,mBAAmB;QACnB,IAAI,MAAc,CAAC;QACnB,IAAI,YAAY,CAAC,KAAK,GAAG,YAAY,CAAC,KAAK,EAAE,CAAC;YAC5C,MAAM,GAAG,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAAC;QACpC,CAAC;aAAM,IAAI,YAAY,CAAC,KAAK,GAAG,YAAY,CAAC,KAAK,EAAE,CAAC;YACnD,MAAM,GAAG,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAAC;QACpC,CAAC;aAAM,CAAC;YACN,MAAM,GAAG,KAAK,CAAC;QACjB,CAAC;QAED,MAAM,MAAM,GAA2B;YACrC,MAAM,EAAE,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC;YAC5B,MAAM,EAAE;gBACN,EAAE,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE;gBAC5B,KAAK,EAAE,YAAY,CAAC,KAAK;gBACzB,cAAc,EAAE,YAAY,CAAC,QAAQ,CAAC,MAAM;gBAC5C,MAAM,EAAE,YAAY,CAAC,MAAM;gBAC3B,KAAK,EAAE,YAAY,CAAC,KAAK;aAC1B;YACD,MAAM,EAAE;gBACN,EAAE,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE;gBAC5B,KAAK,EAAE,YAAY,CAAC,KAAK;gBACzB,cAAc,EAAE,YAAY,CAAC,QAAQ,CAAC,MAAM;gBAC5C,MAAM,EAAE,YAAY,CAAC,MAAM;gBAC3B,KAAK,EAAE,YAAY,CAAC,KAAK;aAC1B;YACD,MAAM;YACN,WAAW;SACZ,CAAC;QAEF,IAAI,CAAC,YAAY,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QAC/B,OAAO,MAAM,CAAC;IAChB,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,QAAQ,CACpB,KAA4B,EAC5B,MAAc,EACd,YAAqB;QAErB,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAE7B,IAAI,CAAC;YACH,MAAM,QAAQ,GAAG,MAAM,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC1C,MAAM,MAAM,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;YAEtC,kBAAkB;YAClB,IAAI,KAAK,GAAG,EAAE,CAAC,CAAC,aAAa;YAC7B,IAAI,YAAY,IAAI,QAAQ,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;gBAC7C,MAAM,UAAU,GAAG,iBAAiB,CAAC,QAAQ,CAAC,CAAC;gBAC/C,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;oBAC1B,MAAM,OAAO,GAAG,mBAAmB,CAAC,UAAU,CAAC,CAAC,CAAE,CAAC,CAAC;oBACpD,KAAK,GAAG,oBAAoB,CAAC,OAAO,CAAC,CAAC;gBACxC,CAAC;YACH,CAAC;YAED,OAAO,EAAE,QAAQ,EAAE,KAAK,EAAE,MAAM,EAAE,CAAC;QACrC,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,OAAO;gBACL,QAAQ,EAAE,EAAE;gBACZ,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS;gBAC9B,KAAK,EAAE,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC;aAC9D,CAAC;QACJ,CAAC;IACH,CAAC;IAED;;OAEG;IACH,YAAY;QACV,MAAM,UAAU,GAAG,IAAI,CAAC,YAAY,CAAC,MAAM,CACzC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,KAAK,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAC7C,CAAC,MAAM,CAAC;QACT,MAAM,UAAU,GAAG,IAAI,CAAC,YAAY,CAAC,MAAM,CACzC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,KAAK,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAC7C,CAAC,MAAM,CAAC;QACT,MAAM,IAAI,GAAG,IAAI,CAAC,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,KAAK,KAAK,CAAC,CAAC,MAAM,CAAC;QACxE,MAAM,KAAK,GAAG,IAAI,CAAC,YAAY,CAAC,MAAM,CAAC;QAEvC,OAAO;YACL,WAAW,EAAE,KAAK;YAClB,MAAM,EAAE;gBACN,EAAE,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE;gBAC5B,IAAI,EAAE,UAAU;gBAChB,OAAO,EAAE,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,UAAU,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;aAC5C;YACD,MAAM,EAAE;gBACN,EAAE,EAAE,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE;gBAC5B,IAAI,EAAE,UAAU;gBAChB,OAAO,EAAE,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,UAAU,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;aAC5C;YACD,IAAI;SACL,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,eAAe;QACb,OAAO,CAAC,GAAG,IAAI,CAAC,YAAY,CAAC,CAAC;IAChC,CAAC;IAED;;OAEG;IACH,KAAK;QACH,IAAI,CAAC,YAAY,CAAC,MAAM,GAAG,CAAC,CAAC;IAC/B,CAAC;CACF;AAED;;GAEG;AACH,MAAM,OAAO,gBAAgB;IACV,MAAM,CAAwB;IAC9B,MAAM,CAAwB;IACvC,MAAM,GAAqB,SAAS,CAAC;IACrC,aAAa,GAA4B,IAAI,CAAC;IAEtD,YAAY,MAA6B,EAAE,MAA6B;QACtE,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;QACrB,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;IACvB,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,GAAG,CAAC,MAAwB,EAAE,SAA+B;QACjE,IAAI,CAAC,MAAM,GAAG,SAAS,CAAC;QACxB,MAAM,SAAS,GAAG,IAAI,IAAI,EAAE,CAAC;QAC7B,MAAM,MAAM,GAAG,IAAI,sBAAsB,CAAC,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;QACpE,MAAM,MAAM,GAA6B,EAAE,CAAC;QAE5C,IAAI,CAAC;YACH,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;gBACvC,MAAM,MAAM,GAAG,MAAM,CAAC,OAAO,CAAC,CAAC,GAAG,MAAM,CAAC,OAAO,CAAC,MAAM,CAAE,CAAC;gBAC1D,SAAS,EAAE,YAAY,EAAE,CAAC,CAAC,GAAG,CAAC,EAAE,MAAM,CAAC,CAAC;gBAEzC,MAAM,MAAM,GAAG,MAAM,MAAM,CAAC,aAAa,CAAC,MAAM,EAAE,MAAM,CAAC,YAAY,CAAC,CAAC;gBACvE,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;gBAEpB,SAAS,EAAE,eAAe,EAAE,CAAC,CAAC,GAAG,CAAC,EAAE,MAAM,CAAC,CAAC;YAC9C,CAAC;YAED,MAAM,OAAO,GAAG,IAAI,IAAI,EAAE,CAAC;YAC3B,MAAM,eAAe,GAAG,OAAO,CAAC,OAAO,EAAE,GAAG,SAAS,CAAC,OAAO,EAAE,CAAC;YAEhE,MAAM,MAAM,GAAqB;gBAC/B,YAAY,EAAE,MAAM,CAAC,YAAY;gBACjC,MAAM;gBACN,MAAM;gBACN,SAAS,EAAE,MAAM,CAAC,YAAY,EAAE;gBAChC,SAAS,EAAE,SAAS,CAAC,WAAW,EAAE;gBAClC,OAAO,EAAE,OAAO,CAAC,WAAW,EAAE;gBAC9B,eAAe;aAChB,CAAC;YAEF,IAAI,CAAC,aAAa,GAAG,MAAM,CAAC;YAC5B,IAAI,CAAC,MAAM,GAAG,WAAW,CAAC;YAC1B,SAAS,EAAE,oBAAoB,EAAE,CAAC,MAAM,CAAC,CAAC;YAE1C,OAAO,MAAM,CAAC;QAChB,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,IAAI,CAAC,MAAM,GAAG,QAAQ,CAAC;YACvB,MAAM,GAAG,GAAG,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,IAAI,KAAK,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC;YACtE,SAAS,EAAE,OAAO,EAAE,CAAC,GAAG,CAAC,CAAC;YAC1B,MAAM,GAAG,CAAC;QACZ,CAAC;IACH,CAAC;IAED;;OAEG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,MAAM,CAAC;IACrB,CAAC;IAED;;OAEG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,aAAa,CAAC;IAC5B,CAAC;CACF;AAED;;GAEG;AACH,MAAM,UAAU,uBAAuB,CAAC,MAAwB;IAC9D,MAAM,KAAK,GAAa;QACtB,eAAe,MAAM,CAAC,YAAY,EAAE;QACpC,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC;QACd,EAAE;QACF,kBAAkB;QAClB,KAAK,MAAM,CAAC,SAAS,CAAC,MAAM,CAAC,EAAE,KAAK,MAAM,CAAC,SAAS,CAAC,MAAM,CAAC,IAAI,UAAU,CAAC,MAAM,CAAC,SAAS,CAAC,MAAM,CAAC,OAAO,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI;QAChI,KAAK,MAAM,CAAC,SAAS,CAAC,MAAM,CAAC,EAAE,KAAK,MAAM,CAAC,SAAS,CAAC,MAAM,CAAC,IAAI,UAAU,CAAC,MAAM,CAAC,SAAS,CAAC,MAAM,CAAC,OAAO,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI;QAChI,WAAW,MAAM,CAAC,SAAS,CAAC,IAAI,EAAE;QAClC,EAAE;QACF,iBAAiB,MAAM,CAAC,SAAS,CAAC,WAAW,EAAE;QAC/C,aAAa,CAAC,MAAM,CAAC,eAAe,GAAG,IAAI,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG;QAC1D,EAAE;QACF,gBAAgB;KACjB,CAAC;IAEF,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;QAC9C,MAAM,KAAK,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,CAAE,CAAC;QAChC,KAAK,CAAC,IAAI,CACR,WAAW,CAAC,GAAG,CAAC,KAAK,KAAK,CAAC,MAAM,KAAK,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,GAAG,KAAK,CAAC,MAAM,OAAO,GAAG;YAC/E,IAAI,KAAK,CAAC,MAAM,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,OAAO,KAAK,CAAC,MAAM,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,CACzE,CAAC;IACJ,CAAC;IAED,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;AAC1B,CAAC"}
|
|
@@ -1,67 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Multi-Agent Competitive RL Framework
|
|
3
|
-
*
|
|
4
|
-
* A competitive reinforcement learning framework where two autonomous erosolar-cli
|
|
5
|
-
* agents compete on code optimization tasks while recursively improving their own
|
|
6
|
-
* implementations.
|
|
7
|
-
*
|
|
8
|
-
* Principal Investigator: Bo Shang
|
|
9
|
-
* Framework: erosolar-cli
|
|
10
|
-
* Status: Active Development
|
|
11
|
-
*
|
|
12
|
-
* Core Innovations:
|
|
13
|
-
* - Recursive Self-Modification Engine: Agents modify their own tool source code
|
|
14
|
-
* - Competitive Multi-Agent Framework: Tournament system with parallel execution
|
|
15
|
-
* - Version-Controlled Self-Improvement: SHA-256 checkpoints with automatic rollback
|
|
16
|
-
* - AST-Based Code Quality Metrics: Comprehensive evaluation across 10+ dimensions
|
|
17
|
-
*
|
|
18
|
-
* Structure:
|
|
19
|
-
* - Core: Types, metrics tracking, code evaluation
|
|
20
|
-
* - Self-Modification: Version-controlled code self-improvement
|
|
21
|
-
* - Introspection: Runtime analysis and self-awareness
|
|
22
|
-
* - Competitive: Multi-agent tournament framework
|
|
23
|
-
* - Security: Optional security research module (lazy loaded)
|
|
24
|
-
*
|
|
25
|
-
* Tech Stack (erosolar-cli):
|
|
26
|
-
* - Python: typer, rich, prompt-toolkit, pydantic, aiohttp, tiktoken
|
|
27
|
-
* - TypeScript: chalk, ora, gradient-string, boxen, nanospinner
|
|
28
|
-
* - AI Providers: anthropic, openai, google-generativeai
|
|
29
|
-
* - Testing: pytest, pytest-asyncio, mypy, ruff, eslint
|
|
30
|
-
*
|
|
31
|
-
* Research Contributions:
|
|
32
|
-
* - Demonstrated practical recursive self-improvement in autonomous agents
|
|
33
|
-
* - Proved competitive dynamics accelerate capability development
|
|
34
|
-
* - Established version control patterns for safe code self-modification
|
|
35
|
-
* - Created comprehensive metrics for evaluating code generation quality
|
|
36
|
-
*
|
|
37
|
-
* Citation:
|
|
38
|
-
* @software{alpha_zero_2,
|
|
39
|
-
* title={Alpha Zero 2: Recursive Self-Improvement in Competitive Multi-Agent Systems},
|
|
40
|
-
* author={Bo Shang},
|
|
41
|
-
* year={2024},
|
|
42
|
-
* framework={erosolar-cli},
|
|
43
|
-
* url={https://github.com/ErosolarAI/erosolar-by-bo}
|
|
44
|
-
* }
|
|
45
|
-
*/
|
|
46
|
-
export type { AgentPerformanceMetrics, CompetitiveAgentConfig, CompetitionRoundResult, CompetitionStandings, CodeQualityMetrics, ExecutionTrace, ImprovementSuggestion, TournamentConfig, TournamentResult, TournamentStatus, TournamentCallbacks, ResearchMetadata, } from './types.js';
|
|
47
|
-
export { ALPHA_ZERO_2_METADATA } from './types.js';
|
|
48
|
-
export { MetricsTracker, createDefaultMetrics } from './metricsTracker.js';
|
|
49
|
-
export { extractCodeBlocks, evaluateCodeQuality, calculateRewardScore, } from './codeEvaluator.js';
|
|
50
|
-
export { AlphaZeroAgentWrapper, type AlphaZeroAgentOptions } from './agentWrapper.js';
|
|
51
|
-
export { CompetitiveAgentRunner, TournamentRunner, formatTournamentSummary, } from './competitiveRunner.js';
|
|
52
|
-
export { SelfModificationEngine, createSelfModificationEngine, type ToolVersion, type TestResult, type PerformanceMetrics as SelfModPerformanceMetrics, type ModificationResult, type SelfModificationConfig, } from './selfModification.js';
|
|
53
|
-
export { IntrospectionEngine, createIntrospectionEngine, type PerformanceProfile, type CodeAnalysis, type IntrospectionConfig, } from './introspection.js';
|
|
54
|
-
export { isGoogleEnabled, getGoogleModule } from './security/googleLoader.js';
|
|
55
|
-
export * from './security/index.js';
|
|
56
|
-
/**
|
|
57
|
-
* Version information
|
|
58
|
-
*/
|
|
59
|
-
export declare const ALPHA_ZERO_VERSION = "1.0.0";
|
|
60
|
-
export declare const ALPHA_ZERO_AUTHOR = "Bo Shang";
|
|
61
|
-
export declare const ALPHA_ZERO_FRAMEWORK = "erosolar-cli";
|
|
62
|
-
export declare function isSecurityEnabled(): boolean;
|
|
63
|
-
/**
|
|
64
|
-
* Get security module (lazy load)
|
|
65
|
-
*/
|
|
66
|
-
export declare function getSecurityModule(): Promise<typeof import("./security/index.js")>;
|
|
67
|
-
//# sourceMappingURL=index.d.ts.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/alpha-zero/index.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA4CG;AAGH,YAAY,EACV,uBAAuB,EACvB,sBAAsB,EACtB,sBAAsB,EACtB,oBAAoB,EACpB,kBAAkB,EAClB,cAAc,EACd,qBAAqB,EACrB,gBAAgB,EAChB,gBAAgB,EAChB,gBAAgB,EAChB,mBAAmB,EACnB,gBAAgB,GACjB,MAAM,YAAY,CAAC;AAEpB,OAAO,EAAE,qBAAqB,EAAE,MAAM,YAAY,CAAC;AAGnD,OAAO,EAAE,cAAc,EAAE,oBAAoB,EAAE,MAAM,qBAAqB,CAAC;AAG3E,OAAO,EACL,iBAAiB,EACjB,mBAAmB,EACnB,oBAAoB,GACrB,MAAM,oBAAoB,CAAC;AAG5B,OAAO,EAAE,qBAAqB,EAAE,KAAK,qBAAqB,EAAE,MAAM,mBAAmB,CAAC;AAGtF,OAAO,EACL,sBAAsB,EACtB,gBAAgB,EAChB,uBAAuB,GACxB,MAAM,wBAAwB,CAAC;AAGhC,OAAO,EACL,sBAAsB,EACtB,4BAA4B,EAC5B,KAAK,WAAW,EAChB,KAAK,UAAU,EACf,KAAK,kBAAkB,IAAI,yBAAyB,EACpD,KAAK,kBAAkB,EACvB,KAAK,sBAAsB,GAC5B,MAAM,uBAAuB,CAAC;AAG/B,OAAO,EACL,mBAAmB,EACnB,yBAAyB,EACzB,KAAK,kBAAkB,EACvB,KAAK,YAAY,EACjB,KAAK,mBAAmB,GACzB,MAAM,oBAAoB,CAAC;AAG5B,OAAO,EAAE,eAAe,EAAE,eAAe,EAAE,MAAM,4BAA4B,CAAC;AAC9E,cAAc,qBAAqB,CAAC;AAEpC;;GAEG;AACH,eAAO,MAAM,kBAAkB,UAAU,CAAC;AAC1C,eAAO,MAAM,iBAAiB,aAAa,CAAC;AAC5C,eAAO,MAAM,oBAAoB,iBAAiB,CAAC;AAOnD,wBAAgB,iBAAiB,IAAI,OAAO,CAU3C;AAED;;GAEG;AACH,wBAAsB,iBAAiB,kDAYtC"}
|