erosolar-cli 1.7.356 → 1.7.358
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +24 -148
- package/dist/bin/erosolar.js +5 -21
- package/dist/bin/erosolar.js.map +1 -1
- package/dist/capabilities/agentSpawningCapability.d.ts.map +1 -1
- package/dist/capabilities/agentSpawningCapability.js +56 -31
- package/dist/capabilities/agentSpawningCapability.js.map +1 -1
- package/dist/contracts/agent-schemas.json +0 -15
- package/dist/contracts/tools.schema.json +0 -9
- package/dist/core/agent.d.ts +2 -2
- package/dist/core/agent.d.ts.map +1 -1
- package/dist/core/agent.js.map +1 -1
- package/dist/core/customCommands.d.ts +1 -0
- package/dist/core/customCommands.d.ts.map +1 -1
- package/dist/core/customCommands.js +3 -0
- package/dist/core/customCommands.js.map +1 -1
- package/dist/core/hooks.d.ts +113 -0
- package/dist/core/hooks.d.ts.map +1 -0
- package/dist/core/hooks.js +267 -0
- package/dist/core/hooks.js.map +1 -0
- package/dist/core/metricsTracker.d.ts +122 -0
- package/dist/core/metricsTracker.d.ts.map +1 -0
- package/dist/{alpha-zero → core}/metricsTracker.js +2 -5
- package/dist/core/metricsTracker.js.map +1 -0
- package/dist/core/securityAssessment.d.ts +91 -0
- package/dist/core/securityAssessment.d.ts.map +1 -0
- package/dist/core/securityAssessment.js +580 -0
- package/dist/core/securityAssessment.js.map +1 -0
- package/dist/core/sessionStore.d.ts +2 -0
- package/dist/core/sessionStore.d.ts.map +1 -1
- package/dist/core/sessionStore.js +1 -0
- package/dist/core/sessionStore.js.map +1 -1
- package/dist/core/toolPreconditions.d.ts.map +1 -1
- package/dist/core/toolPreconditions.js +0 -14
- package/dist/core/toolPreconditions.js.map +1 -1
- package/dist/core/toolRuntime.d.ts +22 -1
- package/dist/core/toolRuntime.d.ts.map +1 -1
- package/dist/core/toolRuntime.js +0 -5
- package/dist/core/toolRuntime.js.map +1 -1
- package/dist/core/toolValidation.d.ts.map +1 -1
- package/dist/core/toolValidation.js +14 -3
- package/dist/core/toolValidation.js.map +1 -1
- package/dist/core/validationRunner.d.ts +1 -3
- package/dist/core/validationRunner.d.ts.map +1 -1
- package/dist/core/validationRunner.js.map +1 -1
- package/dist/core/verification.d.ts +137 -0
- package/dist/core/verification.d.ts.map +1 -0
- package/dist/core/verification.js +323 -0
- package/dist/core/verification.js.map +1 -0
- package/dist/headless/headlessApp.d.ts.map +1 -1
- package/dist/headless/headlessApp.js +21 -0
- package/dist/headless/headlessApp.js.map +1 -1
- package/dist/mcp/sseClient.d.ts.map +1 -1
- package/dist/mcp/sseClient.js +9 -18
- package/dist/mcp/sseClient.js.map +1 -1
- package/dist/plugins/tools/build/buildPlugin.d.ts +0 -6
- package/dist/plugins/tools/build/buildPlugin.d.ts.map +1 -1
- package/dist/plugins/tools/build/buildPlugin.js +4 -10
- package/dist/plugins/tools/build/buildPlugin.js.map +1 -1
- package/dist/plugins/tools/nodeDefaults.d.ts.map +1 -1
- package/dist/plugins/tools/nodeDefaults.js +0 -2
- package/dist/plugins/tools/nodeDefaults.js.map +1 -1
- package/dist/runtime/agentSession.d.ts +2 -2
- package/dist/runtime/agentSession.d.ts.map +1 -1
- package/dist/runtime/agentSession.js +2 -2
- package/dist/runtime/agentSession.js.map +1 -1
- package/dist/shell/interactiveShell.d.ts +41 -7
- package/dist/shell/interactiveShell.d.ts.map +1 -1
- package/dist/shell/interactiveShell.js +399 -166
- package/dist/shell/interactiveShell.js.map +1 -1
- package/dist/shell/shellApp.d.ts +2 -0
- package/dist/shell/shellApp.d.ts.map +1 -1
- package/dist/shell/shellApp.js +82 -9
- package/dist/shell/shellApp.js.map +1 -1
- package/dist/shell/systemPrompt.d.ts.map +1 -1
- package/dist/shell/systemPrompt.js +1 -4
- package/dist/shell/systemPrompt.js.map +1 -1
- package/dist/shell/terminalInput.d.ts +250 -125
- package/dist/shell/terminalInput.d.ts.map +1 -1
- package/dist/shell/terminalInput.js +1061 -612
- package/dist/shell/terminalInput.js.map +1 -1
- package/dist/shell/terminalInputAdapter.d.ts +106 -24
- package/dist/shell/terminalInputAdapter.d.ts.map +1 -1
- package/dist/shell/terminalInputAdapter.js +137 -30
- package/dist/shell/terminalInputAdapter.js.map +1 -1
- package/dist/subagents/agentConfig.d.ts +27 -0
- package/dist/subagents/agentConfig.d.ts.map +1 -0
- package/dist/subagents/agentConfig.js +89 -0
- package/dist/subagents/agentConfig.js.map +1 -0
- package/dist/subagents/agentRegistry.d.ts +33 -0
- package/dist/subagents/agentRegistry.d.ts.map +1 -0
- package/dist/subagents/agentRegistry.js +162 -0
- package/dist/subagents/agentRegistry.js.map +1 -0
- package/dist/subagents/taskRunner.d.ts +7 -1
- package/dist/subagents/taskRunner.d.ts.map +1 -1
- package/dist/subagents/taskRunner.js +200 -49
- package/dist/subagents/taskRunner.js.map +1 -1
- package/dist/ui/ShellUIAdapter.d.ts +7 -1
- package/dist/ui/ShellUIAdapter.d.ts.map +1 -1
- package/dist/ui/ShellUIAdapter.js +42 -18
- package/dist/ui/ShellUIAdapter.js.map +1 -1
- package/dist/ui/display.d.ts +24 -45
- package/dist/ui/display.d.ts.map +1 -1
- package/dist/ui/display.js +148 -274
- package/dist/ui/display.js.map +1 -1
- package/dist/ui/theme.d.ts.map +1 -1
- package/dist/ui/theme.js +6 -8
- package/dist/ui/theme.js.map +1 -1
- package/dist/ui/toolDisplay.d.ts +0 -158
- package/dist/ui/toolDisplay.d.ts.map +1 -1
- package/dist/ui/toolDisplay.js +0 -348
- package/dist/ui/toolDisplay.js.map +1 -1
- package/dist/ui/unified/layout.d.ts +20 -0
- package/dist/ui/unified/layout.d.ts.map +1 -1
- package/dist/ui/unified/layout.js +105 -216
- package/dist/ui/unified/layout.js.map +1 -1
- package/dist/utils/frontmatter.d.ts +10 -0
- package/dist/utils/frontmatter.d.ts.map +1 -0
- package/dist/utils/frontmatter.js +78 -0
- package/dist/utils/frontmatter.js.map +1 -0
- package/package.json +4 -4
- package/dist/alpha-zero/agentWrapper.d.ts +0 -84
- package/dist/alpha-zero/agentWrapper.d.ts.map +0 -1
- package/dist/alpha-zero/agentWrapper.js +0 -171
- package/dist/alpha-zero/agentWrapper.js.map +0 -1
- package/dist/alpha-zero/codeEvaluator.d.ts +0 -25
- package/dist/alpha-zero/codeEvaluator.d.ts.map +0 -1
- package/dist/alpha-zero/codeEvaluator.js +0 -273
- package/dist/alpha-zero/codeEvaluator.js.map +0 -1
- package/dist/alpha-zero/competitiveRunner.d.ts +0 -66
- package/dist/alpha-zero/competitiveRunner.d.ts.map +0 -1
- package/dist/alpha-zero/competitiveRunner.js +0 -224
- package/dist/alpha-zero/competitiveRunner.js.map +0 -1
- package/dist/alpha-zero/index.d.ts +0 -67
- package/dist/alpha-zero/index.d.ts.map +0 -1
- package/dist/alpha-zero/index.js +0 -99
- package/dist/alpha-zero/index.js.map +0 -1
- package/dist/alpha-zero/introspection.d.ts +0 -128
- package/dist/alpha-zero/introspection.d.ts.map +0 -1
- package/dist/alpha-zero/introspection.js +0 -300
- package/dist/alpha-zero/introspection.js.map +0 -1
- package/dist/alpha-zero/metricsTracker.d.ts +0 -71
- package/dist/alpha-zero/metricsTracker.d.ts.map +0 -1
- package/dist/alpha-zero/metricsTracker.js.map +0 -1
- package/dist/alpha-zero/security/core.d.ts +0 -125
- package/dist/alpha-zero/security/core.d.ts.map +0 -1
- package/dist/alpha-zero/security/core.js +0 -271
- package/dist/alpha-zero/security/core.js.map +0 -1
- package/dist/alpha-zero/security/google.d.ts +0 -125
- package/dist/alpha-zero/security/google.d.ts.map +0 -1
- package/dist/alpha-zero/security/google.js +0 -311
- package/dist/alpha-zero/security/google.js.map +0 -1
- package/dist/alpha-zero/security/googleLoader.d.ts +0 -17
- package/dist/alpha-zero/security/googleLoader.d.ts.map +0 -1
- package/dist/alpha-zero/security/googleLoader.js +0 -41
- package/dist/alpha-zero/security/googleLoader.js.map +0 -1
- package/dist/alpha-zero/security/index.d.ts +0 -29
- package/dist/alpha-zero/security/index.d.ts.map +0 -1
- package/dist/alpha-zero/security/index.js +0 -32
- package/dist/alpha-zero/security/index.js.map +0 -1
- package/dist/alpha-zero/security/simulation.d.ts +0 -124
- package/dist/alpha-zero/security/simulation.d.ts.map +0 -1
- package/dist/alpha-zero/security/simulation.js +0 -277
- package/dist/alpha-zero/security/simulation.js.map +0 -1
- package/dist/alpha-zero/selfModification.d.ts +0 -109
- package/dist/alpha-zero/selfModification.d.ts.map +0 -1
- package/dist/alpha-zero/selfModification.js +0 -233
- package/dist/alpha-zero/selfModification.js.map +0 -1
- package/dist/alpha-zero/types.d.ts +0 -170
- package/dist/alpha-zero/types.d.ts.map +0 -1
- package/dist/alpha-zero/types.js +0 -31
- package/dist/alpha-zero/types.js.map +0 -1
- package/dist/capabilities/securityTestingCapability.d.ts +0 -13
- package/dist/capabilities/securityTestingCapability.d.ts.map +0 -1
- package/dist/capabilities/securityTestingCapability.js +0 -25
- package/dist/capabilities/securityTestingCapability.js.map +0 -1
- package/dist/core/aiFlowOptimizer.d.ts +0 -26
- package/dist/core/aiFlowOptimizer.d.ts.map +0 -1
- package/dist/core/aiFlowOptimizer.js +0 -31
- package/dist/core/aiFlowOptimizer.js.map +0 -1
- package/dist/core/aiOptimizationEngine.d.ts +0 -158
- package/dist/core/aiOptimizationEngine.d.ts.map +0 -1
- package/dist/core/aiOptimizationEngine.js +0 -428
- package/dist/core/aiOptimizationEngine.js.map +0 -1
- package/dist/core/aiOptimizationIntegration.d.ts +0 -93
- package/dist/core/aiOptimizationIntegration.d.ts.map +0 -1
- package/dist/core/aiOptimizationIntegration.js +0 -250
- package/dist/core/aiOptimizationIntegration.js.map +0 -1
- package/dist/core/enhancedErrorRecovery.d.ts +0 -100
- package/dist/core/enhancedErrorRecovery.d.ts.map +0 -1
- package/dist/core/enhancedErrorRecovery.js +0 -345
- package/dist/core/enhancedErrorRecovery.js.map +0 -1
- package/dist/core/hooksSystem.d.ts +0 -65
- package/dist/core/hooksSystem.d.ts.map +0 -1
- package/dist/core/hooksSystem.js +0 -273
- package/dist/core/hooksSystem.js.map +0 -1
- package/dist/core/memorySystem.d.ts +0 -48
- package/dist/core/memorySystem.d.ts.map +0 -1
- package/dist/core/memorySystem.js +0 -271
- package/dist/core/memorySystem.js.map +0 -1
- package/dist/core/unified/errors.d.ts +0 -189
- package/dist/core/unified/errors.d.ts.map +0 -1
- package/dist/core/unified/errors.js +0 -497
- package/dist/core/unified/errors.js.map +0 -1
- package/dist/core/unified/index.d.ts +0 -19
- package/dist/core/unified/index.d.ts.map +0 -1
- package/dist/core/unified/index.js +0 -68
- package/dist/core/unified/index.js.map +0 -1
- package/dist/core/unified/schema.d.ts +0 -101
- package/dist/core/unified/schema.d.ts.map +0 -1
- package/dist/core/unified/schema.js +0 -350
- package/dist/core/unified/schema.js.map +0 -1
- package/dist/core/unified/toolRuntime.d.ts +0 -179
- package/dist/core/unified/toolRuntime.d.ts.map +0 -1
- package/dist/core/unified/toolRuntime.js +0 -517
- package/dist/core/unified/toolRuntime.js.map +0 -1
- package/dist/core/unified/tools.d.ts +0 -127
- package/dist/core/unified/tools.d.ts.map +0 -1
- package/dist/core/unified/tools.js +0 -1333
- package/dist/core/unified/tools.js.map +0 -1
- package/dist/core/unified/types.d.ts +0 -352
- package/dist/core/unified/types.d.ts.map +0 -1
- package/dist/core/unified/types.js +0 -12
- package/dist/core/unified/types.js.map +0 -1
- package/dist/core/unified/version.d.ts +0 -209
- package/dist/core/unified/version.d.ts.map +0 -1
- package/dist/core/unified/version.js +0 -454
- package/dist/core/unified/version.js.map +0 -1
- package/dist/plugins/tools/security/securityPlugin.d.ts +0 -3
- package/dist/plugins/tools/security/securityPlugin.d.ts.map +0 -1
- package/dist/plugins/tools/security/securityPlugin.js +0 -12
- package/dist/plugins/tools/security/securityPlugin.js.map +0 -1
- package/dist/security/active-stack-security.d.ts +0 -112
- package/dist/security/active-stack-security.d.ts.map +0 -1
- package/dist/security/active-stack-security.js +0 -296
- package/dist/security/active-stack-security.js.map +0 -1
- package/dist/security/advanced-persistence-research.d.ts +0 -92
- package/dist/security/advanced-persistence-research.d.ts.map +0 -1
- package/dist/security/advanced-persistence-research.js +0 -195
- package/dist/security/advanced-persistence-research.js.map +0 -1
- package/dist/security/advanced-targeting.d.ts +0 -119
- package/dist/security/advanced-targeting.d.ts.map +0 -1
- package/dist/security/advanced-targeting.js +0 -233
- package/dist/security/advanced-targeting.js.map +0 -1
- package/dist/security/assessment/vulnerabilityAssessment.d.ts +0 -104
- package/dist/security/assessment/vulnerabilityAssessment.d.ts.map +0 -1
- package/dist/security/assessment/vulnerabilityAssessment.js +0 -315
- package/dist/security/assessment/vulnerabilityAssessment.js.map +0 -1
- package/dist/security/authorization/securityAuthorization.d.ts +0 -88
- package/dist/security/authorization/securityAuthorization.d.ts.map +0 -1
- package/dist/security/authorization/securityAuthorization.js +0 -172
- package/dist/security/authorization/securityAuthorization.js.map +0 -1
- package/dist/security/comprehensive-targeting.d.ts +0 -85
- package/dist/security/comprehensive-targeting.d.ts.map +0 -1
- package/dist/security/comprehensive-targeting.js +0 -438
- package/dist/security/comprehensive-targeting.js.map +0 -1
- package/dist/security/global-security-integration.d.ts +0 -91
- package/dist/security/global-security-integration.d.ts.map +0 -1
- package/dist/security/global-security-integration.js +0 -218
- package/dist/security/global-security-integration.js.map +0 -1
- package/dist/security/index.d.ts +0 -38
- package/dist/security/index.d.ts.map +0 -1
- package/dist/security/index.js +0 -47
- package/dist/security/index.js.map +0 -1
- package/dist/security/persistence-analyzer.d.ts +0 -56
- package/dist/security/persistence-analyzer.d.ts.map +0 -1
- package/dist/security/persistence-analyzer.js +0 -187
- package/dist/security/persistence-analyzer.js.map +0 -1
- package/dist/security/persistence-cli.d.ts +0 -36
- package/dist/security/persistence-cli.d.ts.map +0 -1
- package/dist/security/persistence-cli.js +0 -160
- package/dist/security/persistence-cli.js.map +0 -1
- package/dist/security/persistence-research.d.ts +0 -92
- package/dist/security/persistence-research.d.ts.map +0 -1
- package/dist/security/persistence-research.js +0 -364
- package/dist/security/persistence-research.js.map +0 -1
- package/dist/security/research/persistenceResearch.d.ts +0 -97
- package/dist/security/research/persistenceResearch.d.ts.map +0 -1
- package/dist/security/research/persistenceResearch.js +0 -282
- package/dist/security/research/persistenceResearch.js.map +0 -1
- package/dist/security/security-integration.d.ts +0 -74
- package/dist/security/security-integration.d.ts.map +0 -1
- package/dist/security/security-integration.js +0 -137
- package/dist/security/security-integration.js.map +0 -1
- package/dist/security/security-testing-framework.d.ts +0 -112
- package/dist/security/security-testing-framework.d.ts.map +0 -1
- package/dist/security/security-testing-framework.js +0 -364
- package/dist/security/security-testing-framework.js.map +0 -1
- package/dist/security/simulation/attackSimulation.d.ts +0 -93
- package/dist/security/simulation/attackSimulation.d.ts.map +0 -1
- package/dist/security/simulation/attackSimulation.js +0 -341
- package/dist/security/simulation/attackSimulation.js.map +0 -1
- package/dist/security/strategic-operations.d.ts +0 -100
- package/dist/security/strategic-operations.d.ts.map +0 -1
- package/dist/security/strategic-operations.js +0 -276
- package/dist/security/strategic-operations.js.map +0 -1
- package/dist/security/tool-security-wrapper.d.ts +0 -58
- package/dist/security/tool-security-wrapper.d.ts.map +0 -1
- package/dist/security/tool-security-wrapper.js +0 -156
- package/dist/security/tool-security-wrapper.js.map +0 -1
- package/dist/shell/claudeCodeStreamHandler.d.ts +0 -145
- package/dist/shell/claudeCodeStreamHandler.d.ts.map +0 -1
- package/dist/shell/claudeCodeStreamHandler.js +0 -322
- package/dist/shell/claudeCodeStreamHandler.js.map +0 -1
- package/dist/shell/inputQueueManager.d.ts +0 -144
- package/dist/shell/inputQueueManager.d.ts.map +0 -1
- package/dist/shell/inputQueueManager.js +0 -290
- package/dist/shell/inputQueueManager.js.map +0 -1
- package/dist/shell/metricsTracker.d.ts +0 -60
- package/dist/shell/metricsTracker.d.ts.map +0 -1
- package/dist/shell/metricsTracker.js +0 -119
- package/dist/shell/metricsTracker.js.map +0 -1
- package/dist/shell/streamingOutputManager.d.ts +0 -115
- package/dist/shell/streamingOutputManager.d.ts.map +0 -1
- package/dist/shell/streamingOutputManager.js +0 -225
- package/dist/shell/streamingOutputManager.js.map +0 -1
- package/dist/tools/securityTools.d.ts +0 -22
- package/dist/tools/securityTools.d.ts.map +0 -1
- package/dist/tools/securityTools.js +0 -448
- package/dist/tools/securityTools.js.map +0 -1
- package/dist/ui/persistentPrompt.d.ts +0 -50
- package/dist/ui/persistentPrompt.d.ts.map +0 -1
- package/dist/ui/persistentPrompt.js +0 -92
- package/dist/ui/persistentPrompt.js.map +0 -1
- package/dist/ui/terminalUISchema.d.ts +0 -195
- package/dist/ui/terminalUISchema.d.ts.map +0 -1
- package/dist/ui/terminalUISchema.js +0 -113
- package/dist/ui/terminalUISchema.js.map +0 -1
- package/scripts/deploy-security-capabilities.js +0 -178
|
@@ -1,171 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Agent Wrapper
|
|
3
|
-
*
|
|
4
|
-
* Wraps the AgentRuntime with Alpha Zero 2 capabilities for
|
|
5
|
-
* performance tracking, code quality evaluation, and competitive metrics.
|
|
6
|
-
*
|
|
7
|
-
* Principal Investigator: Bo Shang
|
|
8
|
-
* Framework: erosolar-cli
|
|
9
|
-
*/
|
|
10
|
-
import { MetricsTracker } from './metricsTracker.js';
|
|
11
|
-
import { extractCodeBlocks, evaluateCodeQuality, calculateRewardScore } from './codeEvaluator.js';
|
|
12
|
-
/**
|
|
13
|
-
* Wrapper around AgentRuntime that adds Alpha Zero 2 capabilities.
|
|
14
|
-
*
|
|
15
|
-
* Provides:
|
|
16
|
-
* - Performance introspection
|
|
17
|
-
* - Code quality evaluation
|
|
18
|
-
* - Competitive metrics tracking
|
|
19
|
-
* - Self-improvement suggestions
|
|
20
|
-
*/
|
|
21
|
-
export class AlphaZeroAgentWrapper {
|
|
22
|
-
agent;
|
|
23
|
-
agentId;
|
|
24
|
-
enableIntrospection;
|
|
25
|
-
enableCodeEvaluation;
|
|
26
|
-
metricsTracker;
|
|
27
|
-
currentTraceId = 0;
|
|
28
|
-
constructor(options) {
|
|
29
|
-
this.agent = options.agent;
|
|
30
|
-
this.agentId = options.agentId ?? 'agent';
|
|
31
|
-
this.enableIntrospection = options.enableIntrospection ?? true;
|
|
32
|
-
this.enableCodeEvaluation = options.enableCodeEvaluation ?? true;
|
|
33
|
-
this.metricsTracker = new MetricsTracker(this.agentId);
|
|
34
|
-
}
|
|
35
|
-
/**
|
|
36
|
-
* Send a message with performance tracking.
|
|
37
|
-
*/
|
|
38
|
-
async send(text, useStreaming = false) {
|
|
39
|
-
const startTime = Date.now();
|
|
40
|
-
const traceId = `trace-${this.currentTraceId++}`;
|
|
41
|
-
const toolCalls = [];
|
|
42
|
-
try {
|
|
43
|
-
const response = await this.agent.send(text, useStreaming);
|
|
44
|
-
const elapsedMs = Date.now() - startTime;
|
|
45
|
-
// Track metrics
|
|
46
|
-
this.metricsTracker.recordMessage(elapsedMs);
|
|
47
|
-
// Evaluate code quality if response contains code
|
|
48
|
-
if (this.enableCodeEvaluation && response.includes('```')) {
|
|
49
|
-
await this.evaluateResponseCode(response);
|
|
50
|
-
}
|
|
51
|
-
// Add execution trace if introspection is enabled
|
|
52
|
-
if (this.enableIntrospection) {
|
|
53
|
-
const trace = {
|
|
54
|
-
traceId,
|
|
55
|
-
timestamp: new Date().toISOString(),
|
|
56
|
-
prompt: text,
|
|
57
|
-
response,
|
|
58
|
-
toolCalls,
|
|
59
|
-
totalDurationMs: elapsedMs,
|
|
60
|
-
};
|
|
61
|
-
this.metricsTracker.addTrace(trace);
|
|
62
|
-
}
|
|
63
|
-
return response;
|
|
64
|
-
}
|
|
65
|
-
catch (error) {
|
|
66
|
-
const elapsedMs = Date.now() - startTime;
|
|
67
|
-
this.metricsTracker.recordMessage(elapsedMs);
|
|
68
|
-
throw error;
|
|
69
|
-
}
|
|
70
|
-
}
|
|
71
|
-
/**
|
|
72
|
-
* Evaluate code quality in a response.
|
|
73
|
-
*/
|
|
74
|
-
async evaluateResponseCode(response) {
|
|
75
|
-
const codeBlocks = extractCodeBlocks(response);
|
|
76
|
-
if (codeBlocks.length === 0) {
|
|
77
|
-
return;
|
|
78
|
-
}
|
|
79
|
-
this.metricsTracker.recordCodeGeneration(codeBlocks.length);
|
|
80
|
-
// Evaluate each code block
|
|
81
|
-
for (const code of codeBlocks) {
|
|
82
|
-
try {
|
|
83
|
-
const metrics = evaluateCodeQuality(code);
|
|
84
|
-
this.metricsTracker.recordCodeQuality(metrics);
|
|
85
|
-
}
|
|
86
|
-
catch {
|
|
87
|
-
// Ignore evaluation errors
|
|
88
|
-
}
|
|
89
|
-
}
|
|
90
|
-
}
|
|
91
|
-
/**
|
|
92
|
-
* Record a tool call result.
|
|
93
|
-
*/
|
|
94
|
-
recordToolCall(success) {
|
|
95
|
-
this.metricsTracker.recordToolCall(success);
|
|
96
|
-
}
|
|
97
|
-
/**
|
|
98
|
-
* Get current performance metrics.
|
|
99
|
-
*/
|
|
100
|
-
getMetrics() {
|
|
101
|
-
return this.metricsTracker.getMetrics();
|
|
102
|
-
}
|
|
103
|
-
/**
|
|
104
|
-
* Get human-readable performance summary.
|
|
105
|
-
*/
|
|
106
|
-
getPerformanceSummary() {
|
|
107
|
-
return this.metricsTracker.getPerformanceSummary();
|
|
108
|
-
}
|
|
109
|
-
/**
|
|
110
|
-
* Get execution traces.
|
|
111
|
-
*/
|
|
112
|
-
getTraces() {
|
|
113
|
-
return this.metricsTracker.getTraces();
|
|
114
|
-
}
|
|
115
|
-
/**
|
|
116
|
-
* Get improvement suggestions based on metrics.
|
|
117
|
-
*/
|
|
118
|
-
getImprovementSuggestions() {
|
|
119
|
-
return this.metricsTracker.getImprovementSuggestions();
|
|
120
|
-
}
|
|
121
|
-
/**
|
|
122
|
-
* Get metrics as a dictionary for serialization.
|
|
123
|
-
*/
|
|
124
|
-
getMetricsDict() {
|
|
125
|
-
const metrics = this.metricsTracker.getMetrics();
|
|
126
|
-
return {
|
|
127
|
-
sessionId: metrics.sessionId,
|
|
128
|
-
totalMessages: metrics.totalMessages,
|
|
129
|
-
totalTimeMs: metrics.totalTimeMs,
|
|
130
|
-
avgResponseTimeMs: metrics.avgResponseTimeMs,
|
|
131
|
-
codeBlocksGenerated: metrics.codeBlocksGenerated,
|
|
132
|
-
tokenUsage: metrics.totalTokensUsed,
|
|
133
|
-
toolUsage: {
|
|
134
|
-
totalCalls: metrics.totalToolCalls,
|
|
135
|
-
successfulCalls: metrics.successfulToolCalls,
|
|
136
|
-
failedCalls: metrics.failedToolCalls,
|
|
137
|
-
},
|
|
138
|
-
codeQuality: {
|
|
139
|
-
qualityScore: metrics.avgCodeQuality,
|
|
140
|
-
algorithmEfficiency: metrics.avgAlgorithmEfficiency,
|
|
141
|
-
errorHandling: metrics.avgErrorHandling,
|
|
142
|
-
},
|
|
143
|
-
};
|
|
144
|
-
}
|
|
145
|
-
/**
|
|
146
|
-
* Reset all metrics.
|
|
147
|
-
*/
|
|
148
|
-
resetMetrics() {
|
|
149
|
-
this.metricsTracker.reset();
|
|
150
|
-
}
|
|
151
|
-
/**
|
|
152
|
-
* Get the underlying agent runtime.
|
|
153
|
-
*/
|
|
154
|
-
getAgent() {
|
|
155
|
-
return this.agent;
|
|
156
|
-
}
|
|
157
|
-
/**
|
|
158
|
-
* Get the agent ID.
|
|
159
|
-
*/
|
|
160
|
-
getAgentId() {
|
|
161
|
-
return this.agentId;
|
|
162
|
-
}
|
|
163
|
-
/**
|
|
164
|
-
* Evaluate a single code snippet and return a reward score.
|
|
165
|
-
*/
|
|
166
|
-
evaluateCode(code) {
|
|
167
|
-
const metrics = evaluateCodeQuality(code);
|
|
168
|
-
return calculateRewardScore(metrics);
|
|
169
|
-
}
|
|
170
|
-
}
|
|
171
|
-
//# sourceMappingURL=agentWrapper.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"agentWrapper.js","sourceRoot":"","sources":["../../src/alpha-zero/agentWrapper.ts"],"names":[],"mappings":"AAAA;;;;;;;;GAQG;AAQH,OAAO,EAAE,cAAc,EAAE,MAAM,qBAAqB,CAAC;AACrD,OAAO,EAAE,iBAAiB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,oBAAoB,CAAC;AASlG;;;;;;;;GAQG;AACH,MAAM,OAAO,qBAAqB;IACf,KAAK,CAAe;IACpB,OAAO,CAAS;IAChB,mBAAmB,CAAU;IAC7B,oBAAoB,CAAU;IAC9B,cAAc,CAAiB;IACxC,cAAc,GAAG,CAAC,CAAC;IAE3B,YAAY,OAA8B;QACxC,IAAI,CAAC,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC;QAC3B,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC,OAAO,IAAI,OAAO,CAAC;QAC1C,IAAI,CAAC,mBAAmB,GAAG,OAAO,CAAC,mBAAmB,IAAI,IAAI,CAAC;QAC/D,IAAI,CAAC,oBAAoB,GAAG,OAAO,CAAC,oBAAoB,IAAI,IAAI,CAAC;QACjE,IAAI,CAAC,cAAc,GAAG,IAAI,cAAc,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;IACzD,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,IAAI,CAAC,IAAY,EAAE,YAAY,GAAG,KAAK;QAC3C,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAC7B,MAAM,OAAO,GAAG,SAAS,IAAI,CAAC,cAAc,EAAE,EAAE,CAAC;QACjD,MAAM,SAAS,GAAgC,EAAE,CAAC;QAElD,IAAI,CAAC;YACH,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,IAAI,EAAE,YAAY,CAAC,CAAC;YAC3D,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;YAEzC,gBAAgB;YAChB,IAAI,CAAC,cAAc,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;YAE7C,kDAAkD;YAClD,IAAI,IAAI,CAAC,oBAAoB,IAAI,QAAQ,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;gBAC1D,MAAM,IAAI,CAAC,oBAAoB,CAAC,QAAQ,CAAC,CAAC;YAC5C,CAAC;YAED,kDAAkD;YAClD,IAAI,IAAI,CAAC,mBAAmB,EAAE,CAAC;gBAC7B,MAAM,KAAK,GAAmB;oBAC5B,OAAO;oBACP,SAAS,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;oBACnC,MAAM,EAAE,IAAI;oBACZ,QAAQ;oBACR,SAAS;oBACT,eAAe,EAAE,SAAS;iBAC3B,CAAC;gBACF,IAAI,CAAC,cAAc,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC;YACtC,CAAC;YAED,OAAO,QAAQ,CAAC;QAClB,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;YACzC,IAAI,CAAC,cAAc,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;YAC7C,MAAM,KAAK,CAAC;QACd,CAAC;IACH,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,oBAAoB,CAAC,QAAgB;QACjD,MAAM,UAAU,GAAG,iBAAiB,CAAC,QAAQ,CAAC,CAAC;QAC/C,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YAC5B,OAAO;QACT,CAAC;QAED,IAAI,CAAC,cAAc,CAAC,oBAAoB,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC;QAE5D,2BAA2B;QAC3B,KAAK,MAAM,IAAI,IAAI,UAAU,EAAE,CAAC;YAC9B,IAAI,CAAC;gBACH,MAAM,OAAO,GAAG,mBAAmB,CAAC,IAAI,CAAC,CAAC;gBAC1C,IAAI,CAAC,cAAc,CAAC,iBAAiB,CAAC,OAAO,CAAC,CAAC;YACjD,CAAC;YAAC,MAAM,CAAC;gBACP,2BAA2B;YAC7B,CAAC;QACH,CAAC;IACH,CAAC;IAED;;OAEG;IACH,cAAc,CAAC,OAAgB;QAC7B,IAAI,CAAC,cAAc,CAAC,cAAc,CAAC,OAAO,CAAC,CAAC;IAC9C,CAAC;IAED;;OAEG;IACH,UAAU;QACR,OAAO,IAAI,CAAC,cAAc,CAAC,UAAU,EAAE,CAAC;IAC1C,CAAC;IAED;;OAEG;IACH,qBAAqB;QACnB,OAAO,IAAI,CAAC,cAAc,CAAC,qBAAqB,EAAE,CAAC;IACrD,CAAC;IAED;;OAEG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,cAAc,CAAC,SAAS,EAAE,CAAC;IACzC,CAAC;IAED;;OAEG;IACH,yBAAyB;QACvB,OAAO,IAAI,CAAC,cAAc,CAAC,yBAAyB,EAAE,CAAC;IACzD,CAAC;IAED;;OAEG;IACH,cAAc;QACZ,MAAM,OAAO,GAAG,IAAI,CAAC,cAAc,CAAC,UAAU,EAAE,CAAC;QACjD,OAAO;YACL,SAAS,EAAE,OAAO,CAAC,SAAS;YAC5B,aAAa,EAAE,OAAO,CAAC,aAAa;YACpC,WAAW,EAAE,OAAO,CAAC,WAAW;YAChC,iBAAiB,EAAE,OAAO,CAAC,iBAAiB;YAC5C,mBAAmB,EAAE,OAAO,CAAC,mBAAmB;YAChD,UAAU,EAAE,OAAO,CAAC,eAAe;YACnC,SAAS,EAAE;gBACT,UAAU,EAAE,OAAO,CAAC,cAAc;gBAClC,eAAe,EAAE,OAAO,CAAC,mBAAmB;gBAC5C,WAAW,EAAE,OAAO,CAAC,eAAe;aACrC;YACD,WAAW,EAAE;gBACX,YAAY,EAAE,OAAO,CAAC,cAAc;gBACpC,mBAAmB,EAAE,OAAO,CAAC,sBAAsB;gBACnD,aAAa,EAAE,OAAO,CAAC,gBAAgB;aACxC;SACF,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,YAAY;QACV,IAAI,CAAC,cAAc,CAAC,KAAK,EAAE,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,QAAQ;QACN,OAAO,IAAI,CAAC,KAAK,CAAC;IACpB,CAAC;IAED;;OAEG;IACH,UAAU;QACR,OAAO,IAAI,CAAC,OAAO,CAAC;IACtB,CAAC;IAED;;OAEG;IACH,YAAY,CAAC,IAAY;QACvB,MAAM,OAAO,GAAG,mBAAmB,CAAC,IAAI,CAAC,CAAC;QAC1C,OAAO,oBAAoB,CAAC,OAAO,CAAC,CAAC;IACvC,CAAC;CACF"}
|
|
@@ -1,25 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Code Evaluator
|
|
3
|
-
*
|
|
4
|
-
* AST-based code quality evaluation for generated code.
|
|
5
|
-
*
|
|
6
|
-
* Principal Investigator: Bo Shang
|
|
7
|
-
* Framework: erosolar-cli
|
|
8
|
-
*/
|
|
9
|
-
import type { CodeQualityMetrics } from './types.js';
|
|
10
|
-
/**
|
|
11
|
-
* Extract code blocks from a response string.
|
|
12
|
-
*/
|
|
13
|
-
export declare function extractCodeBlocks(response: string): string[];
|
|
14
|
-
/**
|
|
15
|
-
* Evaluate code quality metrics.
|
|
16
|
-
*
|
|
17
|
-
* This is a heuristic-based evaluation that analyzes code patterns.
|
|
18
|
-
* For production use, consider integrating actual AST parsers.
|
|
19
|
-
*/
|
|
20
|
-
export declare function evaluateCodeQuality(code: string): CodeQualityMetrics;
|
|
21
|
-
/**
|
|
22
|
-
* Calculate a composite reward score from metrics.
|
|
23
|
-
*/
|
|
24
|
-
export declare function calculateRewardScore(metrics: CodeQualityMetrics): number;
|
|
25
|
-
//# sourceMappingURL=codeEvaluator.d.ts.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"codeEvaluator.d.ts","sourceRoot":"","sources":["../../src/alpha-zero/codeEvaluator.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAEH,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,YAAY,CAAC;AAErD;;GAEG;AACH,wBAAgB,iBAAiB,CAAC,QAAQ,EAAE,MAAM,GAAG,MAAM,EAAE,CAa5D;AAED;;;;;GAKG;AACH,wBAAgB,mBAAmB,CAAC,IAAI,EAAE,MAAM,GAAG,kBAAkB,CAoBpE;AAkQD;;GAEG;AACH,wBAAgB,oBAAoB,CAAC,OAAO,EAAE,kBAAkB,GAAG,MAAM,CAkBxE"}
|
|
@@ -1,273 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Code Evaluator
|
|
3
|
-
*
|
|
4
|
-
* AST-based code quality evaluation for generated code.
|
|
5
|
-
*
|
|
6
|
-
* Principal Investigator: Bo Shang
|
|
7
|
-
* Framework: erosolar-cli
|
|
8
|
-
*/
|
|
9
|
-
/**
|
|
10
|
-
* Extract code blocks from a response string.
|
|
11
|
-
*/
|
|
12
|
-
export function extractCodeBlocks(response) {
|
|
13
|
-
const codeBlockRegex = /```(?:\w+)?\n([\s\S]*?)```/g;
|
|
14
|
-
const blocks = [];
|
|
15
|
-
let match;
|
|
16
|
-
while ((match = codeBlockRegex.exec(response)) !== null) {
|
|
17
|
-
const code = match[1]?.trim();
|
|
18
|
-
if (code && code.length > 0) {
|
|
19
|
-
blocks.push(code);
|
|
20
|
-
}
|
|
21
|
-
}
|
|
22
|
-
return blocks;
|
|
23
|
-
}
|
|
24
|
-
/**
|
|
25
|
-
* Evaluate code quality metrics.
|
|
26
|
-
*
|
|
27
|
-
* This is a heuristic-based evaluation that analyzes code patterns.
|
|
28
|
-
* For production use, consider integrating actual AST parsers.
|
|
29
|
-
*/
|
|
30
|
-
export function evaluateCodeQuality(code) {
|
|
31
|
-
const lines = code.split('\n');
|
|
32
|
-
const totalLines = lines.length;
|
|
33
|
-
// Calculate individual scores
|
|
34
|
-
const codeQualityScore = calculateCodeQualityScore(code, lines);
|
|
35
|
-
const algorithmEfficiency = calculateEfficiencyScore(code, lines);
|
|
36
|
-
const errorHandlingScore = calculateErrorHandlingScore(code);
|
|
37
|
-
const documentationScore = calculateDocumentationScore(code, lines);
|
|
38
|
-
const maintainabilityScore = calculateMaintainabilityScore(code, lines, totalLines);
|
|
39
|
-
const securityScore = calculateSecurityScore(code);
|
|
40
|
-
return {
|
|
41
|
-
codeQualityScore,
|
|
42
|
-
algorithmEfficiency,
|
|
43
|
-
errorHandlingScore,
|
|
44
|
-
documentationScore,
|
|
45
|
-
maintainabilityScore,
|
|
46
|
-
securityScore,
|
|
47
|
-
};
|
|
48
|
-
}
|
|
49
|
-
/**
|
|
50
|
-
* Calculate overall code quality score.
|
|
51
|
-
*/
|
|
52
|
-
function calculateCodeQualityScore(code, lines) {
|
|
53
|
-
let score = 0.5; // Base score
|
|
54
|
-
// Check for consistent indentation
|
|
55
|
-
const indentationConsistent = checkIndentationConsistency(lines);
|
|
56
|
-
if (indentationConsistent) {
|
|
57
|
-
score += 0.1;
|
|
58
|
-
}
|
|
59
|
-
// Check for reasonable line lengths
|
|
60
|
-
const longLines = lines.filter((line) => line.length > 120).length;
|
|
61
|
-
if (longLines / lines.length < 0.1) {
|
|
62
|
-
score += 0.1;
|
|
63
|
-
}
|
|
64
|
-
// Check for naming conventions (camelCase or snake_case)
|
|
65
|
-
if (/[a-z][A-Z]/.test(code) || /_[a-z]/.test(code)) {
|
|
66
|
-
score += 0.1;
|
|
67
|
-
}
|
|
68
|
-
// Check for modular structure (functions/classes)
|
|
69
|
-
if (/(?:function|def|class|const\s+\w+\s*=\s*(?:async\s*)?\()/.test(code)) {
|
|
70
|
-
score += 0.1;
|
|
71
|
-
}
|
|
72
|
-
// Penalize magic numbers
|
|
73
|
-
const magicNumbers = code.match(/(?<![.\w])[2-9]\d*(?![.\w])/g) || [];
|
|
74
|
-
if (magicNumbers.length > 5) {
|
|
75
|
-
score -= 0.1;
|
|
76
|
-
}
|
|
77
|
-
return Math.max(0, Math.min(1, score));
|
|
78
|
-
}
|
|
79
|
-
/**
|
|
80
|
-
* Calculate algorithm efficiency score.
|
|
81
|
-
*/
|
|
82
|
-
function calculateEfficiencyScore(code, _lines) {
|
|
83
|
-
let score = 0.5;
|
|
84
|
-
// Check for efficient data structures
|
|
85
|
-
if (/(?:Map|Set|WeakMap|WeakSet|dict|set)\s*\(/.test(code)) {
|
|
86
|
-
score += 0.15;
|
|
87
|
-
}
|
|
88
|
-
// Penalize nested loops (potential O(n^2) or worse)
|
|
89
|
-
const nestedLoops = code.match(/(?:for|while)[\s\S]*?(?:for|while)/g)?.length || 0;
|
|
90
|
-
if (nestedLoops > 2) {
|
|
91
|
-
score -= 0.2;
|
|
92
|
-
}
|
|
93
|
-
// Check for early returns (efficient control flow)
|
|
94
|
-
if (/return\s+(?!undefined|null)/.test(code)) {
|
|
95
|
-
score += 0.1;
|
|
96
|
-
}
|
|
97
|
-
// Check for caching/memoization patterns
|
|
98
|
-
if (/(?:cache|memo|stored|cached)/i.test(code)) {
|
|
99
|
-
score += 0.15;
|
|
100
|
-
}
|
|
101
|
-
// Penalize string concatenation in loops
|
|
102
|
-
if (/(?:for|while)[\s\S]*?\+\s*=\s*['"`]/.test(code)) {
|
|
103
|
-
score -= 0.1;
|
|
104
|
-
}
|
|
105
|
-
return Math.max(0, Math.min(1, score));
|
|
106
|
-
}
|
|
107
|
-
/**
|
|
108
|
-
* Calculate error handling score.
|
|
109
|
-
*/
|
|
110
|
-
function calculateErrorHandlingScore(code) {
|
|
111
|
-
let score = 0.3;
|
|
112
|
-
// Check for try-catch blocks
|
|
113
|
-
const tryCatchCount = (code.match(/try\s*\{/g) || []).length;
|
|
114
|
-
if (tryCatchCount > 0) {
|
|
115
|
-
score += 0.2 * Math.min(tryCatchCount, 3);
|
|
116
|
-
}
|
|
117
|
-
// Check for error type checking
|
|
118
|
-
if (/instanceof\s+(?:Error|TypeError|RangeError)/i.test(code)) {
|
|
119
|
-
score += 0.1;
|
|
120
|
-
}
|
|
121
|
-
// Check for null/undefined checks
|
|
122
|
-
const nullChecks = (code.match(/(?:!==?\s*(?:null|undefined)|\?\?|\.?\?\.)/g) || []).length;
|
|
123
|
-
if (nullChecks > 0) {
|
|
124
|
-
score += 0.1 * Math.min(nullChecks / 3, 1);
|
|
125
|
-
}
|
|
126
|
-
// Check for error logging
|
|
127
|
-
if (/(?:console\.error|logger\.error|throw\s+new)/i.test(code)) {
|
|
128
|
-
score += 0.1;
|
|
129
|
-
}
|
|
130
|
-
// Check for finally blocks (cleanup)
|
|
131
|
-
if (/finally\s*\{/.test(code)) {
|
|
132
|
-
score += 0.1;
|
|
133
|
-
}
|
|
134
|
-
return Math.max(0, Math.min(1, score));
|
|
135
|
-
}
|
|
136
|
-
/**
|
|
137
|
-
* Calculate documentation score.
|
|
138
|
-
*/
|
|
139
|
-
function calculateDocumentationScore(code, lines) {
|
|
140
|
-
let score = 0.2;
|
|
141
|
-
// Check for JSDoc/docstring comments
|
|
142
|
-
const docComments = (code.match(/\/\*\*[\s\S]*?\*\/|"""[\s\S]*?"""|'''[\s\S]*?'''/g) || []).length;
|
|
143
|
-
if (docComments > 0) {
|
|
144
|
-
score += 0.3 * Math.min(docComments / 3, 1);
|
|
145
|
-
}
|
|
146
|
-
// Check for inline comments
|
|
147
|
-
const inlineComments = lines.filter((line) => /(?:\/\/|#)\s*\w/.test(line)).length;
|
|
148
|
-
const commentRatio = inlineComments / lines.length;
|
|
149
|
-
if (commentRatio > 0.05 && commentRatio < 0.3) {
|
|
150
|
-
score += 0.2;
|
|
151
|
-
}
|
|
152
|
-
// Check for type annotations (TypeScript/Python type hints)
|
|
153
|
-
if (/:\s*(?:string|number|boolean|any|\w+\[\]|Dict|List|Optional)/i.test(code)) {
|
|
154
|
-
score += 0.2;
|
|
155
|
-
}
|
|
156
|
-
// Check for meaningful variable names (longer than 2 chars)
|
|
157
|
-
const shortNames = (code.match(/\b[a-z]{1,2}\b/g) || []).length;
|
|
158
|
-
if (shortNames / lines.length < 0.5) {
|
|
159
|
-
score += 0.1;
|
|
160
|
-
}
|
|
161
|
-
return Math.max(0, Math.min(1, score));
|
|
162
|
-
}
|
|
163
|
-
/**
|
|
164
|
-
* Calculate maintainability score.
|
|
165
|
-
*/
|
|
166
|
-
function calculateMaintainabilityScore(code, lines, totalLines) {
|
|
167
|
-
let score = 0.5;
|
|
168
|
-
// Check function length (prefer smaller functions)
|
|
169
|
-
const functionMatches = code.match(/(?:function|def|=>\s*\{)/g) || [];
|
|
170
|
-
if (functionMatches.length > 0) {
|
|
171
|
-
const avgFunctionLength = totalLines / functionMatches.length;
|
|
172
|
-
if (avgFunctionLength < 30) {
|
|
173
|
-
score += 0.2;
|
|
174
|
-
}
|
|
175
|
-
else if (avgFunctionLength > 100) {
|
|
176
|
-
score -= 0.2;
|
|
177
|
-
}
|
|
178
|
-
}
|
|
179
|
-
// Check for single responsibility (low coupling indicators)
|
|
180
|
-
const importCount = (code.match(/(?:import|require|from\s+['"])/g) || []).length;
|
|
181
|
-
if (importCount < 10) {
|
|
182
|
-
score += 0.1;
|
|
183
|
-
}
|
|
184
|
-
// Check for constants (uppercase naming)
|
|
185
|
-
if (/const\s+[A-Z_]+\s*=/.test(code)) {
|
|
186
|
-
score += 0.1;
|
|
187
|
-
}
|
|
188
|
-
// Penalize deeply nested code
|
|
189
|
-
const maxIndentation = Math.max(...lines.map((line) => {
|
|
190
|
-
const match = line.match(/^(\s*)/);
|
|
191
|
-
return match ? match[1].length : 0;
|
|
192
|
-
}));
|
|
193
|
-
if (maxIndentation > 20) {
|
|
194
|
-
score -= 0.15;
|
|
195
|
-
}
|
|
196
|
-
return Math.max(0, Math.min(1, score));
|
|
197
|
-
}
|
|
198
|
-
/**
|
|
199
|
-
* Calculate security score.
|
|
200
|
-
*/
|
|
201
|
-
function calculateSecurityScore(code) {
|
|
202
|
-
let score = 0.7; // Assume secure by default
|
|
203
|
-
// Check for potential injection vulnerabilities
|
|
204
|
-
const dangerousPatterns = [
|
|
205
|
-
/eval\s*\(/i,
|
|
206
|
-
/exec\s*\(/i,
|
|
207
|
-
/Function\s*\(/i,
|
|
208
|
-
/innerHTML\s*=/i,
|
|
209
|
-
/dangerouslySetInnerHTML/i,
|
|
210
|
-
/document\.write/i,
|
|
211
|
-
];
|
|
212
|
-
for (const pattern of dangerousPatterns) {
|
|
213
|
-
if (pattern.test(code)) {
|
|
214
|
-
score -= 0.15;
|
|
215
|
-
}
|
|
216
|
-
}
|
|
217
|
-
// Check for hardcoded secrets
|
|
218
|
-
if (/(?:password|secret|api[_-]?key|token)\s*=\s*['"][^'"]+['"]/i.test(code)) {
|
|
219
|
-
score -= 0.3;
|
|
220
|
-
}
|
|
221
|
-
// Check for SQL injection risks
|
|
222
|
-
if (/(?:SELECT|INSERT|UPDATE|DELETE)[\s\S]*?\$\{/.test(code)) {
|
|
223
|
-
score -= 0.2;
|
|
224
|
-
}
|
|
225
|
-
// Check for input validation
|
|
226
|
-
if (/(?:validate|sanitize|escape|parameterized)/i.test(code)) {
|
|
227
|
-
score += 0.1;
|
|
228
|
-
}
|
|
229
|
-
return Math.max(0, Math.min(1, score));
|
|
230
|
-
}
|
|
231
|
-
/**
|
|
232
|
-
* Check for consistent indentation.
|
|
233
|
-
*/
|
|
234
|
-
function checkIndentationConsistency(lines) {
|
|
235
|
-
const indentSizes = new Set();
|
|
236
|
-
for (const line of lines) {
|
|
237
|
-
if (line.trim().length === 0)
|
|
238
|
-
continue;
|
|
239
|
-
const match = line.match(/^(\s*)/);
|
|
240
|
-
if (match && match[1]) {
|
|
241
|
-
const size = match[1].length;
|
|
242
|
-
if (size > 0) {
|
|
243
|
-
indentSizes.add(size);
|
|
244
|
-
}
|
|
245
|
-
}
|
|
246
|
-
}
|
|
247
|
-
// Check if all indentations are multiples of a common base
|
|
248
|
-
const sizes = Array.from(indentSizes).sort((a, b) => a - b);
|
|
249
|
-
if (sizes.length < 2)
|
|
250
|
-
return true;
|
|
251
|
-
const base = sizes[0];
|
|
252
|
-
return sizes.every((size) => size % base === 0);
|
|
253
|
-
}
|
|
254
|
-
/**
|
|
255
|
-
* Calculate a composite reward score from metrics.
|
|
256
|
-
*/
|
|
257
|
-
export function calculateRewardScore(metrics) {
|
|
258
|
-
const weights = {
|
|
259
|
-
codeQuality: 0.25,
|
|
260
|
-
efficiency: 0.2,
|
|
261
|
-
errorHandling: 0.2,
|
|
262
|
-
documentation: 0.15,
|
|
263
|
-
maintainability: 0.1,
|
|
264
|
-
security: 0.1,
|
|
265
|
-
};
|
|
266
|
-
return (metrics.codeQualityScore * weights.codeQuality +
|
|
267
|
-
metrics.algorithmEfficiency * weights.efficiency +
|
|
268
|
-
metrics.errorHandlingScore * weights.errorHandling +
|
|
269
|
-
metrics.documentationScore * weights.documentation +
|
|
270
|
-
metrics.maintainabilityScore * weights.maintainability +
|
|
271
|
-
metrics.securityScore * weights.security) * 100;
|
|
272
|
-
}
|
|
273
|
-
//# sourceMappingURL=codeEvaluator.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"codeEvaluator.js","sourceRoot":"","sources":["../../src/alpha-zero/codeEvaluator.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAIH;;GAEG;AACH,MAAM,UAAU,iBAAiB,CAAC,QAAgB;IAChD,MAAM,cAAc,GAAG,6BAA6B,CAAC;IACrD,MAAM,MAAM,GAAa,EAAE,CAAC;IAC5B,IAAI,KAAK,CAAC;IAEV,OAAO,CAAC,KAAK,GAAG,cAAc,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,KAAK,IAAI,EAAE,CAAC;QACxD,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,EAAE,IAAI,EAAE,CAAC;QAC9B,IAAI,IAAI,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC5B,MAAM,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QACpB,CAAC;IACH,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;;;;GAKG;AACH,MAAM,UAAU,mBAAmB,CAAC,IAAY;IAC9C,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC;IAC/B,MAAM,UAAU,GAAG,KAAK,CAAC,MAAM,CAAC;IAEhC,8BAA8B;IAC9B,MAAM,gBAAgB,GAAG,yBAAyB,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;IAChE,MAAM,mBAAmB,GAAG,wBAAwB,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;IAClE,MAAM,kBAAkB,GAAG,2BAA2B,CAAC,IAAI,CAAC,CAAC;IAC7D,MAAM,kBAAkB,GAAG,2BAA2B,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;IACpE,MAAM,oBAAoB,GAAG,6BAA6B,CAAC,IAAI,EAAE,KAAK,EAAE,UAAU,CAAC,CAAC;IACpF,MAAM,aAAa,GAAG,sBAAsB,CAAC,IAAI,CAAC,CAAC;IAEnD,OAAO;QACL,gBAAgB;QAChB,mBAAmB;QACnB,kBAAkB;QAClB,kBAAkB;QAClB,oBAAoB;QACpB,aAAa;KACd,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,yBAAyB,CAAC,IAAY,EAAE,KAAe;IAC9D,IAAI,KAAK,GAAG,GAAG,CAAC,CAAC,aAAa;IAE9B,mCAAmC;IACnC,MAAM,qBAAqB,GAAG,2BAA2B,CAAC,KAAK,CAAC,CAAC;IACjE,IAAI,qBAAqB,EAAE,CAAC;QAC1B,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,oCAAoC;IACpC,MAAM,SAAS,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAI,CAAC,MAAM,GAAG,GAAG,CAAC,CAAC,MAAM,CAAC;IACnE,IAAI,SAAS,GAAG,KAAK,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;QACnC,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yDAAyD;IACzD,IAAI,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACnD,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,kDAAkD;IAClD,IAAI,0DAA0D,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC1E,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yBAAyB;IACzB,MAAM,YAAY,GAAG,IAAI,CAAC,KAAK,CAAC,8BAA8B,CAAC,IAAI,EAAE,CAAC;IACtE,IAAI,YAAY,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC5B,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,wBAAwB,CAAC,IAAY,EAAE,MAAgB;IAC9D,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,sCAAsC;IACtC,IAAI,2CAA2C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC3D,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,oDAAoD;IACpD,MAAM,WAAW,GACf,IAAI,CAAC,KAAK,CAAC,qCAAqC,CAAC,EAAE,MAAM,IAAI,CAAC,CAAC;IACjE,IAAI,WAAW,GAAG,CAAC,EAAE,CAAC;QACpB,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,mDAAmD;IACnD,IAAI,6BAA6B,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7C,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yCAAyC;IACzC,IAAI,+BAA+B,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC/C,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,yCAAyC;IACzC,IAAI,qCAAqC,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACrD,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,2BAA2B,CAAC,IAAY;IAC/C,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,6BAA6B;IAC7B,MAAM,aAAa,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IAC7D,IAAI,aAAa,GAAG,CAAC,EAAE,CAAC;QACtB,KAAK,IAAI,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,aAAa,EAAE,CAAC,CAAC,CAAC;IAC5C,CAAC;IAED,gCAAgC;IAChC,IAAI,8CAA8C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC9D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,kCAAkC;IAClC,MAAM,UAAU,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,6CAA6C,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IAC5F,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;QACnB,KAAK,IAAI,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,UAAU,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC;IAC7C,CAAC;IAED,0BAA0B;IAC1B,IAAI,+CAA+C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC/D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,qCAAqC;IACrC,IAAI,cAAc,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC9B,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,2BAA2B,CAAC,IAAY,EAAE,KAAe;IAChE,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,qCAAqC;IACrC,MAAM,WAAW,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,mDAAmD,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IACnG,IAAI,WAAW,GAAG,CAAC,EAAE,CAAC;QACpB,KAAK,IAAI,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,WAAW,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC;IAC9C,CAAC;IAED,4BAA4B;IAC5B,MAAM,cAAc,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAC3C,iBAAiB,CAAC,IAAI,CAAC,IAAI,CAAC,CAC7B,CAAC,MAAM,CAAC;IACT,MAAM,YAAY,GAAG,cAAc,GAAG,KAAK,CAAC,MAAM,CAAC;IACnD,IAAI,YAAY,GAAG,IAAI,IAAI,YAAY,GAAG,GAAG,EAAE,CAAC;QAC9C,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,4DAA4D;IAC5D,IAAI,+DAA+D,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC/E,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,4DAA4D;IAC5D,MAAM,UAAU,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,iBAAiB,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IAChE,IAAI,UAAU,GAAG,KAAK,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;QACpC,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,6BAA6B,CACpC,IAAY,EACZ,KAAe,EACf,UAAkB;IAElB,IAAI,KAAK,GAAG,GAAG,CAAC;IAEhB,mDAAmD;IACnD,MAAM,eAAe,GAAG,IAAI,CAAC,KAAK,CAAC,2BAA2B,CAAC,IAAI,EAAE,CAAC;IACtE,IAAI,eAAe,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC/B,MAAM,iBAAiB,GAAG,UAAU,GAAG,eAAe,CAAC,MAAM,CAAC;QAC9D,IAAI,iBAAiB,GAAG,EAAE,EAAE,CAAC;YAC3B,KAAK,IAAI,GAAG,CAAC;QACf,CAAC;aAAM,IAAI,iBAAiB,GAAG,GAAG,EAAE,CAAC;YACnC,KAAK,IAAI,GAAG,CAAC;QACf,CAAC;IACH,CAAC;IAED,4DAA4D;IAC5D,MAAM,WAAW,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,iCAAiC,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC;IACjF,IAAI,WAAW,GAAG,EAAE,EAAE,CAAC;QACrB,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,yCAAyC;IACzC,IAAI,qBAAqB,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QACrC,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,8BAA8B;IAC9B,MAAM,cAAc,GAAG,IAAI,CAAC,GAAG,CAC7B,GAAG,KAAK,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE;QACpB,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC;QACnC,OAAO,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAE,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC;IACtC,CAAC,CAAC,CACH,CAAC;IACF,IAAI,cAAc,GAAG,EAAE,EAAE,CAAC;QACxB,KAAK,IAAI,IAAI,CAAC;IAChB,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,sBAAsB,CAAC,IAAY;IAC1C,IAAI,KAAK,GAAG,GAAG,CAAC,CAAC,2BAA2B;IAE5C,gDAAgD;IAChD,MAAM,iBAAiB,GAAG;QACxB,YAAY;QACZ,YAAY;QACZ,gBAAgB;QAChB,gBAAgB;QAChB,0BAA0B;QAC1B,kBAAkB;KACnB,CAAC;IAEF,KAAK,MAAM,OAAO,IAAI,iBAAiB,EAAE,CAAC;QACxC,IAAI,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;YACvB,KAAK,IAAI,IAAI,CAAC;QAChB,CAAC;IACH,CAAC;IAED,8BAA8B;IAC9B,IAAI,6DAA6D,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7E,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,gCAAgC;IAChC,IAAI,6CAA6C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,6BAA6B;IAC7B,IAAI,6CAA6C,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7D,KAAK,IAAI,GAAG,CAAC;IACf,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AACzC,CAAC;AAED;;GAEG;AACH,SAAS,2BAA2B,CAAC,KAAe;IAClD,MAAM,WAAW,GAAG,IAAI,GAAG,EAAU,CAAC;IAEtC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,IAAI,IAAI,CAAC,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC;YAAE,SAAS;QAEvC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC;QACnC,IAAI,KAAK,IAAI,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC;YACtB,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC;YAC7B,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;gBACb,WAAW,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;YACxB,CAAC;QACH,CAAC;IACH,CAAC;IAED,2DAA2D;IAC3D,MAAM,KAAK,GAAG,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;IAC5D,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC;QAAE,OAAO,IAAI,CAAC;IAElC,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;IACtB,OAAO,KAAK,CAAC,KAAK,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAK,GAAG,IAAK,KAAK,CAAC,CAAC,CAAC;AACpD,CAAC;AAED;;GAEG;AACH,MAAM,UAAU,oBAAoB,CAAC,OAA2B;IAC9D,MAAM,OAAO,GAAG;QACd,WAAW,EAAE,IAAI;QACjB,UAAU,EAAE,GAAG;QACf,aAAa,EAAE,GAAG;QAClB,aAAa,EAAE,IAAI;QACnB,eAAe,EAAE,GAAG;QACpB,QAAQ,EAAE,GAAG;KACd,CAAC;IAEF,OAAO,CACL,OAAO,CAAC,gBAAgB,GAAG,OAAO,CAAC,WAAW;QAC9C,OAAO,CAAC,mBAAmB,GAAG,OAAO,CAAC,UAAU;QAChD,OAAO,CAAC,kBAAkB,GAAG,OAAO,CAAC,aAAa;QAClD,OAAO,CAAC,kBAAkB,GAAG,OAAO,CAAC,aAAa;QAClD,OAAO,CAAC,oBAAoB,GAAG,OAAO,CAAC,eAAe;QACtD,OAAO,CAAC,aAAa,GAAG,OAAO,CAAC,QAAQ,CACzC,GAAG,GAAG,CAAC;AACV,CAAC"}
|
|
@@ -1,66 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Alpha Zero 2 - Competitive Agent Runner
|
|
3
|
-
*
|
|
4
|
-
* Runs competitive comparisons between two AI agents.
|
|
5
|
-
*
|
|
6
|
-
* Principal Investigator: Bo Shang
|
|
7
|
-
* Framework: erosolar-cli
|
|
8
|
-
*/
|
|
9
|
-
import type { CompetitionRoundResult, CompetitionStandings, TournamentConfig, TournamentResult, TournamentCallbacks, TournamentStatus } from './types.js';
|
|
10
|
-
import { AlphaZeroAgentWrapper } from './agentWrapper.js';
|
|
11
|
-
/**
|
|
12
|
-
* Run competitive comparisons between two agents.
|
|
13
|
-
*/
|
|
14
|
-
export declare class CompetitiveAgentRunner {
|
|
15
|
-
private readonly agent1;
|
|
16
|
-
private readonly agent2;
|
|
17
|
-
private readonly roundResults;
|
|
18
|
-
constructor(agent1: AlphaZeroAgentWrapper, agent2: AlphaZeroAgentWrapper);
|
|
19
|
-
/**
|
|
20
|
-
* Run both agents on the same prompt and compare results.
|
|
21
|
-
*/
|
|
22
|
-
runComparison(prompt: string, evaluateCode?: boolean): Promise<CompetitionRoundResult>;
|
|
23
|
-
/**
|
|
24
|
-
* Run a single agent and return results.
|
|
25
|
-
*/
|
|
26
|
-
private runAgent;
|
|
27
|
-
/**
|
|
28
|
-
* Get current competition standings.
|
|
29
|
-
*/
|
|
30
|
-
getStandings(): CompetitionStandings;
|
|
31
|
-
/**
|
|
32
|
-
* Get all round results.
|
|
33
|
-
*/
|
|
34
|
-
getRoundResults(): CompetitionRoundResult[];
|
|
35
|
-
/**
|
|
36
|
-
* Reset competition history.
|
|
37
|
-
*/
|
|
38
|
-
reset(): void;
|
|
39
|
-
}
|
|
40
|
-
/**
|
|
41
|
-
* Tournament runner for multi-round competitions.
|
|
42
|
-
*/
|
|
43
|
-
export declare class TournamentRunner {
|
|
44
|
-
private readonly agent1;
|
|
45
|
-
private readonly agent2;
|
|
46
|
-
private status;
|
|
47
|
-
private currentResult;
|
|
48
|
-
constructor(agent1: AlphaZeroAgentWrapper, agent2: AlphaZeroAgentWrapper);
|
|
49
|
-
/**
|
|
50
|
-
* Run a tournament with the given configuration.
|
|
51
|
-
*/
|
|
52
|
-
run(config: TournamentConfig, callbacks?: TournamentCallbacks): Promise<TournamentResult>;
|
|
53
|
-
/**
|
|
54
|
-
* Get current tournament status.
|
|
55
|
-
*/
|
|
56
|
-
getStatus(): TournamentStatus;
|
|
57
|
-
/**
|
|
58
|
-
* Get the tournament result (if completed).
|
|
59
|
-
*/
|
|
60
|
-
getResult(): TournamentResult | null;
|
|
61
|
-
}
|
|
62
|
-
/**
|
|
63
|
-
* Generate a summary of tournament results.
|
|
64
|
-
*/
|
|
65
|
-
export declare function formatTournamentSummary(result: TournamentResult): string;
|
|
66
|
-
//# sourceMappingURL=competitiveRunner.d.ts.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"competitiveRunner.d.ts","sourceRoot":"","sources":["../../src/alpha-zero/competitiveRunner.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAEH,OAAO,KAAK,EACV,sBAAsB,EACtB,oBAAoB,EACpB,gBAAgB,EAChB,gBAAgB,EAChB,mBAAmB,EACnB,gBAAgB,EACjB,MAAM,YAAY,CAAC;AACpB,OAAO,EAAE,qBAAqB,EAAE,MAAM,mBAAmB,CAAC;AAG1D;;GAEG;AACH,qBAAa,sBAAsB;IACjC,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAgC;gBAEjD,MAAM,EAAE,qBAAqB,EAAE,MAAM,EAAE,qBAAqB;IAKxE;;OAEG;IACG,aAAa,CAAC,MAAM,EAAE,MAAM,EAAE,YAAY,UAAO,GAAG,OAAO,CAAC,sBAAsB,CAAC;IAqDzF;;OAEG;YACW,QAAQ;IAgCtB;;OAEG;IACH,YAAY,IAAI,oBAAoB;IA0BpC;;OAEG;IACH,eAAe,IAAI,sBAAsB,EAAE;IAI3C;;OAEG;IACH,KAAK,IAAI,IAAI;CAGd;AAED;;GAEG;AACH,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAwB;IAC/C,OAAO,CAAC,MAAM,CAA+B;IAC7C,OAAO,CAAC,aAAa,CAAiC;gBAE1C,MAAM,EAAE,qBAAqB,EAAE,MAAM,EAAE,qBAAqB;IAKxE;;OAEG;IACG,GAAG,CAAC,MAAM,EAAE,gBAAgB,EAAE,SAAS,CAAC,EAAE,mBAAmB,GAAG,OAAO,CAAC,gBAAgB,CAAC;IA2C/F;;OAEG;IACH,SAAS,IAAI,gBAAgB;IAI7B;;OAEG;IACH,SAAS,IAAI,gBAAgB,GAAG,IAAI;CAGrC;AAED;;GAEG;AACH,wBAAgB,uBAAuB,CAAC,MAAM,EAAE,gBAAgB,GAAG,MAAM,CAyBxE"}
|