npm - testchimp-runner-core - Versions diffs - 0.0.34 → 0.0.35 - Mend

testchimp-runner-core 0.0.34 → 0.0.35

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (114) hide show

package/dist/execution-service.d.ts +1 -4
package/dist/execution-service.d.ts.map +1 -1
package/dist/execution-service.js +155 -468
package/dist/execution-service.js.map +1 -1
package/dist/index.d.ts +3 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +11 -1
package/dist/index.js.map +1 -1
package/dist/orchestrator/decision-parser.d.ts +18 -0
package/dist/orchestrator/decision-parser.d.ts.map +1 -0
package/dist/orchestrator/decision-parser.js +127 -0
package/dist/orchestrator/decision-parser.js.map +1 -0
package/dist/orchestrator/index.d.ts +4 -2
package/dist/orchestrator/index.d.ts.map +1 -1
package/dist/orchestrator/index.js +14 -2
package/dist/orchestrator/index.js.map +1 -1
package/dist/orchestrator/orchestrator-agent.d.ts +17 -14
package/dist/orchestrator/orchestrator-agent.d.ts.map +1 -1
package/dist/orchestrator/orchestrator-agent.js +534 -204
package/dist/orchestrator/orchestrator-agent.js.map +1 -1
package/dist/orchestrator/orchestrator-prompts.d.ts +14 -2
package/dist/orchestrator/orchestrator-prompts.d.ts.map +1 -1
package/dist/orchestrator/orchestrator-prompts.js +529 -247
package/dist/orchestrator/orchestrator-prompts.js.map +1 -1
package/dist/orchestrator/page-som-handler.d.ts +106 -0
package/dist/orchestrator/page-som-handler.d.ts.map +1 -0
package/dist/orchestrator/page-som-handler.js +1353 -0
package/dist/orchestrator/page-som-handler.js.map +1 -0
package/dist/orchestrator/som-types.d.ts +149 -0
package/dist/orchestrator/som-types.d.ts.map +1 -0
package/dist/orchestrator/som-types.js +87 -0
package/dist/orchestrator/som-types.js.map +1 -0
package/dist/orchestrator/tool-registry.d.ts +2 -0
package/dist/orchestrator/tool-registry.d.ts.map +1 -1
package/dist/orchestrator/tool-registry.js.map +1 -1
package/dist/orchestrator/tools/index.d.ts +4 -1
package/dist/orchestrator/tools/index.d.ts.map +1 -1
package/dist/orchestrator/tools/index.js +7 -2
package/dist/orchestrator/tools/index.js.map +1 -1
package/dist/orchestrator/tools/refresh-som-markers.d.ts +12 -0
package/dist/orchestrator/tools/refresh-som-markers.d.ts.map +1 -0
package/dist/orchestrator/tools/refresh-som-markers.js +64 -0
package/dist/orchestrator/tools/refresh-som-markers.js.map +1 -0
package/dist/orchestrator/tools/view-previous-screenshot.d.ts +15 -0
package/dist/orchestrator/tools/view-previous-screenshot.d.ts.map +1 -0
package/dist/orchestrator/tools/view-previous-screenshot.js +92 -0
package/dist/orchestrator/tools/view-previous-screenshot.js.map +1 -0
package/dist/orchestrator/types.d.ts +23 -1
package/dist/orchestrator/types.d.ts.map +1 -1
package/dist/orchestrator/types.js +11 -1
package/dist/orchestrator/types.js.map +1 -1
package/dist/scenario-service.d.ts +5 -0
package/dist/scenario-service.d.ts.map +1 -1
package/dist/scenario-service.js +17 -0
package/dist/scenario-service.js.map +1 -1
package/dist/scenario-worker-class.d.ts +4 -0
package/dist/scenario-worker-class.d.ts.map +1 -1
package/dist/scenario-worker-class.js +18 -3
package/dist/scenario-worker-class.js.map +1 -1
package/dist/testing/agent-tester.d.ts +35 -0
package/dist/testing/agent-tester.d.ts.map +1 -0
package/dist/testing/agent-tester.js +84 -0
package/dist/testing/agent-tester.js.map +1 -0
package/dist/testing/ref-translator-tester.d.ts +44 -0
package/dist/testing/ref-translator-tester.d.ts.map +1 -0
package/dist/testing/ref-translator-tester.js +104 -0
package/dist/testing/ref-translator-tester.js.map +1 -0
package/dist/utils/hierarchical-selector.d.ts +47 -0
package/dist/utils/hierarchical-selector.d.ts.map +1 -0
package/dist/utils/hierarchical-selector.js +212 -0
package/dist/utils/hierarchical-selector.js.map +1 -0
package/dist/utils/page-info-retry.d.ts +14 -0
package/dist/utils/page-info-retry.d.ts.map +1 -0
package/dist/utils/page-info-retry.js +60 -0
package/dist/utils/page-info-retry.js.map +1 -0
package/dist/utils/page-info-utils.d.ts +1 -0
package/dist/utils/page-info-utils.d.ts.map +1 -1
package/dist/utils/page-info-utils.js +46 -18
package/dist/utils/page-info-utils.js.map +1 -1
package/dist/utils/ref-attacher.d.ts +21 -0
package/dist/utils/ref-attacher.d.ts.map +1 -0
package/dist/utils/ref-attacher.js +149 -0
package/dist/utils/ref-attacher.js.map +1 -0
package/dist/utils/ref-translator.d.ts +49 -0
package/dist/utils/ref-translator.d.ts.map +1 -0
package/dist/utils/ref-translator.js +276 -0
package/dist/utils/ref-translator.js.map +1 -0
package/package.json +1 -1
package/plandocs/exploratory-mode-support-v2.plan.md +953 -0
package/plandocs/exploratory-mode-support.plan.md +928 -0
package/plandocs/journey-id-tracking-addendum.md +227 -0
package/src/execution-service.ts +179 -596
package/src/index.ts +10 -0
package/src/orchestrator/decision-parser.ts +139 -0
package/src/orchestrator/index.ts +25 -1
package/src/orchestrator/orchestrator-agent.ts +656 -236
package/src/orchestrator/orchestrator-prompts.ts +559 -247
package/src/orchestrator/page-som-handler.ts +1565 -0
package/src/orchestrator/som-types.ts +188 -0
package/src/orchestrator/tool-registry.ts +2 -0
package/src/orchestrator/tools/index.ts +4 -1
package/src/orchestrator/tools/refresh-som-markers.ts +69 -0
package/src/orchestrator/tools/view-previous-screenshot.ts +103 -0
package/src/orchestrator/types.ts +49 -6
package/src/scenario-service.ts +20 -0
package/src/scenario-worker-class.ts +24 -3
package/src/utils/page-info-retry.ts +65 -0
package/src/utils/page-info-utils.ts +53 -18
package/testchimp-runner-core-0.0.35.tgz +0 -0
package/src/orchestrator/orchestrator-agent.ts.backup +0 -1386
package/testchimp-runner-core-0.0.33.tgz +0 -0
/package/{RELEASE_0.0.26.md → releasenotes/RELEASE_0.0.26.md} +0 -0
/package/{RELEASE_0.0.27.md → releasenotes/RELEASE_0.0.27.md} +0 -0
/package/{RELEASE_0.0.28.md → releasenotes/RELEASE_0.0.28.md} +0 -0

package/src/index.ts CHANGED Viewed

@@ -45,6 +45,7 @@ export {
   SelfReflection,
   ToolCall,
   ToolResult,
+  ExplorationMode,
   DEFAULT_AGENT_CONFIG,
   // Tools (information-gathering only)
   TakeScreenshotTool,
@@ -58,6 +59,9 @@ export {
 export * from './types';
 export { PageInfo, InteractiveElement } from './utils/page-info-utils';
+// Model constants
+export { DEFAULT_MODEL, DEFAULT_SIMPLER_MODEL, VISION_MODEL } from './model-constants';
 // Authentication
 export * from './auth-config';
@@ -359,6 +363,12 @@ export class TestChimpService {
     return this.executeScript(repairRequest);
   }
+  // Exploration mode execution
+  async executeExploration(page: any, explorationConfig: any, jobId: string): Promise<any> {
+    // Delegate to scenario service's orchestrator
+    return this.scenarioService.executeExploration(page, explorationConfig, jobId);
+  }
   // Credit usage reporting methods
   async reportScriptGenerationCredit(jobId?: string): Promise<void> {
     return this.creditUsageService.reportScriptGenerationCredit(jobId);

package/src/orchestrator/decision-parser.ts ADDED Viewed

@@ -0,0 +1,139 @@
+/**
+ * Decision Parser Utility
+ * Parses and validates agent decisions from LLM responses
+ */
+import { AgentDecision } from './types';
+import { isSomVerification, isSomCommand } from './som-types';
+export class DecisionParser {
+  private logger?: (message: string, level?: 'log' | 'error' | 'warn') => void;
+  constructor(logger?: (message: string, level?: 'log' | 'error' | 'warn') => void) {
+    this.logger = logger;
+  }
+  /**
+   * Parse agent decision from LLM response
+   */
+  parse(response: string): AgentDecision {
+    try {
+      // Extract JSON from response
+      const jsonMatch = response.match(/\{[\s\S]*\}/);
+      if (!jsonMatch) {
+        this.logger?.(`[DecisionParser] ✗ No JSON found in LLM response`, 'error');
+        this.logger?.(`[DecisionParser] 📄 FULL LLM RESPONSE:\n${response}`, 'error');
+        throw new Error('No JSON found in response');
+      }
+      const parsed = JSON.parse(jsonMatch[0]);
+      // Validate required fields
+      // Accept either "reasoning" or "statusReasoning" (LLMs sometimes only provide one)
+      if (!parsed.status || (!parsed.reasoning && !parsed.statusReasoning)) {
+        this.logger?.(`[DecisionParser] ✗ Missing required fields in parsed JSON`, 'error');
+        this.logger?.(`[DecisionParser] 📄 FULL LLM RESPONSE:\n${response}`, 'error');
+        this.logger?.(`[DecisionParser] 📄 PARSED JSON:\n${JSON.stringify(parsed, null, 2)}`, 'error');
+        this.logger?.(`[DecisionParser] ❌ Has status: ${!!parsed.status}, Has reasoning: ${!!parsed.reasoning}, Has statusReasoning: ${!!parsed.statusReasoning}`, 'error');
+        throw new Error('Missing required fields: status and (reasoning or statusReasoning)');
+      }
+      // Normalize: if reasoning is missing but statusReasoning exists, use statusReasoning as reasoning
+      if (!parsed.reasoning && parsed.statusReasoning) {
+        parsed.reasoning = parsed.statusReasoning;
+      }
+      return parsed as AgentDecision;
+    } catch (error: any) {
+      this.logger?.(`[DecisionParser] ✗ Failed to parse agent decision: ${error.message}`, 'error');
+      // Only log full response if not already logged above
+      if (!error.message.includes('Missing required fields') && !error.message.includes('No JSON found')) {
+        this.logger?.(`[DecisionParser] 📄 FULL LLM RESPONSE:\n${response}`, 'error');
+      }
+      // Return fallback
+      return {
+        status: 'stuck',
+        statusReasoning: 'Failed to parse agent response',
+        reasoning: `Parse error: ${error.message}`
+      };
+    }
+  }
+  /**
+   * Log agent decision for debugging
+   */
+  log(decision: AgentDecision, iteration: number): void {
+    this.logger?.(`[Orchestrator] 💭 REASONING: ${decision.reasoning}`);
+    if (decision.selfReflection) {
+      this.logger?.(`[Orchestrator] 🧠 SELF-REFLECTION:`);
+      this.logger?.(`[Orchestrator]    Next: ${decision.selfReflection.guidanceForNext}`);
+      if (decision.selfReflection.detectingLoop) {
+        this.logger?.(`[Orchestrator]    🔄 LOOP DETECTED: ${decision.selfReflection.loopReasoning}`, 'warn');
+      }
+    }
+    if (decision.toolCalls && decision.toolCalls.length > 0) {
+      this.logger?.(`[Orchestrator] 🔧 TOOLS: ${decision.toolCalls.map(t => t.name).join(', ')}`);
+      if (decision.toolReasoning) {
+        this.logger?.(`[Orchestrator] 📋 Why: ${decision.toolReasoning}`);
+      }
+    }
+    if (decision.blockerDetected) {
+      this.logger?.(`[Orchestrator] 🚧 BLOCKER: ${decision.blockerDetected.description}`, 'warn');
+      this.logger?.(`[Orchestrator] 🧹 Clearing with ${decision.blockerDetected.clearingCommands.length} command(s)`);
+    }
+    if (decision.stepReEvaluation?.detected) {
+      this.logger?.(`[Orchestrator] 🔍 STEP RE-EVALUATION: ${decision.stepReEvaluation.issue}`, 'warn');
+      this.logger?.(`[Orchestrator] 📝 Explanation: ${decision.stepReEvaluation.explanation}`);
+    }
+    if (decision.commands && decision.commands.length > 0) {
+      this.logger?.(`[Orchestrator] 📝 COMMANDS (${decision.commands.length}):`);
+      decision.commands.slice(0, 3).forEach((cmd: any, i) => {
+        // Handle string commands (standard mode), SomCommand, and SomVerification objects
+        if (typeof cmd === 'string') {
+          this.logger?.(`[Orchestrator]    ${i + 1}. ${cmd.substring(0, 80)}...`);
+        } else if (isSomVerification(cmd)) {
+          const ref = cmd.elementRef || cmd.selector || 'unknown';
+          this.logger?.(`[Orchestrator]    ${i + 1}. [VERIFY] ${cmd.verificationType} on ${ref}: ${cmd.expected}`);
+        } else if (isSomCommand(cmd)) {
+          this.logger?.(`[Orchestrator]    ${i + 1}. [ACTION] ${cmd.action} on ${cmd.elementRef || 'coord'}`);
+        } else {
+          this.logger?.(`[Orchestrator]    ${i + 1}. ${JSON.stringify(cmd).substring(0, 80)}...`);
+        }
+      });
+      if (decision.commands.length > 3) {
+        this.logger?.(`[Orchestrator]    ... and ${decision.commands.length - 3} more`);
+      }
+      if (decision.commandReasoning) {
+        this.logger?.(`[Orchestrator] 💡 Why: ${decision.commandReasoning}`);
+      }
+    }
+    // Log meta-learning suggestions with clear demarcations
+    if (decision.debugInfo?.suggestedPromptUpdates) {
+      this.logger?.(``, 'warn');
+      this.logger?.(`═══════════════════════════════════════════════════════════════`, 'warn');
+      this.logger?.(`[Orchestrator] 🧠 META-LEARNING SUGGESTION FROM AGENT`, 'warn');
+      this.logger?.(`═══════════════════════════════════════════════════════════════`, 'warn');
+      this.logger?.(``, 'warn');
+      this.logger?.(`SUGGESTED PROMPT UPDATE:`, 'warn');
+      this.logger?.(`  ${decision.debugInfo.suggestedPromptUpdates}`, 'warn');
+      this.logger?.(``, 'warn');
+      if (decision.debugInfo.reasoning) {
+        this.logger?.(`REASONING:`, 'warn');
+        this.logger?.(`  ${decision.debugInfo.reasoning}`, 'warn');
+        this.logger?.(``, 'warn');
+      }
+      this.logger?.(`═══════════════════════════════════════════════════════════════`, 'warn');
+      this.logger?.(``, 'warn');
+    }
+  }
+}

package/src/orchestrator/index.ts CHANGED Viewed

@@ -5,12 +5,17 @@
 // Core orchestrator
 export { OrchestratorAgent } from './orchestrator-agent';
+// SoM (Set-of-Marks) handler
+export { PageSoMHandler } from './page-som-handler';
 // Tool system
 export { ToolRegistry, Tool, ToolParameter, ToolExecutionContext } from './tool-registry';
-// 6 information-gathering tools (state changes via Playwright commands)
+// 8 information-gathering tools (state changes via Playwright commands)
 export {
   TakeScreenshotTool,
+  ViewPreviousScreenshotTool,
+  RefreshSomMarkersTool,
   RecallHistoryTool,
   InspectPageTool,
   CheckPageReadyTool,
@@ -29,6 +34,25 @@ export {
   SelfReflection,
   ToolCall,
   ToolResult,
+  ExplorationMode,
   DEFAULT_AGENT_CONFIG
 } from './types';
+// SoM Types
+export {
+  SomCommand,
+  SomElement,
+  SemanticCommandResult,
+  CommandRunStatus,
+  CommandAttempt,
+  DomMutation,
+  InteractionAction,
+  Coordinate,
+  TypedSelector,
+  SomVerification,
+  VerificationType,
+  SomCommandOrVerification,
+  isSomVerification,
+  isSomCommand
+} from './som-types';