npm - testchimp-runner-core - Versions diffs - 0.0.35 → 0.0.37 - Mend

testchimp-runner-core 0.0.35 → 0.0.37

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

package/dist/orchestrator/orchestrator-agent.d.ts.map +1 -1
package/dist/orchestrator/orchestrator-agent.js +7 -4
package/dist/orchestrator/orchestrator-agent.js.map +1 -1
package/dist/orchestrator/orchestrator-prompts.d.ts.map +1 -1
package/dist/orchestrator/orchestrator-prompts.js +73 -15
package/dist/orchestrator/orchestrator-prompts.js.map +1 -1
package/dist/orchestrator/page-som-handler.d.ts +1 -2
package/dist/orchestrator/page-som-handler.d.ts.map +1 -1
package/dist/orchestrator/page-som-handler.js +51 -25
package/dist/orchestrator/page-som-handler.js.map +1 -1
package/package.json +6 -1
package/plandocs/BEFORE_AFTER_VERIFICATION.md +0 -148
package/plandocs/COORDINATE_MODE_DIAGNOSIS.md +0 -144
package/plandocs/CREDIT_CALLBACK_ARCHITECTURE.md +0 -253
package/plandocs/HUMAN_LIKE_IMPROVEMENTS.md +0 -642
package/plandocs/IMPLEMENTATION_STATUS.md +0 -108
package/plandocs/INTEGRATION_COMPLETE.md +0 -322
package/plandocs/MULTI_AGENT_ARCHITECTURE_REVIEW.md +0 -844
package/plandocs/ORCHESTRATOR_MVP_SUMMARY.md +0 -539
package/plandocs/PHASE1_ABSTRACTION_COMPLETE.md +0 -241
package/plandocs/PHASE1_FINAL_STATUS.md +0 -210
package/plandocs/PHASE_1_COMPLETE.md +0 -165
package/plandocs/PHASE_1_SUMMARY.md +0 -184
package/plandocs/PLANNING_SESSION_SUMMARY.md +0 -372
package/plandocs/PROMPT_OPTIMIZATION_ANALYSIS.md +0 -120
package/plandocs/PROMPT_SANITY_CHECK.md +0 -120
package/plandocs/SCRIPT_CLEANUP_FEATURE.md +0 -201
package/plandocs/SCRIPT_GENERATION_ARCHITECTURE.md +0 -364
package/plandocs/SELECTOR_IMPROVEMENTS.md +0 -139
package/plandocs/SESSION_SUMMARY_v0.0.33.md +0 -151
package/plandocs/TROUBLESHOOTING_SESSION.md +0 -72
package/plandocs/VISION_DIAGNOSTICS_IMPROVEMENTS.md +0 -336
package/plandocs/VISUAL_AGENT_EVOLUTION_PLAN.md +0 -396
package/plandocs/WHATS_NEW_v0.0.33.md +0 -183
package/plandocs/exploratory-mode-support-v2.plan.md +0 -953
package/plandocs/exploratory-mode-support.plan.md +0 -928
package/plandocs/journey-id-tracking-addendum.md +0 -227
package/releasenotes/RELEASE_0.0.26.md +0 -165
package/releasenotes/RELEASE_0.0.27.md +0 -236
package/releasenotes/RELEASE_0.0.28.md +0 -286
package/src/auth-config.ts +0 -84
package/src/credit-usage-service.ts +0 -188
package/src/env-loader.ts +0 -103
package/src/execution-service.ts +0 -996
package/src/file-handler.ts +0 -104
package/src/index.ts +0 -432
package/src/llm-facade.ts +0 -821
package/src/llm-provider.ts +0 -53
package/src/model-constants.ts +0 -35
package/src/orchestrator/decision-parser.ts +0 -139
package/src/orchestrator/index.ts +0 -58
package/src/orchestrator/orchestrator-agent.ts +0 -1282
package/src/orchestrator/orchestrator-prompts.ts +0 -786
package/src/orchestrator/page-som-handler.ts +0 -1565
package/src/orchestrator/som-types.ts +0 -188
package/src/orchestrator/tool-registry.ts +0 -184
package/src/orchestrator/tools/check-page-ready.ts +0 -75
package/src/orchestrator/tools/extract-data.ts +0 -92
package/src/orchestrator/tools/index.ts +0 -15
package/src/orchestrator/tools/inspect-page.ts +0 -42
package/src/orchestrator/tools/recall-history.ts +0 -72
package/src/orchestrator/tools/refresh-som-markers.ts +0 -69
package/src/orchestrator/tools/take-screenshot.ts +0 -128
package/src/orchestrator/tools/verify-action-result.ts +0 -159
package/src/orchestrator/tools/view-previous-screenshot.ts +0 -103
package/src/orchestrator/types.ts +0 -291
package/src/playwright-mcp-service.ts +0 -224
package/src/progress-reporter.ts +0 -144
package/src/prompts.ts +0 -842
package/src/providers/backend-proxy-llm-provider.ts +0 -91
package/src/providers/local-llm-provider.ts +0 -38
package/src/scenario-service.ts +0 -252
package/src/scenario-worker-class.ts +0 -1110
package/src/script-utils.ts +0 -203
package/src/types.ts +0 -239
package/src/utils/browser-utils.ts +0 -348
package/src/utils/coordinate-converter.ts +0 -162
package/src/utils/page-info-retry.ts +0 -65
package/src/utils/page-info-utils.ts +0 -285
package/testchimp-runner-core-0.0.35.tgz +0 -0
package/tsconfig.json +0 -19

package/src/script-utils.ts DELETED Viewed

@@ -1,203 +0,0 @@
-/**
- * Script Generation Utilities
- *
- * This module provides utilities for generating and formatting test scripts
- * with TestChimp-specific markers and comments.
- */
-/**
- * TestChimp smart test comment that should be added to all generated scripts
- */
-export const TESTCHIMP_SMART_COMMENT = `/*
-This is a TestChimp Smart Test.
-Version: 1.0
-*/`;
-/**
- * Generates TestChimp smart test comment with optional repair advice and hashtags
- * @param repairAdvice Optional repair advice to include in the comment
- * @param hashtags Optional hashtags for semantic grouping
- * @returns The complete comment block
- */
-export function generateTestChimpComment(repairAdvice?: string, hashtags?: string[]): string {
-  const hashtagString = hashtags ? hashtags.map(tag => tag.startsWith('#') ? tag : `#${tag}`).join(' ') : '';
-  if (repairAdvice) {
-    return `/*
-This is a TestChimp Smart Test.
-Version: 1.0
-${hashtagString}
-Repair Advice:
-${repairAdvice}
-*/`;
-  }
-  return `/*
-This is a TestChimp Smart Test.
-Version: 1.0
-${hashtagString}
-*/`;
-}
-/**
- * Extracts hashtags from an existing TestChimp comment
- * @param script The script content containing the comment
- * @returns Array of hashtags found in the comment
- */
-export function extractHashtagsFromComment(script: string): string[] {
-  const commentMatch = script.match(/\/\*[\s\S]*?This is a TestChimp (Managed|Smart) Test\.[\s\S]*?\*\//);
-  if (!commentMatch) {
-    return [];
-  }
-  const comment = commentMatch[0];
-  // Look for any line in the comment that starts with #
-  const hashtags: string[] = [];
-  const lines = comment.split('\n');
-  for (const line of lines) {
-    const trimmedLine = line.trim();
-    if (trimmedLine.startsWith('#')) {
-      // Extract hashtags from this line
-      const lineHashtags = trimmedLine.match(/#\w+/g) || [];
-      hashtags.push(...lineHashtags);
-    }
-  }
-  return hashtags;
-}
-/**
- * Adds the TestChimp smart test comment to the beginning of a script
- * @param script The original script content
- * @param repairAdvice Optional repair advice to include in the comment
- * @param hashtags Optional hashtags for semantic grouping
- * @returns The script with TestChimp comment prepended
- */
-export function addTestChimpComment(script: string, repairAdvice?: string, hashtags?: string[]): string {
-  // If the script already has the TestChimp comment, update it with repair advice if provided
-  // Prioritize Smart Test detection, fallback to Managed Test for backward compatibility
-  if (script.includes('This is a TestChimp Smart Test') || script.includes('This is a TestChimp Managed Test')) {
-    if (repairAdvice) {
-      // Extract existing hashtags from the current comment
-      const existingHashtags = extractHashtagsFromComment(script);
-      // Use existing hashtags if no new ones provided, otherwise use new ones
-      const finalHashtags = hashtags && hashtags.length > 0 ? hashtags : existingHashtags;
-      // Replace existing comment with new one that includes repair advice and preserved hashtags
-      const commentRegex = /\/\*[\s\S]*?This is a TestChimp (Managed|Smart) Test\.[\s\S]*?\*\//;
-      const newComment = generateTestChimpComment(repairAdvice, finalHashtags);
-      return script.replace(commentRegex, newComment);
-    }
-    return script;
-  }
-  // Add the comment at the beginning of the script
-  const comment = generateTestChimpComment(repairAdvice, hashtags);
-  return `${comment}\n\n${script}`;
-}
-/**
- * Generates a complete test script with TestChimp comment, imports, and test structure
- * @param testName The name of the test
- * @param steps Array of test steps with descriptions and commands
- * @param repairAdvice Optional repair advice to include in the comment
- * @param hashtags Optional hashtags for semantic grouping
- * @returns The complete test script
- */
-export function generateTestScript(
-  testName: string,
-  steps: Array<{
-    stepNumber: number;
-    description: string;
-    playwrightCommand?: string;
-    playwrightCommands?: string[];
-    success?: boolean;
-    error?: string;
-  }>,
-  repairAdvice?: string,
-  hashtags?: string[]
-): string {
-  const scriptLines: string[] = [];
-  // Always add TestChimp comment
-  const comment = generateTestChimpComment(repairAdvice, hashtags);
-  scriptLines.push(comment);
-  scriptLines.push('');
-  // Add imports
-  scriptLines.push(`import { test, expect } from '@playwright/test';`);
-  // Add test structure
-  scriptLines.push(`test('${testName.replace(/'/g, "\\'")}', async ({ page, browser, context }) => {`);
-  // Add steps
-  for (const step of steps) {
-    // Check if step was skipped
-    const isSkipped = step.error?.includes('Skipped due to') ||
-                     (step.success === false && (!step.playwrightCommand && (!step.playwrightCommands || step.playwrightCommands.length === 0)));
-    if (isSkipped) {
-      // Step was skipped due to previous failures
-      scriptLines.push(`  // ${step.description} [SKIPPED]`);
-    } else if (step.success === false) {
-      // Step failed - only show command if this step actually attempted any commands
-      if (step.playwrightCommands && step.playwrightCommands.length > 0) {
-        // Failed after attempting commands - show them
-        scriptLines.push(`  // ${step.description} [FAILED]`);
-        step.playwrightCommands.forEach((cmd: string) => {
-          scriptLines.push(`  // Attempted: ${cmd}`);
-        });
-      } else if (step.playwrightCommand) {
-        // Single command attempted (backward compatibility)
-        scriptLines.push(`  // ${step.description} [FAILED] - ${step.playwrightCommand}`);
-      } else {
-        // Failed without attempting any commands
-        scriptLines.push(`  // ${step.description} [FAILED]`);
-      }
-    } else {
-      // Step succeeded or in progress
-      // Only add comment if step has commands to show
-      const hasCommands = (step.playwrightCommands && step.playwrightCommands.length > 0) || step.playwrightCommand;
-      if (hasCommands) {
-        scriptLines.push(`  // ${step.description}`);
-        // Handle multiple commands per step
-        if (step.playwrightCommands && step.playwrightCommands.length > 0) {
-          // Multiple commands - output all of them
-          step.playwrightCommands.forEach((cmd: string) => {
-            scriptLines.push(`  ${cmd}`);
-          });
-        } else if (step.playwrightCommand) {
-          // Single command (backward compatibility)
-          scriptLines.push(`  ${step.playwrightCommand}`);
-        }
-      }
-      // If step has no commands, skip it entirely (work was done in previous step)
-    }
-  }
-  scriptLines.push(`});`);
-  return scriptLines.join('\n');
-}
-/**
- * Checks if a script is a TestChimp managed/smart test
- * Prioritizes detection of "Smart Test" format while maintaining backward compatibility with "Managed Test"
- * @param script The script content to check
- * @returns True if the script contains the TestChimp smart/managed test comment
- */
-export function isTestChimpManagedTest(script: string): boolean {
-  // Prioritize Smart Test detection, fallback to Managed Test for backward compatibility
-  return script.includes('This is a TestChimp Smart Test') || script.includes('This is a TestChimp Managed Test');
-}

package/src/types.ts DELETED Viewed

@@ -1,239 +0,0 @@
-// ============================================================================
-// CORE TYPES
-// ============================================================================
-/**
- * Playwright MCP configuration - JavaScript config file content (playwright.config.js)
- */
-export type PlaywrightConfig = string;
-// ============================================================================
-// SCRIPT EXECUTION TYPES
-// ============================================================================
-/**
- * Request structure for the Playwright script executor
- */
-export interface PlaywrightExecutionRequest {
-  /** Main Playwright script content */
-  script: string;
-  /** Optional pre-script to run before the main script */
-  prescript?: string;
-  /** Optional post-script to run after the main script */
-  postscript?: string;
-  /** Playwright configuration file content */
-  playwrightConfig: string;
-  /** Optional GPT model to use for AI operations */
-  model?: string;
-}
-/**
- * Response structure for the Playwright script executor
- */
-export interface PlaywrightExecutionResponse {
-  /** Whether the execution was successful */
-  success: boolean;
-  /** Execution results from each script phase */
-  results: {
-    prescript?: ScriptResult;
-    script: ScriptResult;
-    postscript?: ScriptResult;
-  };
-  /** Overall execution time in milliseconds */
-  executionTime: number;
-  /** Any errors that occurred during execution */
-  error?: string;
-}
-/**
- * Individual script execution result
- */
-export interface ScriptResult {
-  /** Whether this specific script executed successfully */
-  success: boolean;
-  /** Output from the script execution */
-  output: string;
-  /** Any errors from this script */
-  error?: string;
-  /** Execution time for this script in milliseconds */
-  executionTime: number;
-}
-// ============================================================================
-// SCENARIO EXECUTION TYPES
-// ============================================================================
-/**
- * Scenario execution request
- */
-export interface ScenarioRequest {
-  scenario: string;
-  testName?: string;
-  playwrightConfig?: PlaywrightConfig;
-  model?: string;
-}
-/**
- * Scenario execution job for worker queue
- */
-export interface ScenarioRunJob {
-  id: string;
-  scenario: string;
-  testName?: string;
-  playwrightConfig?: PlaywrightConfig;
-  model?: string;
-  scenarioFileName?: string;
-  // Optional: Provide existing browser/page/context (for server-side usage)
-  existingBrowser?: any;
-  existingContext?: any;
-  existingPage?: any;
-}
-/**
- * Scenario execution response
- */
-export interface ScenarioResponse {
-  success: boolean;
-  steps: ScenarioStep[];
-  generatedScript: string;
-  executionLog: string;
-  executionTime: number;
-  testName?: string;
-  preferredFileName?: string;
-  error?: string;
-}
-/**
- * Individual sub-action within a step
- */
-export interface SubAction {
-  command: string;
-  success: boolean;
-  error?: string;
-  retryCount: number;
-}
-/**
- * Individual scenario step
- */
-export interface ScenarioStep {
-  stepNumber: number;
-  description: string;
-  playwrightCommand?: string; // For backward compatibility - last successful command or aggregated command
-  playwrightCommands?: string[]; // Multiple commands for complex steps
-  subActions?: SubAction[]; // Detailed tracking of all sub-actions
-  success?: boolean;
-  error?: string;
-  retryCount?: number;
-  attempts?: Array<{
-    attemptNumber: number;
-    command?: string;
-    success: boolean;
-    error?: string;
-    timestamp: number;
-  }>;
-}
-/**
- * Legacy scenario job interface (for backward compatibility)
- */
-export interface ScenarioJob {
-  id: string;
-  scenario: string;
-  config?: PlaywrightConfig;
-  resolve: (result: ScenarioResponse) => void;
-  reject: (error: Error) => void;
-  // Optional: Provide existing browser/page/context (for server-side usage)
-  existingBrowser?: any;
-  existingContext?: any;
-  existingPage?: any;
-}
-// ============================================================================
-// AI REPAIR TYPES
-// ============================================================================
-/**
- * Execution mode for script execution
- */
-export enum ExecutionMode {
-  RUN_EXACTLY = 'RUN_EXACTLY',
-  RUN_WITH_AI_REPAIR = 'RUN_WITH_AI_REPAIR'
-}
-/**
- * Script execution request with AI repair capabilities
- */
-export interface ScriptExecutionRequest {
-  script?: string; // Optional if scriptFilePath is provided
-  scriptFilePath?: string; // Path to script file (alternative to script content)
-  mode: ExecutionMode;
-  repairFlexibility?: number; // 0-5, defaults to 3
-  playwrightConfig?: PlaywrightConfig;
-  playwrightConfigFilePath?: string; // Path to playwright config file (alternative to playwrightConfig content)
-  model?: string;
-  headless?: boolean; // defaults to false (headed)
-  deflakeRunCount?: number; // Number of deflake attempts (defaults to 0, no deflaking)
-  jobId?: string; // Optional job ID for progress tracking
-  // For RUN_WITH_AI_REPAIR mode: whether to attempt runExactly first
-  attemptRunExactlyFirst?: boolean; // defaults to false
-  // For RUN_WITH_AI_REPAIR mode: pre-parsed steps (if provided, skip parsing)
-  // This preserves step IDs from sources like canonical trees
-  steps?: ScriptStep[]; // Optional pre-parsed steps with IDs
-  // Optional: Provide existing browser/page/context (for server-side usage)
-  // If not provided, runner-core will create its own
-  existingBrowser?: any; // Browser instance
-  existingContext?: any; // BrowserContext instance
-  existingPage?: any; // Page instance
-}
-/**
- * Script execution response with repair information
- */
-export interface ScriptExecutionResponse {
-  runStatus: 'success' | 'failed';
-  repairStatus?: 'success' | 'failed' | 'partial';
-  repairConfidence?: number; // 0-5
-  repairAdvice?: string;
-  updatedScript?: string;
-  executionTime: number;
-  numDeflakeRuns?: number; // Number of deflaking runs made (excluding original run)
-  error?: string;
-}
-/**
- * Individual script step for AI repair
- */
-export interface ScriptStep {
-  id?: string; // Optional step ID (preserved from source, e.g., canonical tree)
-  description: string;
-  code: string;
-  success?: boolean;
-  error?: string;
-}
-/**
- * Step operation types for AI repair
- */
-export enum StepOperation {
-  MODIFY = 'MODIFY',
-  INSERT = 'INSERT',
-  REMOVE = 'REMOVE'
-}
-/**
- * Step repair action
- */
-export interface StepRepairAction {
-  operation: StepOperation;
-  stepIndex?: number; // For MODIFY and REMOVE operations
-  newStep?: ScriptStep; // For MODIFY and INSERT operations
-  insertAfterIndex?: number; // For INSERT operation
-}
-// Repair suggestion and confidence interfaces are now in llm-facade.ts