npm - superghost - Versions diffs - 0.1.0 - Mend

superghost 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

package/LICENSE +21 -0
package/README.md +172 -0
package/package.json +77 -0
package/src/agent/agent-runner.ts +69 -0
package/src/agent/mcp-manager.ts +78 -0
package/src/agent/model-factory.ts +71 -0
package/src/agent/prompt.ts +47 -0
package/src/agent/types.ts +28 -0
package/src/cache/cache-manager.ts +105 -0
package/src/cache/step-recorder.ts +50 -0
package/src/cache/step-replayer.ts +51 -0
package/src/cache/types.ts +27 -0
package/src/cli.ts +128 -0
package/src/config/loader.ts +76 -0
package/src/config/schema.ts +26 -0
package/src/config/types.ts +8 -0
package/src/dist/paths.ts +52 -0
package/src/dist/setup.ts +66 -0
package/src/infra/process-manager.ts +34 -0
package/src/infra/signals.ts +20 -0
package/src/output/reporter.ts +75 -0
package/src/output/types.ts +8 -0
package/src/runner/test-executor.ts +145 -0
package/src/runner/test-runner.ts +66 -0
package/src/runner/types.ts +26 -0

package/src/runner/test-executor.ts ADDED Viewed

@@ -0,0 +1,145 @@
+import type { CacheManager } from "../cache/cache-manager.ts";
+import type { StepReplayer } from "../cache/step-replayer.ts";
+import type { AgentExecutionResult } from "../agent/types.ts";
+import type { Config } from "../config/types.ts";
+import type { TestResult } from "./types.ts";
+/** Function signature for executing a test via the AI agent */
+type ExecuteAgentFn = (config: {
+  model: any;
+  tools: Record<string, any>;
+  testCase: string;
+  baseUrl: string;
+  recursionLimit: number;
+  globalContext?: string;
+  testContext?: string;
+}) => Promise<AgentExecutionResult>;
+/**
+ * Executes a single test case following the cache-first-then-AI strategy:
+ * 1. Try replaying from cache (fast path, ~50ms)
+ * 2. On cache miss or replay failure, invoke AI agent with retries
+ * 3. Save new steps on AI success; delete stale cache on AI failure after self-heal attempt
+ */
+export class TestExecutor {
+  private readonly cacheManager: CacheManager;
+  private readonly replayer: StepReplayer;
+  private readonly executeAgentFn: ExecuteAgentFn;
+  private readonly model: any;
+  private readonly tools: Record<string, any>;
+  private readonly config: Pick<
+    Config,
+    "maxAttempts" | "recursionLimit" | "model" | "modelProvider"
+  > & { context?: string };
+  private readonly globalContext?: string;
+  constructor(opts: {
+    cacheManager: CacheManager;
+    replayer: StepReplayer;
+    executeAgentFn: ExecuteAgentFn;
+    model?: any;
+    tools?: Record<string, any>;
+    config: Pick<
+      Config,
+      "maxAttempts" | "recursionLimit" | "model" | "modelProvider"
+    > & { context?: string };
+    globalContext?: string;
+  }) {
+    this.cacheManager = opts.cacheManager;
+    this.replayer = opts.replayer;
+    this.executeAgentFn = opts.executeAgentFn;
+    this.model = opts.model;
+    this.tools = opts.tools ?? {};
+    this.config = opts.config;
+    this.globalContext = opts.globalContext;
+  }
+  /** Execute a single test case with cache-first strategy */
+  async execute(
+    testCase: string,
+    baseUrl: string,
+    testContext?: string,
+  ): Promise<TestResult> {
+    const start = Date.now();
+    // Phase 1: Try cache replay
+    const cached = await this.cacheManager.load(testCase, baseUrl);
+    if (cached) {
+      const replay = await this.replayer.replay(cached.steps);
+      if (replay.success) {
+        return {
+          testName: testCase,
+          testCase,
+          status: "passed",
+          source: "cache",
+          durationMs: Date.now() - start,
+        };
+      }
+      // Cache stale — fall through to AI with self-heal flag
+      return this.executeWithAgent(testCase, baseUrl, start, true, testContext);
+    }
+    // Phase 2: No cache — go directly to AI
+    return this.executeWithAgent(testCase, baseUrl, start, false, testContext);
+  }
+  /** Retry agent execution up to maxAttempts */
+  private async executeWithAgent(
+    testCase: string,
+    baseUrl: string,
+    startTime: number,
+    selfHeal: boolean,
+    testContext?: string,
+  ): Promise<TestResult> {
+    let lastError = "";
+    for (let attempt = 0; attempt < this.config.maxAttempts; attempt++) {
+      const result = await this.executeAgentFn({
+        model: this.model,
+        tools: this.tools,
+        testCase,
+        baseUrl,
+        recursionLimit: this.config.recursionLimit,
+        globalContext: this.globalContext,
+        testContext,
+      });
+      if (result.passed) {
+        // Save cache for future replays
+        await this.cacheManager.save(testCase, baseUrl, result.steps, {
+          model: this.config.model,
+          provider: this.config.modelProvider,
+          stepCount: result.steps.length,
+          aiMessage: result.message,
+          durationMs: Date.now() - startTime,
+        });
+        return {
+          testName: testCase,
+          testCase,
+          status: "passed",
+          source: "ai",
+          durationMs: Date.now() - startTime,
+          ...(selfHeal ? { selfHealed: true } : {}),
+        };
+      }
+      lastError = result.message;
+    }
+    // All attempts exhausted
+    if (selfHeal) {
+      // Delete stale cache that triggered self-heal
+      await this.cacheManager.delete(testCase, baseUrl);
+    }
+    return {
+      testName: testCase,
+      testCase,
+      status: "failed",
+      source: "ai",
+      durationMs: Date.now() - startTime,
+      error: lastError,
+    };
+  }
+}

package/src/runner/test-runner.ts ADDED Viewed

@@ -0,0 +1,66 @@
+import type { Config } from "../config/types.ts";
+import type { Reporter } from "../output/types.ts";
+import type { TestResult, RunResult } from "./types.ts";
+/** Function signature for executing a single test case */
+export type ExecuteFn = (
+  testCase: string,
+  baseUrl: string,
+  testContext?: string,
+) => Promise<TestResult>;
+/**
+ * Orchestrates sequential execution of all test cases.
+ * Calls reporter hooks before/after each test and after the full run.
+ * Delegates individual test execution to the provided execute function.
+ */
+export class TestRunner {
+  private readonly config: Config;
+  private readonly reporter: Reporter;
+  private readonly executeFn: ExecuteFn;
+  constructor(config: Config, reporter: Reporter, executeFn: ExecuteFn) {
+    this.config = config;
+    this.reporter = reporter;
+    this.executeFn = executeFn;
+  }
+  /** Run all test cases sequentially and return aggregate results */
+  async run(): Promise<RunResult> {
+    const startTime = Date.now();
+    const results: TestResult[] = [];
+    for (const test of this.config.tests) {
+      const baseUrl = test.baseUrl ?? this.config.baseUrl ?? "";
+      this.reporter.onTestStart(test.name);
+      const result = await this.executeFn(test.case, baseUrl, test.context);
+      // Ensure testName uses the configured test.name (display name), not the raw testCase
+      const displayResult = { ...result, testName: test.name };
+      results.push(displayResult);
+      this.reporter.onTestComplete(displayResult);
+    }
+    const runResult = aggregateResults(results, Date.now() - startTime);
+    this.reporter.onRunComplete(runResult);
+    return runResult;
+  }
+}
+/** Aggregate individual test results into a run summary */
+function aggregateResults(
+  results: TestResult[],
+  totalDurationMs: number,
+): RunResult {
+  return {
+    results,
+    totalDurationMs,
+    passed: results.filter((r) => r.status === "passed").length,
+    failed: results.filter((r) => r.status === "failed").length,
+    cached: results.filter(
+      (r) => r.source === "cache" && r.status === "passed",
+    ).length,
+  };
+}

package/src/runner/types.ts ADDED Viewed

@@ -0,0 +1,26 @@
+/** Status of a completed test */
+export type TestStatus = "passed" | "failed";
+/** Source of the test result */
+export type TestSource = "cache" | "ai";
+/** Result of executing a single test case */
+export interface TestResult {
+  testName: string;
+  testCase: string;
+  status: TestStatus;
+  source: TestSource;
+  durationMs: number;
+  error?: string;
+  /** Whether this test self-healed from a stale cache */
+  selfHealed?: boolean;
+}
+/** Overall run result from the test runner */
+export interface RunResult {
+  results: TestResult[];
+  totalDurationMs: number;
+  passed: number;
+  failed: number;
+  cached: number;
+}