npm - outcome-cli - Versions diffs - 1.0.0 - Mend

outcome-cli 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

package/README.md +261 -0
package/package.json +95 -0
package/src/agents/README.md +139 -0
package/src/agents/adapters/anthropic.adapter.ts +166 -0
package/src/agents/adapters/dalle.adapter.ts +145 -0
package/src/agents/adapters/gemini.adapter.ts +134 -0
package/src/agents/adapters/imagen.adapter.ts +106 -0
package/src/agents/adapters/nano-banana.adapter.ts +129 -0
package/src/agents/adapters/openai.adapter.ts +165 -0
package/src/agents/adapters/veo.adapter.ts +130 -0
package/src/agents/agent.schema.property.test.ts +379 -0
package/src/agents/agent.schema.test.ts +148 -0
package/src/agents/agent.schema.ts +263 -0
package/src/agents/index.ts +60 -0
package/src/agents/registered-agent.schema.ts +356 -0
package/src/agents/registry.ts +97 -0
package/src/agents/tournament-configs.property.test.ts +266 -0
package/src/cli/README.md +145 -0
package/src/cli/commands/define.ts +79 -0
package/src/cli/commands/list.ts +46 -0
package/src/cli/commands/logs.ts +83 -0
package/src/cli/commands/run.ts +416 -0
package/src/cli/commands/verify.ts +110 -0
package/src/cli/index.ts +81 -0
package/src/config/README.md +128 -0
package/src/config/env.ts +262 -0
package/src/config/index.ts +19 -0
package/src/eval/README.md +318 -0
package/src/eval/ai-judge.test.ts +435 -0
package/src/eval/ai-judge.ts +368 -0
package/src/eval/code-validators.ts +414 -0
package/src/eval/evaluateOutcome.property.test.ts +1174 -0
package/src/eval/evaluateOutcome.ts +591 -0
package/src/eval/immigration-validators.ts +122 -0
package/src/eval/index.ts +90 -0
package/src/eval/judge-cache.ts +402 -0
package/src/eval/tournament-validators.property.test.ts +439 -0
package/src/eval/validators.property.test.ts +1118 -0
package/src/eval/validators.ts +1199 -0
package/src/eval/weighted-scorer.ts +285 -0
package/src/index.ts +17 -0
package/src/league/README.md +188 -0
package/src/league/health-check.ts +353 -0
package/src/league/index.ts +93 -0
package/src/league/killAgent.ts +151 -0
package/src/league/league.test.ts +1151 -0
package/src/league/runLeague.ts +843 -0
package/src/league/scoreAgent.ts +175 -0
package/src/modules/omnibridge/__tests__/.gitkeep +1 -0
package/src/modules/omnibridge/__tests__/auth-tunnel.property.test.ts +524 -0
package/src/modules/omnibridge/__tests__/deterministic-logger.property.test.ts +965 -0
package/src/modules/omnibridge/__tests__/ghost-api.property.test.ts +461 -0
package/src/modules/omnibridge/__tests__/omnibridge-integration.test.ts +542 -0
package/src/modules/omnibridge/__tests__/parallel-executor.property.test.ts +671 -0
package/src/modules/omnibridge/__tests__/semantic-normalizer.property.test.ts +521 -0
package/src/modules/omnibridge/__tests__/semantic-normalizer.test.ts +254 -0
package/src/modules/omnibridge/__tests__/session-vault.property.test.ts +367 -0
package/src/modules/omnibridge/__tests__/shadow-session.property.test.ts +523 -0
package/src/modules/omnibridge/__tests__/triangulation-engine.property.test.ts +292 -0
package/src/modules/omnibridge/__tests__/verification-engine.property.test.ts +769 -0
package/src/modules/omnibridge/api/.gitkeep +1 -0
package/src/modules/omnibridge/api/ghost-api.ts +1087 -0
package/src/modules/omnibridge/auth/.gitkeep +1 -0
package/src/modules/omnibridge/auth/auth-tunnel.ts +843 -0
package/src/modules/omnibridge/auth/session-vault.ts +577 -0
package/src/modules/omnibridge/core/.gitkeep +1 -0
package/src/modules/omnibridge/core/semantic-normalizer.ts +702 -0
package/src/modules/omnibridge/core/triangulation-engine.ts +530 -0
package/src/modules/omnibridge/core/types.ts +610 -0
package/src/modules/omnibridge/execution/.gitkeep +1 -0
package/src/modules/omnibridge/execution/deterministic-logger.ts +629 -0
package/src/modules/omnibridge/execution/parallel-executor.ts +542 -0
package/src/modules/omnibridge/execution/shadow-session.ts +794 -0
package/src/modules/omnibridge/index.ts +212 -0
package/src/modules/omnibridge/omnibridge.ts +510 -0
package/src/modules/omnibridge/verification/.gitkeep +1 -0
package/src/modules/omnibridge/verification/verification-engine.ts +783 -0
package/src/outcomes/README.md +75 -0
package/src/outcomes/acquire-pilot-customer.ts +297 -0
package/src/outcomes/code-delivery-outcomes.ts +89 -0
package/src/outcomes/code-outcomes.ts +256 -0
package/src/outcomes/code_review_battle.test.ts +135 -0
package/src/outcomes/code_review_battle.ts +135 -0
package/src/outcomes/cold_email_battle.ts +97 -0
package/src/outcomes/content_creation_battle.ts +160 -0
package/src/outcomes/f1_stem_opt_compliance.ts +61 -0
package/src/outcomes/index.ts +107 -0
package/src/outcomes/lead_gen_battle.test.ts +113 -0
package/src/outcomes/lead_gen_battle.ts +99 -0
package/src/outcomes/outcome.schema.property.test.ts +229 -0
package/src/outcomes/outcome.schema.ts +187 -0
package/src/outcomes/qualified_sales_interest.ts +118 -0
package/src/outcomes/swarm_planner.property.test.ts +370 -0
package/src/outcomes/swarm_planner.ts +96 -0
package/src/outcomes/web_extraction.ts +234 -0
package/src/runtime/README.md +220 -0
package/src/runtime/agentRunner.test.ts +341 -0
package/src/runtime/agentRunner.ts +746 -0
package/src/runtime/claudeAdapter.ts +232 -0
package/src/runtime/costTracker.ts +123 -0
package/src/runtime/index.ts +34 -0
package/src/runtime/modelAdapter.property.test.ts +305 -0
package/src/runtime/modelAdapter.ts +144 -0
package/src/runtime/openaiAdapter.ts +235 -0
package/src/utils/README.md +122 -0
package/src/utils/command-runner.ts +134 -0
package/src/utils/cost-guard.ts +379 -0
package/src/utils/errors.test.ts +290 -0
package/src/utils/errors.ts +442 -0
package/src/utils/index.ts +37 -0
package/src/utils/logger.test.ts +361 -0
package/src/utils/logger.ts +419 -0
package/src/utils/output-parsers.ts +216 -0

package/src/league/health-check.ts ADDED Viewed

@@ -0,0 +1,353 @@
+/**
+ * Health Check System - Monitors agent availability
+ *
+ * Periodically checks registered agents to verify they are online
+ * and responsive. Updates agent deployment status accordingly.
+ *
+ * @module league/health-check
+ */
+import type {
+  RegisteredAgent,
+  HealthCheckResponse,
+  DeploymentInfo,
+} from '../agents/registered-agent.schema.js';
+/**
+ * Health check result for a single agent.
+ */
+export interface HealthCheckResult {
+  agentId: string;
+  agentName: string;
+  status: 'healthy' | 'degraded' | 'unhealthy';
+  latencyMs: number;
+  checkedAt: Date;
+  error?: string;
+  response?: HealthCheckResponse;
+}
+/**
+ * Configuration for the health check service.
+ */
+export interface HealthCheckConfig {
+  /** Timeout for health check requests in milliseconds */
+  timeoutMs: number;
+  /** Number of consecutive failures before marking offline */
+  failureThreshold: number;
+  /** Interval between health checks in milliseconds */
+  checkIntervalMs: number;
+}
+/**
+ * Default health check configuration.
+ */
+export const DEFAULT_HEALTH_CHECK_CONFIG: HealthCheckConfig = {
+  timeoutMs: 5000,
+  failureThreshold: 3,
+  checkIntervalMs: 60000, // 1 minute
+};
+/**
+ * Tracks consecutive failures per agent.
+ */
+const failureCounters: Map<string, number> = new Map();
+/**
+ * Perform a health check on a single agent.
+ *
+ * @param agent - The agent to check
+ * @param config - Health check configuration
+ * @returns Health check result
+ */
+export async function checkAgentHealth(
+  agent: RegisteredAgent,
+  config: HealthCheckConfig = DEFAULT_HEALTH_CHECK_CONFIG
+): Promise<HealthCheckResult> {
+  const startTime = Date.now();
+  const controller = new AbortController();
+  const timeout = setTimeout(() => controller.abort(), config.timeoutMs);
+  try {
+    // Determine health endpoint URL
+    const healthUrl = getHealthEndpoint(agent.endpoint.url);
+    const response = await fetch(healthUrl, {
+      method: 'GET',
+      headers: buildHeaders(agent),
+      signal: controller.signal,
+    });
+    const latencyMs = Date.now() - startTime;
+    if (!response.ok) {
+      return createUnhealthyResult(agent, latencyMs, `HTTP ${response.status}`);
+    }
+    const data: HealthCheckResponse = await response.json();
+    // Reset failure counter on success
+    failureCounters.set(agent.id, 0);
+    return {
+      agentId: agent.id,
+      agentName: agent.name,
+      status: data.status,
+      latencyMs,
+      checkedAt: new Date(),
+      response: data,
+    };
+  } catch (error) {
+    const latencyMs = Date.now() - startTime;
+    const errorMessage =
+      error instanceof Error ? error.message : 'Unknown error';
+    // Increment failure counter
+    const currentFailures = (failureCounters.get(agent.id) ?? 0) + 1;
+    failureCounters.set(agent.id, currentFailures);
+    return createUnhealthyResult(agent, latencyMs, errorMessage);
+  } finally {
+    clearTimeout(timeout);
+  }
+}
+/**
+ * Check health of multiple agents in parallel.
+ *
+ * @param agents - Array of agents to check
+ * @param config - Health check configuration
+ * @returns Array of health check results
+ */
+export async function checkMultipleAgents(
+  agents: RegisteredAgent[],
+  config: HealthCheckConfig = DEFAULT_HEALTH_CHECK_CONFIG
+): Promise<HealthCheckResult[]> {
+  const results = await Promise.all(
+    agents.map((agent) => checkAgentHealth(agent, config))
+  );
+  return results;
+}
+/**
+ * Determine if an agent should be marked offline based on failure count.
+ *
+ * @param agentId - The agent ID
+ * @param config - Health check configuration
+ * @returns True if agent should be marked offline
+ */
+export function shouldMarkOffline(
+  agentId: string,
+  config: HealthCheckConfig = DEFAULT_HEALTH_CHECK_CONFIG
+): boolean {
+  const failures = failureCounters.get(agentId) ?? 0;
+  return failures >= config.failureThreshold;
+}
+/**
+ * Get current failure count for an agent.
+ *
+ * @param agentId - The agent ID
+ * @returns Number of consecutive failures
+ */
+export function getFailureCount(agentId: string): number {
+  return failureCounters.get(agentId) ?? 0;
+}
+/**
+ * Reset failure counter for an agent.
+ *
+ * @param agentId - The agent ID
+ */
+export function resetFailureCount(agentId: string): void {
+  failureCounters.set(agentId, 0);
+}
+/**
+ * Update deployment info based on health check result.
+ *
+ * @param currentInfo - Current deployment info
+ * @param result - Health check result
+ * @param config - Health check configuration
+ * @returns Updated deployment info
+ */
+export function updateDeploymentInfo(
+  currentInfo: DeploymentInfo,
+  result: HealthCheckResult,
+  config: HealthCheckConfig = DEFAULT_HEALTH_CHECK_CONFIG
+): DeploymentInfo {
+  const shouldBeOffline = shouldMarkOffline(result.agentId, config);
+  let newStatus: DeploymentInfo['status'];
+  if (shouldBeOffline) {
+    newStatus = 'offline';
+  } else if (result.status === 'healthy') {
+    newStatus = 'online';
+  } else if (result.status === 'degraded') {
+    newStatus = 'degraded';
+  } else {
+    newStatus = currentInfo.status; // Keep current if single failure
+  }
+  // Calculate rolling average latency
+  const avgLatency =
+    currentInfo.averageLatencyMs === 0
+      ? result.latencyMs
+      : Math.round((currentInfo.averageLatencyMs + result.latencyMs) / 2);
+  // Calculate uptime percentage (simplified)
+  const wasOnline = currentInfo.status === 'online';
+  const isNowOnline = newStatus === 'online';
+  const uptimeChange = isNowOnline ? 1 : wasOnline ? -5 : 0;
+  const newUptime = Math.max(
+    0,
+    Math.min(100, currentInfo.uptimePercent + uptimeChange)
+  );
+  return {
+    ...currentInfo,
+    status: newStatus,
+    lastHealthCheck: result.checkedAt,
+    averageLatencyMs: avgLatency,
+    uptimePercent: newUptime,
+  };
+}
+/**
+ * Get the health endpoint URL from a chat endpoint URL.
+ */
+function getHealthEndpoint(chatUrl: string): string {
+  const url = new URL(chatUrl);
+  // Try common health check paths
+  if (url.pathname.endsWith('/chat')) {
+    url.pathname = url.pathname.replace(/\/chat$/, '/health');
+  } else if (url.pathname.endsWith('/v1/chat/completions')) {
+    url.pathname = url.pathname.replace(/\/v1\/chat\/completions$/, '/health');
+  } else {
+    // Append /health to the base
+    url.pathname = url.pathname.replace(/\/$/, '') + '/health';
+  }
+  return url.toString();
+}
+/**
+ * Build authentication headers for an agent.
+ */
+function buildHeaders(agent: RegisteredAgent): Record<string, string> {
+  if (agent.endpoint.authType === 'none') {
+    return {};
+  }
+  // Note: In production, this would decrypt the token
+  const token = agent.endpoint.encryptedAuthToken ?? '';
+  const headerName = agent.endpoint.authHeader ?? 'Authorization';
+  const headerValue =
+    agent.endpoint.authType === 'bearer' ? `Bearer ${token}` : token;
+  return { [headerName]: headerValue };
+}
+/**
+ * Create an unhealthy result.
+ */
+function createUnhealthyResult(
+  agent: RegisteredAgent,
+  latencyMs: number,
+  error: string
+): HealthCheckResult {
+  return {
+    agentId: agent.id,
+    agentName: agent.name,
+    status: 'unhealthy',
+    latencyMs,
+    checkedAt: new Date(),
+    error,
+  };
+}
+/**
+ * Health Check Service class for managing periodic checks.
+ */
+export class HealthCheckService {
+  private config: HealthCheckConfig;
+  private intervalId: NodeJS.Timeout | null = null;
+  private onStatusChange?: (
+    agentId: string,
+    oldStatus: string,
+    newStatus: string
+  ) => void;
+  constructor(
+    config: Partial<HealthCheckConfig> = {},
+    onStatusChange?: (
+      agentId: string,
+      oldStatus: string,
+      newStatus: string
+    ) => void
+  ) {
+    this.config = { ...DEFAULT_HEALTH_CHECK_CONFIG, ...config };
+    this.onStatusChange = onStatusChange;
+  }
+  /**
+   * Start periodic health checks.
+   *
+   * @param getAgents - Function to get current list of agents
+   * @param updateAgent - Function to update agent deployment info
+   */
+  start(
+    getAgents: () => RegisteredAgent[],
+    updateAgent: (agentId: string, deployment: DeploymentInfo) => void
+  ): void {
+    if (this.intervalId) {
+      this.stop();
+    }
+    const runChecks = async () => {
+      const agents = getAgents();
+      const results = await checkMultipleAgents(agents, this.config);
+      for (const result of results) {
+        const agent = agents.find((a) => a.id === result.agentId);
+        if (!agent) continue;
+        const oldStatus = agent.deployment.status;
+        const newDeployment = updateDeploymentInfo(
+          agent.deployment,
+          result,
+          this.config
+        );
+        if (oldStatus !== newDeployment.status && this.onStatusChange) {
+          this.onStatusChange(agent.id, oldStatus, newDeployment.status);
+        }
+        updateAgent(agent.id, newDeployment);
+      }
+    };
+    // Run immediately
+    runChecks();
+    // Then run periodically
+    this.intervalId = setInterval(runChecks, this.config.checkIntervalMs);
+  }
+  /**
+   * Stop periodic health checks.
+   */
+  stop(): void {
+    if (this.intervalId) {
+      clearInterval(this.intervalId);
+      this.intervalId = null;
+    }
+  }
+  /**
+   * Check if the service is running.
+   */
+  isRunning(): boolean {
+    return this.intervalId !== null;
+  }
+}

package/src/league/index.ts ADDED Viewed

@@ -0,0 +1,93 @@
+/**
+ * League Module - Parallel agent competition system
+ *
+ * @module league
+ */
+export {
+  type LeagueConfig,
+  type AgentResult,
+  type LeagueResult,
+  runLeague,
+  runLeagueMock,
+} from './runLeague.js';
+export {
+  type KillReason,
+  type AgentLimits,
+  type RunningAgent,
+  shouldKillAgent,
+  killAgent,
+  checkAllAgents,
+} from './killAgent.js';
+export {
+  type AgentMetrics,
+  type AgentScore,
+  scoreAgent,
+  determineWinner,
+  rankAgents,
+  calculateLeagueStats,
+} from './scoreAgent.js';
+// Battle Orchestrator - Production battle management
+export {
+  type BattleConfig,
+  type BattleTask,
+  type BattleResult,
+  type AgentBattleRequest,
+  type AgentBattleResponse,
+  type AgentBattleResult,
+  BattleOrchestrator,
+  AgentOfflineError,
+  createBattleOrchestrator,
+} from './battle-orchestrator.js';
+// Health Check System - Agent availability monitoring
+export {
+  type HealthCheckResult,
+  type HealthCheckConfig,
+  DEFAULT_HEALTH_CHECK_CONFIG,
+  checkAgentHealth,
+  checkMultipleAgents,
+  shouldMarkOffline,
+  getFailureCount,
+  resetFailureCount,
+  updateDeploymentInfo,
+  HealthCheckService,
+} from './health-check.js';
+// Team Coordinator - Team battle management
+export {
+  type TeamConfig,
+  type TeamState,
+  type StateUpdateResult,
+  type MemberContribution,
+  type TeamPayoutDistribution,
+  type TeamStateChangeEvent,
+  type TeamStateChangeListener,
+  StateConflictError,
+  TeamNotFoundError,
+  NotTeamMemberError,
+  TeamCoordinator,
+  createTeamCoordinator,
+} from './team-coordinator.js';
+// Multi-Step Orchestrator - Multi-step bounty execution
+export {
+  type TaskNode,
+  type MultiStepBounty,
+  type TaskExecutionResult,
+  type MultiStepResult,
+  type TaskContext,
+  type MultiStepAgent,
+  CyclicDependencyError,
+  InvalidDependencyError,
+  InvalidFinalTaskError,
+  TaskExecutionError,
+  validateTaskGraph,
+  validateMultiStepBounty,
+  getTopologicalOrder,
+  MultiStepOrchestrator,
+  createMultiStepOrchestrator,
+} from './multi-step-orchestrator.js';

package/src/league/killAgent.ts ADDED Viewed

@@ -0,0 +1,151 @@
+/**
+ * Kill Agent - Agent termination logic
+ *
+ * Handles agent termination conditions and cleanup.
+ *
+ * @module league/killAgent
+ * @see Requirements 4.3, 4.4, 10.2
+ */
+import type { CostTracker } from '../runtime/costTracker.js';
+/**
+ * Reason for agent termination.
+ */
+export interface KillReason {
+  /** Type of termination */
+  type: 'cost_exceeded' | 'attempts_exceeded' | 'timeout' | 'competitor_won';
+  /** Human-readable details */
+  details: string;
+}
+/**
+ * Limits that trigger agent termination.
+ */
+export interface AgentLimits {
+  /** Maximum tokens allowed */
+  maxTokens: number;
+  /** Maximum attempts allowed */
+  maxAttempts: number;
+  /** Maximum runtime in milliseconds */
+  maxRuntimeMs: number;
+}
+/**
+ * State of a running agent.
+ */
+export interface RunningAgent {
+  /** Agent ID */
+  agentId: string;
+  /** Current attempt count */
+  attempts: number;
+  /** Cost tracker for the agent */
+  costTracker: CostTracker;
+  /** Start time of the agent run */
+  startTime: number;
+  /** Whether a competitor has already won */
+  competitorWon: boolean;
+}
+/**
+ * Checks if an agent should be terminated based on current state.
+ *
+ * @param agent - Current agent state
+ * @param limits - Termination limits
+ * @returns KillReason if agent should be killed, null otherwise
+ *
+ * @example
+ * const reason = shouldKillAgent(agent, {
+ *   maxTokens: 10000,
+ *   maxAttempts: 5,
+ *   maxRuntimeMs: 300000
+ * });
+ * if (reason) {
+ *   await killAgent(agent.agentId, reason);
+ * }
+ *
+ * @see Requirements 4.3, 4.4, 10.2
+ */
+export function shouldKillAgent(
+  agent: RunningAgent,
+  limits: AgentLimits
+): KillReason | null {
+  // Check if competitor already won (Requirement 4.5)
+  if (agent.competitorWon) {
+    return {
+      type: 'competitor_won',
+      details: `Another agent achieved success first`,
+    };
+  }
+  // Check cost ceiling (Requirement 4.4, 10.1)
+  if (agent.costTracker.tokensSpent > limits.maxTokens) {
+    return {
+      type: 'cost_exceeded',
+      details: `Token usage ${agent.costTracker.tokensSpent} exceeded ceiling ${limits.maxTokens}`,
+    };
+  }
+  // Check attempt limit (Requirement 4.3)
+  if (agent.attempts >= limits.maxAttempts) {
+    return {
+      type: 'attempts_exceeded',
+      details: `Attempt count ${agent.attempts} reached limit ${limits.maxAttempts}`,
+    };
+  }
+  // Check runtime limit (Requirement 10.2)
+  const elapsed = Date.now() - agent.startTime;
+  if (elapsed >= limits.maxRuntimeMs) {
+    return {
+      type: 'timeout',
+      details: `Runtime ${elapsed}ms exceeded limit ${limits.maxRuntimeMs}ms`,
+    };
+  }
+  return null;
+}
+/**
+ * Terminates an agent with the given reason.
+ *
+ * @param agentId - ID of the agent to terminate
+ * @param reason - Reason for termination
+ *
+ * @see Requirements 4.3, 4.4
+ */
+export async function killAgent(
+  agentId: string,
+  reason: KillReason
+): Promise<void> {
+  // Log termination
+  console.log(`🔴 Agent ${agentId} terminated: ${reason.type} - ${reason.details}`);
+  // In production, this would:
+  // 1. Send termination signal to the agent
+  // 2. Clean up any resources
+  // 3. Record termination in Durable Objects
+}
+/**
+ * Checks multiple agents and returns which ones should be killed.
+ *
+ * @param agents - Array of running agents
+ * @param limits - Termination limits
+ * @returns Map of agentId to KillReason for agents that should be killed
+ */
+export function checkAllAgents(
+  agents: RunningAgent[],
+  limits: AgentLimits
+): Map<string, KillReason> {
+  const toKill = new Map<string, KillReason>();
+  for (const agent of agents) {
+    const reason = shouldKillAgent(agent, limits);
+    if (reason) {
+      toKill.set(agent.agentId, reason);
+    }
+  }
+  return toKill;
+}