npm - coding-agent-benchmarks - Versions diffs - 0.3.3 → 0.5.0 - Mend

coding-agent-benchmarks 0.3.3 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

package/README.md +80 -257
package/dist/adapters/claudeCodeCLI.d.ts.map +1 -1
package/dist/adapters/claudeCodeCLI.js +0 -6
package/dist/adapters/claudeCodeCLI.js.map +1 -1
package/dist/adapters/copilotCLI.d.ts.map +1 -1
package/dist/adapters/copilotCLI.js +0 -6
package/dist/adapters/copilotCLI.js.map +1 -1
package/dist/config/loader.d.ts.map +1 -1
package/dist/config/loader.js +0 -7
package/dist/config/loader.js.map +1 -1
package/dist/evaluator.d.ts +0 -12
package/dist/evaluator.d.ts.map +1 -1
package/dist/evaluator.js +0 -36
package/dist/evaluator.js.map +1 -1
package/dist/index.d.ts +2 -0
package/dist/index.d.ts.map +1 -1
package/dist/index.js +4 -1
package/dist/index.js.map +1 -1
package/dist/runner.js +12 -14
package/dist/runner.js.map +1 -1
package/dist/types.d.ts +1 -1
package/dist/utils/baselineManager.d.ts.map +1 -1
package/dist/utils/baselineManager.js +0 -4
package/dist/utils/baselineManager.js.map +1 -1
package/dist/utils/gitUtils.d.ts.map +1 -1
package/dist/utils/gitUtils.js +0 -6
package/dist/utils/gitUtils.js.map +1 -1
package/dist/utils/updateChecker.d.ts +9 -0
package/dist/utils/updateChecker.d.ts.map +1 -0
package/dist/utils/updateChecker.js +100 -0
package/dist/utils/updateChecker.js.map +1 -0
package/dist/utils/updateNotifier.d.ts +3 -0
package/dist/utils/updateNotifier.d.ts.map +1 -0
package/dist/utils/updateNotifier.js +39 -0
package/dist/utils/updateNotifier.js.map +1 -0
package/dist/utils/workspaceUtils.d.ts.map +1 -1
package/dist/utils/workspaceUtils.js +0 -5
package/dist/utils/workspaceUtils.js.map +1 -1
package/dist/validators/llmJudge.d.ts.map +1 -1
package/dist/validators/llmJudge.js +3 -3
package/dist/validators/llmJudge.js.map +1 -1
package/package.json +2 -1

package/README.md CHANGED Viewed

@@ -1,12 +1,18 @@
 # coding-agent-benchmarks
+**[📖 Documentation](https://chiItepin.github.io/coding-agent-benchmarks)** | **[📦 npm](https://www.npmjs.com/package/coding-agent-benchmarks)** | **[⭐ GitHub](https://github.com/chiItepin/coding-agent-benchmarks)**
 Open-source framework for evaluating AI coding assistants (like GitHub Copilot CLI or Claude Code) follow your coding standards. Here's the workflow:
 1. You give it a prompt → 2. AI generates code → 3. Library validates → 4. You get a score
 ![WhatsApp Image 2026-01-23 at 9 04 49 AM](https://github.com/user-attachments/assets/3544d04f-37a5-47b0-a013-669c6015d26f)
+*Figure 1: Evaluation workflow - prompt → generate → validate → score*
 ![WhatsApp Image 2026-01-24 at 1 58 31 PM](https://github.com/user-attachments/assets/f93ea3e0-74f8-4789-ab43-97245acc91b6)
+*Figure 2: Example terminal output showing scenario evaluation results*
 ## Features
@@ -135,7 +141,7 @@ module.exports = {
   defaultAdapter: 'copilot',
   // Default LLM model for judge
-  defaultModel: 'openai/gpt-4.1',
+  defaultModel: 'openai/gpt-5',
   // Default timeout for code generation (milliseconds)
   // Individual scenarios can override this
@@ -172,33 +178,15 @@ module.exports = {
       id: 'react-no-inline-styles',
       category: 'react',
       severity: 'major',
-      tags: ['react', 'styling', 'best-practices'],
       description: 'Forbid inline style objects in React components',
-      prompt: 'Create a React functional component called Button that accepts a "label" prop and renders a styled button. Use CSS classes instead of inline styles.',
       validationStrategy: {
         patterns: {
-          forbiddenPatterns: [/style\s*=\s*\{\{/, /style\s*=\s*\{[^}]*\}/],
+          forbiddenPatterns: [/style\s*=\s*\{\{/],
           requiredPatterns: [/className/],
         },
       },
     },
-    {
-      id: 'async-error-handling',
-      category: 'general',
-      severity: 'critical',
-      tags: ['async', 'error-handling', 'robustness'],
-      description: 'Ensure async functions have proper error handling',
-      prompt: 'Create an async function called fetchUserData that takes a userId parameter, makes an HTTP request to fetch user data, and returns the user object. Handle errors appropriately.',
-      validationStrategy: {
-        patterns: {
-          requiredPatterns: [/async\s+function\s+fetchUserData|const\s+fetchUserData.*async/, /try|catch|\.catch\(/],
-        },
-        llmJudge: {
-          enabled: true,
-          judgmentPrompt: 'Evaluate the error handling in this async function. Does it use try/catch or .catch()? Are errors logged or re-thrown appropriately?',
-        },
-      },
-    },
+    // Add more scenarios...
   ],
 };
 ```
@@ -211,29 +199,6 @@ You can configure timeouts at three levels (in order of precedence):
 2. **Global default**: Set `defaultTimeout` in your config file
 3. **Built-in default**: 120000ms (2 minutes) if nothing else is specified
-```javascript
-// In benchmarks.config.js
-module.exports = {
-  // Global default applies to all scenarios
-  defaultTimeout: 180000, // 3 minutes
-  scenarios: [
-    {
-      id: 'quick-check',
-      prompt: '...',
-      timeout: 60000, // Override: 1 minute for this scenario
-      // ...
-    },
-    {
-      id: 'complex-task',
-      prompt: '...',
-      // Will use defaultTimeout (3 minutes)
-      // ...
-    },
-  ],
-};
-```
 **Why configure timeouts?**
 - Complex code generation tasks may need more time
 - Simple checks can complete faster with shorter timeouts
@@ -271,133 +236,73 @@ validationStrategy: {
 ### LLM-as-Judge
-Semantic evaluation using AI:
+Semantic evaluation using AI (requires `GITHUB_TOKEN`):
 ```javascript
 validationStrategy: {
   llmJudge: {
     enabled: true,
-    model: 'openai/gpt-4.1', // or 'gpt-4o'
+    model: 'openai/gpt-5',
     judgmentPrompt: `Evaluate if the code follows best practices...`,
   },
 }
 ```
-The LLM judge requires a `GITHUB_TOKEN` environment variable with access to GitHub Models API.
 ### ESLint Integration
 ![WhatsApp Image 2026-01-24 at 2 09 11 PM](https://github.com/user-attachments/assets/12af93e8-ed7c-4153-a183-20601a925965)
+*Figure 3: ESLint validator detecting code quality issues in generated code*
 Run ESLint on generated code:
 ```javascript
 validationStrategy: {
-  eslint: {
-    enabled: true,
-    configPath: '.eslintrc.js', // optional
-  },
+  eslint: { enabled: true, configPath: '.eslintrc.js' },
 }
 ```
 ## Scoring System
-The scoring system operates at three levels: per-validator scoring, per-scenario scoring, and summary scoring.
 ### Per-Validator Scoring
-Each validator (Pattern, LLM Judge, ESLint) independently evaluates the generated code and produces a score from 0.0 to 1.0:
-#### Pattern Validator
-Uses exponential decay based on weighted violations:
-```
-score = e^(-totalWeight)
-```
-Where `totalWeight` is the sum of violation weights:
-- **Critical violations**: 1.0 weight each
-- **Major violations**: 0.7 weight each
-- **Minor violations**: 0.3 weight each
-**Examples**:
-- 0 violations → score = 1.0 (perfect)
-- 1 critical violation → score ≈ 0.37
-- 1 major violation → score ≈ 0.50
-- 2 minor violations → score ≈ 0.55
-#### LLM Judge Validator
-The LLM (GPT-4 or other model) evaluates the code semantically and returns:
-- An `overallScore` from 0.0 to 1.0
-- A list of violations with explanations
-- Passed if: score ≥ 0.7 AND no violations
-The LLM judge provides semantic understanding beyond pattern matching, evaluating whether the code actually solves the problem correctly and follows best practices.
-#### ESLint Validator
-This validator runs ESLint on the generated code and scores based on the number and severity of linting violations. Note that ESLint must be installed and configured in your project for this validator to work. If you don't have ESLint set up globally, disable this validator or provide a custom validator.
-Uses exponential decay with a dampening factor:
-```
-score = e^(-totalWeight / 2)
-```
+Each validator independently evaluates generated code and produces a score from 0.0 to 1.0:
-ESLint violations are mapped to severity:
-- ESLint error (severity 2) → **Major** violation (0.7 weight)
-- ESLint warning (severity 1) → **Minor** violation (0.3 weight)
-The `/2` dampening factor makes ESLint less punitive since projects often have many minor linting issues.
+| Validator | Scoring Method | Notes |
+|-----------|----------------|-------|
+| **Pattern** | Uses exponential decay based on weighted violations | Critical: 1.0 weight, Major: 0.7 weight, Minor: 0.3 weight |
+| **LLM Judge** | AI evaluates semantically, returns 0.0-1.0 score | Passes if score ≥ 0.7 AND no violations |
+| **ESLint** | Exponential decay with dampening factor (÷2) | ESLint errors → Major (0.7), warnings → Minor (0.3) |
 ### Per-Scenario Scoring
-Each scenario receives an **overall score** calculated as:
-```
-overallScore = average of all active validator scores
-```
+Each scenario receives an **overall score** = **average of all active validator scores**
-**Active validators** are those that:
-- Are configured in the scenario's `validationStrategy`
-- Successfully ran (did not return score = -1)
+**Active validators** are those configured in `validationStrategy` that successfully ran (score ≠ -1).
 **Pass/Fail Criteria**:
 - ✅ **PASS**: `overallScore ≥ 0.8` AND `violations.length === 0`
 - ❌ **FAIL**: `overallScore < 0.8` OR `violations.length > 0`
 - ⚠️ **SKIP**: An error occurred during evaluation (timeout, adapter failure, etc.)
-**Example**: If Pattern validator returns 0.9, LLM Judge returns 0.8, and ESLint is skipped:
-```
-overallScore = (0.9 + 0.8) / 2 = 0.85
-```
+**Example**: Pattern (0.9) + LLM Judge (0.8) + ESLint (skipped) → `overallScore = (0.9 + 0.8) / 2 = 0.85`
 ### Summary Scoring
-After evaluating all scenarios, the framework calculates summary statistics:
+After evaluating all scenarios, the framework calculates:
 ```javascript
 {
-  total: 10,              // Total number of scenarios
-  passed: 7,              // Scenarios with overallScore ≥ 0.8 and no violations
-  failed: 2,              // Scenarios evaluated but didn't pass
-  skipped: 1,             // Scenarios that encountered errors
-  averageScore: 0.78,     // Average of all scenario overallScores
+  total: 10,              // Total scenarios
+  passed: 7,              // overallScore ≥ 0.8 and no violations
+  failed: 2,              // Evaluated but didn't pass
+  skipped: 1,             // Encountered errors
+  averageScore: 0.78,     // Average of all scenario scores
   totalViolations: 8      // Sum of violations across all scenarios
 }
 ```
-**Average Score Calculation**:
-```
-averageScore = (sum of all scenario scores) / total scenarios
-```
-This includes scores from failed scenarios, providing an overall quality metric across your entire test suite.
-**Transparency**: When baselines are saved, the per-validator breakdown is included in the baseline file, allowing you to trace exactly which validator contributed what score. See [Baseline File Format](#baseline-file-format) for details.
+**Transparency**: Baselines include per-validator breakdowns. See [Baseline File Format](#baseline-file-format) for details.
 ### Score Interpretation
@@ -417,11 +322,6 @@ When baseline tracking is enabled, you'll see delta metrics:
     ↑ +18.5% improvement from baseline
 ```
-The percentage is calculated as:
-```
-percentage = (currentScore - baselineScore) / baselineScore * 100
-```
 ## Baseline Tracking
 Track evaluation results over time by enabling baseline management in your config file:
@@ -449,42 +349,21 @@ When `compareBaseline` is enabled, the report will show score deltas and whether
 ### Baseline File Format
-Each baseline file contains complete transparency into how the score was calculated:
+Path: `.benchmarks/baselines/{adapter}/{model}/{scenario-id}.json`
+Each baseline file provides complete score traceability:
 ```json
 {
   "scenarioId": "typescript-no-any",
   "score": 0.85,
   "violations": [
-    {
-      "type": "pattern",
-      "message": "Forbidden pattern found: :\\s*any\\b",
-      "file": "src/types.ts",
-      "line": 12,
-      "severity": "critical",
-      "details": "Matched: \"metadata: any\""
-    }
+    { "type": "pattern", "message": "Forbidden pattern found: :\\s*any\\b", "file": "src/types.ts", ... }
   ],
   "validationResults": [
-    {
-      "passed": false,
-      "score": 0.37,
-      "violations": [...],
-      "validatorType": "pattern"
-    },
-    {
-      "passed": true,
-      "score": 1.0,
-      "violations": [],
-      "validatorType": "llm-judge"
-    },
-    {
-      "passed": true,
-      "score": -1,
-      "violations": [],
-      "validatorType": "eslint",
-      "error": "ESLint not found"
-    }
+    { "passed": false, "score": 0.37, "validatorType": "pattern", "violations": [...] },
+    { "passed": true, "score": 1.0, "validatorType": "llm-judge", "violations": [] },
+    { "passed": true, "score": -1, "validatorType": "eslint", "error": "ESLint not found" }
   ],
   "timestamp": "2026-01-23T22:28:32.216Z",
   "adapter": "copilot",
@@ -493,15 +372,11 @@ Each baseline file contains complete transparency into how the score was calcula
 ```
 **Key fields**:
-- `score`: Overall scenario score (average of active validators)
-- `violations`: All violations from all validators combined
-- `validationResults`: Per-validator breakdown showing:
-  - Individual validator score
-  - Whether that validator passed
-  - Violations specific to that validator
-  - Any errors that occurred (`score: -1` means skipped)
+- `score` - Overall scenario score (average of active validators)
+- `violations` - All violations from all validators combined
+- `validationResults` - Per-validator breakdown (score, passed, violations, errors)
-**Score Traceability**: With this format, you can always trace the overall score back to individual validator scores. For example, if you see `score: 0.067`, you can look at `validationResults` to see which validators contributed what scores (e.g., Pattern: 0.135, LLM Judge: 0.00).
+**Traceability**: You can always trace the overall score back to individual validator scores (e.g., `score: 0.067` → check `validationResults` for Pattern: 0.135, LLM Judge: 0.00).
 ## CLI Commands
@@ -509,24 +384,26 @@ Each baseline file contains complete transparency into how the score was calcula
 Run benchmark evaluations.
-**Options:**
-- `--scenario <pattern>`: Filter by scenario ID (supports wildcards like `typescript-*`)
-- `--category <categories>`: Filter by category (comma-separated)
-- `--tag <tags>`: Filter by tags (comma-separated)
-- `--adapter <type>`: Adapter to use (`copilot` or `claude-code`)
-- `--model <model>`: LLM model for judge (default: `openai/gpt-4.1`)
-- `--threshold <number>`: Minimum passing score (default: `0.8`)
-- `--verbose`: Show detailed output
-- `--output <file>`: Export JSON report
-- `--workspace-root <path>`: Workspace root directory
+| Option | Description | Default/Example |
+|--------|-------------|-----------------|
+| `--scenario <pattern>` | Filter by scenario ID (supports wildcards) | `typescript-*` |
+| `--category <categories>` | Filter by category (comma-separated) | `typescript,react` |
+| `--tag <tags>` | Filter by tags (comma-separated) | `safety,types` |
+| `--adapter <type>` | Adapter to use | `copilot` or `claude-code` |
+| `--model <model>` | LLM model for judge | `openai/gpt-5` |
+| `--threshold <number>` | Minimum passing score | `0.8` |
+| `--verbose` | Show detailed output | - |
+| `--output <file>` | Export JSON report | `report.json` |
+| `--workspace-root <path>` | Workspace root directory | Current directory |
 ### `list`
 List available test scenarios.
-**Options:**
-- `--category <categories>`: Filter by category
-- `--tag <tags>`: Filter by tags
+| Option | Description |
+|--------|-------------|
+| `--category <categories>` | Filter by category (comma-separated) |
+| `--tag <tags>` | Filter by tags (comma-separated) |
 ### `check`
@@ -536,8 +413,9 @@ Check if coding agent CLIs are available.
 Test LLM judge with a custom prompt (for debugging).
-**Options:**
-- `--model <model>`: LLM model to use
+| Option | Description |
+|--------|-------------|
+| `--model <model>` | LLM model to use |
 ## Understanding Output
@@ -586,26 +464,15 @@ import { Evaluator, loadConfig } from 'coding-agent-benchmarks';
 async function runEvaluation() {
   const { config, scenarios } = await loadConfig();
-  // Create evaluator
   const evaluator = new Evaluator({
     adapter: 'copilot',
-    model: 'openai/gpt-4.1',
+    model: 'openai/gpt-5',
     verbose: true,
     saveBaseline: config.saveBaseline,
     compareBaseline: config.compareBaseline,
   });
-  // Check adapter availability
-  const available = await evaluator.checkAdapterAvailability();
-  if (!available) {
-    throw new Error('Adapter not available');
-  }
-  // Run evaluation
   const report = await evaluator.evaluate(scenarios);
-  console.log(`Passed: ${report.summary.passed}/${report.summary.total}`);
-  console.log(`Average score: ${report.summary.averageScore.toFixed(2)}`);
 }
 runEvaluation();
@@ -616,106 +483,62 @@ runEvaluation();
 Implement the `CodeValidator` interface:
 ```typescript
-import { CodeValidator, ValidationResult, TestScenario } from 'coding-agent-benchmarks';
+import { CodeValidator, ValidationResult } from 'coding-agent-benchmarks';
 export class CustomValidator implements CodeValidator {
   public readonly type = 'custom';
-  async validate(
-    files: readonly string[],
-    scenario: TestScenario
-  ): Promise<ValidationResult> {
+  async validate(files: readonly string[], scenario: TestScenario): Promise<ValidationResult> {
     // Your validation logic here
-    return {
-      passed: true,
-      score: 1.0,
-      violations: [],
-      validatorType: 'custom',
-    };
+    return { passed: true, score: 1.0, violations: [], validatorType: 'custom' };
   }
 }
 ```
+See CONTRIBUTING.md for complete examples.
 ## Creating Custom Adapters
 Implement the `CodeGenerationAdapter` interface:
 ```typescript
-import { CodeGenerationAdapter, AdapterType } from 'coding-agent-benchmarks';
+import { CodeGenerationAdapter } from 'coding-agent-benchmarks';
 export class CustomAdapter implements CodeGenerationAdapter {
-  public readonly type: AdapterType = 'copilot'; // or extend the type
-  async checkAvailability(): Promise<boolean> {
-    // Check if CLI is available
-    return true;
-  }
+  public readonly type = 'custom-adapter';
-  async generate(
-    prompt: string,
-    contextFiles?: readonly string[],
-    timeout?: number
-  ): Promise<string[]> {
-    // Generate code and return changed files
-    return ['path/to/generated/file.ts'];
-  }
+  async checkAvailability(): Promise<boolean> { /* ... */ }
+  async generate(prompt: string, contextFiles?: readonly string[], timeout?: number): Promise<string[]> { /* ... */ }
 }
 ```
+See CONTRIBUTING.md for complete examples.
 ## GitHub Authentication (for LLM Judge)
-LLM-as-judge validation requires GitHub authentication to access GitHub Models API. There are **two easy options** - no OAuth registration needed!
+LLM-as-judge validation requires GitHub authentication to access GitHub Models API. Choose one option:
 ### Option 1: Personal Access Token (Recommended)
-1. Create token at https://github.com/settings/tokens
-2. Click "Generate new token (classic)"
-3. Give it a name (e.g., "coding-agent-benchmarks")
-4. Select scope: **`models:read`**
-5. Generate and copy the token
-6. Set environment variable:
-   ```bash
-   export GITHUB_TOKEN=ghp_xxxxxxxxxxxxxxxxxxxx
-   ```
+Create a token at https://github.com/settings/tokens with the **`models:read`** scope, then set it as an environment variable:
+```bash
+export GITHUB_TOKEN=ghp_xxxxxxxxxxxxxxxxxxxx
+```
 ### Option 2: GitHub CLI (Automatic)
-If you have GitHub CLI installed, tokens are auto-detected:
+If GitHub CLI is installed, tokens are auto-detected:
 ```bash
-# Install GitHub CLI
-brew install gh          # macOS
-# or download from https://cli.github.com
-# Authenticate (one time)
+brew install gh  # or download from https://cli.github.com
 gh auth login
 # Token will be used automatically - no GITHUB_TOKEN needed!
 ```
-### Check Authentication Status
-```bash
-npx coding-agent-benchmarks check
-```
-Output:
-```
-Checking adapter availability...
-  GitHub Copilot CLI: ✓ Available
-  Claude Code CLI: ✗ Not found
-Checking GitHub authentication...
-  ✓ Using token from GitHub CLI (gh auth token)
-```
-## How It Works
+### Check Authentication
-1. **Code Generation**: The adapter spawns a coding agent CLI with a prompt
-2. **File Tracking**: Git is used to detect which files were created/modified
-3. **Validation**: Multiple validators check the generated code
-4. **Scoring**: Results are aggregated and compared against thresholds
-5. **Reporting**: Results are displayed in terminal and optionally exported as JSON
+Run `npx coding-agent-benchmarks check` to verify authentication status.
 ## Requirements

package/dist/adapters/claudeCodeCLI.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"claudeCodeCLI.d.ts","sourceRoot":"","sources":["../../src/adapters/claudeCodeCLI.ts"],"names":[],"mappings":"AAAA;;GAEG;AAKH,OAAO,EAAE,qBAAqB,EAAE,MAAM,UAAU,CAAC;AAOjD,MAAM,WAAW,2BAA2B;IAC1C,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAID,qBAAa,oBAAqB,YAAW,qBAAqB;IAChE,SAAgB,IAAI,EAAG,aAAa,CAAU;IAC9C,OAAO,CAAC,aAAa,CAAS;IAC9B,OAAO,CAAC,KAAK,CAAS;gBAEV,OAAO,CAAC,EAAE,2BAA2B;IAKjD;;OAEG;IACG,iBAAiB,IAAI,OAAO,CAAC,OAAO,CAAC;IAgB3C;;OAEG;IACH,QAAQ,IAAI,MAAM;IAIlB;;OAEG;IACH,OAAO,CAAC,WAAW;IA8BnB;;;OAGG;IACG,QAAQ,CACZ,MAAM,EAAE,MAAM,EACd,YAAY,CAAC,EAAE,SAAS,MAAM,EAAE,EAChC,OAAO,CAAC,EAAE,MAAM,GAAG,IAAI,GACtB,OAAO,CAAC,MAAM,EAAE,CAAC;~~CA6GrB~~"}
1	+ {"version":3,"file":"claudeCodeCLI.d.ts","sourceRoot":"","sources":["../../src/adapters/claudeCodeCLI.ts"],"names":[],"mappings":"AAAA;;GAEG;AAKH,OAAO,EAAE,qBAAqB,EAAE,MAAM,UAAU,CAAC;AAOjD,MAAM,WAAW,2BAA2B;IAC1C,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAID,qBAAa,oBAAqB,YAAW,qBAAqB;IAChE,SAAgB,IAAI,EAAG,aAAa,CAAU;IAC9C,OAAO,CAAC,aAAa,CAAS;IAC9B,OAAO,CAAC,KAAK,CAAS;gBAEV,OAAO,CAAC,EAAE,2BAA2B;IAKjD;;OAEG;IACG,iBAAiB,IAAI,OAAO,CAAC,OAAO,CAAC;IAgB3C;;OAEG;IACH,QAAQ,IAAI,MAAM;IAIlB;;OAEG;IACH,OAAO,CAAC,WAAW;IA8BnB;;;OAGG;IACG,QAAQ,CACZ,MAAM,EAAE,MAAM,EACd,YAAY,CAAC,EAAE,SAAS,MAAM,EAAE,EAChC,OAAO,CAAC,EAAE,MAAM,GAAG,IAAI,GACtB,OAAO,CAAC,MAAM,EAAE,CAAC;CAuGrB"}

package/dist/adapters/claudeCodeCLI.js CHANGED Viewed

@@ -105,13 +105,10 @@ class ClaudeCodeCLIAdapter {
             throw new Error("Claude Code CLI is not available. Please install it first: https://docs.anthropic.com/en/docs/build-with-claude/claude-code");
         }
         const fullPrompt = this.buildPrompt(prompt, contextFiles);
-        // Capture git status before generation
         const statusBefore = (0, gitUtils_1.getGitStatusPorcelain)(this.workspaceRoot);
-        // Write prompt to temp file and pipe via stdin (matches @copilot-evals pattern)
         return new Promise((resolve, reject) => {
             const tempFile = path.join(this.workspaceRoot, ".claude-eval-prompt.txt");
             fs.writeFileSync(tempFile, fullPrompt, "utf8");
-            // Cleanup function
             const cleanup = () => {
                 try {
                     if (fs.existsSync(tempFile)) {
@@ -122,7 +119,6 @@ class ClaudeCodeCLIAdapter {
                     // Ignore cleanup errors
                 }
             };
-            // Register cleanup on process termination
             const cleanupOnExit = () => {
                 cleanup();
             };
@@ -142,7 +138,6 @@ class ClaudeCodeCLIAdapter {
             proc.stderr?.on("data", (data) => {
                 stderr += data.toString();
             });
-            // Set timeout only if specified (null/undefined = no timeout)
             let timeoutHandle = null;
             if (timeout !== null && timeout !== undefined) {
                 timeoutHandle = setTimeout(() => {
@@ -164,7 +159,6 @@ class ClaudeCodeCLIAdapter {
                     reject(new Error(`Claude Code CLI exited with code ${code}\nStderr: ${stderr}`));
                     return;
                 }
-                // Get files changed during generation (diff before/after)
                 try {
                     const statusAfter = (0, gitUtils_1.getGitStatusPorcelain)(this.workspaceRoot);
                     const changedFiles = (0, gitUtils_1.getChangedFilesDiff)(statusBefore, statusAfter, this.workspaceRoot);

package/dist/adapters/claudeCodeCLI.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"claudeCodeCLI.js","sourceRoot":"","sources":["../../src/adapters/claudeCodeCLI.ts"],"names":[],"mappings":";AAAA;;GAEG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAEH,iDAAsC;AACtC,uCAAyB;AACzB,2CAA6B;AAE7B,gDAA+E;AAC/E,4DAGiC;AAOjC,MAAM,aAAa,GAAG,QAAQ,CAAC;AAE/B,MAAa,oBAAoB;IAK/B,YAAY,OAAqC;QAJjC,SAAI,GAAG,aAAsB,CAAC;QAK5C,IAAI,CAAC,aAAa,GAAG,IAAA,qCAAoB,EAAC,OAAO,EAAE,aAAa,CAAC,CAAC;QAClE,IAAI,CAAC,KAAK,GAAG,OAAO,EAAE,KAAK,IAAI,aAAa,CAAC;IAC/C,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,iBAAiB;QACrB,OAAO,IAAI,OAAO,CAAC,CAAC,OAAO,EAAE,EAAE;YAC7B,MAAM,IAAI,GAAG,IAAA,qBAAK,EAAC,OAAO,EAAE,CAAC,QAAQ,CAAC,EAAE;gBACtC,KAAK,EAAE,MAAM;aACd,CAAC,CAAC;YAEH,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,CAAC,IAAI,EAAE,EAAE;gBACxB,OAAO,CAAC,IAAI,KAAK,CAAC,CAAC,CAAC;YACtB,CAAC,CAAC,CAAC;YAEH,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,GAAG,EAAE;gBACpB,OAAO,CAAC,KAAK,CAAC,CAAC;YACjB,CAAC,CAAC,CAAC;QACL,CAAC,CAAC,CAAC;IACL,CAAC;IAED;;OAEG;IACH,QAAQ;QACN,OAAO,IAAI,CAAC,KAAK,CAAC;IACpB,CAAC;IAED;;OAEG;IACK,WAAW,CACjB,MAAc,EACd,YAAgC;QAEhC,MAAM,KAAK,GAAa,EAAE,CAAC;QAE3B,IAAI,YAAY,IAAI,YAAY,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC5C,MAAM,QAAQ,GAAG,IAAA,iCAAgB,EAAC,IAAI,CAAC,aAAa,EAAE,YAAY,CAAC,CAAC;YACpE,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBACxB,KAAK,CAAC,IAAI,CAAC,qBAAqB,CAAC,CAAC;gBAClC,MAAM,cAAc,GAAG,QAAQ;qBAC5B,GAAG,CAAC,CAAC,GAAG,EAAE,EAAE;oBACX,MAAM,GAAG,GAAG,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,IAAI,YAAY,CAAC;oBAC5D,OAAO,OAAO,GAAG,CAAC,IAAI,WAAW,GAAG,KAAK,GAAG,CAAC,OAAO,UAAU,CAAC;gBACjE,CAAC,CAAC;qBACD,IAAI,CAAC,MAAM,CAAC,CAAC;gBAChB,KAAK,CAAC,IAAI,CAAC,cAAc,CAAC,CAAC;gBAC3B,KAAK,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;YACxB,CAAC;QACH,CAAC;QAED,KAAK,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;QACvB,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QACnB,KAAK,CAAC,IAAI,CACR,0GAA0G,CAC3G,CAAC;QAEF,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC1B,CAAC;IAED;;;OAGG;IACH,KAAK,CAAC,QAAQ,CACZ,MAAc,EACd,YAAgC,EAChC,OAAuB;QAEvB,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,iBAAiB,EAAE,CAAC;QACnD,IAAI,CAAC,WAAW,EAAE,CAAC;YACjB,MAAM,IAAI,KAAK,CACb,6HAA6H,CAC9H,CAAC;QACJ,CAAC;QAED,MAAM,UAAU,GAAG,IAAI,CAAC,WAAW,CAAC,MAAM,EAAE,YAAY,CAAC,CAAC;QAE1D,~~uCAAuC;QACvC,~~MAAM,YAAY,GAAG,IAAA,gCAAqB,EAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAE/D,~~gFAAgF;QAChF,~~OAAO,IAAI,OAAO,CAAC,CAAC,OAAO,EAAE,MAAM,EAAE,EAAE;YACrC,MAAM,QAAQ,GAAG,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,aAAa,EAAE,yBAAyB,CAAC,CAAC;YAC1E,EAAE,CAAC,aAAa,CAAC,QAAQ,EAAE,UAAU,EAAE,MAAM,CAAC,CAAC;YAE/C,~~mBAAmB;YACnB,~~MAAM,OAAO,GAAG,GAAS,EAAE;gBACzB,IAAI,CAAC;oBACH,IAAI,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;wBAC5B,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC;oBAC1B,CAAC;gBACH,CAAC;gBAAC,MAAM,CAAC;oBACP,wBAAwB;gBAC1B,CAAC;YACH,CAAC,CAAC;YAEF,~~0CAA0C;YAC1C,~~MAAM,aAAa,GAAG,GAAS,EAAE;gBAC/B,OAAO,EAAE,CAAC;YACZ,CAAC,CAAC;YACF,OAAO,CAAC,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;YACtC,OAAO,CAAC,IAAI,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;YAEvC,MAAM,OAAO,GAAG,QAAQ,QAAQ,sBAAsB,IAAI,CAAC,KAAK,yIAAyI,CAAC;YAC1M,MAAM,IAAI,GAAG,IAAA,qBAAK,EAAC,IAAI,EAAE,CAAC,IAAI,EAAE,OAAO,CAAC,EAAE;gBACxC,GAAG,EAAE,IAAI,CAAC,aAAa;gBACvB,KAAK,EAAE,CAAC,MAAM,EAAE,MAAM,EAAE,MAAM,CAAC;aAChC,CAAC,CAAC;YAEH,6DAA6D;YAC7D,IAAI,MAAM,GAAG,EAAE,CAAC;YAChB,IAAI,MAAM,GAAG,EAAE,CAAC;YAEhB,IAAI,CAAC,MAAM,EAAE,EAAE,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,EAAE;gBAC/B,MAAM,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;YAC5B,CAAC,CAAC,CAAC;YAEH,IAAI,CAAC,MAAM,EAAE,EAAE,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,EAAE;gBAC/B,MAAM,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;YAC5B,CAAC,CAAC,CAAC;YAEH,~~8DAA8D;YAC9D,~~IAAI,aAAa,GAA0B,IAAI,CAAC;YAChD,IAAI,OAAO,KAAK,IAAI,IAAI,OAAO,KAAK,SAAS,EAAE,CAAC;gBAC9C,aAAa,GAAG,UAAU,CAAC,GAAG,EAAE;oBAC9B,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;oBACrB,OAAO,EAAE,CAAC;oBACV,OAAO,CAAC,cAAc,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;oBAChD,OAAO,CAAC,cAAc,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;oBACjD,MAAM,CAAC,IAAI,KAAK,CAAC,mCAAmC,OAAO,IAAI,CAAC,CAAC,CAAC;gBACpE,CAAC,EAAE,OAAO,CAAC,CAAC;YACd,CAAC;YAED,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,CAAC,IAAI,EAAE,EAAE;gBACxB,IAAI,aAAa,EAAE,CAAC;oBAClB,YAAY,CAAC,aAAa,CAAC,CAAC;gBAC9B,CAAC;gBAED,OAAO,EAAE,CAAC;gBACV,OAAO,CAAC,cAAc,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;gBAChD,OAAO,CAAC,cAAc,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;gBAEjD,IAAI,IAAI,KAAK,CAAC,EAAE,CAAC;oBACf,MAAM,CACJ,IAAI,KAAK,CACP,oCAAoC,IAAI,aAAa,MAAM,EAAE,CAC9D,CACF,CAAC;oBACF,OAAO;gBACT,CAAC;gBAED,~~0DAA0D;gBAC1D,~~IAAI,CAAC;oBACH,MAAM,WAAW,GAAG,IAAA,gCAAqB,EAAC,IAAI,CAAC,aAAa,CAAC,CAAC;oBAC9D,MAAM,YAAY,GAAG,IAAA,8BAAmB,EACtC,YAAY,EACZ,WAAW,EACX,IAAI,CAAC,aAAa,CACnB,CAAC;oBACF,OAAO,CAAC,YAAY,CAAC,CAAC;gBACxB,CAAC;gBAAC,OAAO,KAAK,EAAE,CAAC;oBACf,MAAM,CAAC,IAAI,KAAK,CAAC,gCAAgC,KAAK,EAAE,CAAC,CAAC,CAAC;gBAC7D,CAAC;YACH,CAAC,CAAC,CAAC;YAEH,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,CAAC,KAAK,EAAE,EAAE;gBACzB,IAAI,aAAa,EAAE,CAAC;oBAClB,YAAY,CAAC,aAAa,CAAC,CAAC;gBAC9B,CAAC;gBACD,OAAO,EAAE,CAAC;gBACV,OAAO,CAAC,cAAc,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;gBAChD,OAAO,CAAC,cAAc,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;gBACjD,MAAM,CAAC,IAAI,KAAK,CAAC,oCAAoC,KAAK,EAAE,CAAC,CAAC,CAAC;YACjE,CAAC,CAAC,CAAC;QACL,CAAC,CAAC,CAAC;IACL,CAAC;CACF;~~AA1LD~~,~~oDA0LC~~"}
1	+ {"version":3,"file":"claudeCodeCLI.js","sourceRoot":"","sources":["../../src/adapters/claudeCodeCLI.ts"],"names":[],"mappings":";AAAA;;GAEG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAEH,iDAAsC;AACtC,uCAAyB;AACzB,2CAA6B;AAE7B,gDAA+E;AAC/E,4DAGiC;AAOjC,MAAM,aAAa,GAAG,QAAQ,CAAC;AAE/B,MAAa,oBAAoB;IAK/B,YAAY,OAAqC;QAJjC,SAAI,GAAG,aAAsB,CAAC;QAK5C,IAAI,CAAC,aAAa,GAAG,IAAA,qCAAoB,EAAC,OAAO,EAAE,aAAa,CAAC,CAAC;QAClE,IAAI,CAAC,KAAK,GAAG,OAAO,EAAE,KAAK,IAAI,aAAa,CAAC;IAC/C,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,iBAAiB;QACrB,OAAO,IAAI,OAAO,CAAC,CAAC,OAAO,EAAE,EAAE;YAC7B,MAAM,IAAI,GAAG,IAAA,qBAAK,EAAC,OAAO,EAAE,CAAC,QAAQ,CAAC,EAAE;gBACtC,KAAK,EAAE,MAAM;aACd,CAAC,CAAC;YAEH,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,CAAC,IAAI,EAAE,EAAE;gBACxB,OAAO,CAAC,IAAI,KAAK,CAAC,CAAC,CAAC;YACtB,CAAC,CAAC,CAAC;YAEH,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,GAAG,EAAE;gBACpB,OAAO,CAAC,KAAK,CAAC,CAAC;YACjB,CAAC,CAAC,CAAC;QACL,CAAC,CAAC,CAAC;IACL,CAAC;IAED;;OAEG;IACH,QAAQ;QACN,OAAO,IAAI,CAAC,KAAK,CAAC;IACpB,CAAC;IAED;;OAEG;IACK,WAAW,CACjB,MAAc,EACd,YAAgC;QAEhC,MAAM,KAAK,GAAa,EAAE,CAAC;QAE3B,IAAI,YAAY,IAAI,YAAY,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC5C,MAAM,QAAQ,GAAG,IAAA,iCAAgB,EAAC,IAAI,CAAC,aAAa,EAAE,YAAY,CAAC,CAAC;YACpE,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBACxB,KAAK,CAAC,IAAI,CAAC,qBAAqB,CAAC,CAAC;gBAClC,MAAM,cAAc,GAAG,QAAQ;qBAC5B,GAAG,CAAC,CAAC,GAAG,EAAE,EAAE;oBACX,MAAM,GAAG,GAAG,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,IAAI,YAAY,CAAC;oBAC5D,OAAO,OAAO,GAAG,CAAC,IAAI,WAAW,GAAG,KAAK,GAAG,CAAC,OAAO,UAAU,CAAC;gBACjE,CAAC,CAAC;qBACD,IAAI,CAAC,MAAM,CAAC,CAAC;gBAChB,KAAK,CAAC,IAAI,CAAC,cAAc,CAAC,CAAC;gBAC3B,KAAK,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;YACxB,CAAC;QACH,CAAC;QAED,KAAK,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;QACvB,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QACnB,KAAK,CAAC,IAAI,CACR,0GAA0G,CAC3G,CAAC;QAEF,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC1B,CAAC;IAED;;;OAGG;IACH,KAAK,CAAC,QAAQ,CACZ,MAAc,EACd,YAAgC,EAChC,OAAuB;QAEvB,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,iBAAiB,EAAE,CAAC;QACnD,IAAI,CAAC,WAAW,EAAE,CAAC;YACjB,MAAM,IAAI,KAAK,CACb,6HAA6H,CAC9H,CAAC;QACJ,CAAC;QAED,MAAM,UAAU,GAAG,IAAI,CAAC,WAAW,CAAC,MAAM,EAAE,YAAY,CAAC,CAAC;QAE1D,MAAM,YAAY,GAAG,IAAA,gCAAqB,EAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAE/D,OAAO,IAAI,OAAO,CAAC,CAAC,OAAO,EAAE,MAAM,EAAE,EAAE;YACrC,MAAM,QAAQ,GAAG,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,aAAa,EAAE,yBAAyB,CAAC,CAAC;YAC1E,EAAE,CAAC,aAAa,CAAC,QAAQ,EAAE,UAAU,EAAE,MAAM,CAAC,CAAC;YAE/C,MAAM,OAAO,GAAG,GAAS,EAAE;gBACzB,IAAI,CAAC;oBACH,IAAI,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;wBAC5B,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC;oBAC1B,CAAC;gBACH,CAAC;gBAAC,MAAM,CAAC;oBACP,wBAAwB;gBAC1B,CAAC;YACH,CAAC,CAAC;YAEF,MAAM,aAAa,GAAG,GAAS,EAAE;gBAC/B,OAAO,EAAE,CAAC;YACZ,CAAC,CAAC;YACF,OAAO,CAAC,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;YACtC,OAAO,CAAC,IAAI,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;YAEvC,MAAM,OAAO,GAAG,QAAQ,QAAQ,sBAAsB,IAAI,CAAC,KAAK,yIAAyI,CAAC;YAC1M,MAAM,IAAI,GAAG,IAAA,qBAAK,EAAC,IAAI,EAAE,CAAC,IAAI,EAAE,OAAO,CAAC,EAAE;gBACxC,GAAG,EAAE,IAAI,CAAC,aAAa;gBACvB,KAAK,EAAE,CAAC,MAAM,EAAE,MAAM,EAAE,MAAM,CAAC;aAChC,CAAC,CAAC;YAEH,6DAA6D;YAC7D,IAAI,MAAM,GAAG,EAAE,CAAC;YAChB,IAAI,MAAM,GAAG,EAAE,CAAC;YAEhB,IAAI,CAAC,MAAM,EAAE,EAAE,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,EAAE;gBAC/B,MAAM,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;YAC5B,CAAC,CAAC,CAAC;YAEH,IAAI,CAAC,MAAM,EAAE,EAAE,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,EAAE;gBAC/B,MAAM,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;YAC5B,CAAC,CAAC,CAAC;YAEH,IAAI,aAAa,GAA0B,IAAI,CAAC;YAChD,IAAI,OAAO,KAAK,IAAI,IAAI,OAAO,KAAK,SAAS,EAAE,CAAC;gBAC9C,aAAa,GAAG,UAAU,CAAC,GAAG,EAAE;oBAC9B,IAAI,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;oBACrB,OAAO,EAAE,CAAC;oBACV,OAAO,CAAC,cAAc,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;oBAChD,OAAO,CAAC,cAAc,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;oBACjD,MAAM,CAAC,IAAI,KAAK,CAAC,mCAAmC,OAAO,IAAI,CAAC,CAAC,CAAC;gBACpE,CAAC,EAAE,OAAO,CAAC,CAAC;YACd,CAAC;YAED,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,CAAC,IAAI,EAAE,EAAE;gBACxB,IAAI,aAAa,EAAE,CAAC;oBAClB,YAAY,CAAC,aAAa,CAAC,CAAC;gBAC9B,CAAC;gBAED,OAAO,EAAE,CAAC;gBACV,OAAO,CAAC,cAAc,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;gBAChD,OAAO,CAAC,cAAc,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;gBAEjD,IAAI,IAAI,KAAK,CAAC,EAAE,CAAC;oBACf,MAAM,CACJ,IAAI,KAAK,CACP,oCAAoC,IAAI,aAAa,MAAM,EAAE,CAC9D,CACF,CAAC;oBACF,OAAO;gBACT,CAAC;gBAED,IAAI,CAAC;oBACH,MAAM,WAAW,GAAG,IAAA,gCAAqB,EAAC,IAAI,CAAC,aAAa,CAAC,CAAC;oBAC9D,MAAM,YAAY,GAAG,IAAA,8BAAmB,EACtC,YAAY,EACZ,WAAW,EACX,IAAI,CAAC,aAAa,CACnB,CAAC;oBACF,OAAO,CAAC,YAAY,CAAC,CAAC;gBACxB,CAAC;gBAAC,OAAO,KAAK,EAAE,CAAC;oBACf,MAAM,CAAC,IAAI,KAAK,CAAC,gCAAgC,KAAK,EAAE,CAAC,CAAC,CAAC;gBAC7D,CAAC;YACH,CAAC,CAAC,CAAC;YAEH,IAAI,CAAC,EAAE,CAAC,OAAO,EAAE,CAAC,KAAK,EAAE,EAAE;gBACzB,IAAI,aAAa,EAAE,CAAC;oBAClB,YAAY,CAAC,aAAa,CAAC,CAAC;gBAC9B,CAAC;gBACD,OAAO,EAAE,CAAC;gBACV,OAAO,CAAC,cAAc,CAAC,QAAQ,EAAE,aAAa,CAAC,CAAC;gBAChD,OAAO,CAAC,cAAc,CAAC,SAAS,EAAE,aAAa,CAAC,CAAC;gBACjD,MAAM,CAAC,IAAI,KAAK,CAAC,oCAAoC,KAAK,EAAE,CAAC,CAAC,CAAC;YACjE,CAAC,CAAC,CAAC;QACL,CAAC,CAAC,CAAC;IACL,CAAC;CACF;AApLD,oDAoLC"}

package/dist/adapters/copilotCLI.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"copilotCLI.d.ts","sourceRoot":"","sources":["../../src/adapters/copilotCLI.ts"],"names":[],"mappings":"AAAA;;GAEG;AAKH,OAAO,EAAE,qBAAqB,EAAE,MAAM,UAAU,CAAC;AAOjD,MAAM,WAAW,wBAAwB;IACvC,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAID,qBAAa,iBAAkB,YAAW,qBAAqB;IAC7D,SAAgB,IAAI,EAAG,SAAS,CAAU;IAC1C,OAAO,CAAC,aAAa,CAAS;IAC9B,OAAO,CAAC,KAAK,CAAS;gBAEV,OAAO,CAAC,EAAE,wBAAwB;IAKxC,iBAAiB,IAAI,OAAO,CAAC,OAAO,CAAC;IAgB3C;;OAEG;IACH,QAAQ,IAAI,MAAM;IAIlB;;OAEG;IACH,OAAO,CAAC,WAAW;IA8BnB;;;OAGG;IACG,QAAQ,CACZ,MAAM,EAAE,MAAM,EACd,YAAY,CAAC,EAAE,SAAS,MAAM,EAAE,EAChC,OAAO,CAAC,EAAE,MAAM,GAAG,IAAI,GACtB,OAAO,CAAC,MAAM,EAAE,CAAC;~~CA+GrB~~"}
1	+ {"version":3,"file":"copilotCLI.d.ts","sourceRoot":"","sources":["../../src/adapters/copilotCLI.ts"],"names":[],"mappings":"AAAA;;GAEG;AAKH,OAAO,EAAE,qBAAqB,EAAE,MAAM,UAAU,CAAC;AAOjD,MAAM,WAAW,wBAAwB;IACvC,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAID,qBAAa,iBAAkB,YAAW,qBAAqB;IAC7D,SAAgB,IAAI,EAAG,SAAS,CAAU;IAC1C,OAAO,CAAC,aAAa,CAAS;IAC9B,OAAO,CAAC,KAAK,CAAS;gBAEV,OAAO,CAAC,EAAE,wBAAwB;IAKxC,iBAAiB,IAAI,OAAO,CAAC,OAAO,CAAC;IAgB3C;;OAEG;IACH,QAAQ,IAAI,MAAM;IAIlB;;OAEG;IACH,OAAO,CAAC,WAAW;IA8BnB;;;OAGG;IACG,QAAQ,CACZ,MAAM,EAAE,MAAM,EACd,YAAY,CAAC,EAAE,SAAS,MAAM,EAAE,EAChC,OAAO,CAAC,EAAE,MAAM,GAAG,IAAI,GACtB,OAAO,CAAC,MAAM,EAAE,CAAC;CAyGrB"}

package/dist/adapters/copilotCLI.js CHANGED Viewed

@@ -102,13 +102,10 @@ class CopilotCLIAdapter {
             throw new Error("GitHub Copilot CLI is not available. Please install it first: https://docs.github.com/en/copilot/how-tos/set-up/install-copilot-cli");
         }
         const fullPrompt = this.buildPrompt(prompt, contextFiles);
-        // Capture git status before generation
         const statusBefore = (0, gitUtils_1.getGitStatusPorcelain)(this.workspaceRoot);
-        // Write prompt to temp file and pipe via stdin (matches @copilot-evals pattern)
         return new Promise((resolve, reject) => {
             const tempFile = path.join(this.workspaceRoot, ".copilot-eval-prompt.txt");
             fs.writeFileSync(tempFile, fullPrompt, "utf8");
-            // Cleanup function
             const cleanup = () => {
                 try {
                     if (fs.existsSync(tempFile)) {
@@ -119,7 +116,6 @@ class CopilotCLIAdapter {
                     // Ignore cleanup errors
                 }
             };
-            // Register cleanup on process termination
             const cleanupOnExit = () => {
                 cleanup();
             };
@@ -138,7 +134,6 @@ class CopilotCLIAdapter {
             proc.stderr?.on("data", (data) => {
                 stderr += data.toString();
             });
-            // Set timeout only if specified (null/undefined = no timeout)
             let timeoutHandle = null;
             if (timeout !== null && timeout !== undefined) {
                 timeoutHandle = setTimeout(() => {
@@ -160,7 +155,6 @@ class CopilotCLIAdapter {
                     reject(new Error(`Copilot CLI exited with code ${code}\nStderr: ${stderr}`));
                     return;
                 }
-                // Get files changed during generation (diff before/after)
                 try {
                     const statusAfter = (0, gitUtils_1.getGitStatusPorcelain)(this.workspaceRoot);
                     const changedFiles = (0, gitUtils_1.getChangedFilesDiff)(statusBefore, statusAfter, this.workspaceRoot);