npm - chorus-cli - Versions diffs - 0.5.1 → 0.5.4 - Mend

chorus-cli 0.5.1 → 0.5.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/index.js +139 -22
package/package.json +1 -1
package/tools/__pycache__/coder.cpython-314.pyc +0 -0
package/tools/__pycache__/qa.cpython-314.pyc +0 -0
package/tools/coder.py +13 -2
package/tools/qa.py +14 -2

package/index.js CHANGED Viewed

@@ -62,7 +62,7 @@ async function getMachineId() {
 }
 // Run coder.py with real-time stderr streaming so progress is visible
-function runCoder(prompt) {
+function runCoder(prompt, { model } = {}) {
   return new Promise((resolve, reject) => {
     const env = { ...process.env };
     if (CONFIG.ai.chorusApiKey) {
@@ -72,7 +72,12 @@ function runCoder(prompt) {
     if (CONFIG.ai.machineId) {
       env.CHORUS_MACHINE_ID = CONFIG.ai.machineId;
     }
-    const proc = spawn(CONFIG.ai.venvPython, [CONFIG.ai.coderPath, '--prompt', prompt], {
+    if (isFreeModel(model)) {
+      env.CHORUS_FREE = '1';
+    }
+    const coderArgs = [CONFIG.ai.coderPath, '--prompt', prompt];
+    if (model) { coderArgs.push('--model', model); }
+    const proc = spawn(CONFIG.ai.venvPython, coderArgs, {
       cwd: process.cwd(),
       env,
       stdio: ['ignore', 'pipe', 'pipe'],
@@ -103,7 +108,7 @@ function runCoder(prompt) {
 }
 // Run qa.py with issue context on stdin, capture JSON from stdout
-function runQAChat(issue, enrichedDetails, qaName, useSuper = false) {
+function runQAChat(issue, enrichedDetails, qaName, useSuper = false, { model } = {}) {
   return new Promise((resolve, reject) => {
     const input = JSON.stringify({
       issue_number: issue.number,
@@ -117,6 +122,7 @@ function runQAChat(issue, enrichedDetails, qaName, useSuper = false) {
       args.push('--auth', CONFIG.teams.authPath);
     }
     if (useSuper) {args.push('--super');}
+    if (model) {args.push('--model', model);}
     const env = { ...process.env };
     if (CONFIG.ai.chorusApiKey) {
@@ -126,6 +132,9 @@ function runQAChat(issue, enrichedDetails, qaName, useSuper = false) {
     if (CONFIG.ai.machineId) {
       env.CHORUS_MACHINE_ID = CONFIG.ai.machineId;
     }
+    if (isFreeModel(model)) {
+      env.CHORUS_FREE = '1';
+    }
     if (CONFIG.messenger === 'slack' && CONFIG.slack.botToken) {
       env.SLACK_BOT_TOKEN = CONFIG.slack.botToken;
     }
@@ -202,7 +211,7 @@ const CONFIG = {
 // Use createProvider(CONFIG, issueArg) to get the right provider.
 // ===== AI ENRICHMENT =====
-async function enrichWithAI(issue) {
+async function enrichWithAI(issue, { model } = {}) {
   const prompt = `Analyze this GitHub issue and write questions for QA clarification.
 ISSUE DETAILS:
@@ -253,7 +262,7 @@ IMPORTANT: Output ONLY the message above. Do not include any preamble, thinking
     const openai = new OpenAI(openaiOpts);
     const response = await openai.chat.completions.create({
-      model: 'chorus-default',
+      model: model || 'chorus-default',
       max_tokens: 2000,
       messages: [
         {
@@ -262,7 +271,10 @@ IMPORTANT: Output ONLY the message above. Do not include any preamble, thinking
         }
       ]
     }, {
-      headers: { 'X-Chorus-Mode': 'enrich' },
+      headers: {
+        'X-Chorus-Mode': 'enrich',
+        ...(isFreeModel(model) && { 'X-Chorus-Free': '1' }),
+      },
     });
     if (response.usage) {
@@ -279,7 +291,7 @@ IMPORTANT: Output ONLY the message above. Do not include any preamble, thinking
 }
 // ===== CODE GENERATION =====
-async function generateCode(issue, enrichedDetails, qaResponse) {
+async function generateCode(issue, enrichedDetails, qaResponse, { model } = {}) {
   const tool = CONFIG.ai.codingTool;
   if (tool === 'coder') {
@@ -304,7 +316,7 @@ Instructions:
     console.log('🔨 Generating code with Coder agent...');
-    return await runCoder(prompt);
+    return await runCoder(prompt, { model });
   }
   // Fallback: kimi
@@ -423,7 +435,7 @@ async function getCodeRabbitReview(solution, issue, provider) {
   }
 }
-async function refineCode(solution, review) {
+async function refineCode(solution, review, { model } = {}) {
   const tool = CONFIG.ai.codingTool;
   if (tool === 'coder') {
@@ -448,7 +460,7 @@ Instructions:
     console.log('🔄 Refining code with Coder agent...');
-    return await runCoder(prompt);
+    return await runCoder(prompt, { model });
   }
   // Fallback: kimi
@@ -535,6 +547,10 @@ ${lintOutput.slice(0, 5000)}`;
 // ===== TOKEN LIMIT =====
+function isFreeModel(model) {
+  return model && FREE_MODELS.has(model);
+}
 function isTokenLimitError(err) {
   const msg = typeof err === 'string' ? err : (err?.message || err?.error || '');
   return msg.includes('token limit exceeded') || msg.includes('rate_limit_error');
@@ -576,7 +592,7 @@ async function printTokenLimitMessage() {
 }
 // ===== MAIN WORKFLOW =====
-async function processTicket(issueArg, { useSuper = false, skipQA = false, qaName: qaNameOverride } = {}) {
+async function processTicket(issueArg, { useSuper = false, skipQA = false, qaName: qaNameOverride, model } = {}) {
   try {
     console.log('🚀 Starting ticket processing...\n');
@@ -600,7 +616,25 @@ async function processTicket(issueArg, { useSuper = false, skipQA = false, qaNam
       efs(CONFIG.ai.venvPython, ['-m', 'pip', 'install', '-r', reqFile], { stdio: 'inherit' });
     }
-    // 0a. Verify no modified tracked files (untracked files like .chorus/ are fine)
+    // 0a. Check token balance — free models can proceed with zero balance
+    const usingFree = isFreeModel(model);
+    const email = await fetchAccountEmail();
+    const balance = await fetchCreditBalance(email);
+    if (balance !== null && balance <= 0 && !usingFree) {
+      await printTokenLimitMessage();
+      console.log('   Tip: Use --free to run with a free model\n');
+      process.exit(1);
+    }
+    if (usingFree) {
+      if (balance !== null && balance <= 0) {
+        console.log(`🆓 Using free model "${model}"\n`);
+      } else {
+        console.log(`🆓 Using free model "${model}"\n`);
+      }
+    }
+    // 0b. Verify no modified tracked files (untracked files like .chorus/ are fine)
     const { stdout: gitStatus } = await execPromise('git status --porcelain --untracked-files=no');
     if (gitStatus.trim()) {
       console.error('⚠️ Working directory has uncommitted changes. Commit or stash first:');
@@ -640,7 +674,7 @@ async function processTicket(issueArg, { useSuper = false, skipQA = false, qaNam
     console.log(`Found issue #${issue.number}: ${issue.title}\n`);
     // 2. Enrich with AI
-    const enrichedDetails = await enrichWithAI(issue);
+    const enrichedDetails = await enrichWithAI(issue, { model });
     console.log('Enrichment complete\n', enrichedDetails);
     // 3. Multi-turn QA conversation via qa.py
@@ -650,12 +684,13 @@ async function processTicket(issueArg, { useSuper = false, skipQA = false, qaNam
     } else {
       const qaName = qaNameOverride || await provider.getUserDisplayName(issue.user.login);
       console.log(`💬 Starting QA conversation with ${qaName?.login}...`);
-      const qaResult = await runQAChat(issue, enrichedDetails, qaName, useSuper);
+      const qaResult = await runQAChat(issue, enrichedDetails, qaName, useSuper, { model });
       qaResponse = qaResult.requirements;
       if (!qaResult.completed) {
-        if (isTokenLimitError(qaResult.error)) {
+        if (isTokenLimitError(qaResult.error) && !usingFree) {
           await printTokenLimitMessage();
+          console.log('   Tip: Use --free to run with a free model\n');
           process.exit(1);
         }
         console.warn('⚠️  QA chat did not complete successfully:', qaResult.error || 'unknown');
@@ -678,7 +713,7 @@ async function processTicket(issueArg, { useSuper = false, skipQA = false, qaNam
     for (let attempt = 1; attempt <= maxCodeAttempts; attempt++) {
       if (attempt === 1) {
-        solution = await generateCode(issue, enrichedDetails, qaResponse);
+        solution = await generateCode(issue, enrichedDetails, qaResponse, { model });
       } else {
         // Reprompt with explicit instruction that files must be written
         const retryPrompt = `You previously attempted to implement this issue but DID NOT write any files. Your task is NOT complete until you have actually created or modified files using write_file or edit_file.
@@ -699,13 +734,14 @@ ${qaResponse}
 CRITICAL: You MUST write code to actual files. Do not just describe changes — use write_file or edit_file to make them. If you are unsure where to make changes, explore the codebase first, then write the code.`;
         console.log(`🔁 Reprompting coder (attempt ${attempt}/${maxCodeAttempts})...`);
-        solution = await runCoder(retryPrompt);
+        solution = await runCoder(retryPrompt, { model });
       }
       if (solution.completed === false) {
         const errs = solution.errors || [solution.summary || ''];
-        if (errs.some(e => isTokenLimitError(e))) {
+        if (errs.some(e => isTokenLimitError(e)) && !usingFree) {
           printTokenLimitMessage();
+          console.log('   Tip: Use --free to run with a free model\n');
           process.exit(1);
         }
         console.error('❌ Code generation failed:', errs);
@@ -765,7 +801,7 @@ CRITICAL: You MUST write code to actual files. Do not just describe changes —
       while (review.needsChanges && iterations < maxIterations) {
         console.log(`Iteration ${iterations + 1}/${maxIterations}...`);
-        const refined = await refineCode(solution, review);
+        const refined = await refineCode(solution, review, { model });
         if (refined.completed === false) {
           console.warn('⚠️  Refinement had errors:', refined.errors);
@@ -843,8 +879,9 @@ Instructions:
       if (revised.completed === false) {
         const errs = revised.errors || [revised.summary || ''];
-        if (errs.some(e => isTokenLimitError(e))) {
+        if (errs.some(e => isTokenLimitError(e)) && !usingFree) {
           printTokenLimitMessage();
+          console.log('   Tip: Use --free to run with a free model\n');
           rl.close();
           process.exit(1);
         }
@@ -874,8 +911,9 @@ Instructions:
     console.log('\n✨ Ticket processing complete!');
   } catch (error) {
-    if (isTokenLimitError(error)) {
+    if (isTokenLimitError(error) && !isFreeModel(model)) {
       await printTokenLimitMessage();
+      console.log('   Tip: Use --free to run with a free model\n');
       process.exit(1);
     }
     console.error('❌ Error processing ticket:', error);
@@ -1271,21 +1309,89 @@ function printZEP() {
 const command = process.argv[2];
 const _envExists = require('fs').existsSync(path.join(os.homedir(), '.config', 'chorus', '.env'));
+const FREE_MODELS = new Set([
+  'gpt-oss', 'gpt-oss-20b', 'qwen-coder', 'qwen', 'llama', 'hermes',
+  'nemotron', 'gemma', 'mistral', 'glm', 'step', 'solar'
+]);
+const PAID_MODELS = new Set([
+  'claude', 'chatgpt', 'deepseek', 'kimi', 'gemini', 'grok', 'command-r'
+]);
+const ALLOWED_MODELS = new Set([...FREE_MODELS, ...PAID_MODELS]);
+const DEFAULT_FREE_MODEL = 'gpt-oss';
+function printModelTable(out = console.error) {
+  out('\n  Free models:');
+  out('  ┌─────────────────────┬──────────────────────────────────┐');
+  out('  │ Flag value          │ Model                            │');
+  out('  ├─────────────────────┼──────────────────────────────────┤');
+  out('  │ gpt-oss             │ GPT-OSS 120B           (default) │');
+  out('  │ gpt-oss-20b         │ GPT-OSS 20B                      │');
+  out('  │ qwen-coder          │ Qwen3 Coder 480B                 │');
+  out('  │ qwen                │ Qwen3 Next 80B                   │');
+  out('  │ llama               │ Llama 3.3 70B                    │');
+  out('  │ hermes              │ Hermes 3 405B                    │');
+  out('  │ nemotron            │ Nemotron 3 Nano 30B              │');
+  out('  │ gemma               │ Gemma 3 27B                      │');
+  out('  │ mistral             │ Mistral Small 3.1 24B            │');
+  out('  │ glm                 │ GLM 4.5 Air                      │');
+  out('  │ step                │ Step 3.5 Flash                   │');
+  out('  │ solar               │ Solar Pro 3                      │');
+  out('  └─────────────────────┴──────────────────────────────────┘');
+  out('\n  Paid models:');
+  out('  ┌─────────────────────┬──────────────────────────────────┐');
+  out('  │ Flag value          │ Model                            │');
+  out('  ├─────────────────────┼──────────────────────────────────┤');
+  out('  │ claude              │ Claude                           │');
+  out('  │ chatgpt             │ ChatGPT                          │');
+  out('  │ deepseek            │ DeepSeek                         │');
+  out('  │ kimi                │ Kimi                             │');
+  out('  │ gemini              │ Gemini                           │');
+  out('  │ grok                │ Grok                             │');
+  out('  │ command-r           │ Command R                        │');
+  out('  └─────────────────────┴──────────────────────────────────┘');
+}
 function parseRunArgs() {
   const args = process.argv.slice(3);
-  const opts = { useSuper: false, skipQA: false, qaName: null, issueArg: null };
+  const opts = { useSuper: false, skipQA: false, qaName: null, issueArg: null, model: null, free: false };
   for (let i = 0; i < args.length; i++) {
     if (args[i] === '--super') {
       opts.useSuper = true;
     } else if (args[i] === '--skip-qa') {
       opts.skipQA = true;
+    } else if (args[i] === '--free') {
+      opts.free = true;
     } else if (args[i] === '--qa' && i + 1 < args.length) {
       opts.qaName = args[++i];
+    } else if (args[i] === '--model' && i + 1 < args.length) {
+      const val = args[++i];
+      if (!ALLOWED_MODELS.has(val)) {
+        console.error(`Error: invalid model "${val}". Allowed models: ${[...ALLOWED_MODELS].join(', ')}`);
+        printModelTable();
+        process.exit(1);
+      }
+      opts.model = val;
     } else if (!args[i].startsWith('--')) {
       opts.issueArg = args[i];
     }
   }
+  // --free: default to best free model, or validate that --model is free
+  if (opts.free) {
+    if (opts.model && !FREE_MODELS.has(opts.model)) {
+      console.error(`Error: "${opts.model}" is a paid model and cannot be used with --free.`);
+      printModelTable();
+      process.exit(1);
+    }
+    if (!opts.model) {
+      opts.model = DEFAULT_FREE_MODEL;
+    }
+  }
   return opts;
 }
@@ -1303,6 +1409,13 @@ if (command === 'setup') {
     const { issueArg, ...opts } = parseRunArgs();
     processTicket(issueArg, opts).catch(console.error);
   }
+} else if (command === 'models') {
+  console.log('\nChorus — Available Models');
+  printModelTable(console.log);
+  console.log('\nUsage:');
+  console.log('  chorus run 4464 --model deepseek    Use a specific model');
+  console.log('  chorus run 4464 --free              Use the best free model (GPT-OSS 120B)');
+  console.log('  chorus run 4464 --free --model qwen-coder  Use a specific free model\n');
 } else if (command === 'zep') {
   printZEP()
 } else {
@@ -1321,10 +1434,14 @@ Chorus — AI-powered ticket automation (GitHub & Azure DevOps)
 Usage:
   chorus setup                       - Set up provider, Chorus auth + messenger
+  chorus models                      - List all available models (free & paid)
   chorus run                         - Process latest assigned issue
   chorus run 4464                    - Process specific issue by number
   chorus run <url>                   - Process issue from full URL (auto-detects provider)
   chorus run 4464 --super            - Use Opus 4.6 for QA evaluation
+  chorus run 4464 --model deepseek   - Use a specific model (see --free for free options)
+  chorus run 4464 --free             - Use the best free model (GPT-OSS 120B)
+  chorus run 4464 --free --model qwen-coder - Use a specific free model
   chorus run 4464 --qa 'John Doe'    - Specify QA contact name for chat
   chorus run 4464 --skip-qa          - Skip QA conversation, go straight to coding

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "chorus-cli",
-  "version": "0.5.1",
+  "version": "0.5.4",
   "description": "Automated ticket resolution with AI, Teams, and Slack integration",
   "main": "index.js",
   "bin": {

package/tools/__pycache__/coder.cpython-314.pyc CHANGED Viewed

Binary file

package/tools/__pycache__/qa.cpython-314.pyc CHANGED Viewed

Binary file

package/tools/coder.py CHANGED Viewed

@@ -878,8 +878,13 @@ def run_prompt(client, prompt, chorus_context):
 def main():
     parser = argparse.ArgumentParser(description="Coder — AI coding agent powered by Claude via Chorus")
     parser.add_argument("-p", "--prompt", help="Run a single prompt headlessly and output JSON")
+    parser.add_argument("--model", help="Override the model sent to the proxy")
     args = parser.parse_args()
+    global MODEL
+    if args.model:
+        MODEL = args.model
     api_key = os.environ.get("CHORUS_API_KEY")
     if not api_key:
         print(f"{C.RED}Error: CHORUS_API_KEY not set. Run 'chorus setup' to configure.{C.RESET}", file=sys.stderr)
@@ -887,9 +892,15 @@ def main():
     base_url = os.environ.get("CHORUS_API_URL", "https://chorus-bad0f.web.app/v1")
     machine_id = os.environ.get("CHORUS_MACHINE_ID")
-    client_kwargs = {"api_key": api_key, "base_url": base_url}
+    chorus_free = os.environ.get("CHORUS_FREE", "")
+    default_headers = {}
     if machine_id:
-        client_kwargs["default_headers"] = {"X-Machine-Id": machine_id}
+        default_headers["X-Machine-Id"] = machine_id
+    if chorus_free:
+        default_headers["X-Chorus-Free"] = "1"
+    client_kwargs = {"api_key": api_key, "base_url": base_url}
+    if default_headers:
+        client_kwargs["default_headers"] = default_headers
     client = OpenAI(**client_kwargs)
     cwd = os.getcwd()

package/tools/qa.py CHANGED Viewed

@@ -408,9 +408,15 @@ def run_qa_chat(issue_context, messenger, qa_name):
     api_key = os.environ.get("CHORUS_API_KEY")
     base_url = os.environ.get("CHORUS_API_URL", "https://chorus-bad0f.web.app/v1")
     machine_id = os.environ.get("CHORUS_MACHINE_ID")
-    client_kwargs = {"api_key": api_key, "base_url": base_url}
+    chorus_free = os.environ.get("CHORUS_FREE", "")
+    default_headers = {}
     if machine_id:
-        client_kwargs["default_headers"] = {"X-Machine-Id": machine_id}
+        default_headers["X-Machine-Id"] = machine_id
+    if chorus_free:
+        default_headers["X-Chorus-Free"] = "1"
+    client_kwargs = {"api_key": api_key, "base_url": base_url}
+    if default_headers:
+        client_kwargs["default_headers"] = default_headers
     client = OpenAI(**client_kwargs)
     conversation = []
     raw_responses = []
@@ -483,8 +489,14 @@ def main():
     parser.add_argument("--auth", help="Path to Teams auth state JSON (required for --messenger teams)")
     parser.add_argument("--qa", required=True, help="QA person's name")
     parser.add_argument("--super", action="store_true", help="Use Opus 4.6 instead of Sonnet")
+    parser.add_argument("--model", help="Override the model sent to the proxy")
     args = parser.parse_args()
+    # Override model if specified
+    global MODEL
+    if args.model:
+        MODEL = args.model
     # chorus_mode tells the proxy which model to use
     global QA_CHORUS_MODE
     if args.super: