npm - navada-edge-cli - Versions diffs - 3.3.0 → 3.4.1 - Mend

navada-edge-cli 3.3.0 → 3.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md +499 -191
package/architecture.svg +171 -0
package/lib/agent.js +178 -20
package/lib/commands/ai.js +61 -3
package/lib/commands/conversations.js +139 -0
package/lib/commands/index.js +1 -1
package/lib/commands/system.js +5 -0
package/package.json +2 -2
package/network.svg +0 -207

package/architecture.svg ADDED Viewed

@@ -0,0 +1,171 @@
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 800 500" width="800" height="500">
+  <style>
+    text { font-family: 'SF Mono', 'Fira Code', monospace; fill: #e0e0e0; }
+    .label { font-size: 9px; fill: #666; }
+    .title { font-size: 11px; font-weight: bold; }
+    .small { font-size: 8px; fill: #888; }
+    .accent { fill: #a855f7; }
+    .box { fill: #0a0a0a; stroke: #1a1a1a; stroke-width: 1; }
+    .box-accent { fill: #0a0a0a; stroke: #a855f7; stroke-width: 1; }
+    .line { stroke: #333; stroke-width: 1; fill: none; }
+    .line-accent { stroke: #a855f7; stroke-width: 1; fill: none; }
+    .arrow { fill: #a855f7; }
+  </style>
+  <rect width="800" height="500" fill="#0a0a0a"/>
+  <!-- Title -->
+  <text x="400" y="24" text-anchor="middle" font-size="13" font-weight="bold" fill="#e0e0e0">NAVADA Edge CLI — Architecture</text>
+  <text x="400" y="38" text-anchor="middle" class="label">v3.3.0</text>
+  <!-- USER -->
+  <rect x="20" y="60" width="110" height="40" rx="2" class="box-accent"/>
+  <text x="75" y="78" text-anchor="middle" class="title">USER</text>
+  <text x="75" y="90" text-anchor="middle" class="label">Terminal</text>
+  <!-- Arrow: User -> CLI -->
+  <line x1="130" y1="80" x2="178" y2="80" class="line-accent"/>
+  <polygon points="178,76 186,80 178,84" class="arrow"/>
+  <!-- CLI Core -->
+  <rect x="188" y="55" width="140" height="50" rx="2" class="box-accent"/>
+  <text x="258" y="76" text-anchor="middle" class="title" fill="#a855f7">NAVADA Edge CLI</text>
+  <text x="258" y="90" text-anchor="middle" class="label">agent.md + config</text>
+  <!-- Three output arrows from CLI -->
+  <!-- Arrow: CLI -> AI Router -->
+  <line x1="328" y1="70" x2="410" y2="70" class="line-accent"/>
+  <line x1="410" y1="70" x2="410" y2="140" class="line-accent"/>
+  <polygon points="406,140 410,148 414,140" class="arrow"/>
+  <!-- Arrow: CLI -> Tool Engine -->
+  <line x1="328" y1="80" x2="540" y2="80" class="line-accent"/>
+  <line x1="540" y1="80" x2="540" y2="140" class="line-accent"/>
+  <polygon points="536,140 540,148 544,140" class="arrow"/>
+  <!-- Arrow: CLI -> Edge Network -->
+  <line x1="328" y1="90" x2="680" y2="90" class="line-accent"/>
+  <line x1="680" y1="90" x2="680" y2="140" class="line-accent"/>
+  <polygon points="676,140 680,148 684,140" class="arrow"/>
+  <!-- === COLUMN 1: AI Router === -->
+  <rect x="340" y="150" width="140" height="36" rx="2" class="box-accent"/>
+  <text x="410" y="170" text-anchor="middle" class="title">AI Router</text>
+  <text x="410" y="180" text-anchor="middle" class="label">model selection</text>
+  <!-- Provider grid: 3x2 -->
+  <rect x="310" y="200" width="90" height="28" rx="2" class="box"/>
+  <text x="355" y="215" text-anchor="middle" font-size="9" fill="#a855f7">NAVADA Free</text>
+  <rect x="410" y="200" width="90" height="28" rx="2" class="box"/>
+  <text x="455" y="215" text-anchor="middle" font-size="9">Anthropic</text>
+  <rect x="310" y="236" width="90" height="28" rx="2" class="box"/>
+  <text x="355" y="251" text-anchor="middle" font-size="9">OpenAI</text>
+  <rect x="410" y="236" width="90" height="28" rx="2" class="box"/>
+  <text x="455" y="251" text-anchor="middle" font-size="9">Gemini</text>
+  <rect x="310" y="272" width="90" height="28" rx="2" class="box"/>
+  <text x="355" y="287" text-anchor="middle" font-size="9">NVIDIA</text>
+  <rect x="410" y="272" width="90" height="28" rx="2" class="box"/>
+  <text x="455" y="287" text-anchor="middle" font-size="9">HuggingFace</text>
+  <!-- Connector lines from router to providers -->
+  <line x1="410" y1="186" x2="355" y2="200" class="line"/>
+  <line x1="410" y1="186" x2="455" y2="200" class="line"/>
+  <line x1="355" y1="228" x2="355" y2="236" class="line"/>
+  <line x1="455" y1="228" x2="455" y2="236" class="line"/>
+  <line x1="355" y1="264" x2="355" y2="272" class="line"/>
+  <line x1="455" y1="264" x2="455" y2="272" class="line"/>
+  <!-- === COLUMN 2: Tool Engine === -->
+  <rect x="510" y="150" width="120" height="36" rx="2" class="box-accent"/>
+  <text x="570" y="170" text-anchor="middle" class="title">Tool Engine</text>
+  <text x="570" y="180" text-anchor="middle" class="label">execution layer</text>
+  <!-- Tools: Local (left col) + Network (right col) -->
+  <text x="540" y="207" text-anchor="middle" class="label">LOCAL</text>
+  <text x="620" y="207" text-anchor="middle" class="label">NETWORK</text>
+  <rect x="510" y="214" width="56" height="24" rx="2" class="box"/>
+  <text x="538" y="229" text-anchor="middle" font-size="8">Shell</text>
+  <rect x="510" y="244" width="56" height="24" rx="2" class="box"/>
+  <text x="538" y="259" text-anchor="middle" font-size="8">Files</text>
+  <rect x="510" y="274" width="56" height="24" rx="2" class="box"/>
+  <text x="538" y="289" text-anchor="middle" font-size="8">Python</text>
+  <rect x="510" y="304" width="56" height="24" rx="2" class="box"/>
+  <text x="538" y="319" text-anchor="middle" font-size="8">Docker</text>
+  <rect x="576" y="214" width="56" height="24" rx="2" class="box"/>
+  <text x="604" y="229" text-anchor="middle" font-size="8">MCP</text>
+  <rect x="576" y="244" width="56" height="24" rx="2" class="box"/>
+  <text x="604" y="259" text-anchor="middle" font-size="8">SSH</text>
+  <rect x="576" y="274" width="56" height="24" rx="2" class="box"/>
+  <text x="604" y="289" text-anchor="middle" font-size="8">Email</text>
+  <rect x="576" y="304" width="56" height="24" rx="2" class="box"/>
+  <text x="604" y="319" text-anchor="middle" font-size="8">Registry</text>
+  <!-- Connector lines from engine to tools -->
+  <line x1="550" y1="186" x2="538" y2="214" class="line"/>
+  <line x1="590" y1="186" x2="604" y2="214" class="line"/>
+  <!-- === COLUMN 3: Edge Network === -->
+  <rect x="645" y="150" width="130" height="36" rx="2" class="box-accent"/>
+  <text x="710" y="170" text-anchor="middle" class="title">Edge Network</text>
+  <text x="710" y="180" text-anchor="middle" class="label">Tailscale mesh</text>
+  <!-- 4 Node boxes -->
+  <rect x="650" y="200" width="120" height="34" rx="2" class="box"/>
+  <text x="710" y="215" text-anchor="middle" font-size="9" fill="#a855f7">ASUS</text>
+  <text x="710" y="226" text-anchor="middle" class="small">Production Engine</text>
+  <rect x="650" y="242" width="120" height="34" rx="2" class="box"/>
+  <text x="710" y="257" text-anchor="middle" font-size="9">HP</text>
+  <text x="710" y="268" text-anchor="middle" class="small">Database (PG17)</text>
+  <rect x="650" y="284" width="120" height="34" rx="2" class="box"/>
+  <text x="710" y="299" text-anchor="middle" font-size="9">EC2</text>
+  <text x="710" y="310" text-anchor="middle" class="small">24/7 Monitoring</text>
+  <rect x="650" y="326" width="120" height="34" rx="2" class="box"/>
+  <text x="710" y="341" text-anchor="middle" font-size="9">Oracle</text>
+  <text x="710" y="352" text-anchor="middle" class="small">Infra + Tunnel</text>
+  <!-- Connector lines from network to nodes -->
+  <line x1="710" y1="186" x2="710" y2="200" class="line"/>
+  <line x1="710" y1="234" x2="710" y2="242" class="line"/>
+  <line x1="710" y1="276" x2="710" y2="284" class="line"/>
+  <line x1="710" y1="318" x2="710" y2="326" class="line"/>
+  <!-- Mesh lines between nodes (subtle) -->
+  <line x1="650" y1="217" x2="645" y2="259" stroke="#1a1a1a" stroke-width="1" stroke-dasharray="2,3"/>
+  <line x1="650" y1="259" x2="645" y2="301" stroke="#1a1a1a" stroke-width="1" stroke-dasharray="2,3"/>
+  <line x1="650" y1="301" x2="645" y2="343" stroke="#1a1a1a" stroke-width="1" stroke-dasharray="2,3"/>
+  <!-- Bottom bar -->
+  <line x1="40" y1="400" x2="760" y2="400" stroke="#1a1a1a" stroke-width="1"/>
+  <!-- Legend -->
+  <text x="40" y="425" class="label">FLOW</text>
+  <line x1="70" y1="422" x2="100" y2="422" class="line-accent"/>
+  <polygon points="100,419 106,422 100,425" class="arrow"/>
+  <text x="112" y="425" class="small">data path</text>
+  <rect x="170" y="414" width="14" height="14" rx="2" class="box-accent"/>
+  <text x="190" y="425" class="small">core module</text>
+  <rect x="260" y="414" width="14" height="14" rx="2" class="box"/>
+  <text x="280" y="425" class="small">component</text>
+  <!-- Footer -->
+  <text x="400" y="470" text-anchor="middle" class="label">navada-edge-cli@3.3.0 | npm i -g navada-edge-cli | github.com/navada25/edge-cli</text>
+  <text x="400" y="484" text-anchor="middle" font-size="8" fill="#333">NAVADA Edge Network 2026</text>
+</svg>

package/lib/agent.js CHANGED Viewed

@@ -32,6 +32,8 @@ You also connect to the NAVADA Edge Network (4 nodes via Tailscale VPN):
   - send_email / generate_image: communications and AI image generation
   - founder_info: information about Lee Akpareva, the creator of NAVADA
 When users ask you to DO something — DO IT. Use write_file to create files. Use shell to run commands. Never say "I can't" when you have a tool for it.
+When asked to generate diagrams — use write_file to create Mermaid (.mmd), SVG, or HTML files. You can also use python_exec with matplotlib/graphviz for complex diagrams.
+When asked to create, edit, or delete files — use the file tools directly. You are a terminal agent with FULL access.
 Keep responses short. Code blocks when needed. No fluff.`,
   founder: {
     name: 'Leslie (Lee) Akpareva',
@@ -79,8 +81,8 @@ function getSystemPrompt() {
 // Session state — exposed for UI panels
 // ---------------------------------------------------------------------------
 const sessionState = {
-  provider: 'Grok (free)',
-  model: 'grok-3-mini',
+  provider: 'NAVADA (free)',
+  model: 'gpt-4o-mini',
   tokens: { input: 0, output: 0, total: 0 },
   cost: 0,
   messages: 0,
@@ -335,7 +337,7 @@ function streamFreeTier(endpoint, messages) {
     const req = transport.request(url, {
       method: 'POST',
       headers: { 'Content-Type': 'application/json', 'Content-Length': Buffer.byteLength(body) },
-      timeout: endpoint.includes('navada-edge-server.uk') ? 30000 : 5000,
+      timeout: endpoint.includes('navada-edge-server.uk') ? 120000 : 10000,
     }, (res) => {
       // If server doesn't support streaming, collect full response
       if (!res.headers['content-type']?.includes('text/event-stream')) {
@@ -373,10 +375,13 @@ function streamFreeTier(endpoint, messages) {
           if (data === '[DONE]') continue;
           try {
             const parsed = JSON.parse(data);
-            const delta = parsed.choices?.[0]?.delta?.content || '';
-            if (delta) {
-              process.stdout.write(delta);
-              fullContent += delta;
+            const delta = parsed.choices?.[0]?.delta;
+            // Grok-3-mini streams reasoning_content first, then content — skip reasoning
+            if (delta?.reasoning_content && !delta?.content) continue;
+            const text = delta?.content || '';
+            if (text) {
+              process.stdout.write(text);
+              fullContent += text;
             }
           } catch {}
         }
@@ -579,15 +584,84 @@ function streamOpenAI(key, messages, model = 'gpt-4o') {
   });
 }
+// ---------------------------------------------------------------------------
+// Streaming — Google Gemini API (gemini-2.0-flash)
+// ---------------------------------------------------------------------------
+function streamGemini(key, messages, model = 'gemini-2.0-flash') {
+  return new Promise((resolve, reject) => {
+    const contents = messages.map(m => ({
+      role: m.role === 'assistant' ? 'model' : 'user',
+      parts: [{ text: typeof m.content === 'string' ? m.content : JSON.stringify(m.content) }],
+    }));
+    const body = JSON.stringify({
+      contents,
+      generationConfig: { maxOutputTokens: 4096 },
+      systemInstruction: { parts: [{ text: getSystemPrompt() }] },
+    });
+    const url = new URL(`https://generativelanguage.googleapis.com/v1beta/models/${model}:streamGenerateContent?alt=sse&key=${key}`);
+    const req = https.request(url, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json', 'Content-Length': Buffer.byteLength(body) },
+      timeout: 120000,
+    }, (res) => {
+      if (res.statusCode !== 200) {
+        let data = '';
+        res.on('data', c => data += c);
+        res.on('end', () => reject(new Error(`Gemini API error ${res.statusCode}: ${data.slice(0, 200)}`)));
+        return;
+      }
+      let buffer = '';
+      let fullContent = '';
+      res.on('data', (chunk) => {
+        buffer += chunk.toString();
+        const lines = buffer.split('\n');
+        buffer = lines.pop();
+        for (const line of lines) {
+          if (!line.startsWith('data: ')) continue;
+          const data = line.slice(6).trim();
+          if (!data) continue;
+          try {
+            const parsed = JSON.parse(data);
+            const text = parsed.candidates?.[0]?.content?.parts?.[0]?.text || '';
+            if (text) {
+              process.stdout.write(text);
+              fullContent += text;
+            }
+          } catch {}
+        }
+      });
+      res.on('end', () => {
+        if (fullContent) process.stdout.write('\n');
+        resolve({ content: fullContent });
+      });
+    });
+    req.on('error', reject);
+    req.on('timeout', () => { req.destroy(); reject(new Error('Timeout')); });
+    req.write(body);
+    req.end();
+  });
+}
 function openAITools() {
   const defs = [
-    { name: 'shell', description: 'Execute a shell command on the user\'s machine', parameters: { type: 'object', properties: { command: { type: 'string' } }, required: ['command'] } },
-    { name: 'read_file', description: 'Read a file', parameters: { type: 'object', properties: { path: { type: 'string' } }, required: ['path'] } },
-    { name: 'write_file', description: 'Write to a file', parameters: { type: 'object', properties: { path: { type: 'string' }, content: { type: 'string' } }, required: ['path', 'content'] } },
-    { name: 'list_files', description: 'List directory contents', parameters: { type: 'object', properties: { path: { type: 'string' } } } },
-    { name: 'system_info', description: 'Get system info (CPU, RAM, OS)', parameters: { type: 'object', properties: {} } },
-    { name: 'python_exec', description: 'Execute Python code', parameters: { type: 'object', properties: { code: { type: 'string' } }, required: ['code'] } },
-    { name: 'python_pip', description: 'Install a Python package', parameters: { type: 'object', properties: { package: { type: 'string' } }, required: ['package'] } },
+    { name: 'shell', description: 'Execute a shell command on the user\'s machine. Use for: file operations, git, npm, docker, system commands, creating directories, running scripts.', parameters: { type: 'object', properties: { command: { type: 'string', description: 'The shell command to run' } }, required: ['command'] } },
+    { name: 'read_file', description: 'Read the contents of a file on the user\'s machine.', parameters: { type: 'object', properties: { path: { type: 'string', description: 'Absolute or relative file path' } }, required: ['path'] } },
+    { name: 'write_file', description: 'Write content to a file. Creates parent directories if needed. Use for creating new files, scripts, configs, diagrams (Mermaid, SVG, HTML), code files.', parameters: { type: 'object', properties: { path: { type: 'string', description: 'File path to write' }, content: { type: 'string', description: 'Full content to write to the file' } }, required: ['path', 'content'] } },
+    { name: 'list_files', description: 'List files and directories.', parameters: { type: 'object', properties: { path: { type: 'string', description: 'Directory path (default: current dir)' } } } },
+    { name: 'system_info', description: 'Get local system information (CPU, RAM, disk, OS, hostname).', parameters: { type: 'object', properties: {} } },
+    { name: 'python_exec', description: 'Execute Python code inline. Use for data analysis, calculations, generating content, processing files, ML tasks.', parameters: { type: 'object', properties: { code: { type: 'string', description: 'Python code to execute' } }, required: ['code'] } },
+    { name: 'python_pip', description: 'Install a Python package via pip.', parameters: { type: 'object', properties: { package: { type: 'string', description: 'Package name' } }, required: ['package'] } },
+    { name: 'python_script', description: 'Run a Python script file.', parameters: { type: 'object', properties: { path: { type: 'string', description: 'Path to .py file' } }, required: ['path'] } },
+    { name: 'sandbox_run', description: 'Run code in an isolated sandbox with syntax highlighting. Supports javascript, python, typescript.', parameters: { type: 'object', properties: { code: { type: 'string' }, language: { type: 'string', description: 'javascript, python, or typescript' } }, required: ['code'] } },
+    { name: 'founder_info', description: 'Get information about Lee Akpareva, founder of NAVADA Edge.', parameters: { type: 'object', properties: {} } },
   ];
   return defs.map(d => ({ type: 'function', function: d }));
 }
@@ -662,12 +736,14 @@ async function chat(userMessage, conversationHistory = []) {
   const anthropicKey = config.get('anthropicKey') || process.env.ANTHROPIC_API_KEY || '';
   const openaiKey = config.get('openaiKey') || process.env.OPENAI_API_KEY || '';
   const nvidiaKey = config.get('nvidiaKey') || process.env.NVIDIA_API_KEY || '';
+  const geminiKey = config.get('geminiKey') || process.env.GEMINI_API_KEY || process.env.GOOGLE_API_KEY || '';
   const apiKey = config.getApiKey() || '';
   // Determine which provider to use
   const effectiveAnthropicKey = anthropicKey || (apiKey.startsWith('sk-ant') ? apiKey : '');
   const effectiveOpenAIKey = openaiKey || (apiKey.startsWith('sk-') && !apiKey.startsWith('sk-ant') ? apiKey : '');
   const effectiveNvidiaKey = nvidiaKey || (apiKey.startsWith('nvapi-') ? apiKey : '');
+  const effectiveGeminiKey = geminiKey || (apiKey.startsWith('AIza') ? apiKey : '');
   const modelPref = config.getModel();
   const intent = detectIntent(userMessage);
@@ -675,11 +751,12 @@ async function chat(userMessage, conversationHistory = []) {
   // Track active provider for UI
   if (effectiveAnthropicKey) sessionState.provider = 'Anthropic';
   else if (effectiveOpenAIKey) sessionState.provider = 'OpenAI';
+  else if (effectiveGeminiKey) sessionState.provider = 'Gemini';
   else if (effectiveNvidiaKey) sessionState.provider = 'NVIDIA';
   else sessionState.provider = 'Grok (free)';
   // No personal key — use free tier
-  if (!effectiveAnthropicKey && !effectiveOpenAIKey && !effectiveNvidiaKey) {
+  if (!effectiveAnthropicKey && !effectiveOpenAIKey && !effectiveNvidiaKey && !effectiveGeminiKey) {
     if (intent === 'code' && navada.config.hfToken) {
       try {
         const r = await navada.ai.huggingface.qwen(userMessage);
@@ -689,6 +766,28 @@ async function chat(userMessage, conversationHistory = []) {
     return grokChat(userMessage, conversationHistory);
   }
+  // Gemini key — route to Gemini
+  if (effectiveGeminiKey && (!effectiveAnthropicKey || modelPref === 'gemini' || modelPref?.startsWith('gemini-'))) {
+    const geminiModel = config.get('geminiModel') || 'gemini-2.0-flash';
+    sessionState.provider = 'Gemini';
+    sessionState.model = geminiModel;
+    const messages = [
+      ...conversationHistory.map(m => ({ role: m.role, content: typeof m.content === 'string' ? m.content : JSON.stringify(m.content) })),
+      { role: 'user', content: userMessage },
+    ];
+    process.stdout.write(ui.dim('  NAVADA > '));
+    try {
+      const result = await streamGemini(effectiveGeminiKey, messages, geminiModel);
+      return result.content;
+    } catch (e) {
+      if (!sessionState._geminiWarned) {
+        console.log(ui.warn('Gemini API unavailable, using Grok free tier.'));
+        sessionState._geminiWarned = true;
+      }
+      return grokChat(userMessage, conversationHistory);
+    }
+  }
   // NVIDIA key — route to NVIDIA
   if (effectiveNvidiaKey && (!effectiveAnthropicKey || modelPref?.startsWith('nvidia') || modelPref?.startsWith('llama') || modelPref?.startsWith('deepseek') || modelPref?.startsWith('mistral') || modelPref?.startsWith('gemma') || modelPref?.startsWith('nemotron'))) {
     const { streamNvidia } = require('./commands/nvidia');
@@ -903,13 +1002,72 @@ async function grokChat(userMessage, conversationHistory = []) {
     { role: 'user', content: userMessage },
   ];
-  // Try streaming first
-  const result = await callFreeTier(messages, true);
-  if (result.streamed) {
-    // Already printed to stdout, return for history
+  // Send tools with the request — free tier now supports tool use
+  const tools = openAITools();
+  const endpoint = FREE_TIER_ENDPOINTS[0];
+  // Non-streaming request with tools (streaming + tools is complex, use non-streaming for tool calls)
+  let response;
+  try {
+    const r = await navada.request(endpoint, {
+      method: 'POST',
+      body: { messages, tools },
+      timeout: 120000,
+    });
+    if (r.status === 429) {
+      return `Free tier limit reached. /login <key> for unlimited access.`;
+    }
+    if (r.status !== 200) {
+      // Fall back to streaming without tools
+      const result = await callFreeTier(messages, true);
+      return result.content || 'No response from free tier.';
+    }
+    rateTracker.record();
+    response = r.data;
+  } catch {
+    // Network error — try streaming fallback
+    const result = await callFreeTier(messages, true);
     return result.content || 'No response from free tier. Try /login <key> for full agent.';
   }
-  return result.content || 'No response from free tier. Try /login <key> for full agent.';
+  // Handle tool use loop (same as OpenAI path)
+  let iterations = 0;
+  while (response?.choices?.[0]?.finish_reason === 'tool_calls' && iterations < 10) {
+    iterations++;
+    const toolCalls = response.choices[0].message.tool_calls || [];
+    if (toolCalls.length === 0) break;
+    const toolResults = [];
+    for (const tc of toolCalls) {
+      let input;
+      try { input = JSON.parse(tc.function.arguments); } catch { input = {}; }
+      console.log(ui.dim(`  [${tc.function.name}] ${JSON.stringify(input).slice(0, 80)}`));
+      const result = await executeTool(tc.function.name, input);
+      toolResults.push({ role: 'tool', tool_call_id: tc.id, content: typeof result === 'string' ? result : JSON.stringify(result) });
+    }
+    // Add assistant message with tool_calls + results, then call again
+    messages.push({ role: 'assistant', content: response.choices[0].message.content || null, tool_calls: toolCalls });
+    messages.push(...toolResults);
+    try {
+      const r = await navada.request(endpoint, {
+        method: 'POST',
+        body: { messages, tools },
+        timeout: 120000,
+      });
+      if (r.status !== 200) break;
+      rateTracker.record();
+      response = r.data;
+    } catch { break; }
+  }
+  // Extract final text
+  const content = response?.choices?.[0]?.message?.content || '';
+  if (content) console.log(`  ${content}`);
+  return content || 'No response.';
 }
 async function fallbackChat(msg) {

package/lib/commands/ai.js CHANGED Viewed

@@ -3,7 +3,7 @@
 const navada = require('navada-edge-sdk');
 const ui = require('../ui');
 const config = require('../config');
-const { chat: agentChat, reportTelemetry, rateTracker, addToHistory, getConversationHistory, clearHistory } = require('../agent');
+const { chat: agentChat, reportTelemetry, rateTracker, addToHistory, getConversationHistory, clearHistory, sessionState } = require('../agent');
 module.exports = function(reg) {
@@ -109,12 +109,14 @@ module.exports = function(reg) {
   reg('model', 'Show/set default AI model', (args) => {
     if (args[0]) {
-      const valid = ['auto', 'claude', 'gpt-4o', 'gpt-4o-mini', 'qwen', 'nvidia', 'llama-3.3-70b', 'llama-3.1-8b', 'mistral-large', 'gemma-2-27b', 'codellama-70b', 'deepseek-r1', 'phi-3-medium', 'nemotron-70b'];
+      const valid = ['auto', 'claude', 'gpt-4o', 'gpt-4o-mini', 'gemini', 'gemini-2.0-flash', 'gemini-2.5-pro', 'qwen', 'nvidia', 'llama-3.3-70b', 'llama-3.1-8b', 'mistral-large', 'gemma-2-27b', 'codellama-70b', 'deepseek-r1', 'phi-3-medium', 'nemotron-70b'];
       if (!valid.includes(args[0])) { console.log(ui.error(`Invalid model. Options: ${valid.join(', ')}`)); return; }
       config.setModel(args[0]);
       // If it's an NVIDIA model name, also set it as the nvidia model
       const nvidiaModels = ['llama-3.3-70b', 'llama-3.1-8b', 'mistral-large', 'gemma-2-27b', 'codellama-70b', 'deepseek-r1', 'phi-3-medium', 'nemotron-70b'];
       if (nvidiaModels.includes(args[0])) config.set('nvidiaModel', args[0]);
+      // If it's a Gemini model name, set it
+      if (args[0].startsWith('gemini')) config.set('geminiModel', args[0]);
       console.log(ui.success(`Model set to: ${args[0]}`));
     } else {
       console.log(ui.header('AI MODELS'));
@@ -125,6 +127,8 @@ module.exports = function(reg) {
       console.log(ui.label('auto', 'Smart routing — picks best provider per query'));
       console.log(ui.label('claude', 'Claude Sonnet 4 (Anthropic) — full agent + tools'));
       console.log(ui.label('gpt-4o', 'GPT-4o (OpenAI) — tool use + streaming'));
+      console.log(ui.label('gemini', 'Gemini 2.0 Flash (Google — FREE)'));
+      console.log(ui.label('gemini-2.5-pro', 'Gemini 2.5 Pro (Google)'));
       console.log(ui.label('qwen', 'Qwen Coder 32B (HuggingFace — FREE)'));
       console.log('');
       console.log(ui.dim('NVIDIA models (FREE via build.nvidia.com):'));
@@ -138,7 +142,61 @@ module.exports = function(reg) {
       console.log(ui.dim('Set: /model deepseek-r1'));
       console.log(ui.dim('NVIDIA key: /login nvapi-your-key (free at build.nvidia.com)'));
     }
-  }, { category: 'AI', subs: ['auto', 'claude', 'gpt-4o', 'gpt-4o-mini', 'qwen', 'nvidia', 'llama-3.3-70b', 'deepseek-r1', 'mistral-large', 'codellama-70b', 'gemma-2-27b', 'nemotron-70b'] });
+  }, { category: 'AI', subs: ['auto', 'claude', 'gpt-4o', 'gpt-4o-mini', 'gemini', 'gemini-2.0-flash', 'gemini-2.5-pro', 'qwen', 'nvidia', 'llama-3.3-70b', 'deepseek-r1', 'mistral-large', 'codellama-70b', 'gemma-2-27b', 'nemotron-70b'] });
+  // --- /retry ---
+  reg('retry', 'Resend the last message to the AI', async () => {
+    const history = getConversationHistory();
+    const lastUserMsg = [...history].reverse().find(m => m.role === 'user');
+    if (!lastUserMsg) {
+      console.log(ui.warn('No previous message to retry.'));
+      return;
+    }
+    const msg = typeof lastUserMsg.content === 'string' ? lastUserMsg.content : JSON.stringify(lastUserMsg.content);
+    console.log(ui.dim(`  Retrying: ${msg.slice(0, 80)}${msg.length > 80 ? '...' : ''}`));
+    const hasKey = config.getApiKey() || config.get('anthropicKey') || process.env.ANTHROPIC_API_KEY;
+    let spinner;
+    if (!hasKey) {
+      process.stdout.write(ui.dim('  NAVADA > '));
+    } else {
+      const ora = require('ora');
+      spinner = ora({ text: '  NAVADA thinking...', color: 'white' }).start();
+    }
+    try {
+      // Remove the last assistant response + user message, then resend
+      const trimmedHistory = history.slice(0, -2);
+      const response = await agentChat(msg, trimmedHistory);
+      if (spinner) spinner.stop();
+      // Replace the last exchange in history
+      addToHistory('user', msg);
+      addToHistory('assistant', response);
+    } catch (e) {
+      if (spinner) spinner.stop();
+      console.log(ui.error(e.message));
+    }
+  }, { category: 'AI', aliases: ['r'] });
+  // --- /tokens ---
+  reg('tokens', 'Show session token usage and cost', () => {
+    console.log(ui.header('SESSION USAGE'));
+    const s = sessionState;
+    const uptime = ((Date.now() - s.startTime) / 60000).toFixed(1);
+    console.log(ui.label('Provider', s.provider));
+    console.log(ui.label('Model', s.model || config.getModel()));
+    console.log(ui.label('Messages', String(s.messages)));
+    console.log(ui.label('Input tokens', String(s.tokens.input)));
+    console.log(ui.label('Output tokens', String(s.tokens.output)));
+    console.log(ui.label('Total tokens', String(s.tokens.total)));
+    console.log(ui.label('Est. cost', `$${s.cost.toFixed(4)}`));
+    console.log(ui.label('Session time', `${uptime} min`));
+    console.log(ui.label('Rate limit', `${rateTracker.used()}/${rateTracker.limit} RPM`));
+    console.log('');
+    console.log(ui.dim('Free tier: Grok 3 via NAVADA Edge server'));
+    console.log(ui.dim('Upgrade: /login <key> for full agent + tools'));
+  }, { category: 'AI', aliases: ['usage'] });
   reg('research', 'RAG search via MCP', async (args) => {
     const query = args.join(' ');