npm - uneven-ai - Versions diffs - 1.2.2 → 1.3.0 - Mend

uneven-ai 1.2.2 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/CHANGELOG.md CHANGED Viewed

@@ -5,6 +5,25 @@ All notable changes to Uneven AI will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+## [1.3.0] - 2026-05-02
+### Added
+- **Multi-architecture GGUF dispatcher** — The Rust inference loader now reads `general.architecture` from GGUF metadata and routes to the correct candle-transformers backend (`quantized_llama`, `quantized_qwen2`, `quantized_gemma3`, `quantized_phi3`). All seven catalog models are now supported out of the box.
+- **Chat templates** — Each model family now receives prompts in its correct format: Llama 3 (`<|begin_of_text|>` header tokens), ChatML (`<|im_start|>`, used by Qwen and SmolLM2), DeepSeek-R1 (Unicode BOS/EOS tokens), Gemma 3 (`<start_of_turn>`), and Phi 3/4 (`<|system|>` role tokens). The `detectTemplate` helper selects the right template from the model ID automatically.
+- **DeepSeek-R1 thinking-token stripping** — `<think>…</think>` blocks emitted by DeepSeek-R1 models are removed before the response reaches the user.
+- **Adaptive inference timeout** — Local inference timeout is now `max(300 s, maxTokens × 1.2 s)` instead of a fixed 120 s, preventing spurious timeouts on slower hardware.
+- **`llm-error` utility module** — `sanitizeLlmError` extracted to `src/infrastructure/utils/llm-error.ts` for isolated unit testing without the native binding mock.
+- **Unit tests — chat templates (60 tests)** — Per-architecture token structure, content integrity, multi-turn history ordering, and per-model send/receive simulation for all seven catalog models.
+- **Unit tests — error sanitisation (12 tests)** — Covers every error category mapped by `sanitizeLlmError`.
+### Fixed
+- **Double BOS token** — `encode(prompt, true)` was adding a BOS token on top of the one already embedded in the chat template, corrupting Llama 3 prompts. Changed to `encode(prompt, false)`.
+- **Default model ID** — Fallback model in the NAPI layer updated from `llama-3.2-1b-q8` to `llama-3.2-1b-q4` to match the catalog.
+---
 ## [1.2.2] - 2026-05-02
 ### Fixed

package/README.md CHANGED Viewed

@@ -157,7 +157,7 @@ uneven-ai ci
 Run `uneven-ai` with no arguments to open the interactive shell:
 ```
-  ◈  Uneven AI  v1.2.0
+  ◈  Uneven AI  v1.3.0
   ────────────────────────────────────────────────────────────
   Olá! O que posso fazer por você hoje?
   (Escreva sua mensagem ou "sair" para encerrar)

package/dist/application/orchestration/engine/ask/brain.d.ts CHANGED Viewed

@@ -1,14 +1,8 @@
 import type { EngineCtx } from '../context.js';
-/**
- * EngineBrain — Encapsulates the inference logic for the engine.
- * Handles switching between local and external providers, timeouts, and streaming.
- */
+import type { ChatTurn } from './chat-template.js';
 export declare class EngineBrain {
     private ctx;
     constructor(ctx: EngineCtx);
-    /**
-     * Performs an inference (completion) with the configured provider.
-     */
-    infer(prompt: string, onToken?: (token: string) => void): Promise<string>;
+    infer(user: string, onToken?: (token: string) => void, maxTokensOverride?: number, system?: string, history?: ChatTurn[]): Promise<string>;
 }
 //# sourceMappingURL=brain.d.ts.map

package/dist/application/orchestration/engine/ask/brain.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"brain.d.ts","sourceRoot":"","sources":["../../../../../src/application/orchestration/engine/ask/brain.ts"],"names":[],"mappings":"~~AAKA~~,OAAO,KAAK,EAAE,SAAS,EAAE,MAAM,eAAe,CAAA;~~AAE9C;;;GAGG~~;~~AACH~~,qBAAa,WAAW;IACV,OAAO,CAAC,GAAG;gBAAH,GAAG,EAAE,SAAS;~~IAElC;;OAEG;IACG~~,KAAK,~~CAAC~~,~~MAAM~~,EAAE,MAAM,~~EAAE~~,OAAO,CAAC,EAAE,CAAC,KAAK,EAAE,MAAM,KAAK,IAAI,~~GAAG~~,OAAO,CAAC,MAAM,CAAC;~~CAgChF~~"}
1	+ {"version":3,"file":"brain.d.ts","sourceRoot":"","sources":["../../../../../src/application/orchestration/engine/ask/brain.ts"],"names":[],"mappings":"AAMA,OAAO,KAAK,EAAE,SAAS,EAAE,MAAM,eAAe,CAAA;AAC9C,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,oBAAoB,CAAA;AAElD,qBAAa,WAAW;IACV,OAAO,CAAC,GAAG;gBAAH,GAAG,EAAE,SAAS;IAE5B,KAAK,CACT,IAAI,EAAE,MAAM,EACZ,OAAO,CAAC,EAAE,CAAC,KAAK,EAAE,MAAM,KAAK,IAAI,EACjC,iBAAiB,CAAC,EAAE,MAAM,EAC1B,MAAM,CAAC,EAAE,MAAM,EACf,OAAO,GAAE,QAAQ,EAAO,GACvB,OAAO,CAAC,MAAM,CAAC;CA2CnB"}

package/dist/application/orchestration/engine/ask/brain.js CHANGED Viewed

@@ -1,43 +1,45 @@
 import { llmInfer, llmInferStream, } from '../../../../infrastructure/adapters/bridge.js';
 import { ExternalProviders } from '../../../../infrastructure/adapters/providers/index.js';
-/**
- * EngineBrain — Encapsulates the inference logic for the engine.
- * Handles switching between local and external providers, timeouts, and streaming.
- */
+import { detectTemplate, applyTemplate, stripThinkingTokens } from './chat-template.js';
 export class EngineBrain {
     ctx;
     constructor(ctx) {
         this.ctx = ctx;
     }
-    /**
-     * Performs an inference (completion) with the configured provider.
-     */
-    async infer(prompt, onToken) {
+    async infer(user, onToken, maxTokensOverride, system, history = []) {
         const brainConfig = this.ctx.config.brain;
         const provider = brainConfig?.provider || 'local';
-        const model = brainConfig?.model || 'llama3.2';
-        const maxTokens = brainConfig?.maxTokens || 1024;
+        const model = brainConfig?.model || 'llama-3.2-1b-q4';
+        const maxTokens = maxTokensOverride ?? brainConfig?.maxTokens ?? 1024;
         const temperature = brainConfig?.temperature ?? 0.0;
-        const timeoutMs = brainConfig?.local?.inferTimeoutMs ?? 120_000;
+        const timeoutMs = brainConfig?.local?.inferTimeoutMs
+            ?? Math.max(300_000, maxTokens * 1_200);
         const withTimeout = (p) => Promise.race([
             p,
             new Promise((_, reject) => setTimeout(() => reject(new Error(`LLM inference timed out after ${timeoutMs}ms`)), timeoutMs)),
         ]);
         if (provider === 'local') {
             const threads = brainConfig?.local?.threads ?? 4;
+            const template = detectTemplate(model);
+            const prompt = system
+                ? applyTemplate(template, system, history, user)
+                : user;
+            const isDeepSeek = model.toLowerCase().startsWith('deepseek');
+            let content;
             if (onToken) {
                 const result = await withTimeout(llmInferStream(prompt, onToken, maxTokens, threads, temperature));
-                return result.content;
+                content = result.content;
             }
             else {
                 const result = await withTimeout(llmInfer(prompt, maxTokens, threads, temperature));
-                return result.content;
+                content = result.content;
             }
+            return isDeepSeek ? stripThinkingTokens(content) : content;
         }
         else {
             const extProviders = new ExternalProviders(this.ctx.logger);
             const apiKey = brainConfig?.apiKey;
-            const result = await withTimeout(extProviders.infer(prompt, provider, model, maxTokens, onToken, apiKey));
+            const result = await withTimeout(extProviders.infer(user, provider, model, maxTokens, onToken, apiKey));
             return result.content;
         }
     }

package/dist/application/orchestration/engine/ask/chat-template.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+export type ChatTemplate = 'llama3' | 'chatml' | 'deepseek-r1' | 'gemma3' | 'phi3';
+export declare function detectTemplate(modelId: string): ChatTemplate;
+export interface ChatTurn {
+    role: 'user' | 'assistant';
+    content: string;
+}
+export declare function applyTemplate(template: ChatTemplate, system: string, history: ChatTurn[], user: string): string;
+export declare function stripThinkingTokens(text: string): string;
+//# sourceMappingURL=chat-template.d.ts.map

package/dist/application/orchestration/engine/ask/chat-template.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"chat-template.d.ts","sourceRoot":"","sources":["../../../../../src/application/orchestration/engine/ask/chat-template.ts"],"names":[],"mappings":"AAAA,MAAM,MAAM,YAAY,GAAG,QAAQ,GAAG,QAAQ,GAAG,aAAa,GAAG,QAAQ,GAAG,MAAM,CAAA;AAElF,wBAAgB,cAAc,CAAC,OAAO,EAAE,MAAM,GAAG,YAAY,CAQ5D;AAED,MAAM,WAAW,QAAQ;IACvB,IAAI,EAAE,MAAM,GAAG,WAAW,CAAA;IAC1B,OAAO,EAAE,MAAM,CAAA;CAChB;AAED,wBAAgB,aAAa,CAC3B,QAAQ,EAAE,YAAY,EACtB,MAAM,EAAE,MAAM,EACd,OAAO,EAAE,QAAQ,EAAE,EACnB,IAAI,EAAE,MAAM,GACX,MAAM,CAiER;AAED,wBAAgB,mBAAmB,CAAC,IAAI,EAAE,MAAM,GAAG,MAAM,CAExD"}

package/dist/application/orchestration/engine/ask/chat-template.js ADDED Viewed

@@ -0,0 +1,82 @@
+export function detectTemplate(modelId) {
+    const id = modelId.toLowerCase();
+    if (id.startsWith('deepseek'))
+        return 'deepseek-r1';
+    if (id.startsWith('llama') || id.startsWith('smollm'))
+        return 'llama3';
+    if (id.startsWith('qwen'))
+        return 'chatml';
+    if (id.startsWith('gemma'))
+        return 'gemma3';
+    if (id.startsWith('phi'))
+        return 'phi3';
+    return 'llama3';
+}
+export function applyTemplate(template, system, history, user) {
+    switch (template) {
+        case 'llama3': {
+            let prompt = `<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\n${system}<|eot_id|>`;
+            for (const turn of history) {
+                prompt += `<|start_header_id|>${turn.role}<|end_header_id|>\n\n${turn.content}<|eot_id|>`;
+            }
+            prompt += `<|start_header_id|>user<|end_header_id|>\n\n${user}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n`;
+            return prompt;
+        }
+        case 'chatml': {
+            let prompt = `<|im_start|>system\n${system}<|im_end|>\n`;
+            for (const turn of history) {
+                prompt += `<|im_start|>${turn.role}\n${turn.content}<|im_end|>\n`;
+            }
+            prompt += `<|im_start|>user\n${user}<|im_end|>\n<|im_start|>assistant\n`;
+            return prompt;
+        }
+        case 'deepseek-r1': {
+            // DeepSeek-R1 uses its own special tokens (Unicode full-width vertical bars)
+            // System message goes before the first User marker (no dedicated system role)
+            let prompt = `<｜begin▁of▁sentence｜>${system}\n`;
+            for (const turn of history) {
+                if (turn.role === 'user') {
+                    prompt += `<｜User｜>${turn.content}\n`;
+                }
+                else {
+                    prompt += `<｜Assistant｜>${turn.content}<｜end▁of▁sentence｜>\n`;
+                }
+            }
+            prompt += `<｜User｜>${user}\n<｜Assistant｜>`;
+            return prompt;
+        }
+        case 'gemma3': {
+            // Gemma 3 has no system role — system message goes inside the first user turn
+            let prompt = `<start_of_turn>user\n${system}\n\n`;
+            // First user turn already opened; if there's history, close it and add alternating turns
+            if (history.length > 0) {
+                prompt += `<end_of_turn>\n`;
+                for (const turn of history) {
+                    const role = turn.role === 'user' ? 'user' : 'model';
+                    prompt += `<start_of_turn>${role}\n${turn.content}<end_of_turn>\n`;
+                }
+                prompt += `<start_of_turn>user\n${user}<end_of_turn>\n<start_of_turn>model\n`;
+            }
+            else {
+                prompt += `${user}<end_of_turn>\n<start_of_turn>model\n`;
+            }
+            return prompt;
+        }
+        case 'phi3': {
+            let prompt = `<|system|>\n${system}<|end|>\n`;
+            for (const turn of history) {
+                if (turn.role === 'user') {
+                    prompt += `<|user|>\n${turn.content}<|end|>\n`;
+                }
+                else {
+                    prompt += `<|assistant|>\n${turn.content}<|end|>\n`;
+                }
+            }
+            prompt += `<|user|>\n${user}<|end|>\n<|assistant|>\n`;
+            return prompt;
+        }
+    }
+}
+export function stripThinkingTokens(text) {
+    return text.replace(/<think>[\s\S]*?<\/think>\s*/g, '').trim();
+}

package/dist/application/orchestration/engine/ask/context-assembler.js CHANGED Viewed

@@ -4,7 +4,7 @@ import * as path from 'path';
 import { llmEmbed, retrievalSearch } from '../../../../infrastructure/adapters/bridge.js';
 import { KnowledgeRetriever } from '../../knowledge-retriever.js';
 import { FixEngine } from '../../../development/fix/index.js';
-import { ROUTER_PROMPT } from './prompts.js';
+import { ROUTER_SYSTEM, ROUTER_USER } from './prompts.js';
 /**
  * ContextAssembler — Responsible for gathering relevant project context.
  * Uses Knowledge Map routing, Vector Search, and Proactive Auditing.
@@ -57,9 +57,9 @@ export class ContextAssembler {
         }
     }
     async detectRelevantPaths(filesMap, question, brain) {
-        const routerPrompt = ROUTER_PROMPT(filesMap, question);
+        const routerUser = ROUTER_USER(filesMap, question);
         try {
-            const result = await brain.infer(routerPrompt);
+            const result = await brain.infer(routerUser, undefined, 128, ROUTER_SYSTEM);
             // Use [\s\S] so the match works on both compact and pretty-printed arrays.
             const jsonMatch = result.match(/\[[\s\S]*?\]/);
             if (jsonMatch) {

package/dist/application/orchestration/engine/ask/prompts.d.ts CHANGED Viewed

@@ -1,6 +1,8 @@
 /**
  * Prompts for the Ask Engine
  */
+export declare const ROUTER_SYSTEM = "You are a context router for a coding assistant. Your only job is to identify which files (MAX 5) are relevant to the user's question and return them as a JSON array. Output ONLY the JSON array \u2014 no explanation, no markdown, no extra text.";
+export declare const ROUTER_USER: (filesMap: string, question: string) => string;
 export declare const ROUTER_PROMPT: (filesMap: string, question: string) => string;
 export declare const SYSTEM_INSTRUCTIONS_HEADER: string;
 //# sourceMappingURL=prompts.d.ts.map

package/dist/application/orchestration/engine/ask/prompts.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"prompts.d.ts","sourceRoot":"","sources":["../../../../../src/application/orchestration/engine/ask/prompts.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,eAAO,MAAM,aAAa,GAAI,UAAU,MAAM,EAAE,UAAU,MAAM,~~WAexD~~,CAAA;AAER,eAAO,MAAM,0BAA0B,QAI/B,CAAA"}
1	+ {"version":3,"file":"prompts.d.ts","sourceRoot":"","sources":["../../../../../src/application/orchestration/engine/ask/prompts.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,eAAO,MAAM,aAAa,yPACyN,CAAA;AAEnP,eAAO,MAAM,WAAW,GAAI,UAAU,MAAM,EAAE,UAAU,MAAM,WAQtD,CAAA;AAER,eAAO,MAAM,aAAa,GAAI,UAAU,MAAM,EAAE,UAAU,MAAM,WACN,CAAA;AAE1D,eAAO,MAAM,0BAA0B,QAI/B,CAAA"}

package/dist/application/orchestration/engine/ask/prompts.js CHANGED Viewed

@@ -1,22 +1,17 @@
 /**
  * Prompts for the Ask Engine
  */
-export const ROUTER_PROMPT = (filesMap, question) => `
-You are a context router for a coding assistant.
-Given the following list of files in the project and the user's question, identify which files (MAX 5) are necessary to answer the question.
-### PROJECT FILES:
+export const ROUTER_SYSTEM = `You are a context router for a coding assistant. Your only job is to identify which files (MAX 5) are relevant to the user's question and return them as a JSON array. Output ONLY the JSON array — no explanation, no markdown, no extra text.`;
+export const ROUTER_USER = (filesMap, question) => `
+PROJECT FILES:
 ${filesMap}
-### QUESTION:
-${question}
+QUESTION: ${question}
-### INSTRUCTIONS:
-- Identify files that likely contain the answer.
-- Answer ONLY with a JSON array of relative paths.
-- If no files are relevant, return [].
-- Example: ["src/controllers/user.js", "src/models/user.ts"]
+Answer with ONLY a JSON array of relative paths. If no files are relevant, return [].
+Example: ["src/controllers/user.js", "src/models/user.ts"]
 `.trim();
+export const ROUTER_PROMPT = (filesMap, question) => `${ROUTER_SYSTEM}\n\n${ROUTER_USER(filesMap, question)}`;
 export const SYSTEM_INSTRUCTIONS_HEADER = `
 You are Uneven AI (Snatchy), a senior software engineer assistant.
 Base your answers on the provided project context and conversation history.

package/dist/application/orchestration/engine/ask.js CHANGED Viewed

@@ -30,12 +30,12 @@ export async function doAsk(ctx, question, onToken, history = [], fixEngineOverr
         // 3. Context Assembly (Data Diet)
         const context = await assembler.assemble(question, brain);
         // 4. Prompt Synthesis
-        const historySection = formatHistory(history);
         const SafetyGuard = ctx.safetyGuard.constructor;
         const sysInstructions = SafetyGuard.SYSTEM_INSTRUCTIONS ?? SYSTEM_INSTRUCTIONS_HEADER;
-        const fullPrompt = `${sysInstructions}\n\n${context}${historySection}\nQuestion: ${question}\n\nAnswer:`;
+        const userContent = `${context}\nQuestion: ${question}`;
+        const chatHistory = history.map(t => ({ role: t.role, content: t.content }));
         // 5. Brain Inference (Thought Process)
-        let response = await brain.infer(fullPrompt, onToken);
+        let response = await brain.infer(userContent, onToken, undefined, sysInstructions, chatHistory);
         // 6. Sanitization & Finalization
         response = ctx.safetyGuard.sanitizeResponse(response);
         ctx.logger.info(`Ask: Generated answer (${response.length} chars)`);
@@ -52,13 +52,3 @@ export async function doAsk(ctx, question, onToken, history = [], fixEngineOverr
         throw error;
     }
 }
-/**
- * Formats conversation history for the prompt.
- */
-function formatHistory(history) {
-    if (history.length === 0)
-        return '';
-    return '\n## CONVERSATION HISTORY\n\n' +
-        history.map(t => t.role === 'user' ? `User: ${t.content}` : `Assistant: ${t.content}`).join('\n') +
-        '\n';
-}

package/dist/cli/commands/ask.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"ask.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/ask.ts"],"names":[],"mappings":"AAQA,wBAAsB,UAAU,CAC9B,QAAQ,EAAE,MAAM,EAChB,OAAO,GAAE;IAAE,QAAQ,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAO,GAClD,OAAO,CAAC,IAAI,CAAC,~~CAqEf~~"}
1	+ {"version":3,"file":"ask.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/ask.ts"],"names":[],"mappings":"AAQA,wBAAsB,UAAU,CAC9B,QAAQ,EAAE,MAAM,EAChB,OAAO,GAAE;IAAE,QAAQ,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAO,GAClD,OAAO,CAAC,IAAI,CAAC,CAsEf"}

package/dist/cli/commands/ask.js CHANGED Viewed

@@ -33,6 +33,7 @@ export async function askCommand(question, options = {}) {
                 console.log(t.dim('  Action stopped to keep your machine responsive.'));
             }
             blank();
+            process.exit(0);
         });
         let streamingStarted = false;
         const answer = await uneven.ask(question, (token) => {

package/dist/cli/commands/chat.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"chat.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/chat.ts"],"names":[],"mappings":"AAOA,MAAM,WAAW,gBAAgB;IAC/B,IAAI,EAAE,MAAM,GAAG,WAAW,CAAA;IAC1B,OAAO,EAAE,MAAM,CAAA;CAChB;AAED,eAAO,MAAM,iBAAiB,KAAK,CAAA;AAEnC,wBAAgB,wBAAwB,CAAC,OAAO,EAAE,gBAAgB,EAAE,GAAG,MAAM,CAQ5E;AAED,wBAAsB,WAAW,CAC/B,OAAO,GAAE;IAAE,QAAQ,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAO,GAClD,OAAO,CAAC,IAAI,CAAC,~~CAgHf~~"}
1	+ {"version":3,"file":"chat.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/chat.ts"],"names":[],"mappings":"AAOA,MAAM,WAAW,gBAAgB;IAC/B,IAAI,EAAE,MAAM,GAAG,WAAW,CAAA;IAC1B,OAAO,EAAE,MAAM,CAAA;CAChB;AAED,eAAO,MAAM,iBAAiB,KAAK,CAAA;AAEnC,wBAAgB,wBAAwB,CAAC,OAAO,EAAE,gBAAgB,EAAE,GAAG,MAAM,CAQ5E;AAED,wBAAsB,WAAW,CAC/B,OAAO,GAAE;IAAE,QAAQ,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAO,GAClD,OAAO,CAAC,IAAI,CAAC,CAiHf"}

package/dist/cli/commands/chat.js CHANGED Viewed

@@ -44,6 +44,7 @@ export async function chatCommand(options = {}) {
         blank();
         console.log(t.rust(`  Safety interrupt: ${reason}`));
         blank();
+        process.exit(0);
     });
     const cleanup = () => {
         guardian.stop();

package/dist/cli/commands/docs.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"docs.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/docs.ts"],"names":[],"mappings":"AASA,MAAM,MAAM,UAAU,GAAG,IAAI,GAAG,OAAO,CAAA;AAEvC,eAAO,MAAM,mBAAmB,QAAS,CAAA;AAEzC,wBAAgB,mBAAmB,CACjC,OAAO,EAAE,MAAM,EACf,QAAQ,GAAE,MAA4B,GACrC,MAAM,CAMR;AAED,wBAAgB,eAAe,CAC7B,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,MAAM,EACf,MAAM,EAAE,MAAM,EACd,MAAM,EAAE,UAAU,GACjB,MAAM,CAuCR;AAED,MAAM,WAAW,WAAW;IAC1B,MAAM,CAAC,EAAE,UAAU,CAAA;IACnB,GAAG,CAAC,EAAE,MAAM,CAAA;IACZ,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,KAAK,CAAC,EAAE,MAAM,CAAA;CACf;AAED,wBAAsB,WAAW,CAC/B,QAAQ,EAAE,MAAM,EAChB,MAAM,GAAE,MAAW,EACnB,OAAO,GAAE,WAAgB,GACxB,OAAO,CAAC,IAAI,CAAC,~~CA4Ef~~"}
1	+ {"version":3,"file":"docs.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/docs.ts"],"names":[],"mappings":"AASA,MAAM,MAAM,UAAU,GAAG,IAAI,GAAG,OAAO,CAAA;AAEvC,eAAO,MAAM,mBAAmB,QAAS,CAAA;AAEzC,wBAAgB,mBAAmB,CACjC,OAAO,EAAE,MAAM,EACf,QAAQ,GAAE,MAA4B,GACrC,MAAM,CAMR;AAED,wBAAgB,eAAe,CAC7B,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,MAAM,EACf,MAAM,EAAE,MAAM,EACd,MAAM,EAAE,UAAU,GACjB,MAAM,CAuCR;AAED,MAAM,WAAW,WAAW;IAC1B,MAAM,CAAC,EAAE,UAAU,CAAA;IACnB,GAAG,CAAC,EAAE,MAAM,CAAA;IACZ,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,KAAK,CAAC,EAAE,MAAM,CAAA;CACf;AAED,wBAAsB,WAAW,CAC/B,QAAQ,EAAE,MAAM,EAChB,MAAM,GAAE,MAAW,EACnB,OAAO,GAAE,WAAgB,GACxB,OAAO,CAAC,IAAI,CAAC,CA6Ef"}

package/dist/cli/commands/docs.js CHANGED Viewed

@@ -86,6 +86,7 @@ export async function docsCommand(filePath, symbol = '', options = {}) {
         guardian = new ResourceGuardian(new Logger('./.uneven/logs/guardian.md'));
         guardian.start((reason) => {
             console.error(t.rust(`\n  Safety interrupt: ${reason}`));
+            process.exit(0);
         });
         blank();
         const modeLabel = format === 'jsdoc' ? 'TSDoc' : 'Markdown';

package/dist/cli/commands/explain.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"explain.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/explain.ts"],"names":[],"mappings":"AASA,eAAO,MAAM,cAAc,QAAS,CAAA;AAEpC,wBAAgB,mBAAmB,CACjC,OAAO,EAAE,MAAM,EACf,QAAQ,GAAE,MAAuB,GAChC,MAAM,CAMR;AAED,wBAAgB,kBAAkB,CAChC,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,MAAM,EACf,KAAK,EAAE,MAAM,GACZ,MAAM,CAqBR;AAED,MAAM,WAAW,cAAc;IAC7B,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,KAAK,CAAC,EAAE,MAAM,CAAA;CACf;AAED,wBAAsB,cAAc,CAClC,QAAQ,EAAE,MAAM,EAChB,KAAK,GAAE,MAAW,EAClB,OAAO,GAAE,cAAmB,GAC3B,OAAO,CAAC,IAAI,CAAC,~~CAiEf~~"}
1	+ {"version":3,"file":"explain.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/explain.ts"],"names":[],"mappings":"AASA,eAAO,MAAM,cAAc,QAAS,CAAA;AAEpC,wBAAgB,mBAAmB,CACjC,OAAO,EAAE,MAAM,EACf,QAAQ,GAAE,MAAuB,GAChC,MAAM,CAMR;AAED,wBAAgB,kBAAkB,CAChC,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,MAAM,EACf,KAAK,EAAE,MAAM,GACZ,MAAM,CAqBR;AAED,MAAM,WAAW,cAAc;IAC7B,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,KAAK,CAAC,EAAE,MAAM,CAAA;CACf;AAED,wBAAsB,cAAc,CAClC,QAAQ,EAAE,MAAM,EAChB,KAAK,GAAE,MAAW,EAClB,OAAO,GAAE,cAAmB,GAC3B,OAAO,CAAC,IAAI,CAAC,CAkEf"}

package/dist/cli/commands/explain.js CHANGED Viewed

@@ -66,6 +66,7 @@ export async function explainCommand(filePath, focus = '', options = {}) {
         guardian = new ResourceGuardian(new Logger(logPath));
         guardian.start((reason) => {
             console.error(t.rust(`\n  Safety interrupt: ${reason}`));
+            process.exit(0);
         });
         blank();
         console.log(t.dim('  ┌─ Explanation'));

package/dist/cli/commands/init/config-builder.js CHANGED Viewed

@@ -2,7 +2,7 @@ export function defaultModelFor(provider, localModelId) {
     if (provider === 'local' && localModelId)
         return localModelId;
     const MAP = {
-        local: 'llama-3.2-1b-q8',
+        local: 'llama-3.2-1b-q4',
         ollama: 'llama3.2',
         claude: 'claude-sonnet-4-6',
         openai: 'gpt-4o-mini',

package/dist/cli/commands/init/constants.js CHANGED Viewed

@@ -18,19 +18,19 @@ export const EMBEDDING_FILES = [
 ];
 export const LOCAL_MODEL_CATALOG = [
     {
-        id: 'llama-3.2-1b-q8',
-        label: 'Llama 3.2 1B Q8',
-        ram: '~2.5 GB',
-        storage: '~1.4 GB',
+        id: 'llama-3.2-1b-q4',
+        label: 'Llama 3.2 1B Q4',
+        ram: '~1.5 GB',
+        storage: '~700 MB',
         files: [
             {
-                url: 'https://huggingface.co/bartowski/Llama-3.2-1B-Instruct-GGUF/resolve/main/Llama-3.2-1B-Instruct-Q8_0.gguf',
-                dest: '.uneven/models/llama-3.2-1b-q8.gguf',
-                size: '~1.4 GB',
+                url: 'https://huggingface.co/bartowski/Llama-3.2-1B-Instruct-GGUF/resolve/main/Llama-3.2-1B-Instruct-Q4_K_M.gguf',
+                dest: '.uneven/models/llama-3.2-1b-q4.gguf',
+                size: '~700 MB',
             },
             {
                 url: 'https://huggingface.co/unsloth/Llama-3.2-1B-Instruct/resolve/main/tokenizer.json',
-                dest: '.uneven/models/llama-3.2-1b-q8-tokenizer.json',
+                dest: '.uneven/models/llama-3.2-1b-q4-tokenizer.json',
                 size: '~1.7 MB',
             },
         ],

package/dist/domain/entities/session/constants.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 export declare const SESSION_FILE = ".uneven/session.json";
-export declare const UNEVEN_VERSION = "1.2.2";
+export declare const UNEVEN_VERSION = "1.3.0";
 export declare const STALE_THRESHOLD_MS: number;
 export declare const LOCK_TIMEOUT_MS = 30000;
 export declare const LOCK_DEBOUNCE_MS = 1500;

package/dist/domain/entities/session/constants.js CHANGED Viewed

@@ -1,5 +1,5 @@
 export const SESSION_FILE = '.uneven/session.json';
-export const UNEVEN_VERSION = '1.2.2';
+export const UNEVEN_VERSION = '1.3.0';
 export const STALE_THRESHOLD_MS = 60 * 60 * 1000; // 1 hour
 export const LOCK_TIMEOUT_MS = 30_000; // 30 seconds
 export const LOCK_DEBOUNCE_MS = 1_500; // 1.5 seconds

package/dist/infrastructure/adapters/bridge.d.ts CHANGED Viewed

@@ -1,3 +1,5 @@
+import { sanitizeLlmError } from '../utils/llm-error.js';
+export { sanitizeLlmError };
 export interface NativeEngine {
     initEngine(config: object, threads: number): Promise<string>;
     getVersion(): string;

package/dist/infrastructure/adapters/bridge.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"bridge.d.ts","sourceRoot":"","sources":["../../../src/infrastructure/adapters/bridge.ts"],"names":[],"mappings":"~~AAmEA~~,MAAM,WAAW,YAAY;IAC3B,UAAU,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IAC5D,UAAU,IAAI,MAAM,CAAA;IACpB,aAAa,IAAI,MAAM,CAAA;IACvB,aAAa,IAAI,MAAM,CAAA;IACvB,aAAa,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACjE,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;IACjC,QAAQ,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACvC,QAAQ,CAAC,MAAM,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,EAAE,aAAa,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACzH,cAAc,CAAC,MAAM,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,EAAE,aAAa,EAAE,MAAM,EAAE,OAAO,EAAE,CAAC,GAAG,EAAE,KAAK,GAAG,IAAI,EAAE,KAAK,CAAC,EAAE,MAAM,KAAK,IAAI,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACrL,uBAAuB,IAAI,IAAI,CAAA;IAC/B,mBAAmB,IAAI,IAAI,CAAA;IAC3B,eAAe,CAAC,SAAS,EAAE,MAAM,EAAE,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC;QAAE,SAAS,EAAE,MAAM,EAAE,CAAC;QAAC,MAAM,EAAE,MAAM,EAAE,CAAA;KAAE,CAAC,CAAA;IACtG,aAAa,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IACtH,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;IACjC,eAAe,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IAC9C,aAAa,CAAC,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;CACnG;AAED,wBAAgB,gBAAgB,IAAI,YAAY,GAAG,IAAI,CAEtD;AAED,wBAAgB,iBAAiB,IAAI,OAAO,CAE3C;AAkCD,wBAAsB,gBAAgB,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,GAAE,MAAU,GAAG,OAAO,CAAC,IAAI,CAAC,CAQzF;AAED,wBAAgB,gBAAgB,IAAI,MAAM,CAGzC;AAED,wBAAgB,mBAAmB,IAAI,MAAM,CAG5C;AAGD,wBAAgB,aAAa,IAAI,MAAM,CAGtC;AAED,wBAAsB,aAAa,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,GAAE,MAAU,GAAG,OAAO,CAAC,IAAI,CAAC,CAOxF;AAED,wBAAsB,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAOtD;AAED,wBAAsB,QAAQ,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC,CAY9D;AAED,wBAAsB,aAAa,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAgBxE;AAED,wBAAsB,mBAAmB,CACvC,MAAM,EAAO,MAAM,EAAE,EACrB,QAAQ,EAAK,MAAM,EAAE,EACrB,WAAW,EAAE,MAAM,EAAE,EACrB,QAAQ,EAAK,MAAM,EAAE,EACrB,UAAU,EAAG,MAAM,EAAE,EAAE,GACtB,OAAO,CAAC,IAAI,CAAC,CAef;~~AAqBD~~,wBAAsB,QAAQ,CAC5B,MAAM,EAAE,MAAM,EACd,SAAS,EAAE,MAAM,EACjB,OAAO,GAAE,MAAU,EACnB,WAAW,GAAE,MAAY,EAAI,oCAAoC;AACjE,aAAa,GAAE,MAAY,GAC1B,OAAO,CAAC;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,WAAW,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAA;CAAE,CAAC,CAalE;AAED,wBAAsB,cAAc,CAClC,MAAM,EAAE,MAAM,EACd,OAAO,EAAE,CAAC,KAAK,EAAE,MAAM,KAAK,IAAI,EAChC,SAAS,EAAE,MAAM,EACjB,OAAO,GAAE,MAAU,EACnB,WAAW,GAAE,MAAY,EACzB,aAAa,GAAE,MAAY,GAC1B,OAAO,CAAC;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,WAAW,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAA;CAAE,CAAC,CAgBlE;AAED,wBAAsB,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAOtD;AAED,wBAAsB,aAAa,CACjC,KAAK,EAAE,MAAM,EACb,OAAO,EAAE,MAAM,EACf,UAAU,EAAE,MAAM,EAClB,OAAO,EAAE,MAAM,EACf,SAAS,EAAE,MAAM,EAAE,GAClB,OAAO,CAAC,IAAI,CAAC,CAOf;AAED,wBAAsB,eAAe,CACnC,SAAS,EAAE,MAAM,EAAE,EACnB,IAAI,EAAE,MAAM,GACX,OAAO,CAAC;IAAE,SAAS,EAAE,MAAM,EAAE,CAAC;IAAC,MAAM,EAAE,MAAM,EAAE,CAAA;CAAE,CAAC,CAWpD;AAED,wBAAsB,aAAa,CACjC,MAAM,EAAE,MAAM,EACd,QAAQ,EAAE,MAAM,EAChB,KAAK,EAAE,MAAM,EACb,SAAS,GAAE,MAAY,GACtB,OAAO,CAAC;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,WAAW,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAC;IAAC,QAAQ,EAAE,MAAM,CAAA;CAAE,CAAC,CAYpF;AAED,wBAAgB,uBAAuB,IAAI,IAAI,CAI9C;AAED,wBAAgB,mBAAmB,IAAI,IAAI,CAI1C"}
1	+ {"version":3,"file":"bridge.d.ts","sourceRoot":"","sources":["../../../src/infrastructure/adapters/bridge.ts"],"names":[],"mappings":"AAKA,OAAO,EAAE,gBAAgB,EAAE,MAAM,uBAAuB,CAAA;AACxD,OAAO,EAAE,gBAAgB,EAAE,CAAA;AA+D3B,MAAM,WAAW,YAAY;IAC3B,UAAU,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IAC5D,UAAU,IAAI,MAAM,CAAA;IACpB,aAAa,IAAI,MAAM,CAAA;IACvB,aAAa,IAAI,MAAM,CAAA;IACvB,aAAa,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACjE,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;IACjC,QAAQ,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACvC,QAAQ,CAAC,MAAM,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,EAAE,aAAa,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACzH,cAAc,CAAC,MAAM,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,EAAE,aAAa,EAAE,MAAM,EAAE,OAAO,EAAE,CAAC,GAAG,EAAE,KAAK,GAAG,IAAI,EAAE,KAAK,CAAC,EAAE,MAAM,KAAK,IAAI,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IACrL,uBAAuB,IAAI,IAAI,CAAA;IAC/B,mBAAmB,IAAI,IAAI,CAAA;IAC3B,eAAe,CAAC,SAAS,EAAE,MAAM,EAAE,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC;QAAE,SAAS,EAAE,MAAM,EAAE,CAAC;QAAC,MAAM,EAAE,MAAM,EAAE,CAAA;KAAE,CAAC,CAAA;IACtG,aAAa,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IACtH,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;IACjC,eAAe,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IAC9C,aAAa,CAAC,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;CACnG;AAED,wBAAgB,gBAAgB,IAAI,YAAY,GAAG,IAAI,CAEtD;AAED,wBAAgB,iBAAiB,IAAI,OAAO,CAE3C;AAkCD,wBAAsB,gBAAgB,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,GAAE,MAAU,GAAG,OAAO,CAAC,IAAI,CAAC,CAQzF;AAED,wBAAgB,gBAAgB,IAAI,MAAM,CAGzC;AAED,wBAAgB,mBAAmB,IAAI,MAAM,CAG5C;AAGD,wBAAgB,aAAa,IAAI,MAAM,CAGtC;AAED,wBAAsB,aAAa,CAAC,QAAQ,EAAE,MAAM,EAAE,OAAO,GAAE,MAAU,GAAG,OAAO,CAAC,IAAI,CAAC,CAOxF;AAED,wBAAsB,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAOtD;AAED,wBAAsB,QAAQ,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC,CAY9D;AAED,wBAAsB,aAAa,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAgBxE;AAED,wBAAsB,mBAAmB,CACvC,MAAM,EAAO,MAAM,EAAE,EACrB,QAAQ,EAAK,MAAM,EAAE,EACrB,WAAW,EAAE,MAAM,EAAE,EACrB,QAAQ,EAAK,MAAM,EAAE,EACrB,UAAU,EAAG,MAAM,EAAE,EAAE,GACtB,OAAO,CAAC,IAAI,CAAC,CAef;AAsBD,wBAAsB,QAAQ,CAC5B,MAAM,EAAE,MAAM,EACd,SAAS,EAAE,MAAM,EACjB,OAAO,GAAE,MAAU,EACnB,WAAW,GAAE,MAAY,EAAI,oCAAoC;AACjE,aAAa,GAAE,MAAY,GAC1B,OAAO,CAAC;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,WAAW,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAA;CAAE,CAAC,CAalE;AAED,wBAAsB,cAAc,CAClC,MAAM,EAAE,MAAM,EACd,OAAO,EAAE,CAAC,KAAK,EAAE,MAAM,KAAK,IAAI,EAChC,SAAS,EAAE,MAAM,EACjB,OAAO,GAAE,MAAU,EACnB,WAAW,GAAE,MAAY,EACzB,aAAa,GAAE,MAAY,GAC1B,OAAO,CAAC;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,WAAW,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAA;CAAE,CAAC,CAgBlE;AAED,wBAAsB,gBAAgB,IAAI,OAAO,CAAC,IAAI,CAAC,CAOtD;AAED,wBAAsB,aAAa,CACjC,KAAK,EAAE,MAAM,EACb,OAAO,EAAE,MAAM,EACf,UAAU,EAAE,MAAM,EAClB,OAAO,EAAE,MAAM,EACf,SAAS,EAAE,MAAM,EAAE,GAClB,OAAO,CAAC,IAAI,CAAC,CAOf;AAED,wBAAsB,eAAe,CACnC,SAAS,EAAE,MAAM,EAAE,EACnB,IAAI,EAAE,MAAM,GACX,OAAO,CAAC;IAAE,SAAS,EAAE,MAAM,EAAE,CAAC;IAAC,MAAM,EAAE,MAAM,EAAE,CAAA;CAAE,CAAC,CAWpD;AAED,wBAAsB,aAAa,CACjC,MAAM,EAAE,MAAM,EACd,QAAQ,EAAE,MAAM,EAChB,KAAK,EAAE,MAAM,EACb,SAAS,GAAE,MAAY,GACtB,OAAO,CAAC;IAAE,OAAO,EAAE,MAAM,CAAC;IAAC,WAAW,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAC;IAAC,QAAQ,EAAE,MAAM,CAAA;CAAE,CAAC,CAYpF;AAED,wBAAgB,uBAAuB,IAAI,IAAI,CAI9C;AAED,wBAAgB,mBAAmB,IAAI,IAAI,CAI1C"}

package/dist/infrastructure/adapters/bridge.js CHANGED Viewed

@@ -3,6 +3,8 @@ import { createRequire } from 'module';
 import { resolve, dirname, join } from 'path';
 import { fileURLToPath } from 'url';
 import { withTimeout, TimeoutError } from '../utils/timeout.js';
+import { sanitizeLlmError } from '../utils/llm-error.js';
+export { sanitizeLlmError };
 // Embedding: fast pass through the model — 2 min covers cold-start on CPU
 const LLM_EMBED_TIMEOUT_MS = 120_000;
 // Inference: generating 300-500 tokens on CPU — 3 min
@@ -210,7 +212,7 @@ repeatPenalty = 1.1) {
     catch (error) {
         if (error instanceof TimeoutError)
             nativeBinding.interruptLocalInference();
-        throw new Error(`Failed to run inference: ${error instanceof Error ? error.message : error}`);
+        throw new Error(sanitizeLlmError(error));
     }
 }
 export async function llmInferStream(prompt, onToken, maxTokens, threads = 4, temperature = 0.0, repeatPenalty = 1.1) {
@@ -224,7 +226,7 @@ export async function llmInferStream(prompt, onToken, maxTokens, threads = 4, te
     catch (error) {
         if (error instanceof TimeoutError)
             nativeBinding.interruptLocalInference();
-        throw new Error(`Failed to run streaming inference: ${error instanceof Error ? error.message : error}`);
+        throw new Error(sanitizeLlmError(error));
     }
 }
 export async function flushVectorStore() {

package/dist/infrastructure/utils/config-loader.js CHANGED Viewed

@@ -43,7 +43,7 @@ export async function findProjectRoot(startDir = process.cwd()) {
 const DEFAULTS = {
     brain: {
         provider: 'local',
-        model: 'llama-3.2-1b-q8',
+        model: 'llama-3.2-1b-q4',
         temperature: 0.3,
         maxTokens: 2048,
         local: {
@@ -475,7 +475,7 @@ export async function saveConfig(config, projectRoot) {
 }
 // Display names for local model ids — keep in sync with init/constants LOCAL_MODEL_CATALOG
 const LOCAL_MODEL_LABELS = {
-    'llama-3.2-1b-q8': 'Llama 3.2 1B Q8',
+    'llama-3.2-1b-q4': 'Llama 3.2 1B Q4',
     'qwen-2.5-1.5b-q8': 'Qwen 2.5 1.5B Q8',
     'deepseek-r1-1.5b-q8': 'DeepSeek-R1 1.5B Q8',
     'gemma-3-1b-q8': 'Gemma 3 1B Q8',

package/dist/infrastructure/utils/llm-error.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export declare function sanitizeLlmError(error: unknown): string;
2	+ //# sourceMappingURL=llm-error.d.ts.map

package/dist/infrastructure/utils/llm-error.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"llm-error.d.ts","sourceRoot":"","sources":["../../../src/infrastructure/utils/llm-error.ts"],"names":[],"mappings":"AAAA,wBAAgB,gBAAgB,CAAC,KAAK,EAAE,OAAO,GAAG,MAAM,CA2BvD"}

package/dist/infrastructure/utils/llm-error.js ADDED Viewed

@@ -0,0 +1,20 @@
+export function sanitizeLlmError(error) {
+    const raw = error instanceof Error ? error.message : String(error);
+    if (/model.*not found|cannot open.*models|no such file/i.test(raw))
+        return 'Local model not found. Run `uneven init` to download it.';
+    if (/tokenizer not found/i.test(raw))
+        return 'Model tokenizer missing. Run `uneven init` to reinstall.';
+    if (/model not loaded/i.test(raw))
+        return 'Local model is not loaded. Run `uneven init` to set up.';
+    if (/out of memory|insufficient memory|oom/i.test(raw))
+        return 'Not enough memory for local inference. Try a smaller model.';
+    if (/timed out|timeout/i.test(raw))
+        return 'Inference timed out. The model may be too slow for your hardware.';
+    if (/interrupted/i.test(raw))
+        return 'Inference was interrupted.';
+    if (/context window.*too small|unavailable/i.test(raw))
+        return raw;
+    if (process.env.UNEVEN_DEBUG)
+        return raw;
+    return 'Local inference failed. Set UNEVEN_DEBUG=1 for technical details.';
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "uneven-ai",
-  "version": "1.2.2",
+  "version": "1.3.0",
   "publishConfig": {
     "access": "public",
     "registry": "https://registry.npmjs.org/"

package/prebuilds/darwin-arm64/uneven_core.node CHANGED Viewed

Binary file

package/prebuilds/linux-arm64/uneven_core.node CHANGED Viewed

Binary file

package/prebuilds/linux-x64/uneven_core.node CHANGED Viewed

Binary file

package/prebuilds/win32-x64/uneven_core.node CHANGED Viewed

Binary file