npm - @gmickel/gno - Versions diffs - 0.9.3 → 0.9.4 - Mend

@gmickel/gno 0.9.3 → 0.9.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/README.md CHANGED Viewed

@@ -332,14 +332,14 @@ Models auto-download on first use to `~/.cache/gno/models/`.
 ### Model Presets
-| Preset     | Disk   | Best For               |
-| :--------- | :----- | :--------------------- |
-| `slim`     | ~1GB   | Fast, lower quality    |
-| `balanced` | ~2GB   | Good balance (default) |
-| `quality`  | ~2.5GB | Best answers           |
+| Preset     | Disk   | Best For                     |
+| :--------- | :----- | :--------------------------- |
+| `slim`     | ~1GB   | Fast, good quality (default) |
+| `balanced` | ~2GB   | Slightly larger model        |
+| `quality`  | ~2.5GB | Best answers                 |
 ```bash
-gno models use balanced
+gno models use slim
 gno models pull --all  # Optional: pre-download models (auto-downloads on first use)
 ```

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@gmickel/gno",
-  "version": "0.9.3",
+  "version": "0.9.4",
   "description": "Local semantic search for your documents. Index Markdown, PDF, and Office files with hybrid BM25 + vector search.",
   "keywords": [
     "embeddings",
@@ -48,6 +48,9 @@
     "test:coverage": "bun test --coverage",
     "test:coverage:html": "bun test --coverage --html",
     "test:fixtures": "bun scripts/generate-test-fixtures.ts",
+    "evals": "bun scripts/update-eval-scores.ts",
+    "eval": "bun --bun evalite",
+    "eval:watch": "bun --bun evalite watch",
     "reset": "bun run src/index.ts reset --confirm",
     "docs:verify": "bun run scripts/docs-verify.ts",
     "website:install": "cd website && bundle install",
@@ -110,6 +113,7 @@
     "zod": "^4.3.4"
   },
   "devDependencies": {
+    "@ai-sdk/openai": "^3.0.2",
     "@biomejs/biome": "2.3.10",
     "@tailwindcss/cli": "^4.1.18",
     "@types/bun": "latest",
@@ -126,7 +130,8 @@
     "oxlint-tsgolint": "^0.10.1",
     "pdf-lib": "^1.17.1",
     "pptxgenjs": "^4.0.1",
-    "ultracite": "7.0.4"
+    "ultracite": "7.0.4",
+    "vitest": "^4.0.16"
   },
   "peerDependencies": {
     "typescript": "^5"

package/src/config/types.ts CHANGED Viewed

@@ -176,7 +176,7 @@ export type ModelPreset = z.infer<typeof ModelPresetSchema>;
 export const DEFAULT_MODEL_PRESETS: ModelPreset[] = [
   {
     id: "slim",
-    name: "Slim (Fast, ~1GB)",
+    name: "Slim (Default, ~1GB)",
     embed: "hf:gpustack/bge-m3-GGUF/bge-m3-Q4_K_M.gguf",
     rerank:
       "hf:ggml-org/Qwen3-Reranker-0.6B-Q8_0-GGUF/qwen3-reranker-0.6b-q8_0.gguf",
@@ -184,11 +184,11 @@ export const DEFAULT_MODEL_PRESETS: ModelPreset[] = [
   },
   {
     id: "balanced",
-    name: "Balanced (Default, ~2GB)",
+    name: "Balanced (~2GB)",
     embed: "hf:gpustack/bge-m3-GGUF/bge-m3-Q4_K_M.gguf",
     rerank:
       "hf:ggml-org/Qwen3-Reranker-0.6B-Q8_0-GGUF/qwen3-reranker-0.6b-q8_0.gguf",
-    gen: "hf:ggml-org/SmolLM3-3B-GGUF/SmolLM3-Q4_K_M.gguf",
+    gen: "hf:bartowski/Qwen2.5-3B-Instruct-GGUF/Qwen2.5-3B-Instruct-Q4_K_M.gguf",
   },
   {
     id: "quality",
@@ -202,7 +202,7 @@ export const DEFAULT_MODEL_PRESETS: ModelPreset[] = [
 export const ModelConfigSchema = z.object({
   /** Active preset ID */
-  activePreset: z.string().default("balanced"),
+  activePreset: z.string().default("slim"),
   /** Model presets */
   presets: z.array(ModelPresetSchema).default(DEFAULT_MODEL_PRESETS),
   /** Model load timeout in ms */

package/src/llm/registry.ts CHANGED Viewed

@@ -19,7 +19,7 @@ import { DEFAULT_MODEL_PRESETS } from "../config/types";
  */
 export function getModelConfig(config: Config): ModelConfig {
   return {
-    activePreset: config.models?.activePreset ?? "balanced",
+    activePreset: config.models?.activePreset ?? "slim",
     presets: config.models?.presets?.length
       ? config.models.presets
       : DEFAULT_MODEL_PRESETS,

package/src/pipeline/answer.ts CHANGED Viewed

@@ -13,21 +13,24 @@ import type { Citation, SearchResult } from "./types";
 // Constants
 // ─────────────────────────────────────────────────────────────────────────────
-const ANSWER_PROMPT = `You are answering a question using ONLY the provided context blocks.
+const ANSWER_PROMPT = `Answer the question using ONLY the context blocks below. Cite sources with [1], [2], etc.
-Rules you MUST follow:
-1) Use ONLY facts stated in the context blocks. Do NOT use outside knowledge.
-2) Every factual statement must include an inline citation like [1] or [2] referring to a context block.
-3) If the context does not contain enough information to answer, reply EXACTLY:
-   "I don't have enough information in the provided sources to answer this question."
-4) Do not cite sources you did not use. Do not invent citation numbers.
+Example:
+Q: What is the capital of France?
+Context:
+[1] France is a country in Western Europe. Paris is the capital and largest city.
+[2] The Eiffel Tower, built in 1889, is located in Paris.
-Question: {query}
+Answer: Paris is the capital of France [1]. It is home to the Eiffel Tower [2].
-Context blocks:
+---
+Q: {query}
+Context:
 {context}
-Write a concise answer (1-3 paragraphs).`;
+Answer:`;
 /** Abstention message when LLM cannot ground answer */
 export const ABSTENTION_MESSAGE =

package/src/pipeline/search.ts CHANGED Viewed

@@ -223,7 +223,11 @@ export async function searchBm25(
   // For --full, fetch full content and build results
   if (options.full) {
-    for (const { fts, chunk } of bestByDocid.values()) {
+    // Sort by raw BM25 score (smaller = better) before building results
+    const sortedEntries = [...bestByDocid.values()].sort(
+      (a, b) => a.score - b.score
+    );
+    for (const { fts, chunk } of sortedEntries) {
       let fullContent: string | undefined;
       if (fts.mirrorHash) {
         const contentResult = await store.getContent(fts.mirrorHash);