npm - @deepsweet/mdn - Versions diffs - 0.1.3 → 0.3.0 - Mend

@deepsweet/mdn 0.1.3 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/README.md CHANGED Viewed

@@ -22,7 +22,7 @@ See [dataset repo](https://huggingface.co/datasets/deepsweet/mdn) on HuggigFace
 ### 1. Download dataset and embedding model
 ```sh
-npx -y @deepsweet/mdn download
+npx -y @deepsweet/mdn@latest download
 ```
 Both [dataset](https://huggingface.co/datasets/deepsweet/mdn) (\~260 MB) and the [embedding model GGUF file](https://huggingface.co/deepsweet/bge-m3-GGUF-Q4_K_M) (\~438 MB) will be downloaded directly from HugginFace and stored in its default cache location (typically `~/.cache/huggingface/`), just like the `hf download` command does.
@@ -35,7 +35,8 @@ Both [dataset](https://huggingface.co/datasets/deepsweet/mdn) (\~260 MB) and the
     "mdn": {
       "command": "npx",
       "args": [
-        "@deepsweet/mdn",
+        "-y",
+        "@deepsweet/mdn@latest",
         "server"
       ],
       "env": {}
@@ -44,6 +45,9 @@ Both [dataset](https://huggingface.co/datasets/deepsweet/mdn) (\~260 MB) and the
 }
 ```
+> [!TIP]
+> Remove `@latest` for a full offline experience, but keep in mind that this will cache a fixed version without auto-updating.
 The `stdio` server will spawn [llama.cpp](https://github.com/ggml-org/llama.cpp) under the hood, load the embedding model (~655 MB RAM/VRAM), and query the dataset – all on demand.
 ## Settings
@@ -51,7 +55,6 @@ The `stdio` server will spawn [llama.cpp](https://github.com/ggml-org/llama.cpp)
 | Env variable               | Default value                                                   | Description                                                                                                       |
 |----------------------------|-----------------------------------------------------------------|-------------------------------------------------------------------------------------------------------------------|
 | `MDN_DATASET_PATH`         | HuggingFace cache                                               | Custom dataset directory path                                                                                     |
-| `MDN_DATASET_LOCALE`       | `en-us`                                                         | Dataset language, currently `en-us` only                                                                          |
 | `MDN_MODEL_PATH`           | HuggingFace cache                                               | Custom model file path                                                                                            |
 | `MDN_MODEL_TTL`            | `1800`                                                          | For how long llama.cpp with embedding model should be kept loaded in memory, in seconds; `0` to prevent unloading |
 | `MDN_QUERY_DESCRIPTION`    | `Natural language query for hybrid vector and full-text search` | Custom search query description in case your LLM does a poor job asking the MCP tool                              |
@@ -60,7 +63,6 @@ The `stdio` server will spawn [llama.cpp](https://github.com/ggml-org/llama.cpp)
 ## To do
 - [ ] figure out a better query description so that LLM doesn't over-generate keywords
-- [ ] add more dataset [translations](https://github.com/mdn/translated-content/tree/main/files/)
 - [ ] automatically update and upload the dataset artifacts monthly with GitHub Actions
 ## License

package/dist/index.js CHANGED Viewed

@@ -1,10 +1,28 @@
 #!/usr/bin/env node
+// src/huggingface.ts
+import fs from "node:fs/promises";
+import path from "path";
+import {
+  downloadFileToCacheDir,
+  getHFHubCachePath,
+  getRepoFolderName,
+  scanCachedRepo,
+  snapshotDownload
+} from "@huggingface/hub";
+// src/const.ts
+var DATASET_REPO = "deepsweet/mdn";
+var MODEL_REPO = "deepsweet/bge-m3-GGUF-Q4_K_M";
+var MODEL_FILE = "bge-m3-GGUF-Q4_K_M.gguf";
+var MODEL_MAX_TOKENS = 8192;
+var TABLE_NAME = "mdn";
+var TABLE_FILENAME = `${TABLE_NAME}.lance`;
 // src/env.ts
 import { z } from "zod";
 var env = z.object({
   MDN_DATASET_PATH: z.string().optional(),
-  MDN_DATASET_LOCALE: z.enum(["en-us"]).default("en-us"),
   MDN_MODEL_PATH: z.string().optional(),
   MDN_MODEL_TTL: z.number().default(1800),
   MDN_QUERY_DESCRIPTION: z.string().default("Natural language query for hybrid vector and full-text search"),
@@ -12,19 +30,6 @@ var env = z.object({
 }).parse(process.env);
 // src/huggingface.ts
-import fs from "node:fs/promises";
-import path from "path";
-import { getHFHubCachePath, getRepoFolderName, scanCachedRepo, snapshotDownload } from "@huggingface/hub";
-// src/utils.ts
-var getTableName = (locale) => {
-  return `mdn-${locale}`;
-};
-// src/huggingface.ts
-var DATASET_REPO = "deepsweet/mdn";
-var MODEL_REPO = "deepsweet/bge-m3-GGUF-Q4_K_M";
-var MODEL_FILE = "bge-m3-GGUF-Q4_K_M.gguf";
 var replaceSymlinksWithHardlinks = async (dir) => {
   const entries = await fs.readdir(dir, { withFileTypes: true });
   for (const entry of entries) {
@@ -57,18 +62,17 @@ var getLatestCachedRepoRevision = async (name, type) => {
   });
   return latestRevision.path;
 };
-var downloadDataset = async (locale) => {
-  const tableName = getTableName(locale);
+var downloadDataset = async () => {
   const dirPath = await snapshotDownload({
     repo: `datasets/${DATASET_REPO}`,
-    path: `data/${tableName}.lance`
+    path: `data/${TABLE_FILENAME}`
   });
   const dataPath = path.join(dirPath, "data");
   await replaceSymlinksWithHardlinks(dataPath);
 };
 var getDatasetPath = async () => {
-  if (process.env.MDN_DATASET_PATH != null) {
-    return process.env.MDN_DATASET_PATH;
+  if (env.MDN_DATASET_PATH != null) {
+    return env.MDN_DATASET_PATH;
   }
   const latestRevisionPath = await getLatestCachedRepoRevision(DATASET_REPO, "dataset");
   const datasetPath = path.join(latestRevisionPath, "data");
@@ -80,8 +84,8 @@ var downloadModel = async () => {
   });
 };
 var getModelPath = async () => {
-  if (process.env.MDN_MODEL_PATH != null) {
-    return process.env.MDN_MODEL_PATH;
+  if (env.MDN_MODEL_PATH != null) {
+    return env.MDN_MODEL_PATH;
   }
   const latestRevisionPath = await getLatestCachedRepoRevision(MODEL_REPO, "model");
   const modelPath = path.join(latestRevisionPath, MODEL_FILE);
@@ -95,15 +99,16 @@ import { StdioServerTransport } from "@modelcontextprotocol/sdk/server/stdio.js"
 import { z as z2 } from "zod";
 // src/llama.ts
+import os from "node:os";
 import { getLlama, LlamaLogLevel } from "node-llama-cpp";
-var MAX_TOKENS = 8192;
 var getLlamaContext = async (modelPath) => {
+  const threads = Math.floor(os.availableParallelism() / 2);
   const llama = await getLlama({ logLevel: LlamaLogLevel.error });
   const model = await llama.loadModel({ modelPath });
   const context = await model.createEmbeddingContext({
-    contextSize: MAX_TOKENS,
-    batchSize: MAX_TOKENS,
-    threads: 0
+    contextSize: MODEL_MAX_TOKENS,
+    batchSize: MODEL_MAX_TOKENS,
+    threads
   });
   context.onDispose.createOnceListener(() => {
     model.dispose().then(() => llama.dispose()).catch(console.error);
@@ -124,7 +129,7 @@ var vectorize = async (context, text) => {
 // src/query.ts
 var queryHybrid = async (llamaContext, table, reranker, text) => {
   const vector = await vectorize(llamaContext, text);
-  const results = await table.query().nearestTo(vector).fullTextSearch(text).rerank(reranker).limit(env.MDN_SEARCH_RESULTS_LIMIT).toArray();
+  const results = await table.query().nearestTo(vector).column("vector").fullTextSearch(text, { columns: "text" }).rerank(reranker).limit(env.MDN_SEARCH_RESULTS_LIMIT).toArray();
   return results;
 };
 var createReranker = async () => {
@@ -134,7 +139,7 @@ var createReranker = async () => {
 // package.json
 var name = "@deepsweet/mdn";
-var version = "0.1.3";
+var version = "0.3.0";
 // src/server.ts
 var startMcpServer = async () => {
@@ -142,8 +147,7 @@ var startMcpServer = async () => {
   const db = await lancedb2.connect(datasetPath);
   const reranker = await createReranker();
   const server = new McpServer({ name, version });
-  const tableName = getTableName(env.MDN_DATASET_LOCALE);
-  const table = await db.openTable(tableName);
+  const table = await db.openTable(TABLE_NAME);
   const modelPath = await getModelPath();
   const llamaTtl = env.MDN_MODEL_TTL * 1000;
   let llamaContext = null;
@@ -152,6 +156,9 @@ var startMcpServer = async () => {
     description: "Reference documentation for Web API, JavaScript, HTML, CSS, SVG and HTTP",
     inputSchema: z2.object({
       query: z2.string().describe(env.MDN_QUERY_DESCRIPTION)
+    }),
+    outputSchema: z2.object({
+      results: z2.array(z2.string())
     })
   }, async ({ query }) => {
     llamaContext ??= await getLlamaContext(modelPath);
@@ -170,7 +177,10 @@ var startMcpServer = async () => {
       content: results.map((result) => ({
         type: "text",
         text: result.text
-      }))
+      })),
+      structuredContent: {
+        results: results.map((result) => result.text)
+      }
     };
   });
   const transport = new StdioServerTransport;
@@ -196,8 +206,7 @@ var startMcpServer = async () => {
 // src/index.ts
 switch (process.argv[2]) {
   case "download": {
-    const locale = process.argv[3] ?? env.MDN_DATASET_LOCALE;
-    await downloadDataset(locale);
+    await downloadDataset();
     await downloadModel();
     break;
   }
@@ -206,7 +215,7 @@ switch (process.argv[2]) {
     break;
   }
   default: {
-    console.error('Unknown or missing command, use "download" or "server"');
+    console.error('Unknown command, use "download" or "server"');
     process.exit(1);
   }
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@deepsweet/mdn",
-  "version": "0.1.3",
+  "version": "0.3.0",
   "publishConfig": {
     "access": "public"
   },
@@ -27,13 +27,18 @@
     "eslint": "^10.1.0",
     "gray-matter": "^4.0.3",
     "marked": "^17.0.5",
+    "p-all": "^5.0.1",
     "rimraf": "^6.1.3",
     "typescript": "^6.0.2"
   },
   "scripts": {
+    "download": "bun scripts/download.ts",
     "chunk": "bun scripts/chunk.ts",
     "ingest": "bun scripts/ingest.ts",
+    "update": "bun scripts/update.ts",
     "query": "bun scripts/query.ts",
+    "upload": "bun scripts/upload.ts",
+    "test": "bun scripts/test.ts",
     "check": "tsc --noEmit && eslint --cache scripts/ src/",
     "dist": "bun build --format esm --target node --packages external --outdir dist/ src/index.ts"
   },