npm - @agentskillshub/cli - Versions diffs - 0.2.0 → 0.2.2 - Mend

@agentskillshub/cli 0.2.0 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/bin/ash.mjs +27 -1
package/package.json +1 -1

package/bin/ash.mjs CHANGED Viewed

@@ -45,6 +45,13 @@ const GRADE = {
 // CJK detection — Chinese queries have no word boundaries, so we bigram them.
 const CJK = /[一-鿿]/;
+// Generic terms that appear in ~half the catalog — they drown the distinctive
+// part of a query. Ignored during scoring unless the whole query is generic.
+const STOPWORDS = new Set([
+  "ai", "mcp", "mcps", "agent", "agents", "tool", "tools", "skill", "skills",
+  "server", "servers", "app", "apps", "工具", "服务器", "服务",
+]);
 // ─── tiny ANSI (auto-off when not a TTY / NO_COLOR) ──────────────────────────
 const tty = process.stdout.isTTY && !process.env.NO_COLOR;
 const c = (code, s) => (tty ? `\x1b[${code}m${s}\x1b[0m` : s);
@@ -150,8 +157,14 @@ function scoreRow(row, tokens) {
   // English-only repos via our curated scenario titles, and ranks
   // scenario-relevant skills higher. Empty/undefined on older indexes.
   const scen = (row.w || "").toLowerCase();
+  // When the query has a distinctive term, generic tokens (ai/mcp/agent/工具…)
+  // match half the catalog and drown it — "去 AI 味" would rank vercel/ai over
+  // the actual humanizer. Skip generic tokens for scoring UNLESS the whole query
+  // is generic (then they're all we have).
+  const hasContent = tokens.some((t) => !STOPWORDS.has(t));
   let score = 0;
   for (const tok of tokens) {
+    if (hasContent && STOPWORDS.has(tok)) continue;
     if (name === tok) score += 50;
     else if (name.includes(tok)) score += 20;
     if (full.includes(tok)) score += 8;
@@ -181,9 +194,22 @@ function applyFilters(skills, f) {
   });
 }
+/** Tokenize a query. Splits on whitespace AND at latin↔CJK boundaries, so a
+ *  glued mixed query like "ppt制作" becomes ["ppt", "制作"] (otherwise it's one
+ *  token that matches nothing). Pure-CJK compounds still rely on the bigram
+ *  fallback in scoreRow. */
+function tokenize(q) {
+  return q
+    .toLowerCase()
+    .replace(/([a-z0-9])([一-鿿])/g, "$1 $2")
+    .replace(/([一-鿿])([a-z0-9])/g, "$1 $2")
+    .split(/\s+/)
+    .filter(Boolean);
+}
 function runSearch(index, args) {
   const f = parseFilters(args);
-  const tokens = f.query.toLowerCase().split(/\s+/).filter(Boolean);
+  const tokens = tokenize(f.query);
   const pool = applyFilters(index.skills, f);
   const ranked = pool
     .map((r) => ({ r, score: scoreRow(r, tokens) }))

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@agentskillshub/cli",
-  "version": "0.2.0",
+  "version": "0.2.2",
   "description": "Search, audit, and install open-source AI agent skills & MCP servers from the terminal — security-graded, quality-scored.",
   "type": "module",
   "bin": {