npm - product-spec-mcp - Versions diffs - 0.3.21 → 0.3.26 - Mend

product-spec-mcp 0.3.21 → 0.3.26

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/README.md +14 -0
package/dist/index.cjs +1325 -29
package/docs/online-pm-gate.md +58 -0
package/package.json +6 -2
package/workers/pm-intent-gate.mjs +383 -0
package/workers/schema.sql +24 -0
package/workers/wrangler.toml.example +19 -0

package/docs/online-pm-gate.md ADDED Viewed

@@ -0,0 +1,58 @@
+# Online PM Gate
+P0 online gate is an HTTP classifier for low-confidence or conflicting local PM Gate decisions. It does not generate long specs. It only helps choose the gate and returns short JSON for the local MCP package to validate and merge.
+## Local MCP Environment
+```bash
+PRODUCT_SPEC_REMOTE_GATE_URL=https://gate.example.com/v1/pm-intent
+PRODUCT_SPEC_REMOTE_GATE_TOKEN=replace-with-token
+PRODUCT_SPEC_REMOTE_GATE_TIMEOUT_MS=2500
+PRODUCT_SPEC_REMOTE_GATE_MODE=auto
+PRODUCT_SPEC_TELEMETRY=off
+```
+Modes:
+- `auto`: only call remote when local gate is low confidence, unknown, or internally conflicting.
+- `off`: never call remote.
+- `force`: call remote for debugging.
+Telemetry:
+- `off`: do not store prompt samples.
+- `minimal`: store hashes and decisions only.
+- `sample`: store redacted prompt samples.
+## Cloudflare Worker
+Files:
+- `workers/pm-intent-gate.mjs`
+- `workers/schema.sql`
+- `workers/wrangler.toml.example`
+Setup outline:
+```bash
+cd workers
+cp wrangler.toml.example wrangler.toml
+wrangler kv namespace create PROMPT_CACHE
+wrangler d1 create product-spec-prompt-samples
+wrangler d1 execute product-spec-prompt-samples --file schema.sql
+wrangler secret put GATE_TOKEN
+wrangler secret put DEEPSEEK_API_KEY
+wrangler secret put RATE_LIMIT_SALT
+wrangler deploy
+```
+Runtime behavior:
+- Prompt cache key: `cache:{model}:{promptHash}:pm-gate-v1`
+- Cache TTL: 7 days
+- LLM quota: 3 non-cached LLM decisions per IP per Shanghai calendar day
+- User message sent to LLM: max 500 characters
+- LLM max output tokens: 600
+- LLM temperature: 0.1
+If the Worker is unreachable, rate-limited, returns invalid JSON, or returns invalid enum fields, the local MCP falls back to the local PM Gate decision.

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "product-spec-mcp",
-  "version": "0.3.21",
+  "version": "0.3.26",
   "description": "MCP Server for product specification - requirement interrogation, architecture decision, UI translation, debug guidance, and acceptance generation",
   "type": "commonjs",
   "main": "dist/index.cjs",
@@ -9,7 +9,11 @@
   },
   "files": [
     "dist/index.cjs",
-    "README.md"
+    "README.md",
+    "docs/online-pm-gate.md",
+    "workers/pm-intent-gate.mjs",
+    "workers/schema.sql",
+    "workers/wrangler.toml.example"
   ],
   "engines": {
     "node": ">=18"

package/workers/pm-intent-gate.mjs ADDED Viewed

@@ -0,0 +1,383 @@
+const GATE_SCHEMA_VERSION = "pm-gate-v1";
+const DEFAULT_MODEL = "deepseek-chat";
+const DAILY_LIMIT = 3;
+export default {
+  async fetch(request, env) {
+    const url = new URL(request.url);
+    if (request.method === "GET" && url.pathname === "/health") {
+      return json({ ok: true, gateSchemaVersion: GATE_SCHEMA_VERSION });
+    }
+    if (request.method !== "POST" || url.pathname !== "/v1/pm-intent") {
+      return json({ error: "not_found" }, 404);
+    }
+    if (!isAuthorized(request, env)) {
+      return json({ error: "unauthorized" }, 401);
+    }
+    let body;
+    try {
+      body = await request.json();
+    } catch {
+      return json({ error: "invalid_json" }, 400);
+    }
+    const telemetryMode = normalizeTelemetry(request.headers.get("x-product-spec-telemetry") || "off");
+    const message = String(body.message || "").slice(0, 500);
+    const messageHash = body.messageHash || await sha256(normalizeText(message));
+    const model = env.DEEPSEEK_MODEL || DEFAULT_MODEL;
+    const cacheKey = `cache:${model}:${messageHash}:${GATE_SCHEMA_VERSION}`;
+    const cached = await env.PROMPT_CACHE?.get(cacheKey, "json");
+    const ipKey = await rateLimitKey(request, env);
+    const resetAt = nextShanghaiMidnightIso();
+    if (cached?.decision) {
+      await maybeStoreSample(env, telemetryMode, body, cached.decision, cached.decision, {
+        llmUsed: 0,
+        cacheHit: 1,
+        rateLimitStatus: "cache_hit",
+      });
+      return json({
+        decision: cached.decision,
+        llmGate: {
+          used: false,
+          provider: "deepseek",
+          model,
+          promptTokensApprox: cached.promptTokensApprox || 0,
+          completionTokensApprox: cached.completionTokensApprox || 0,
+          cacheHit: true,
+        },
+        rateLimit: {
+          limit: DAILY_LIMIT,
+          remaining: await remainingForKey(env, ipKey),
+          resetAt,
+        },
+        privacy: privacyResult(telemetryMode),
+      });
+    }
+    const limit = await consumeLimit(env, ipKey, resetAt);
+    if (!limit.allowed) {
+      await maybeStoreSample(env, telemetryMode, body, null, body.ruleDecision || {}, {
+        llmUsed: 0,
+        cacheHit: 0,
+        rateLimitStatus: "limited",
+        fallbackReason: "rate_limited",
+      });
+      return json({
+        decision: fallbackDecision(body.ruleDecision),
+        llmGate: { used: false, provider: "deepseek", model, cacheHit: false },
+        rateLimit: { limit: DAILY_LIMIT, remaining: 0, resetAt },
+        privacy: privacyResult(telemetryMode),
+      }, 429);
+    }
+    const prompt = buildGatePrompt(message, body.ruleDecision || {}, body.choices || {});
+    const promptTokensApprox = approxTokens(prompt);
+    let llmDecision;
+    let completionTokensApprox = 0;
+    let fallbackReason = "";
+    try {
+      const llmText = await callDeepSeek(env, model, prompt);
+      completionTokensApprox = approxTokens(llmText);
+      llmDecision = sanitizeDecision(extractJson(llmText));
+      if (!llmDecision) fallbackReason = "invalid_llm_schema";
+    } catch (error) {
+      fallbackReason = error instanceof Error ? error.message : "llm_error";
+    }
+    const finalDecision = llmDecision || fallbackDecision(body.ruleDecision);
+    if (llmDecision && env.PROMPT_CACHE) {
+      await env.PROMPT_CACHE.put(cacheKey, JSON.stringify({
+        decision: finalDecision,
+        promptTokensApprox,
+        completionTokensApprox,
+      }), { expirationTtl: 7 * 24 * 60 * 60 });
+    }
+    await maybeStoreSample(env, telemetryMode, body, llmDecision, finalDecision, {
+      llmUsed: llmDecision ? 1 : 0,
+      cacheHit: 0,
+      promptTokensApprox,
+      completionTokensApprox,
+      rateLimitStatus: "allowed",
+      fallbackReason,
+    });
+    return json({
+      decision: finalDecision,
+      llmGate: {
+        used: Boolean(llmDecision),
+        provider: "deepseek",
+        model,
+        promptTokensApprox,
+        completionTokensApprox,
+        cacheHit: false,
+        ...(fallbackReason ? { fallbackReason } : {}),
+      },
+      rateLimit: {
+        limit: DAILY_LIMIT,
+        remaining: limit.remaining,
+        resetAt,
+      },
+      privacy: privacyResult(telemetryMode),
+    });
+  },
+};
+function isAuthorized(request, env) {
+  if (!env.GATE_TOKEN) return false;
+  return request.headers.get("authorization") === `Bearer ${env.GATE_TOKEN}`;
+}
+function buildGatePrompt(message, rule, choices) {
+  return JSON.stringify({
+    task: "Choose the best PM gate only. Return strict JSON, no markdown.",
+    output: {
+      bestGate: "one needType enum",
+      usageScope: "one usageScope enum",
+      maintenanceMode: "one maintenanceMode enum",
+      accessTopology: "one accessTopology enum",
+      confidence: "high|medium|low",
+      strongSignals: ["short strings"],
+      weakSignals: ["short strings"],
+      coreObjects: ["short strings"],
+      states: ["short strings"],
+      actions: ["short strings"],
+      mustNotUse: ["short ids"],
+      boundaryQuestionIds: ["short ids"],
+    },
+    msg: message,
+    rule: {
+      strong: rule.strongSignals || [],
+      weak: rule.weakSignals || [],
+      shape: rule.technicalShape || rule.shape || "unknown",
+      conflict: Boolean(rule.conflict),
+    },
+    choices,
+  });
+}
+async function callDeepSeek(env, model, prompt) {
+  if (!env.DEEPSEEK_API_KEY) throw new Error("missing_deepseek_api_key");
+  const response = await fetch("https://api.deepseek.com/chat/completions", {
+    method: "POST",
+    headers: {
+      "content-type": "application/json",
+      authorization: `Bearer ${env.DEEPSEEK_API_KEY}`,
+    },
+    body: JSON.stringify({
+      model,
+      temperature: 0.1,
+      max_tokens: 600,
+      messages: [
+        { role: "system", content: "You are a terse product intent classifier. Output JSON only." },
+        { role: "user", content: prompt },
+      ],
+    }),
+  });
+  if (!response.ok) throw new Error(`deepseek_http_${response.status}`);
+  const data = await response.json();
+  const content = data?.choices?.[0]?.message?.content;
+  if (typeof content !== "string" || !content.trim()) throw new Error("deepseek_empty_content");
+  return content;
+}
+function extractJson(text) {
+  try {
+    return JSON.parse(text);
+  } catch {
+    const start = text.indexOf("{");
+    const end = text.lastIndexOf("}");
+    if (start < 0 || end <= start) return null;
+    try {
+      return JSON.parse(text.slice(start, end + 1));
+    } catch {
+      return null;
+    }
+  }
+}
+function sanitizeDecision(raw) {
+  if (!raw || typeof raw !== "object") return null;
+  const bestGate = raw.bestGate || raw.needType;
+  if (!needTypes.includes(bestGate)) return null;
+  const decision = { bestGate };
+  copyEnum(raw, decision, "usageScope", usageScopes);
+  copyEnum(raw, decision, "maintenanceMode", maintenanceModes);
+  copyEnum(raw, decision, "accessTopology", accessTopologies);
+  copyEnum(raw, decision, "confidence", confidences);
+  copyStringArray(raw, decision, "strongSignals");
+  copyStringArray(raw, decision, "weakSignals");
+  copyStringArray(raw, decision, "coreObjects");
+  copyStringArray(raw, decision, "states");
+  copyStringArray(raw, decision, "actions");
+  copyStringArray(raw, decision, "mustNotUse");
+  copyStringArray(raw, decision, "boundaryQuestionIds");
+  return decision;
+}
+function fallbackDecision(ruleDecision) {
+  return {
+    bestGate: ruleDecision?.needType || "unknown",
+    usageScope: ruleDecision?.usageScope || "unknown",
+    maintenanceMode: ruleDecision?.maintenanceMode || "unknown",
+    accessTopology: ruleDecision?.accessTopology || "unknown",
+    confidence: "low",
+    strongSignals: ruleDecision?.strongSignals || [],
+    weakSignals: ruleDecision?.weakSignals || [],
+    coreObjects: [],
+    states: [],
+    actions: [],
+    mustNotUse: ruleDecision?.mustNotUse || [],
+    boundaryQuestionIds: ruleDecision?.boundaryQuestionIds || ["usage_scope", "maintenance_mode", "data_flow"],
+  };
+}
+async function consumeLimit(env, key, resetAt) {
+  if (!env.PROMPT_CACHE) return { allowed: true, remaining: DAILY_LIMIT - 1 };
+  const current = Number(await env.PROMPT_CACHE.get(key) || "0");
+  if (current >= DAILY_LIMIT) return { allowed: false, remaining: 0 };
+  const next = current + 1;
+  const resetSeconds = Math.max(60, Math.floor((new Date(resetAt).getTime() - Date.now()) / 1000));
+  await env.PROMPT_CACHE.put(key, String(next), { expirationTtl: resetSeconds });
+  return { allowed: true, remaining: Math.max(0, DAILY_LIMIT - next) };
+}
+async function remainingForKey(env, key) {
+  if (!env.PROMPT_CACHE) return DAILY_LIMIT;
+  const current = Number(await env.PROMPT_CACHE.get(key) || "0");
+  return Math.max(0, DAILY_LIMIT - current);
+}
+async function rateLimitKey(request, env) {
+  const ip = request.headers.get("cf-connecting-ip") || request.headers.get("x-forwarded-for") || "unknown";
+  const day = shanghaiDateKey();
+  const salt = env.RATE_LIMIT_SALT || "product-spec";
+  return `rate:${day}:${await sha256(`${salt}:${ip}`)}`;
+}
+async function maybeStoreSample(env, telemetryMode, body, llmDecision, finalDecision, meta) {
+  if (!env.PROMPT_SAMPLES || telemetryMode === "off") return;
+  const id = crypto.randomUUID();
+  const message = String(body.message || "").slice(0, 500);
+  const messageHash = body.messageHash || await sha256(normalizeText(message));
+  const sample = telemetryMode === "sample" ? redact(message) : null;
+  await env.PROMPT_SAMPLES.prepare(
+    `INSERT INTO prompt_samples (
+      id, created_at, package_version, client, telemetry_mode, message_hash, message_sample,
+      rule_decision_json, llm_decision_json, final_decision_json, llm_used, cache_hit,
+      prompt_tokens_approx, completion_tokens_approx, rate_limit_status, fallback_reason
+    ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)`
+  ).bind(
+    id,
+    new Date().toISOString(),
+    body.packageVersion || null,
+    body.client || null,
+    telemetryMode,
+    messageHash,
+    sample,
+    JSON.stringify(body.ruleDecision || {}),
+    llmDecision ? JSON.stringify(llmDecision) : null,
+    JSON.stringify(finalDecision || {}),
+    meta.llmUsed,
+    meta.cacheHit,
+    meta.promptTokensApprox || null,
+    meta.completionTokensApprox || null,
+    meta.rateLimitStatus || null,
+    meta.fallbackReason || null
+  ).run();
+}
+function normalizeTelemetry(value) {
+  return ["off", "minimal", "sample"].includes(value) ? value : "off";
+}
+function privacyResult(telemetryMode) {
+  return {
+    stored: telemetryMode !== "off",
+    mode: telemetryMode,
+    redacted: telemetryMode === "sample",
+  };
+}
+function redact(text) {
+  return text
+    .replace(/[A-Z0-9._%+-]+@[A-Z0-9.-]+\.[A-Z]{2,}/gi, "[EMAIL]")
+    .replace(/(?<!\d)1[3-9]\d{9}(?!\d)/g, "[PHONE]")
+    .replace(/\b\d{15,19}\b/g, "[SENSITIVE_NUMBER]")
+    .replace(/\b(?:sk|pk|api|token|secret)[-_]?[A-Za-z0-9]{16,}\b/gi, "[SECRET]")
+    .replace(/([?&](?:token|key|secret|access_token)=)[^&\s]+/gi, "$1[SECRET]");
+}
+function shanghaiDateKey() {
+  return new Intl.DateTimeFormat("en-CA", {
+    timeZone: "Asia/Shanghai",
+    year: "numeric",
+    month: "2-digit",
+    day: "2-digit",
+  }).format(new Date());
+}
+function nextShanghaiMidnightIso() {
+  const parts = new Intl.DateTimeFormat("en-CA", {
+    timeZone: "Asia/Shanghai",
+    year: "numeric",
+    month: "2-digit",
+    day: "2-digit",
+  }).formatToParts(new Date());
+  const year = Number(parts.find((p) => p.type === "year").value);
+  const month = Number(parts.find((p) => p.type === "month").value);
+  const day = Number(parts.find((p) => p.type === "day").value);
+  const next = new Date(Date.UTC(year, month - 1, day + 1));
+  const y = next.getUTCFullYear();
+  const m = String(next.getUTCMonth() + 1).padStart(2, "0");
+  const d = String(next.getUTCDate()).padStart(2, "0");
+  return `${y}-${m}-${d}T00:00:00+08:00`;
+}
+async function sha256(text) {
+  const bytes = new TextEncoder().encode(text);
+  const digest = await crypto.subtle.digest("SHA-256", bytes);
+  return [...new Uint8Array(digest)].map((byte) => byte.toString(16).padStart(2, "0")).join("");
+}
+function normalizeText(text) {
+  return text.trim().replace(/\s+/g, " ");
+}
+function approxTokens(text) {
+  return Math.ceil(String(text || "").length / 4);
+}
+function copyEnum(raw, decision, key, allowed) {
+  if (raw[key] !== undefined && allowed.includes(raw[key])) decision[key] = raw[key];
+}
+function copyStringArray(raw, decision, key) {
+  if (Array.isArray(raw[key])) decision[key] = raw[key].filter((item) => typeof item === "string").slice(0, 12);
+}
+function json(payload, status = 200) {
+  return new Response(JSON.stringify(payload), {
+    status,
+    headers: { "content-type": "application/json; charset=utf-8" },
+  });
+}
+const needTypes = [
+  "static_display",
+  "personal_local_tool",
+  "multi_user_collaboration",
+  "content_marketing_site",
+  "data_visualization_site",
+  "transaction_workflow",
+  "content_knowledge",
+  "ai_automation",
+  "unknown",
+];
+const usageScopes = ["self", "fixed_group", "public_audience", "unknown"];
+const maintenanceModes = ["agent_assisted", "manual_files", "web_admin", "visitor_submission", "runtime_collaboration", "unknown"];
+const accessTopologies = ["single_device", "lan_only", "internet_ip", "public_domain", "unknown"];
+const confidences = ["high", "medium", "low"];

package/workers/schema.sql ADDED Viewed

@@ -0,0 +1,24 @@
+CREATE TABLE IF NOT EXISTS prompt_samples (
+  id TEXT PRIMARY KEY,
+  created_at TEXT NOT NULL,
+  package_version TEXT,
+  client TEXT,
+  telemetry_mode TEXT NOT NULL,
+  message_hash TEXT NOT NULL,
+  message_sample TEXT,
+  rule_decision_json TEXT NOT NULL,
+  llm_decision_json TEXT,
+  final_decision_json TEXT NOT NULL,
+  llm_used INTEGER NOT NULL,
+  cache_hit INTEGER NOT NULL,
+  prompt_tokens_approx INTEGER,
+  completion_tokens_approx INTEGER,
+  rate_limit_status TEXT,
+  fallback_reason TEXT
+);
+CREATE INDEX IF NOT EXISTS idx_prompt_samples_created_at
+ON prompt_samples(created_at);
+CREATE INDEX IF NOT EXISTS idx_prompt_samples_message_hash
+ON prompt_samples(message_hash);

package/workers/wrangler.toml.example ADDED Viewed

@@ -0,0 +1,19 @@
+name = "product-spec-pm-intent-gate"
+main = "pm-intent-gate.mjs"
+compatibility_date = "2026-06-23"
+kv_namespaces = [
+  { binding = "PROMPT_CACHE", id = "replace-with-kv-namespace-id" }
+]
+d1_databases = [
+  { binding = "PROMPT_SAMPLES", database_name = "product-spec-prompt-samples", database_id = "replace-with-d1-database-id" }
+]
+[vars]
+DEEPSEEK_MODEL = "deepseek-chat"
+# Secrets to set with wrangler:
+# wrangler secret put GATE_TOKEN
+# wrangler secret put DEEPSEEK_API_KEY
+# wrangler secret put RATE_LIMIT_SALT