npm - local-model-suitability-mcp - Versions diffs - 1.1.22 → 1.1.24 - Mend

local-model-suitability-mcp 1.1.22 → 1.1.24

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,13 @@
 # Changelog
+## [1.1.24] - 2026-06-26
+- fix: trial extension requests now written to Redis (lms:trial:{email}) on grant -- permanent audit trail that survives redeploys; previously in-memory only
+## [1.1.23] - 2026-06-25
+- feat: calls_remaining field added to check_local_viability response -- "unlimited" for paid keys, numeric free-tier headroom otherwise (HTTP POST and stdio transports)
+- feat: verdict_ttl field added (86400s/24h)
+- feat: data_source_status field added (full/degraded) -- "degraded" when Anthropic responds but returns unparseable output and a fallback verdict is used; "full" otherwise, including the CONFIDENTIAL local-rule shortcut which never calls Anthropic
 ## [1.1.22] - 2026-06-24
 - feat: unauthenticated /public-stats endpoint -- first_deployed, lifetime tool calls, uptime %, version, for agent orchestrators evaluating server trustworthiness
 - feat: /process-trial-followups endpoint + 24h follow-up record on trial-extension grant

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "local-model-suitability-mcp",
   "mcpName": "io.github.OjasKord/local-model-suitability-mcp",
-  "version": "1.1.22",
+  "version": "1.1.24",
   "description": "AI model router for agents. Checks whether a local model can handle the task before calling cloud inference. LOCAL/CLOUD verdict saves cost on every call.",
   "main": "src/server.js",
   "type": "module",

package/server.json CHANGED Viewed

@@ -1,36 +1,36 @@
-{
-  "$schema": "https://static.modelcontextprotocol.io/schemas/2025-12-11/server.schema.json",
-  "name": "io.github.OjasKord/local-model-suitability-mcp",
-  "title": "Local Model Suitability MCP",
-  "description": "Check if a task runs locally vs cloud. Save money on calls that don't need cloud inference.",
-  "version": "1.1.16",
-  "websiteUrl": "https://kordagencies.com",
-  "repository": {
-    "url": "https://github.com/OjasKord/local-model-suitability-mcp",
-    "source": "github"
-  },
-  "packages": [
-    {
-      "registryType": "npm",
-      "identifier": "local-model-suitability-mcp",
-      "version": "1.1.16",
-      "transport": {
-        "type": "stdio"
-      },
-      "environmentVariables": [
-        {
-          "name": "ANTHROPIC_API_KEY",
-          "description": "Anthropic API key for Claude routing analysis",
-          "isRequired": true,
-          "isSecret": true
-        }
-      ]
-    }
-  ],
-  "remotes": [
-    {
-      "type": "streamable-http",
-      "url": "https://local-model-suitability-mcp-production.up.railway.app"
-    }
-  ]
-}
+{
+  "$schema": "https://static.modelcontextprotocol.io/schemas/2025-12-11/server.schema.json",
+  "name": "io.github.OjasKord/local-model-suitability-mcp",
+  "title": "Local Model Suitability MCP",
+  "description": "Check if a task runs locally vs cloud. Save money on calls that don't need cloud inference.",
+  "version": "1.1.23",
+  "websiteUrl": "https://kordagencies.com",
+  "repository": {
+    "url": "https://github.com/OjasKord/local-model-suitability-mcp",
+    "source": "github"
+  },
+  "packages": [
+    {
+      "registryType": "npm",
+      "identifier": "local-model-suitability-mcp",
+      "version": "1.1.23",
+      "transport": {
+        "type": "stdio"
+      },
+      "environmentVariables": [
+        {
+          "name": "ANTHROPIC_API_KEY",
+          "description": "Anthropic API key for Claude routing analysis",
+          "isRequired": true,
+          "isSecret": true
+        }
+      ]
+    }
+  ],
+  "remotes": [
+    {
+      "type": "streamable-http",
+      "url": "https://local-model-suitability-mcp-production.up.railway.app"
+    }
+  ]
+}

package/src/server.js CHANGED Viewed

@@ -3,7 +3,7 @@ import { createHmac, timingSafeEqual } from 'crypto';
 import { readFileSync, writeFileSync } from 'fs';
 import Anthropic from '@anthropic-ai/sdk';
-const VERSION = '1.1.22';
+const VERSION = '1.1.24';
 const FIRST_DEPLOYED = '2026-04-13T06:41:38Z';
 const LIFETIME_CALLS_REDIS_KEY = 'lms:lifetime_calls';
 const UPTIME_HEARTBEAT_KEY = 'lms:uptime:heartbeat_count';
@@ -16,6 +16,8 @@ const ENTERPRISE_UPGRADE_URL = 'https://buy.stripe.com/28E9AS27PbPvfkoe7Sebu0q';
 const ALLOWED_PAYMENT_LINK_IDS = ['plink_1TQzCBD6WvRe6sn3H1q5t2LF', 'plink_1TQzDSD6WvRe6sn3UM2G1EgX'];
 const PERSIST_FILE = '/tmp/lms_stats.json';
 const LEGAL_DISCLAIMER = 'AI-powered routing analysis. We do not log or store your task content. Results are for cost-optimisation guidance only. Provider maximum liability is limited to subscription fees paid in the preceding 3 months. Full terms: kordagencies.com/terms.html';
+// Caching/staleness policy per tool, in seconds.
+const VERDICT_TTL = { check_local_viability: 86400 };
 function nowISO() { return new Date().toISOString(); }
@@ -382,6 +384,8 @@ async function checkLocalViability(task, qualityThreshold, dataSensitivity) {
       cloud_justified_reason: null,
       data_sensitivity_override: true,
       analysis_type: 'AI-powered cost routing — NOT a simple lookup',
+      verdict_ttl: VERDICT_TTL.check_local_viability,
+      data_source_status: 'full',
       _disclaimer: LEGAL_DISCLAIMER
     };
   }
@@ -429,6 +433,7 @@ Respond ONLY with a JSON object — no markdown, no explanation outside the JSON
   const raw = response.content[0].text.trim();
   let parsed;
+  let aiDegraded = false;
   try {
     parsed = JSON.parse(raw);
   } catch(e) {
@@ -441,6 +446,7 @@ Respond ONLY with a JSON object — no markdown, no explanation outside the JSON
       recommended_local_models: ['llama3.2:8b', 'mistral-7b'],
       cloud_justified_reason: null
     };
+    aiDegraded = true;
   }
   const _rLms = {
@@ -448,6 +454,8 @@ Respond ONLY with a JSON object — no markdown, no explanation outside the JSON
     task_quality_threshold: quality,
     data_sensitivity: sensitivity,
     analysis_type: 'AI-powered cost routing — NOT a simple lookup',
+    verdict_ttl: VERDICT_TTL.check_local_viability,
+    data_source_status: aiDegraded ? 'degraded' : 'full',
     checked_at: nowISO(),
     _disclaimer: LEGAL_DISCLAIMER
   };
@@ -707,6 +715,7 @@ const server = createServer(async (req, res) => {
         stats.free_tier_calls_by_ip[clientIp][month] = Math.max(0, current - TRIAL_EXTENSION_CALLS);
         trialExtensions.set(emailKey, { name, email, use_case: use_case || '', ip: clientIp, granted_at: nowISO() });
         saveStats();
+        await redisSet(REDIS_PREFIX + ':trial:' + email.toLowerCase().trim(), { name, email, use_case: use_case || '', ip: clientIp, timestamp: nowISO(), server: 'local-model-suitability-mcp' });
         // 24h follow-up record -- processed by /process-trial-followups (fleet cron)
         await redisSet(REDIS_PREFIX + ':followup:' + email.toLowerCase().trim(), { email, name, server: 'local-model-suitability-mcp', granted_at: nowISO(), sent: false });
         const sendTrialEmail = async (to, subject, html) => {
@@ -890,9 +899,11 @@ const server = createServer(async (req, res) => {
               redisIncr(LIFETIME_CALLS_REDIS_KEY).catch(() => {});
               logCall('check_local_viability', access.tier, clientIp);
               appendSessionLog(clientIp, 'check_local_viability').catch((e) => console.error('[SessionLog] appendSessionLog failed:', e));
+              const callsRemaining = access.tier === 'free' ? Math.max(0, FREE_TIER_LIMIT - getFreeTierCount(clientIp)) : 'unlimited';
               try {
                 const result = await checkLocalViability(task, quality_threshold, data_sensitivity);
+                result.calls_remaining = callsRemaining;
                 // Partial response for free tier
                 if (access.tier === 'free') {
@@ -902,6 +913,7 @@ const server = createServer(async (req, res) => {
                     reason: result.reason,
                     analysis_type: result.analysis_type,
                     checked_at: result.checked_at,
+                    calls_remaining: result.calls_remaining,
                     _disclaimer: result._disclaimer,
                     upgrade_url: PRO_UPGRADE_URL
                   };
@@ -977,6 +989,7 @@ function setupStdio() {
         } else {
           try {
             const result = await checkLocalViability(task, quality_threshold, data_sensitivity);
+            result.calls_remaining = 'unlimited';
             response = { jsonrpc: '2.0', id: req.id, result: { content: [{ type: 'text', text: JSON.stringify(result) }] } };
           } catch(e) {
             response = { jsonrpc: '2.0', id: req.id, result: { content: [{ type: 'text', text: JSON.stringify({ error: e.message, likely_cause: 'AI routing analysis failed — transient Anthropic API issue', retryable: true, retry_after_ms: 120000, fallback_tool: null, agent_action: 'RETRY_IN_2_MIN', category: 'ai_failure', trace_id: nowISO(), _disclaimer: LEGAL_DISCLAIMER }) }] } };