npm - shellward - Versions diffs - 0.5.16 → 0.6.0 - Mend

shellward 0.5.16 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

package/README.md +95 -30
package/dist/auto-check.d.ts +1 -0
package/dist/auto-check.js +12 -1
package/dist/commands/index.d.ts +2 -1
package/dist/commands/index.js +7 -0
package/dist/commands/scan-mcp.d.ts +2 -0
package/dist/commands/scan-mcp.js +105 -0
package/dist/core/engine.d.ts +35 -0
package/dist/core/engine.js +225 -30
package/dist/index.d.ts +4 -2
package/dist/index.js +18 -3
package/dist/mcp-baseline.d.ts +27 -0
package/dist/mcp-baseline.js +73 -0
package/dist/mcp-client.d.ts +29 -0
package/dist/mcp-client.js +264 -0
package/dist/mcp-server.js +64 -9
package/dist/rules/dangerous-commands.js +6 -2
package/dist/rules/injection-en.js +27 -2
package/dist/rules/injection-zh.js +27 -4
package/dist/rules/sensitive-patterns.d.ts +13 -1
package/dist/rules/sensitive-patterns.js +32 -5
package/dist/rules/tool-poisoning.d.ts +8 -0
package/dist/rules/tool-poisoning.js +96 -0
package/dist/types.d.ts +32 -0
package/dist/types.js +3 -1
package/package.json +4 -2
package/server.json +2 -2
package/src/auto-check.ts +11 -1
package/src/commands/index.ts +9 -1
package/src/commands/scan-mcp.ts +118 -0
package/src/core/engine.ts +250 -31
package/src/index.ts +25 -5
package/src/mcp-baseline.ts +97 -0
package/src/mcp-client.ts +268 -0
package/src/mcp-server.ts +71 -9
package/src/rules/dangerous-commands.ts +6 -2
package/src/rules/injection-en.ts +27 -2
package/src/rules/injection-zh.ts +27 -4
package/src/rules/sensitive-patterns.ts +37 -5
package/src/rules/tool-poisoning.ts +108 -0
package/src/types.ts +38 -1

package/src/rules/tool-poisoning.ts ADDED Viewed

@@ -0,0 +1,108 @@
+// src/rules/tool-poisoning.ts — MCP tool-poisoning detection rules
+//
+// Tool poisoning = malicious instructions hidden in an MCP tool's *metadata*
+// (description / parameter descriptions) that the LLM reads but the human never
+// sees in the UI. These are distinct from generic prompt-injection in user text:
+// they target the agent at tool-discovery time. Patterns below are tuned for the
+// common public PoCs (Invariant Labs, MCP-Shield, Snyk agent-scan).
+export interface ToolPoisonRule {
+  id: string
+  name: string
+  pattern: RegExp
+  riskScore: number
+  category: 'hidden_instruction' | 'data_access' | 'exfiltration' | 'concealment' | 'shadowing'
+}
+export const TOOL_POISONING_RULES: ToolPoisonRule[] = [
+  // ===== Hidden instruction markup =====
+  {
+    id: 'tp_important_tag',
+    name: 'Hidden <IMPORTANT>/<system> directive in description',
+    pattern: /<\s*(?:important|system|secret|instructions?|admin)\s*>/i,
+    riskScore: 45,
+    category: 'hidden_instruction',
+  },
+  {
+    id: 'tp_before_using',
+    name: 'Pre-tool instruction injection',
+    pattern: /before\s+(?:using|calling|invoking|running)\s+(?:any\s+other|this|the|another)\s+tool/i,
+    riskScore: 40,
+    category: 'hidden_instruction',
+  },
+  {
+    id: 'tp_zh_before_using',
+    name: '工具描述内前置指令注入',
+    pattern: /(?:在使用|调用|执行)(?:任何)?(?:其他|这个|该)?工具(?:之前|前)/,
+    riskScore: 40,
+    category: 'hidden_instruction',
+  },
+  // ===== Concealment ("don't tell the user") =====
+  {
+    id: 'tp_do_not_tell',
+    name: 'Instruction to hide activity from user',
+    pattern: /(?:do\s+not|don'?t|never)\s+(?:tell|inform|mention|notify|reveal|show)\s+(?:to\s+)?(?:the\s+)?(?:user|human|operator)/i,
+    riskScore: 45,
+    category: 'concealment',
+  },
+  {
+    id: 'tp_zh_do_not_tell',
+    name: '指示对用户隐藏行为',
+    pattern: /(?:不要|不得|切勿|别)(?:告诉|告知|提示|通知|让)?(?:用户|使用者)(?:知道|看到|发现)?/,
+    riskScore: 45,
+    category: 'concealment',
+  },
+  {
+    id: 'tp_without_user',
+    name: 'Act without user knowledge/consent',
+    pattern: /without\s+(?:the\s+)?(?:user'?s?\s+)?(?:knowledge|consent|awareness|noticing|telling)/i,
+    riskScore: 40,
+    category: 'concealment',
+  },
+  // ===== Sensitive data access from a tool description =====
+  {
+    id: 'tp_read_secrets',
+    // Bare mention of a sensitive path is only weakly suspicious — legitimate
+    // tools (dotenv loaders, ssh managers) and security tools name these too.
+    // Scored below threshold so it must corroborate another signal to block.
+    name: 'Description references sensitive files',
+    pattern: /(?:~\/\.ssh|id_rsa|\.aws\/credentials|\.env\b|\.cursor\/mcp\.json|\.npmrc|\/etc\/passwd|\.config\/.*(?:token|secret|credential))/i,
+    riskScore: 25,
+    category: 'data_access',
+  },
+  {
+    id: 'tp_pass_file_contents',
+    name: 'Description asks to pass file/secret contents as a parameter',
+    pattern: /(?:pass|include|read|send|provide|attach)\s+(?:the\s+)?(?:full\s+)?(?:contents?|content|value)\s+of\s+(?:the\s+)?(?:file|\S*(?:key|token|secret|password|credential))/i,
+    riskScore: 35,
+    category: 'data_access',
+  },
+  // ===== Exfiltration hints =====
+  {
+    id: 'tp_exfil_url',
+    name: 'Description instructs sending data to a URL',
+    pattern: /(?:send|transmit|upload|post|exfiltrate|forward)\s+(?:it|this|the\s+\w+|data|results?)?\s*(?:to|via)\s+(?:https?:\/\/|the\s+(?:webhook|endpoint|server|url))/i,
+    riskScore: 40,
+    category: 'exfiltration',
+  },
+  {
+    id: 'tp_exfiltrate_verb',
+    // "exfiltrate" in a tool description is almost never benign.
+    name: 'Exfiltration verb in description',
+    pattern: /\bexfiltrat(?:e|ion|ing)\b/i,
+    riskScore: 35,
+    category: 'exfiltration',
+  },
+  {
+    id: 'tp_sidechannel',
+    // A bare side-channel hostname is weak on its own (could be documentation);
+    // scored below threshold so it must accompany another signal to block.
+    name: 'Known exfiltration side-channel keyword',
+    pattern: /\b(?:webhook\.site|requestbin|pastebin|ngrok\.io|burpcollaborator|interact\.sh|oast\b)/i,
+    riskScore: 25,
+    category: 'exfiltration',
+  },
+]

package/src/types.ts CHANGED Viewed

@@ -16,6 +16,41 @@ export interface ShellWardConfig {
     sessionGuard: boolean
   }
   injectionThreshold: number
+  /** User-supplied rules merged on top of the built-ins (additive; allowedTools wins). */
+  customRules?: CustomRules
+}
+/** A user-defined PII/secret pattern (regex source as a string for JSON-friendliness). */
+export interface CustomSensitivePattern {
+  id: string
+  name: string
+  pattern: string
+  flags?: string
+  replacement?: string
+}
+/** A user-defined dangerous-command pattern. */
+export interface CustomCommandRule {
+  id: string
+  pattern: string
+  flags?: string
+  description?: string
+}
+/**
+ * Extension points for any platform embedding ShellWard. All fields are optional
+ * and ADDITIVE on top of the built-in rules — except `allowedTools`, which always
+ * wins (a tool listed there is never blocked and is treated as low-risk).
+ */
+export interface CustomRules {
+  blockedTools?: string[]
+  allowedTools?: string[]
+  sensitiveTools?: string[]
+  outboundTools?: string[]
+  honeypotPaths?: string[]
+  sensitivePatterns?: CustomSensitivePattern[]
+  dangerousCommands?: CustomCommandRule[]
+  injectionRules?: InjectionRule[]
 }
 export type ResolvedLocale = 'zh' | 'en'
@@ -80,7 +115,9 @@ export const DEFAULT_CONFIG: ShellWardConfig = {
     dataFlowGuard: true,
     sessionGuard: true,
   },
-  injectionThreshold: 60,
+  // 40 catches single high-confidence signals (one strong rule = a block) while
+  // keeping benign "act as…"-style phrasing (≤35) safe. Calibrated against bench/.
+  injectionThreshold: 40,
 }
 /**