npm - security-mcp - Versions diffs - 1.1.4 → 1.3.3 - Mend

security-mcp 1.1.4 → 1.3.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (158) hide show

package/README.md +341 -1018
package/defaults/checklists/ai.json +20 -1
package/defaults/checklists/api.json +35 -1
package/defaults/checklists/infra.json +34 -1
package/defaults/checklists/mobile.json +23 -1
package/defaults/checklists/payments.json +15 -1
package/defaults/checklists/web.json +11 -1
package/defaults/cloud-controls/aws.json +10712 -0
package/defaults/cloud-controls/azure.json +7201 -0
package/defaults/cloud-controls/gcp.json +4061 -0
package/defaults/control-catalog.json +24 -0
package/defaults/security-policy.json +2 -2
package/dist/ci/pr-gate.js +22 -5
package/dist/cli/index.js +73 -2
package/dist/cli/install.js +4 -55
package/dist/cli/onboarding.js +18 -10
package/dist/gate/baseline.js +82 -7
package/dist/gate/catalog.js +10 -2
package/dist/gate/checks/agentic-instructions.js +515 -0
package/dist/gate/checks/ai-governance.js +132 -0
package/dist/gate/checks/ai.js +757 -39
package/dist/gate/checks/auth-deep.js +920 -216
package/dist/gate/checks/business-logic.js +751 -0
package/dist/gate/checks/ci-pipeline.js +399 -4
package/dist/gate/checks/cloud-controls.js +69 -0
package/dist/gate/checks/crypto.js +423 -2
package/dist/gate/checks/data-platform.js +954 -0
package/dist/gate/checks/dependencies.js +582 -15
package/dist/gate/checks/docker-deep.js +1236 -0
package/dist/gate/checks/gitops.js +724 -0
package/dist/gate/checks/graphql.js +201 -19
package/dist/gate/checks/iac.js +1230 -0
package/dist/gate/checks/infra.js +246 -1
package/dist/gate/checks/injection-deep.js +827 -184
package/dist/gate/checks/k8s.js +955 -2
package/dist/gate/checks/mobile-android.js +917 -3
package/dist/gate/checks/mobile-ios.js +797 -5
package/dist/gate/checks/required-artifacts.js +194 -0
package/dist/gate/checks/runtime.js +178 -0
package/dist/gate/checks/secrets.js +256 -13
package/dist/gate/checks/supply-chain-deep.js +787 -0
package/dist/gate/checks/web-nextjs.js +572 -48
package/dist/gate/cloud-controls/apply.js +115 -0
package/dist/gate/cloud-controls/bicep.js +36 -0
package/dist/gate/cloud-controls/cfn.js +125 -0
package/dist/gate/cloud-controls/detect.js +104 -0
package/dist/gate/cloud-controls/hcl.js +140 -0
package/dist/gate/cloud-controls/types.js +87 -0
package/dist/gate/diff.js +17 -5
package/dist/gate/evidence.js +8 -1
package/dist/gate/exceptions.js +202 -9
package/dist/gate/findings.js +15 -2
package/dist/gate/policy.js +316 -130
package/dist/gate/threat-intel.js +6 -0
package/dist/mcp/audit-chain.js +131 -28
package/dist/mcp/auth.js +169 -0
package/dist/mcp/learning.js +129 -4
package/dist/mcp/model-router.js +161 -24
package/dist/mcp/orchestration.js +377 -89
package/dist/mcp/server.js +460 -69
package/dist/mcp/tool-audit.js +193 -0
package/dist/repo/fs.js +37 -1
package/dist/repo/search.js +31 -6
package/dist/review/store.js +56 -3
package/dist/tests/run.js +124 -1
package/package.json +9 -9
package/skills/_TEMPLATE/SKILL.md +99 -0
package/skills/advanced-dos-tester/SKILL.md +118 -0
package/skills/agentic-instruction-auditor/SKILL.md +111 -0
package/skills/agentic-loop-exploiter/SKILL.md +377 -0
package/skills/ai-llm-redteam/SKILL.md +113 -0
package/skills/ai-model-supply-chain-agent/SKILL.md +112 -0
package/skills/algorithm-implementation-reviewer/SKILL.md +107 -0
package/skills/android-penetration-tester/SKILL.md +464 -46
package/skills/anti-replay-tester/SKILL.md +115 -0
package/skills/appsec-code-auditor/SKILL.md +94 -0
package/skills/artifact-integrity-analyst/SKILL.md +450 -0
package/skills/attack-navigator/SKILL.md +476 -8
package/skills/auth-session-hacker/SKILL.md +111 -0
package/skills/aws-penetration-tester/SKILL.md +510 -0
package/skills/azure-penetration-tester/SKILL.md +542 -3
package/skills/binary-auth-validator/SKILL.md +120 -0
package/skills/bot-detection-specialist/SKILL.md +118 -0
package/skills/business-logic-attacker/SKILL.md +240 -0
package/skills/capec-code-mapper/SKILL.md +93 -0
package/skills/cert-pin-rotation-specialist/SKILL.md +121 -0
package/skills/cicd-pipeline-hijacker/SKILL.md +414 -0
package/skills/ciso-orchestrator/SKILL.md +465 -43
package/skills/cloud-infra-specialist/SKILL.md +127 -0
package/skills/compliance-gap-analyst/SKILL.md +431 -0
package/skills/compliance-grc/SKILL.md +94 -0
package/skills/compliance-lifecycle-tracker/SKILL.md +93 -0
package/skills/container-hardening-auditor/SKILL.md +125 -0
package/skills/credential-stuffing-specialist/SKILL.md +111 -0
package/skills/crypto-pki-specialist/SKILL.md +96 -0
package/skills/csa-ccm-mapper/SKILL.md +93 -0
package/skills/csf2-governance-mapper/SKILL.md +93 -0
package/skills/data-platform-auditor/SKILL.md +125 -0
package/skills/deep-link-fuzzer/SKILL.md +118 -0
package/skills/dependency-confusion-attacker/SKILL.md +424 -0
package/skills/device-integrity-aggregator/SKILL.md +117 -0
package/skills/dos-resilience-tester/SKILL.md +106 -0
package/skills/dread-scorer/SKILL.md +93 -0
package/skills/egress-policy-enforcer/SKILL.md +108 -0
package/skills/evidence-collector/SKILL.md +107 -0
package/skills/file-upload-attacker/SKILL.md +118 -0
package/skills/gcp-penetration-tester/SKILL.md +510 -2
package/skills/git-history-secret-scanner/SKILL.md +115 -0
package/skills/gitops-delivery-auditor/SKILL.md +120 -0
package/skills/iac-security-auditor/SKILL.md +125 -0
package/skills/iam-privesc-graph-builder/SKILL.md +161 -0
package/skills/incident-responder/SKILL.md +120 -0
package/skills/injection-specialist/SKILL.md +111 -0
package/skills/ios-security-auditor/SKILL.md +291 -0
package/skills/json-ambiguity-tester/SKILL.md +145 -0
package/skills/k8s-container-escaper/SKILL.md +406 -0
package/skills/key-management-lifecycle-analyst/SKILL.md +107 -0
package/skills/kill-switch-engineer/SKILL.md +111 -0
package/skills/linddun-privacy-analyst/SKILL.md +111 -0
package/skills/logic-race-fuzzer/SKILL.md +452 -0
package/skills/mobile-api-network-attacker/SKILL.md +430 -0
package/skills/mobile-binary-hardener/SKILL.md +111 -0
package/skills/mobile-security-specialist/SKILL.md +94 -0
package/skills/mobile-webview-auditor/SKILL.md +105 -0
package/skills/model-extraction-attacker/SKILL.md +228 -0
package/skills/multipart-abuse-tester/SKILL.md +93 -0
package/skills/oauth-pkce-specialist/SKILL.md +113 -0
package/skills/parser-exhaustion-tester/SKILL.md +151 -0
package/skills/pentest-infra/SKILL.md +107 -0
package/skills/pentest-social/SKILL.md +210 -0
package/skills/pentest-team/SKILL.md +96 -0
package/skills/pentest-web-api/SKILL.md +107 -0
package/skills/privacy-flow-analyst/SKILL.md +243 -0
package/skills/prompt-injection-specialist/SKILL.md +403 -0
package/skills/quantum-migration-planner/SKILL.md +105 -0
package/skills/rag-poisoning-specialist/SKILL.md +367 -0
package/skills/registry-mirror-enforcer/SKILL.md +93 -0
package/skills/rotation-validation-agent/SKILL.md +121 -0
package/skills/samm-assessor/SKILL.md +94 -0
package/skills/secrets-mask-bypass-tester/SKILL.md +109 -0
package/skills/senior-security-engineer/SKILL.md +178 -0
package/skills/serialization-memory-attacker/SKILL.md +341 -0
package/skills/session-timeout-tester/SKILL.md +170 -0
package/skills/slsa-level3-enforcer/SKILL.md +121 -0
package/skills/slsa-provenance-enforcer/SKILL.md +111 -0
package/skills/ssrf-detection-validator/SKILL.md +117 -0
package/skills/step-up-auth-enforcer/SKILL.md +93 -0
package/skills/stride-pasta-analyst/SKILL.md +429 -0
package/skills/supply-chain-devsecops/SKILL.md +107 -0
package/skills/threat-infrastructure-analyst/SKILL.md +93 -0
package/skills/threat-modeler/SKILL.md +94 -0
package/skills/tls-certificate-auditor/SKILL.md +582 -18
package/skills/token-reuse-detector/SKILL.md +104 -0
package/skills/trike-risk-modeler/SKILL.md +93 -0
package/skills/unicode-homograph-tester/SKILL.md +93 -0
package/skills/waf-rule-lifecycle-agent/SKILL.md +106 -0
package/skills/webhook-security-tester/SKILL.md +111 -0
package/skills/zero-trust-architect/SKILL.md +118 -0

package/dist/mcp/model-router.js CHANGED Viewed

@@ -35,9 +35,28 @@ const MEMORY_DIR = join(".mcp", "memory");
 const USAGE_FILE = join(MEMORY_DIR, "model-usage.json");
 const HEALTH_FILE = join(MEMORY_DIR, "provider-health.json");
 const POLICY_FILE = join(".mcp", "policies", "security-policy.json");
-const DEFAULT_BUDGET_USD = 5.0;
+const DEFAULT_BUDGET_USD = 5;
 const CIRCUIT_BREAKER_THRESHOLD = 3; // failures before circuit opens
 const CIRCUIT_BREAKER_COOLDOWN_MS = 60_000; // 60 seconds
+// ---------------------------------------------------------------------------
+// Rate limiting — recordProviderFailure to prevent circuit-breaker manipulation
+// ---------------------------------------------------------------------------
+const _providerFailureSubmissions = new Map();
+const FAILURE_RATE_LIMIT = 5; // max 5 failure reports per provider per window
+const FAILURE_WINDOW_MS = 300_000; // 5 minute window
+export function recordProviderFailureRateLimited(providerName) {
+    const now = Date.now();
+    const entry = _providerFailureSubmissions.get(providerName);
+    if (!entry || now - entry.windowStart > FAILURE_WINDOW_MS) {
+        _providerFailureSubmissions.set(providerName, { count: 1, windowStart: now });
+        return { allowed: true };
+    }
+    if (entry.count >= FAILURE_RATE_LIMIT) {
+        return { allowed: false, reason: `Rate limit exceeded: max ${FAILURE_RATE_LIMIT} failure reports per provider per 5 minutes` };
+    }
+    entry.count++;
+    return { allowed: true };
+}
 /**
  * Full model registry across all providers.
  * Pricing sourced from public pricing pages (approximate, for routing decisions only).
@@ -57,8 +76,8 @@ export const MODEL_REGISTRY = [
         modelId: "claude-sonnet-4-6",
         provider: "anthropic",
         capabilityTier: "standard",
-        inputPer1M: 3.0,
-        outputPer1M: 15.0,
+        inputPer1M: 3,
+        outputPer1M: 15,
         label: "Claude Sonnet 4.6"
     },
     // OpenAI — GPT
@@ -67,15 +86,15 @@ export const MODEL_REGISTRY = [
         provider: "openai",
         capabilityTier: "light",
         inputPer1M: 0.15,
-        outputPer1M: 0.60,
+        outputPer1M: 0.6,
         label: "GPT-4o Mini"
     },
     {
         modelId: "gpt-4o",
         provider: "openai",
         capabilityTier: "standard",
-        inputPer1M: 2.50,
-        outputPer1M: 10.0,
+        inputPer1M: 2.5,
+        outputPer1M: 10,
         label: "GPT-4o"
     },
     // Google — Gemini
@@ -84,7 +103,7 @@ export const MODEL_REGISTRY = [
         provider: "google",
         capabilityTier: "light",
         inputPer1M: 0.075,
-        outputPer1M: 0.30,
+        outputPer1M: 0.3,
         label: "Gemini 1.5 Flash"
     },
     {
@@ -92,7 +111,7 @@ export const MODEL_REGISTRY = [
         provider: "google",
         capabilityTier: "standard",
         inputPer1M: 1.25,
-        outputPer1M: 5.0,
+        outputPer1M: 5,
         label: "Gemini 1.5 Pro"
     },
     // Cohere — Command R
@@ -101,17 +120,44 @@ export const MODEL_REGISTRY = [
         provider: "cohere",
         capabilityTier: "light",
         inputPer1M: 0.15,
-        outputPer1M: 0.60,
+        outputPer1M: 0.6,
         label: "Command R"
     },
     {
         modelId: "command-r-plus",
         provider: "cohere",
         capabilityTier: "standard",
-        inputPer1M: 2.50,
-        outputPer1M: 10.0,
+        inputPer1M: 2.5,
+        outputPer1M: 10,
         label: "Command R+"
     },
+    // Anthropic — Claude Opus (advanced tier, opt-in via advanced_task_preference in policy)
+    {
+        modelId: "claude-opus-4-8",
+        provider: "anthropic",
+        capabilityTier: "advanced",
+        inputPer1M: 15,
+        outputPer1M: 75,
+        label: "Claude Opus 4.8"
+    },
+    // OpenAI — o1 (advanced tier)
+    {
+        modelId: "o1",
+        provider: "openai",
+        capabilityTier: "advanced",
+        inputPer1M: 15,
+        outputPer1M: 60,
+        label: "OpenAI o1"
+    },
+    // Google — Gemini 2.0 Flash (advanced tier)
+    {
+        modelId: "gemini-2.0-flash-thinking-exp",
+        provider: "google",
+        capabilityTier: "advanced",
+        inputPer1M: 0,
+        outputPer1M: 0,
+        label: "Gemini 2.0 Flash Thinking (experimental)"
+    },
     // Local — Ollama (zero cost, requires Ollama at localhost:11434)
     {
         modelId: "llama3",
@@ -185,7 +231,7 @@ export const TASK_TIER_MAP = {
 // Storage helpers
 // ---------------------------------------------------------------------------
 async function ensureMemoryDir() {
-    await mkdir(MEMORY_DIR, { recursive: true });
+    await mkdir(MEMORY_DIR, { recursive: true, mode: 0o700 });
 }
 async function loadUsageStore() {
     try {
@@ -199,7 +245,7 @@ async function loadUsageStore() {
 async function saveUsageStore(store) {
     await ensureMemoryDir();
     store.updatedAt = new Date().toISOString();
-    await writeFile(USAGE_FILE, JSON.stringify(store, null, 2) + "\n", "utf-8");
+    await writeFile(USAGE_FILE, JSON.stringify(store, null, 2) + "\n", { encoding: "utf-8", mode: 0o600 });
 }
 async function loadHealthStore() {
     try {
@@ -213,7 +259,7 @@ async function loadHealthStore() {
 async function saveHealthStore(store) {
     await ensureMemoryDir();
     store.updatedAt = new Date().toISOString();
-    await writeFile(HEALTH_FILE, JSON.stringify(store, null, 2) + "\n", "utf-8");
+    await writeFile(HEALTH_FILE, JSON.stringify(store, null, 2) + "\n", { encoding: "utf-8", mode: 0o600 });
 }
 async function loadMaxBudget() {
     try {
@@ -235,6 +281,16 @@ async function loadPreferredProviders() {
         return null;
     }
 }
+async function loadAdvancedTaskPreferences() {
+    try {
+        const raw = await readFile(POLICY_FILE, "utf-8");
+        const policy = JSON.parse(raw);
+        return policy.model_budget?.advanced_task_preference ?? [];
+    }
+    catch {
+        return [];
+    }
+}
 // ---------------------------------------------------------------------------
 // Circuit breaker helpers
 // ---------------------------------------------------------------------------
@@ -265,12 +321,31 @@ function legacyTier(capTier) {
  * Select the cheapest healthy model that meets the capability requirement for
  * the given task type. Respects preferred_providers policy and circuit breakers.
  *
- * @param requiredTier  Minimum capability tier for the task.
- * @param health        Current provider health store.
- * @param preferred     Optional ordered list of preferred providers.
- * @returns             [chosen model, failoverUsed]
+ * @param requiredTier    Minimum capability tier for the task.
+ * @param health          Current provider health store.
+ * @param preferred       Optional ordered list of preferred providers.
+ * @param preferAdvanced  If true, try advanced-tier models first, fall back to standard.
+ * @returns               [chosen model, failoverUsed]
  */
-function selectModel(requiredTier, health, preferred) {
+function selectModel(requiredTier, health, preferred, preferAdvanced = false) {
+    // If advanced is preferred, try advanced-tier models first. Fall back gracefully to
+    // standard if none are healthy or registered — zero impact for users without Opus/o1.
+    if (preferAdvanced) {
+        const advancedCandidates = MODEL_REGISTRY.filter((m) => m.capabilityTier === "advanced");
+        const healthyAdvanced = advancedCandidates.filter((m) => !isCircuitOpen(health.providers[m.provider]));
+        if (healthyAdvanced.length > 0) {
+            const pool = preferred
+                ? [
+                    ...healthyAdvanced.filter((m) => preferred.includes(m.provider)),
+                    ...healthyAdvanced.filter((m) => !preferred.includes(m.provider))
+                ]
+                : healthyAdvanced;
+            pool.sort((a, b) => combinedCost(a) - combinedCost(b));
+            if (pool.length > 0)
+                return [pool[0], false];
+        }
+        // No advanced model available — fall through to standard selection silently.
+    }
     // Candidates: all models meeting the capability floor.
     const candidates = MODEL_REGISTRY.filter((m) => meetsCapabilityFloor(m, requiredTier));
     // Separate healthy vs. circuit-open providers.
@@ -304,14 +379,16 @@ function selectModel(requiredTier, health, preferred) {
  * Falls back to next-cheapest provider on circuit breaker open.
  */
 export async function getModelForTask(taskType, _opts) {
-    const [store, health, maxBudget, preferred] = await Promise.all([
+    const [store, health, maxBudget, preferred, advancedPrefs] = await Promise.all([
         loadUsageStore(),
         loadHealthStore(),
         loadMaxBudget(),
-        loadPreferredProviders()
+        loadPreferredProviders(),
+        loadAdvancedTaskPreferences()
     ]);
     const requiredTier = TASK_CAPABILITY_MAP[taskType];
-    const [chosen, failoverUsed] = selectModel(requiredTier, health, preferred);
+    const preferAdvanced = advancedPrefs.includes(taskType);
+    const [chosen, failoverUsed] = selectModel(requiredTier, health, preferred, preferAdvanced);
     const spent = store.totalSpentUsd;
     const remaining = maxBudget - spent;
     const utilizationPct = maxBudget > 0 ? (spent / maxBudget) * 100 : 0;
@@ -326,6 +403,39 @@ export async function getModelForTask(taskType, _opts) {
         budgetStatus = "ok";
     }
     const rationale = buildRationale(taskType, requiredTier, chosen, failoverUsed, preferred);
+    // Determine whether all providers were circuit-open (best-effort fallback path).
+    const allProviders = ["anthropic", "openai", "google", "cohere", "local"];
+    const allCircuitsOpen = allProviders.every((p) => isCircuitOpen(health.providers[p]));
+    // ISO 42001 §9.1 — emit structured audit log for every routing decision.
+    let routingReason;
+    if (allCircuitsOpen) {
+        routingReason = "circuit_open_fallback";
+    }
+    else if (failoverUsed) {
+        routingReason = "capability_match";
+    }
+    else {
+        routingReason = "cost_optimized";
+    }
+    console.log(JSON.stringify({
+        event: "MODEL_ROUTING_DECISION",
+        timestamp: new Date().toISOString(),
+        taskType,
+        selectedModel: chosen.modelId,
+        selectedProvider: chosen.provider,
+        reason: routingReason,
+        circuitState: allCircuitsOpen ? "FALLBACK" : "NORMAL",
+    }));
+    // Additional high-severity audit entry for the circuit-breaker fallback path.
+    if (allCircuitsOpen) {
+        console.warn(JSON.stringify({
+            event: "MODEL_ROUTING_CIRCUIT_FALLBACK",
+            timestamp: new Date().toISOString(),
+            reason: "ALL_PROVIDERS_CIRCUIT_OPEN",
+            fallbackModel: chosen.modelId,
+            severity: "HIGH",
+        }));
+    }
     return {
         model: chosen.modelId,
         provider: chosen.provider,
@@ -358,8 +468,8 @@ function buildRationale(taskType, required, chosen, failoverUsed, preferred) {
 export async function trackUsage(usage) {
     const [store, health] = await Promise.all([loadUsageStore(), loadHealthStore()]);
     const model = MODEL_REGISTRY.find((m) => m.modelId === usage.model);
-    const inputRate = model?.inputPer1M ?? (usage.tier === "haiku" ? 0.25 : 3.0);
-    const outputRate = model?.outputPer1M ?? (usage.tier === "haiku" ? 1.25 : 15.0);
+    const inputRate = model?.inputPer1M ?? (usage.tier === "haiku" ? 0.25 : 3);
+    const outputRate = model?.outputPer1M ?? (usage.tier === "haiku" ? 1.25 : 15);
     const estimatedCost = (usage.inputTokens / 1_000_000) * inputRate +
         (usage.outputTokens / 1_000_000) * outputRate;
     const record = {
@@ -389,8 +499,13 @@ export async function trackUsage(usage) {
 /**
  * Record a provider failure (connection error, rate limit, auth failure).
  * Opens circuit breaker after CIRCUIT_BREAKER_THRESHOLD consecutive failures.
+ * Rate-limited to prevent deliberate circuit-breaker manipulation (max 5 per provider per 5 min).
  */
 export async function recordProviderFailure(provider) {
+    const rateCheck = recordProviderFailureRateLimited(provider);
+    if (!rateCheck.allowed) {
+        return { recorded: false, reason: rateCheck.reason };
+    }
     const health = await loadHealthStore();
     const now = new Date();
     const state = health.providers[provider] ?? {
@@ -407,6 +522,28 @@ export async function recordProviderFailure(provider) {
     }
     health.providers[provider] = state;
     await saveHealthStore(health);
+    // Circuit-state audit: warn and emit structured audit record if all known providers are circuit-open.
+    // Deliberate manipulation requires only CIRCUIT_BREAKER_THRESHOLD (3) failures per provider × 5 providers
+    // = 15 calls, constrained to max 5 per provider per 5-min window. Log at ERROR level so SIEM picks this up.
+    // MITRE ATLAS AML.T0040 (ML Model Inference API) — circuit-breaker exhaustion attack.
+    const allProviders = ["anthropic", "openai", "google", "cohere", "local"];
+    const allProvidersDown = allProviders.every((p) => isCircuitOpen(health.providers[p]));
+    if (allProvidersDown) {
+        // Determine which fallback model will be used (cheapest in registry, circuit ignored).
+        const fallbackCandidates = MODEL_REGISTRY.filter((m) => m.provider === "anthropic" && m.capabilityTier === "standard");
+        const fallbackModel = fallbackCandidates[0]?.modelId ?? "unknown";
+        console.error(JSON.stringify({
+            severity: "CRITICAL",
+            event: "ALL_PROVIDERS_CIRCUIT_OPEN",
+            message: "All AI providers are circuit-open. Routing to fallback model. This may indicate deliberate circuit-breaker manipulation.",
+            fallbackModel,
+            timestamp: new Date().toISOString(),
+            failingProvider: provider,
+            mitre: "AML.T0040",
+            action: "Manual investigation required. Call security.reset_provider_circuit after confirming provider health."
+        }));
+    }
+    return { recorded: true };
 }
 /**
  * Return health status for all providers — circuit breaker state and call counts.