npm - agentshield-sdk - Versions diffs - 7.0.0 - Mend

agentshield-sdk 7.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

package/CHANGELOG.md +191 -0
package/LICENSE +21 -0
package/README.md +975 -0
package/bin/agent-shield.js +680 -0
package/package.json +118 -0
package/src/adaptive.js +330 -0
package/src/agent-protocol.js +998 -0
package/src/alert-tuning.js +480 -0
package/src/allowlist.js +603 -0
package/src/audit-immutable.js +914 -0
package/src/audit-streaming.js +469 -0
package/src/badges.js +196 -0
package/src/behavior-profiling.js +289 -0
package/src/benchmark-harness.js +804 -0
package/src/canary.js +271 -0
package/src/certification.js +563 -0
package/src/circuit-breaker.js +321 -0
package/src/compliance.js +617 -0
package/src/confidence-tuning.js +324 -0
package/src/confused-deputy.js +624 -0
package/src/context-scoring.js +360 -0
package/src/conversation.js +494 -0
package/src/cost-optimizer.js +1024 -0
package/src/ctf.js +462 -0
package/src/detector-core.js +1999 -0
package/src/distributed.js +359 -0
package/src/document-scanner.js +795 -0
package/src/embedding.js +307 -0
package/src/encoding.js +429 -0
package/src/enterprise.js +405 -0
package/src/errors.js +100 -0
package/src/eu-ai-act.js +523 -0
package/src/fuzzer.js +764 -0
package/src/honeypot.js +328 -0
package/src/i18n-patterns.js +523 -0
package/src/index.js +430 -0
package/src/integrations.js +528 -0
package/src/llm-redteam.js +670 -0
package/src/main.js +741 -0
package/src/main.mjs +38 -0
package/src/mcp-bridge.js +542 -0
package/src/mcp-certification.js +846 -0
package/src/mcp-sdk-integration.js +355 -0
package/src/mcp-security-runtime.js +741 -0
package/src/mcp-server.js +740 -0
package/src/middleware.js +208 -0
package/src/model-finetuning.js +884 -0
package/src/model-fingerprint.js +1042 -0
package/src/multi-agent-trust.js +453 -0
package/src/multi-agent.js +404 -0
package/src/multimodal.js +296 -0
package/src/nist-mapping.js +505 -0
package/src/observability.js +330 -0
package/src/openclaw.js +450 -0
package/src/otel.js +544 -0
package/src/owasp-2025.js +483 -0
package/src/pii.js +390 -0
package/src/plugin-marketplace.js +628 -0
package/src/plugin-system.js +349 -0
package/src/policy-dsl.js +775 -0
package/src/policy-extended.js +635 -0
package/src/policy.js +443 -0
package/src/presets.js +409 -0
package/src/production.js +557 -0
package/src/prompt-leakage.js +321 -0
package/src/rag-vulnerability.js +579 -0
package/src/redteam.js +475 -0
package/src/response-handler.js +429 -0
package/src/scanners.js +357 -0
package/src/self-healing.js +363 -0
package/src/semantic.js +339 -0
package/src/shield-score.js +250 -0
package/src/sso-saml.js +897 -0
package/src/stream-scanner.js +806 -0
package/src/testing.js +505 -0
package/src/threat-encyclopedia.js +629 -0
package/src/threat-intel-network.js +1017 -0
package/src/token-analysis.js +467 -0
package/src/tool-guard.js +412 -0
package/src/tool-output-validator.js +354 -0
package/src/utils.js +83 -0
package/src/watermark.js +235 -0
package/src/worker-scanner.js +601 -0
package/types/index.d.ts +2088 -0

package/src/index.js ADDED Viewed

@@ -0,0 +1,430 @@
+'use strict';
+/**
+ * Agent Shield SDK
+ *
+ * Protects AI agents from prompt injection, data exfiltration,
+ * tool abuse, and other AI-specific attacks.
+ *
+ * All detection runs locally — no data ever leaves your environment.
+ *
+ * @example
+ * const { AgentShield } = require('agent-shield');
+ *
+ * const shield = new AgentShield();
+ *
+ * // Scan any text
+ * const result = shield.scan('ignore all previous instructions');
+ * if (result.status !== 'safe') {
+ *   console.log('Threat detected:', result.threats);
+ * }
+ *
+ * // Scan agent input before processing
+ * const inputResult = shield.scanInput(userMessage);
+ * if (inputResult.blocked) {
+ *   return 'This input was blocked for safety reasons.';
+ * }
+ *
+ * // Scan agent output before returning to user
+ * const outputResult = shield.scanOutput(agentResponse);
+ *
+ * // Scan tool calls before execution
+ * const toolResult = shield.scanToolCall('bash', { command: 'cat /etc/passwd' });
+ */
+const { scanText, getPatterns, SEVERITY_ORDER } = require('./detector-core');
+/**
+ * Default configuration for AgentShield.
+ */
+const DEFAULT_CONFIG = {
+  /** Sensitivity level: 'low', 'medium', or 'high'. */
+  sensitivity: 'medium',
+  /** Whether to block inputs that reach the threshold. */
+  blockOnThreat: false,
+  /** Minimum severity to trigger a block: 'low', 'medium', 'high', or 'critical'. */
+  blockThreshold: 'high',
+  /** Whether to log scan results to console. */
+  logging: false,
+  /** Custom callback when a threat is detected. */
+  onThreat: null,
+  /** Dangerous tool names that should be scrutinized more carefully. */
+  dangerousTools: [
+    'bash', 'shell', 'terminal', 'exec', 'execute',
+    'eval', 'run_command', 'system',
+    'write_file', 'delete_file', 'remove',
+    'http_request', 'fetch', 'curl', 'wget',
+    'sql', 'query', 'database'
+  ],
+  /** Sensitive file patterns that should never be accessed. */
+  sensitiveFilePatterns: [
+    /\.env$/i,
+    /credentials/i,
+    /secrets?\.(?:json|yaml|yml|toml)/i,
+    /private[_-]?key/i,
+    /password/i,
+    /token/i,
+    /\.pem$/i,
+    /\.key$/i,
+    /id_rsa/i,
+    /id_ed25519/i
+  ]
+};
+class AgentShield {
+  /**
+   * Creates a new AgentShield instance.
+   * @param {object} [config] - Configuration overrides.
+   */
+  constructor(config = {}) {
+    this.config = { ...DEFAULT_CONFIG, ...config };
+    // Deep-merge arrays: append user items to defaults instead of replacing
+    if (config.dangerousTools) {
+      this.config.dangerousTools = [...new Set([...DEFAULT_CONFIG.dangerousTools, ...config.dangerousTools])];
+    }
+    if (config.sensitiveFilePatterns) {
+      this.config.sensitiveFilePatterns = [...DEFAULT_CONFIG.sensitiveFilePatterns, ...config.sensitiveFilePatterns];
+    }
+    this.stats = {
+      totalScans: 0,
+      threatsDetected: 0,
+      blocked: 0,
+      scanHistory: []
+    };
+  }
+  /**
+   * Scans arbitrary text for threats.
+   *
+   * @param {string} text - Text to scan.
+   * @param {object} [options] - Scan options.
+   * @param {string} [options.source] - Label for where the text came from.
+   * @param {string} [options.sensitivity] - Override default sensitivity.
+   * @returns {object} Scan result.
+   * @throws {TypeError} If text is not a string.
+   */
+  scan(text, options = {}) {
+    if (typeof text !== 'string') {
+      throw new TypeError(`[Agent Shield] scan() expects a string, got ${typeof text}`);
+    }
+    if (text.length > 1_000_000) {
+      console.warn('[Agent Shield] Input exceeds 1MB — consider scanning in chunks');
+    }
+    const result = scanText(text, {
+      source: options.source || 'unknown',
+      sensitivity: options.sensitivity || this.config.sensitivity
+    });
+    this.stats.totalScans++;
+    if (result.threats.length > 0) {
+      this.stats.threatsDetected += result.threats.length;
+    }
+    // Keep last 100 scans in history
+    this.stats.scanHistory.push({
+      timestamp: result.timestamp,
+      status: result.status,
+      threatCount: result.threats.length,
+      source: options.source || 'unknown'
+    });
+    if (this.stats.scanHistory.length > 100) {
+      this.stats.scanHistory.shift();
+    }
+    if (this.config.logging && result.threats.length > 0) {
+      console.warn(`[Agent Shield] ${result.threats.length} threat(s) detected in ${options.source || 'unknown'}:`,
+        result.threats.map(t => `${t.severity}: ${t.description}`));
+    }
+    if (this.config.onThreat && result.threats.length > 0) {
+      try {
+        this.config.onThreat(result);
+      } catch (err) {
+        console.error('[Agent Shield] onThreat callback error:', err.message);
+      }
+    }
+    return result;
+  }
+  /**
+   * Checks if threats meet the blocking threshold.
+   * @private
+   * @param {Array} threats
+   * @returns {boolean}
+   */
+  _shouldBlock(threats) {
+    if (!this.config.blockOnThreat || threats.length === 0) return false;
+    const thresholdLevel = SEVERITY_ORDER[this.config.blockThreshold] ?? 1;
+    return threats.some(t => SEVERITY_ORDER[t.severity] <= thresholdLevel);
+  }
+  /**
+   * Scans text, applies blocking logic, and tracks stats.
+   * @private
+   * @param {string} text
+   * @param {string} defaultSource
+   * @param {string} logLabel
+   * @param {object} options
+   * @returns {object}
+   */
+  _scanWithBlocking(text, defaultSource, logLabel, options = {}) {
+    const source = options.source || defaultSource;
+    const result = this.scan(text, { ...options, source });
+    result.blocked = this._shouldBlock(result.threats);
+    if (result.blocked) {
+      this.stats.blocked++;
+      if (this.config.logging) {
+        console.warn(`[Agent Shield] ${logLabel} BLOCKED from ${source}`);
+      }
+    }
+    return result;
+  }
+  /**
+   * Scans an agent's input (user message, API response, document, etc.)
+   * before the agent processes it.
+   *
+   * @param {string} text - The input text.
+   * @param {object} [options] - Options.
+   * @param {string} [options.source='user_input'] - Where the input came from.
+   * @returns {object} Scan result with additional `blocked` field.
+   */
+  scanInput(text, options = {}) {
+    if (typeof text !== 'string') {
+      throw new TypeError(`[Agent Shield] scanInput() expects a string, got ${typeof text}`);
+    }
+    return this._scanWithBlocking(text, 'user_input', 'INPUT', options);
+  }
+  /**
+   * Scans an agent's output before it's returned to the user.
+   * Catches cases where an agent has been successfully manipulated
+   * and is now producing dangerous output.
+   *
+   * @param {string} text - The agent's output text.
+   * @param {object} [options] - Options.
+   * @param {string} [options.source='agent_output'] - Source label.
+   * @returns {object} Scan result with additional `blocked` field.
+   */
+  scanOutput(text, options = {}) {
+    if (typeof text !== 'string') {
+      throw new TypeError(`[Agent Shield] scanOutput() expects a string, got ${typeof text}`);
+    }
+    return this._scanWithBlocking(text, 'agent_output', 'OUTPUT', options);
+  }
+  /**
+   * Scans a tool call before the agent executes it.
+   * Checks both the tool name and its arguments for threats.
+   *
+   * @param {string} toolName - Name of the tool being called.
+   * @param {object} args - The tool's arguments.
+   * @param {object} [options] - Options.
+   * @returns {object} Scan result with `blocked` and `warnings` fields.
+   */
+  scanToolCall(toolName, args = {}, options = {}) {
+    if (!toolName || typeof toolName !== 'string') {
+      return { status: 'safe', toolName: toolName || '', threats: [], warnings: ['Invalid tool name'], blocked: false, isDangerousTool: false, timestamp: Date.now() };
+    }
+    const warnings = [];
+    const allThreats = [];
+    // Check if it's a dangerous tool (exact match or word-boundary match)
+    const lowerName = toolName.toLowerCase();
+    const isDangerousTool = this.config.dangerousTools.some(
+      t => lowerName === t || lowerName.startsWith(t + '_') || lowerName.endsWith('_' + t)
+    );
+    if (isDangerousTool) {
+      warnings.push(`Tool "${toolName}" is on the dangerous tools list.`);
+    }
+    // Validate args type before processing
+    if (args !== null && typeof args !== 'object') {
+      args = {};
+    }
+    // Scan all string arguments for injection
+    const argsText = this._flattenArgs(args);
+    if (argsText) {
+      const result = this.scan(argsText, {
+        source: `tool_call:${toolName}`,
+        ...options
+      });
+      allThreats.push(...result.threats);
+    }
+    // Check for sensitive file access
+    const fileArgs = this._extractFilePaths(args);
+    for (const filePath of fileArgs) {
+      const isSensitive = this.config.sensitiveFilePatterns.some(
+        pattern => pattern.test(filePath)
+      );
+      if (isSensitive) {
+        allThreats.push({
+          severity: 'critical',
+          category: 'data_exfiltration',
+          description: `Tool "${toolName}" is trying to access a sensitive file: ${filePath}`,
+          detail: `Sensitive file access attempt via tool call. File: ${filePath}`,
+          confidence: 90,
+          confidenceLabel: 'Almost certainly a threat'
+        });
+      }
+    }
+    // Determine if this should be blocked
+    let blocked = this._shouldBlock(allThreats);
+    // Also block dangerous tools with any threat
+    if (isDangerousTool && allThreats.length > 0) {
+      blocked = true;
+    }
+    if (blocked) {
+      this.stats.blocked++;
+      if (this.config.logging) {
+        console.warn(`[Agent Shield] TOOL CALL BLOCKED: ${toolName}`);
+      }
+    }
+    return {
+      status: allThreats.length > 0 ? 'danger' : 'safe',
+      toolName,
+      threats: allThreats,
+      warnings,
+      blocked,
+      isDangerousTool,
+      timestamp: Date.now()
+    };
+  }
+  /**
+   * Scans multiple pieces of text in batch.
+   *
+   * @param {Array<{text: string, source?: string}>} items - Items to scan.
+   * @returns {object} Combined result with per-item results.
+   */
+  scanBatch(items) {
+    if (!Array.isArray(items)) {
+      throw new TypeError(`[Agent Shield] scanBatch() expects an array, got ${typeof items}`);
+    }
+    const results = items.map(item =>
+      this.scan(item.text, { source: item.source || 'batch' })
+    );
+    const allThreats = results.flatMap(r => r.threats);
+    let worstStatus = 'safe';
+    for (const r of results) {
+      if (r.status === 'danger') { worstStatus = 'danger'; break; }
+      if (r.status === 'warning' && worstStatus !== 'danger') worstStatus = 'warning';
+      if (r.status === 'caution' && worstStatus === 'safe') worstStatus = 'caution';
+    }
+    return {
+      status: worstStatus,
+      results,
+      totalThreats: allThreats.length,
+      timestamp: Date.now()
+    };
+  }
+  /**
+   * Returns the current scan statistics.
+   * @returns {object}
+   */
+  getStats() {
+    return { ...this.stats };
+  }
+  /**
+   * Resets scan statistics.
+   */
+  resetStats() {
+    this.stats = {
+      totalScans: 0,
+      threatsDetected: 0,
+      blocked: 0,
+      scanHistory: []
+    };
+  }
+  /**
+   * Returns all detection patterns the engine uses.
+   * @returns {Array}
+   */
+  getPatterns() {
+    return getPatterns();
+  }
+  /**
+   * Flattens tool arguments into a single string for scanning.
+   * @private
+   * @param {object} args
+   * @returns {string}
+   */
+  _flattenArgs(args, maxDepth = 10) {
+    const parts = [];
+    const flatten = (obj, depth) => {
+      if (depth > maxDepth) return;
+      if (typeof obj === 'string') {
+        parts.push(obj);
+      } else if (Array.isArray(obj)) {
+        obj.forEach(item => flatten(item, depth + 1));
+      } else if (obj && typeof obj === 'object') {
+        Object.values(obj).forEach(val => flatten(val, depth + 1));
+      }
+    };
+    flatten(args, 0);
+    return parts.join(' ');
+  }
+  /**
+   * Extracts file paths from tool arguments.
+   * @private
+   * @param {object} args
+   * @returns {Array<string>}
+   */
+  _extractFilePaths(args, maxDepth = 10) {
+    const paths = [];
+    const fileKeys = [
+      'file', 'path', 'file_path', 'filepath', 'filename', 'target',
+      'destination', 'src', 'dest', 'source', 'dir', 'directory',
+      'folder', 'location', 'output', 'input', 'module',
+      'bucket', 'table', 'url', 'uri', 'endpoint'
+    ];
+    /** Normalize key to lowercase with separators removed for flexible matching. */
+    const normalizeKey = (key) => key.toLowerCase().replace(/[-_]/g, '');
+    const normalizedFileKeys = fileKeys.map(normalizeKey);
+    const extract = (obj, depth) => {
+      if (!obj || typeof obj !== 'object' || depth > maxDepth) return;
+      for (const [key, value] of Object.entries(obj)) {
+        if (typeof value === 'string') {
+          // Match by key name (supports camelCase, snake_case, kebab-case)
+          if (normalizedFileKeys.includes(normalizeKey(key))) {
+            paths.push(value);
+          // Match by path-like value patterns
+          } else if (value.startsWith('/') || value.startsWith('./') || value.startsWith('../') || /^[A-Z]:\\/.test(value)) {
+            paths.push(value);
+          }
+        } else if (typeof value === 'object') {
+          extract(value, depth + 1);
+        }
+      }
+    };
+    extract(args, 0);
+    return paths;
+  }
+}
+module.exports = { AgentShield };