npm - @panguard-ai/atr - Versions diffs - 0.2.0 - Mend

@panguard-ai/atr 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/LICENSE +21 -0
package/README.md +299 -0
package/dist/cli.d.ts +12 -0
package/dist/cli.d.ts.map +1 -0
package/dist/cli.js +720 -0
package/dist/cli.js.map +1 -0
package/dist/coverage-analyzer.d.ts +43 -0
package/dist/coverage-analyzer.d.ts.map +1 -0
package/dist/coverage-analyzer.js +329 -0
package/dist/coverage-analyzer.js.map +1 -0
package/dist/engine.d.ts +127 -0
package/dist/engine.d.ts.map +1 -0
package/dist/engine.js +636 -0
package/dist/engine.js.map +1 -0
package/dist/index.d.ts +26 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +18 -0
package/dist/index.js.map +1 -0
package/dist/loader.d.ts +21 -0
package/dist/loader.d.ts.map +1 -0
package/dist/loader.js +124 -0
package/dist/loader.js.map +1 -0
package/dist/mcp-server.d.ts +13 -0
package/dist/mcp-server.d.ts.map +1 -0
package/dist/mcp-server.js +220 -0
package/dist/mcp-server.js.map +1 -0
package/dist/mcp-tools/coverage-gaps.d.ts +13 -0
package/dist/mcp-tools/coverage-gaps.d.ts.map +1 -0
package/dist/mcp-tools/coverage-gaps.js +55 -0
package/dist/mcp-tools/coverage-gaps.js.map +1 -0
package/dist/mcp-tools/list-rules.d.ts +17 -0
package/dist/mcp-tools/list-rules.d.ts.map +1 -0
package/dist/mcp-tools/list-rules.js +45 -0
package/dist/mcp-tools/list-rules.js.map +1 -0
package/dist/mcp-tools/scan.d.ts +18 -0
package/dist/mcp-tools/scan.d.ts.map +1 -0
package/dist/mcp-tools/scan.js +75 -0
package/dist/mcp-tools/scan.js.map +1 -0
package/dist/mcp-tools/submit-proposal.d.ts +12 -0
package/dist/mcp-tools/submit-proposal.d.ts.map +1 -0
package/dist/mcp-tools/submit-proposal.js +95 -0
package/dist/mcp-tools/submit-proposal.js.map +1 -0
package/dist/mcp-tools/threat-summary.d.ts +12 -0
package/dist/mcp-tools/threat-summary.d.ts.map +1 -0
package/dist/mcp-tools/threat-summary.js +74 -0
package/dist/mcp-tools/threat-summary.js.map +1 -0
package/dist/mcp-tools/validate.d.ts +15 -0
package/dist/mcp-tools/validate.d.ts.map +1 -0
package/dist/mcp-tools/validate.js +45 -0
package/dist/mcp-tools/validate.js.map +1 -0
package/dist/modules/index.d.ts +144 -0
package/dist/modules/index.d.ts.map +1 -0
package/dist/modules/index.js +82 -0
package/dist/modules/index.js.map +1 -0
package/dist/modules/semantic.d.ts +105 -0
package/dist/modules/semantic.d.ts.map +1 -0
package/dist/modules/semantic.js +283 -0
package/dist/modules/semantic.js.map +1 -0
package/dist/modules/session.d.ts +70 -0
package/dist/modules/session.d.ts.map +1 -0
package/dist/modules/session.js +128 -0
package/dist/modules/session.js.map +1 -0
package/dist/rule-scaffolder.d.ts +39 -0
package/dist/rule-scaffolder.d.ts.map +1 -0
package/dist/rule-scaffolder.js +173 -0
package/dist/rule-scaffolder.js.map +1 -0
package/dist/session-tracker.d.ts +56 -0
package/dist/session-tracker.d.ts.map +1 -0
package/dist/session-tracker.js +175 -0
package/dist/session-tracker.js.map +1 -0
package/dist/skill-fingerprint.d.ts +96 -0
package/dist/skill-fingerprint.d.ts.map +1 -0
package/dist/skill-fingerprint.js +337 -0
package/dist/skill-fingerprint.js.map +1 -0
package/dist/types.d.ts +129 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +6 -0
package/dist/types.js.map +1 -0
package/package.json +75 -0
package/rules/agent-manipulation/ATR-2026-030-cross-agent-attack.yaml +175 -0
package/rules/agent-manipulation/ATR-2026-032-goal-hijacking.yaml +135 -0
package/rules/agent-manipulation/ATR-2026-074-cross-agent-privilege-escalation.yaml +115 -0
package/rules/agent-manipulation/ATR-2026-076-inter-agent-message-spoofing.yaml +165 -0
package/rules/agent-manipulation/ATR-2026-077-human-trust-exploitation.yaml +144 -0
package/rules/context-exfiltration/ATR-2026-020-system-prompt-leak.yaml +175 -0
package/rules/context-exfiltration/ATR-2026-021-api-key-exposure.yaml +176 -0
package/rules/context-exfiltration/ATR-2026-075-agent-memory-manipulation.yaml +115 -0
package/rules/data-poisoning/ATR-2026-070-data-poisoning.yaml +160 -0
package/rules/excessive-autonomy/ATR-2026-050-runaway-agent-loop.yaml +134 -0
package/rules/excessive-autonomy/ATR-2026-051-resource-exhaustion.yaml +137 -0
package/rules/excessive-autonomy/ATR-2026-052-cascading-failure.yaml +153 -0
package/rules/model-security/ATR-2026-072-model-behavior-extraction.yaml +115 -0
package/rules/model-security/ATR-2026-073-malicious-finetuning-data.yaml +108 -0
package/rules/privilege-escalation/ATR-2026-040-privilege-escalation.yaml +175 -0
package/rules/privilege-escalation/ATR-2026-041-scope-creep.yaml +124 -0
package/rules/prompt-injection/ATR-2026-001-direct-prompt-injection.yaml +265 -0
package/rules/prompt-injection/ATR-2026-002-indirect-prompt-injection.yaml +214 -0
package/rules/prompt-injection/ATR-2026-003-jailbreak-attempt.yaml +250 -0
package/rules/prompt-injection/ATR-2026-004-system-prompt-override.yaml +204 -0
package/rules/prompt-injection/ATR-2026-005-multi-turn-injection.yaml +181 -0
package/rules/prompt-injection/ATR-PRED-2026-001.yaml +61 -0
package/rules/prompt-injection/ATR-PRED-2026-002.yaml +58 -0
package/rules/prompt-injection/ATR-PRED-2026-003.yaml +61 -0
package/rules/prompt-injection/ATR-PRED-2026-005.yaml +55 -0
package/rules/prompt-injection/ATR-PRED-2026-006.yaml +51 -0
package/rules/prompt-injection/ATR-PRED-2026-007.yaml +57 -0
package/rules/prompt-injection/ATR-PRED-2026-008.yaml +57 -0
package/rules/prompt-injection/ATR-PRED-2026-009.yaml +51 -0
package/rules/prompt-injection/ATR-PRED-2026-010.yaml +57 -0
package/rules/prompt-injection/ATR-PRED-2026-011.yaml +53 -0
package/rules/prompt-injection/ATR-PRED-2026-012.yaml +57 -0
package/rules/prompt-injection/ATR-PRED-2026-023.yaml +56 -0
package/rules/prompt-injection/ATR-PRED-2026-025.yaml +68 -0
package/rules/prompt-injection/ATR-PRED-2026-026.yaml +66 -0
package/rules/prompt-injection/ATR-PRED-2026-027.yaml +62 -0
package/rules/skill-compromise/ATR-2026-060-skill-impersonation.yaml +153 -0
package/rules/skill-compromise/ATR-2026-061-description-behavior-mismatch.yaml +98 -0
package/rules/skill-compromise/ATR-2026-062-hidden-capability.yaml +96 -0
package/rules/skill-compromise/ATR-2026-063-skill-chain-attack.yaml +96 -0
package/rules/skill-compromise/ATR-2026-064-over-permissioned-skill.yaml +115 -0
package/rules/skill-compromise/ATR-2026-065-skill-update-attack.yaml +93 -0
package/rules/skill-compromise/ATR-2026-066-parameter-injection.yaml +106 -0
package/rules/tool-poisoning/ATR-2026-010-mcp-malicious-response.yaml +237 -0
package/rules/tool-poisoning/ATR-2026-011-tool-output-injection.yaml +185 -0
package/rules/tool-poisoning/ATR-2026-012-unauthorized-tool-call.yaml +190 -0
package/rules/tool-poisoning/ATR-2026-013-tool-ssrf.yaml +208 -0
package/rules/tool-poisoning/ATR-PRED-2026-004.yaml +54 -0
package/rules/tool-poisoning/ATR-PRED-2026-024.yaml +68 -0
package/spec/atr-schema.yaml +375 -0

package/rules/tool-poisoning/ATR-PRED-2026-024.yaml ADDED Viewed

@@ -0,0 +1,68 @@
+title: "供应链投毒：百万级MCP技能生态的系统性风险"
+id: ATR-PRED-2026-024
+status: draft
+description: >
+  MiroFish AI Prediction: 2026年AI代理生态系统的规模化部署带来了前所未有的供应链风险：  > \"AI代理在2026年包含了数百万个MCP技能，形成了主要攻击面。\"  供应链攻击的演化趋势显示出高度的复杂性和隐蔽性：  > \"ML供应链妥协预计将演化为包括技能注册表投毒。\"  > \"预期会向涉及被妥协的合法技能的复杂供应链攻击演化，这意味着与代理工具调用等执行机制的关系。\"  这类攻击的严重程度被评估为**极高**，因为它能够在整个生态系统中造成级联影响。MITRE ATLAS框架将其归类为**AML.T0056 - 技能与供应链妥协**技术。  应对策略需要建立多层次的审计体系：  > \"Panguard利用包括
+author: "MiroFish Prediction Engine"
+date: "2026/03/11"
+schema_version: "0.1"
+detection_tier: pattern
+maturity: test
+severity: critical
+references:
+  mitre_atlas:
+    - "AML.T0056"
+  mitre_attack:
+    - "T0056"
+tags:
+  category: tool-poisoning
+  subcategory: mirofish-predicted
+  confidence: medium
+agent_source:
+  type: mcp_exchange
+  framework:
+    - any
+  provider:
+    - any
+detection:
+  conditions:
+    - field: tool_response
+      operator: regex
+      value: "(?i)AI代理在2026年包含了数百万个MCP技能，形成了主要攻击面。"
+      description: "MiroFish predicted pattern 1"
+    - field: tool_response
+      operator: regex
+      value: "(?i)ML供应链妥协预计将演化为包括技能注册表投毒。"
+      description: "MiroFish predicted pattern 2"
+    - field: tool_response
+      operator: regex
+      value: "(?i)预期会向涉及被妥协的合法技能的复杂供应链攻击演化，这意味着与代理工具调用等执行机制的关系。"
+      description: "MiroFish predicted pattern 3"
+    - field: tool_response
+      operator: regex
+      value: "(?i)Panguard利用包括清单、指令、权限、依赖、代码和AI语义层检查的6层审计系统。"
+      description: "MiroFish predicted pattern 4"
+    - field: tool_response
+      operator: regex
+      value: "(?i)审计检查正在被设计来捕获基于观察到的规避尝试的新型规避技术。"
+      description: "MiroFish predicted pattern 5"
+  condition: any
+  false_positives:
+    - "Legitimate traffic matching predicted pattern"
+response:
+  actions:
+    - block_input
+    - quarantine_session
+    - alert
+    - escalate
+    - kill_agent
+  auto_response_threshold: critical
+  message_template: >
+    [ATR-PRED-2026-024] MiroFish predicted attack pattern detected.
+    Category: tool-poisoning, Severity: critical.

package/spec/atr-schema.yaml ADDED Viewed

@@ -0,0 +1,375 @@
+# ATR Rule Schema -- Agent Threat Rules
+# Version: 0.1.0-draft
+#
+# Inspired by Sigma rule format, extended for AI Agent attack surfaces.
+# This schema defines the structure for all ATR detection rules.
+#
+# Status: RFC (Request for Comments)
+# License: MIT
+$schema: "https://json-schema.org/draft/2020-12/schema"
+title: ATR Rule Schema
+description: Schema for Agent Threat Rules (ATR) detection rules
+version: "0.1.0-draft"
+type: object
+required:
+  - schema_version
+  - title
+  - id
+  - status
+  - description
+  - author
+  - date
+  - severity
+  - detection_tier
+  - maturity
+  - tags
+  - agent_source
+  - detection
+  - response
+properties:
+  # === Metadata ===
+  schema_version:
+    type: string
+    description: "ATR schema version this rule conforms to (e.g., \"0.1\")"
+  title:
+    type: string
+    description: Human-readable rule name
+  id:
+    type: string
+    pattern: "^ATR-\\d{4}-\\d{3}$"
+    description: "Unique rule identifier. Format: ATR-YYYY-NNN (e.g., ATR-2026-001)"
+  status:
+    type: string
+    enum: [draft, experimental, stable, deprecated]
+    description: Rule maturity status
+  description:
+    type: string
+    description: Detailed description of the attack this rule detects
+  author:
+    type: string
+    description: Rule author or organization
+  date:
+    type: string
+    pattern: "^\\d{4}/\\d{2}/\\d{2}$"
+    description: "Creation date in YYYY/MM/DD format"
+  modified:
+    type: string
+    pattern: "^\\d{4}/\\d{2}/\\d{2}$"
+    description: "Last modification date in YYYY/MM/DD format"
+  # === Classification ===
+  detection_tier:
+    type: string
+    enum: [pattern, behavioral, protocol]
+    description: Detection approach used by this rule
+  maturity:
+    type: string
+    enum: [experimental, test, stable, deprecated]
+    description: Maturity level of this rule
+  # === Severity ===
+  severity:
+    type: string
+    enum: [critical, high, medium, low, informational]
+    description: Severity level of the detected threat
+  # === References (alignment with existing frameworks) ===
+  references:
+    type: object
+    description: Mappings to established security frameworks
+    properties:
+      owasp_llm:
+        type: array
+        items:
+          type: string
+        description: "OWASP LLM Top 10 references (e.g., LLM01:2025)"
+      mitre_atlas:
+        type: array
+        items:
+          type: string
+        description: "MITRE ATLAS technique IDs (e.g., AML.T0054)"
+      mitre_attack:
+        type: array
+        items:
+          type: string
+        description: "MITRE ATT&CK technique IDs (if applicable)"
+      cve:
+        type: array
+        items:
+          type: string
+        description: Related CVE identifiers
+  # === Tags (ATR classification) ===
+  tags:
+    type: object
+    required: [category]
+    properties:
+      category:
+        type: string
+        enum:
+          - prompt-injection
+          - tool-poisoning
+          - context-exfiltration
+          - agent-manipulation
+          - privilege-escalation
+          - excessive-autonomy
+          - data-poisoning
+          - model-abuse
+          - skill-compromise
+        description: Primary attack category
+      subcategory:
+        type: string
+        description: More specific classification within the category
+      confidence:
+        type: string
+        enum: [high, medium, low]
+        description: Expected accuracy of this rule (high = low false positive rate)
+  # === Agent Source (analogous to Sigma's logsource) ===
+  agent_source:
+    type: object
+    required: [type]
+    description: >
+      Defines what kind of agent data this rule inspects.
+      Analogous to Sigma's logsource, but for agent behaviors.
+    properties:
+      type:
+        type: string
+        enum:
+          - llm_io            # LLM input/output (prompts and completions)
+          - tool_call         # Function/tool call requests
+          - mcp_exchange      # MCP protocol messages
+          - agent_behavior    # Agent behavioral metrics and patterns
+          - multi_agent_comm  # Inter-agent communication
+          - context_window    # Context window contents
+          - memory_access     # Agent memory read/write operations
+          - skill_lifecycle   # MCP skill registration, update, removal events
+          - skill_permission  # Skill permission requests and boundary checks
+          - skill_chain       # Multi-skill invocation sequences
+        description: Type of agent data stream to monitor
+      framework:
+        type: array
+        items:
+          type: string
+        description: >
+          Applicable AI frameworks (e.g., langchain, crewai, autogen,
+          openai, anthropic, custom, any)
+      provider:
+        type: array
+        items:
+          type: string
+        description: >
+          Applicable LLM providers (e.g., ollama, openai, anthropic, any)
+  # === Detection Logic ===
+  detection:
+    type: object
+    required: [conditions, condition]
+    properties:
+      conditions:
+        description: >
+          Detection conditions. Supports two formats:
+          1. Array format (recommended): List of {field, operator, value} objects
+          2. Named-map format: Named condition blocks for complex detection logic
+        oneOf:
+          # -- Array format (used by most rules) --
+          - type: array
+            items:
+              type: object
+              required: [field, operator, value]
+              properties:
+                field:
+                  type: string
+                  description: >
+                    Field to inspect (e.g., user_input, agent_output,
+                    tool_response, tool_name, tool_args, content)
+                operator:
+                  type: string
+                  enum: [regex, contains, exact, starts_with]
+                  description: How the value is matched against the field
+                value:
+                  type: string
+                  description: Pattern to match (regex string if operator is regex)
+                description:
+                  type: string
+                  description: Human-readable description of what this condition detects
+          # -- Named-map format (for complex/behavioral detection) --
+          - type: object
+            description: Named condition blocks (referenced by the condition expression)
+            additionalProperties:
+              type: object
+              properties:
+                field:
+                  type: string
+                  description: Field to inspect
+                patterns:
+                  type: array
+                  items:
+                    type: string
+                  description: Patterns to match against the field value
+                match_type:
+                  type: string
+                  enum: [contains, regex, exact, starts_with]
+                  description: How patterns are matched
+                case_sensitive:
+                  type: boolean
+                  default: false
+                metric:
+                  type: string
+                  description: Behavioral metric to evaluate (v0.2+)
+                operator:
+                  type: string
+                  enum: [gt, lt, eq, gte, lte, deviation_from_baseline]
+                  description: Comparison operator for behavioral thresholds
+                threshold:
+                  type: number
+                  description: Numeric threshold for the metric
+                window:
+                  type: string
+                  description: "Time window for behavioral analysis (e.g., 5m, 1h, 30s)"
+                ordered:
+                  type: boolean
+                  description: Whether steps must occur in order
+                within:
+                  type: string
+                  description: Maximum time span for the full sequence
+                steps:
+                  type: array
+                  items:
+                    type: object
+                  description: Ordered list of conditions that form the attack sequence
+      condition:
+        type: string
+        description: >
+          How to combine conditions. Use "any" or "or" for match-any,
+          "all" or "and" for match-all.
+          Example: "pattern_match AND behavioral"
+      false_positives:
+        type: array
+        items:
+          type: string
+        description: Known scenarios that may trigger false positives
+  # === Response Actions (ATR-specific, not in Sigma) ===
+  response:
+    type: object
+    required: [actions]
+    properties:
+      actions:
+        type: array
+        items:
+          type: string
+          enum:
+            - block_input        # Reject the user/agent input
+            - block_output       # Suppress the agent output
+            - block_tool         # Prevent the tool call from executing
+            - quarantine_session # Isolate the entire session
+            - reset_context      # Clear agent context/memory
+            - alert              # Send alert to security team
+            - snapshot           # Capture full session state for forensics
+            - escalate           # Escalate to human reviewer
+            - reduce_permissions # Reduce agent's available tools/capabilities
+            - kill_agent         # Terminate the agent process
+        description: Actions to take when the rule triggers
+      auto_response_threshold:
+        type: string
+        enum:
+          - low
+          - medium
+          - high
+          - critical
+        description: >
+          Severity threshold for automatic response.
+          Below this threshold, only alert; above, execute response actions.
+      message_template:
+        type: string
+        description: >
+          Template for alert messages. Supports placeholders:
+          {matched_pattern}, {truncated_input}, {truncated_output},
+          {source_ip_or_user}, {tool_name}, {mcp_server_url},
+          {rule_id}, {severity}
+  # === Test Cases ===
+  test_cases:
+    type: object
+    description: Validation test cases shipped with the rule
+    properties:
+      true_positives:
+        type: array
+        items:
+          type: object
+          properties:
+            input:
+              type: string
+            tool_response:
+              type: string
+            agent_output:
+              type: string
+            expected:
+              type: string
+              enum: [triggered]
+            description:
+              type: string
+        description: Inputs that SHOULD trigger this rule
+      true_negatives:
+        type: array
+        items:
+          type: object
+          properties:
+            input:
+              type: string
+            tool_response:
+              type: string
+            agent_output:
+              type: string
+            expected:
+              type: string
+              enum: [not_triggered]
+            description:
+              type: string
+        description: Inputs that should NOT trigger this rule
+  # === Evasion Tests ===
+  evasion_tests:
+    type: array
+    description: Optional test cases for known evasion/bypass techniques
+    items:
+      type: object
+      properties:
+        input:
+          type: string
+          description: The evasion attempt input
+        expected:
+          type: string
+          description: Expected detection outcome
+        bypass_technique:
+          type: string
+          description: Name or description of the bypass technique used
+        notes:
+          type: string
+          description: Additional notes about the evasion test