PyPI - cisco-ai-skill-scanner - Versions diffs - 1.0.0__py3-none-any.whl - Mend

cisco-ai-skill-scanner 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (100) hide show

cisco_ai_skill_scanner-1.0.0.dist-info/METADATA +253 -0
cisco_ai_skill_scanner-1.0.0.dist-info/RECORD +100 -0
cisco_ai_skill_scanner-1.0.0.dist-info/WHEEL +4 -0
cisco_ai_skill_scanner-1.0.0.dist-info/entry_points.txt +4 -0
cisco_ai_skill_scanner-1.0.0.dist-info/licenses/LICENSE +17 -0
skillanalyzer/__init__.py +45 -0
skillanalyzer/_version.py +34 -0
skillanalyzer/api/__init__.py +25 -0
skillanalyzer/api/api.py +34 -0
skillanalyzer/api/api_cli.py +78 -0
skillanalyzer/api/api_server.py +634 -0
skillanalyzer/api/router.py +527 -0
skillanalyzer/cli/__init__.py +25 -0
skillanalyzer/cli/cli.py +816 -0
skillanalyzer/config/__init__.py +26 -0
skillanalyzer/config/config.py +149 -0
skillanalyzer/config/config_parser.py +122 -0
skillanalyzer/config/constants.py +85 -0
skillanalyzer/core/__init__.py +24 -0
skillanalyzer/core/analyzers/__init__.py +75 -0
skillanalyzer/core/analyzers/aidefense_analyzer.py +872 -0
skillanalyzer/core/analyzers/base.py +53 -0
skillanalyzer/core/analyzers/behavioral/__init__.py +30 -0
skillanalyzer/core/analyzers/behavioral/alignment/__init__.py +45 -0
skillanalyzer/core/analyzers/behavioral/alignment/alignment_llm_client.py +240 -0
skillanalyzer/core/analyzers/behavioral/alignment/alignment_orchestrator.py +216 -0
skillanalyzer/core/analyzers/behavioral/alignment/alignment_prompt_builder.py +422 -0
skillanalyzer/core/analyzers/behavioral/alignment/alignment_response_validator.py +136 -0
skillanalyzer/core/analyzers/behavioral/alignment/threat_vulnerability_classifier.py +198 -0
skillanalyzer/core/analyzers/behavioral_analyzer.py +453 -0
skillanalyzer/core/analyzers/cross_skill_analyzer.py +490 -0
skillanalyzer/core/analyzers/llm_analyzer.py +440 -0
skillanalyzer/core/analyzers/llm_prompt_builder.py +270 -0
skillanalyzer/core/analyzers/llm_provider_config.py +215 -0
skillanalyzer/core/analyzers/llm_request_handler.py +284 -0
skillanalyzer/core/analyzers/llm_response_parser.py +81 -0
skillanalyzer/core/analyzers/meta_analyzer.py +845 -0
skillanalyzer/core/analyzers/static.py +1105 -0
skillanalyzer/core/analyzers/trigger_analyzer.py +341 -0
skillanalyzer/core/analyzers/virustotal_analyzer.py +463 -0
skillanalyzer/core/exceptions.py +77 -0
skillanalyzer/core/loader.py +377 -0
skillanalyzer/core/models.py +300 -0
skillanalyzer/core/reporters/__init__.py +26 -0
skillanalyzer/core/reporters/json_reporter.py +65 -0
skillanalyzer/core/reporters/markdown_reporter.py +209 -0
skillanalyzer/core/reporters/sarif_reporter.py +246 -0
skillanalyzer/core/reporters/table_reporter.py +195 -0
skillanalyzer/core/rules/__init__.py +19 -0
skillanalyzer/core/rules/patterns.py +165 -0
skillanalyzer/core/rules/yara_scanner.py +157 -0
skillanalyzer/core/scanner.py +437 -0
skillanalyzer/core/static_analysis/__init__.py +27 -0
skillanalyzer/core/static_analysis/cfg/__init__.py +21 -0
skillanalyzer/core/static_analysis/cfg/builder.py +439 -0
skillanalyzer/core/static_analysis/context_extractor.py +742 -0
skillanalyzer/core/static_analysis/dataflow/__init__.py +25 -0
skillanalyzer/core/static_analysis/dataflow/forward_analysis.py +715 -0
skillanalyzer/core/static_analysis/interprocedural/__init__.py +21 -0
skillanalyzer/core/static_analysis/interprocedural/call_graph_analyzer.py +406 -0
skillanalyzer/core/static_analysis/interprocedural/cross_file_analyzer.py +190 -0
skillanalyzer/core/static_analysis/parser/__init__.py +21 -0
skillanalyzer/core/static_analysis/parser/python_parser.py +380 -0
skillanalyzer/core/static_analysis/semantic/__init__.py +28 -0
skillanalyzer/core/static_analysis/semantic/name_resolver.py +206 -0
skillanalyzer/core/static_analysis/semantic/type_analyzer.py +200 -0
skillanalyzer/core/static_analysis/taint/__init__.py +21 -0
skillanalyzer/core/static_analysis/taint/tracker.py +252 -0
skillanalyzer/core/static_analysis/types/__init__.py +36 -0
skillanalyzer/data/__init__.py +30 -0
skillanalyzer/data/prompts/boilerplate_protection_rule_prompt.md +26 -0
skillanalyzer/data/prompts/code_alignment_threat_analysis_prompt.md +901 -0
skillanalyzer/data/prompts/llm_response_schema.json +71 -0
skillanalyzer/data/prompts/skill_meta_analysis_prompt.md +303 -0
skillanalyzer/data/prompts/skill_threat_analysis_prompt.md +263 -0
skillanalyzer/data/prompts/unified_response_schema.md +97 -0
skillanalyzer/data/rules/signatures.yaml +440 -0
skillanalyzer/data/yara_rules/autonomy_abuse.yara +66 -0
skillanalyzer/data/yara_rules/code_execution.yara +61 -0
skillanalyzer/data/yara_rules/coercive_injection.yara +115 -0
skillanalyzer/data/yara_rules/command_injection.yara +54 -0
skillanalyzer/data/yara_rules/credential_harvesting.yara +115 -0
skillanalyzer/data/yara_rules/prompt_injection.yara +71 -0
skillanalyzer/data/yara_rules/script_injection.yara +83 -0
skillanalyzer/data/yara_rules/skill_discovery_abuse.yara +57 -0
skillanalyzer/data/yara_rules/sql_injection.yara +73 -0
skillanalyzer/data/yara_rules/system_manipulation.yara +65 -0
skillanalyzer/data/yara_rules/tool_chaining_abuse.yara +60 -0
skillanalyzer/data/yara_rules/transitive_trust_abuse.yara +73 -0
skillanalyzer/data/yara_rules/unicode_steganography.yara +65 -0
skillanalyzer/hooks/__init__.py +21 -0
skillanalyzer/hooks/pre_commit.py +450 -0
skillanalyzer/threats/__init__.py +25 -0
skillanalyzer/threats/threats.py +480 -0
skillanalyzer/utils/__init__.py +28 -0
skillanalyzer/utils/command_utils.py +129 -0
skillanalyzer/utils/di_container.py +154 -0
skillanalyzer/utils/file_utils.py +86 -0
skillanalyzer/utils/logging_config.py +96 -0
skillanalyzer/utils/logging_utils.py +71 -0

skillanalyzer/core/analyzers/trigger_analyzer.py ADDED Viewed

@@ -0,0 +1,341 @@
+# Copyright 2026 Cisco Systems, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+"""
+Trigger analyzer for detecting overly generic skill descriptions.
+Claude uses skill descriptions to decide when to activate a skill.
+Overly generic descriptions can cause trigger hijacking where a skill
+activates for unrelated user requests.
+"""
+import re
+from ..models import Finding, Severity, Skill, ThreatCategory
+from .base import BaseAnalyzer
+class TriggerAnalyzer(BaseAnalyzer):
+    """Analyzes skill descriptions for trigger specificity issues."""
+    # Generic patterns that are too broad for skill descriptions
+    # Only match truly generic descriptions that could hijack any query
+    # "Toolkit for X" is specific if X is specific, so we don't flag it
+    GENERIC_PATTERNS = [
+        r"^help\s*(me|you|with\s+anything)?\s*$",  # Just "help" or "help me"
+        r"^(a|an|the)?\s*assistant\s*$",  # Just "assistant" with no context
+        r"^(a|an|the)?\s*helper\s*$",  # Just "helper" with no context
+        r"^(I |this )?(can |will )?do\s+(anything|everything)\s*(for you)?\.?$",
+        r"^general\s+purpose\s+(assistant|tool|skill)\s*$",
+        r"^universal\s+(assistant|tool|skill)\s*$",
+        r"^default\s+(assistant|tool|skill)\s*$",
+        r"^use\s+(this|me)\s+for\s+(everything|anything)\s*$",
+    ]
+    # Vague/generic words that shouldn't dominate a description
+    GENERIC_WORDS = {
+        "help",
+        "helper",
+        "helps",
+        "helping",
+        "assist",
+        "assistant",
+        "assists",
+        "assisting",
+        "do",
+        "does",
+        "doing",
+        "thing",
+        "things",
+        "stuff",
+        "general",
+        "generic",
+        "universal",
+        "any",
+        "anything",
+        "everything",
+        "something",
+        "all",
+        "various",
+        "multiple",
+        "many",
+        "useful",
+        "handy",
+        "convenient",
+        "tool",
+        "utility",
+    }
+    # Words that indicate specificity (good)
+    SPECIFIC_INDICATORS = {
+        # Actions
+        "convert",
+        "parse",
+        "format",
+        "validate",
+        "generate",
+        "analyze",
+        "create",
+        "build",
+        "compile",
+        "transform",
+        "extract",
+        "process",
+        "calculate",
+        "compute",
+        "summarize",
+        "translate",
+        "encode",
+        "decode",
+        # Domains
+        "json",
+        "yaml",
+        "xml",
+        "csv",
+        "markdown",
+        "html",
+        "css",
+        "sql",
+        "python",
+        "javascript",
+        "typescript",
+        "rust",
+        "go",
+        "java",
+        "api",
+        "database",
+        "file",
+        "image",
+        "pdf",
+        "document",
+        "git",
+        "docker",
+        "kubernetes",
+        "aws",
+        "azure",
+        "gcp",
+        # Specific nouns
+        "code",
+        "test",
+        "documentation",
+        "report",
+        "log",
+        "config",
+        "user",
+        "data",
+        "request",
+        "response",
+        "error",
+        "exception",
+    }
+    def __init__(self):
+        """Initialize trigger analyzer."""
+        super().__init__("trigger_analyzer")
+        self._compiled_patterns = [re.compile(p, re.IGNORECASE) for p in self.GENERIC_PATTERNS]
+    def analyze(self, skill: Skill) -> list[Finding]:
+        """
+        Analyze skill for trigger specificity issues.
+        Args:
+            skill: Skill to analyze
+        Returns:
+            List of findings related to trigger issues
+        """
+        findings = []
+        # Check for generic patterns in description
+        findings.extend(self._check_generic_patterns(skill))
+        # Check description word count and specificity
+        findings.extend(self._check_description_specificity(skill))
+        # Check for keyword baiting (SEO-style stuffing)
+        findings.extend(self._check_keyword_baiting(skill))
+        return findings
+    def _check_generic_patterns(self, skill: Skill) -> list[Finding]:
+        """Check if description matches known generic patterns."""
+        findings = []
+        description = skill.description.strip()
+        for pattern in self._compiled_patterns:
+            if pattern.match(description):
+                findings.append(
+                    Finding(
+                        id=f"TRIGGER_GENERIC_{hash(description) & 0xFFFFFFFF:08x}",
+                        rule_id="TRIGGER_OVERLY_GENERIC",
+                        category=ThreatCategory.SOCIAL_ENGINEERING,
+                        severity=Severity.MEDIUM,
+                        title="Skill description is overly generic",
+                        description=(
+                            f"Description '{description[:50]}...' matches a generic pattern. "
+                            f"This may cause the skill to trigger for unrelated user requests, "
+                            f"potentially hijacking conversations."
+                        ),
+                        file_path="SKILL.md",
+                        remediation=(
+                            "Make the description more specific by describing exactly what the skill does, "
+                            "what inputs it accepts, and what outputs it produces."
+                        ),
+                        analyzer="trigger",
+                    )
+                )
+                break  # One finding per skill is enough
+        return findings
+    def _check_description_specificity(self, skill: Skill) -> list[Finding]:
+        """Check if description has sufficient specificity."""
+        findings = []
+        description = skill.description.strip()
+        # Tokenize description
+        words = re.findall(r"\b[a-zA-Z]+\b", description.lower())
+        # Check word count
+        if len(words) < 5:
+            findings.append(
+                Finding(
+                    id=f"TRIGGER_SHORT_{hash(description) & 0xFFFFFFFF:08x}",
+                    rule_id="TRIGGER_DESCRIPTION_TOO_SHORT",
+                    category=ThreatCategory.SOCIAL_ENGINEERING,
+                    severity=Severity.LOW,
+                    title="Skill description is too short",
+                    description=(
+                        f"Description has only {len(words)} words. "
+                        f"Short descriptions may not provide enough context for Claude to determine "
+                        f"when this skill should be used."
+                    ),
+                    file_path="SKILL.md",
+                    remediation=(
+                        "Expand the description to at least 10-20 words explaining the skill's "
+                        "purpose, capabilities, and appropriate use cases."
+                    ),
+                    analyzer="trigger",
+                )
+            )
+            return findings  # Don't check further for very short descriptions
+        # Calculate specificity ratio
+        generic_count = sum(1 for w in words if w in self.GENERIC_WORDS)
+        specific_count = sum(1 for w in words if w in self.SPECIFIC_INDICATORS)
+        generic_ratio = generic_count / len(words) if words else 0
+        # If more than 40% of words are generic, flag it
+        if generic_ratio > 0.4 and specific_count < 2:
+            findings.append(
+                Finding(
+                    id=f"TRIGGER_VAGUE_{hash(description) & 0xFFFFFFFF:08x}",
+                    rule_id="TRIGGER_VAGUE_DESCRIPTION",
+                    category=ThreatCategory.SOCIAL_ENGINEERING,
+                    severity=Severity.LOW,
+                    title="Skill description lacks specificity",
+                    description=(
+                        f"Description contains {generic_count} generic words ({generic_ratio:.0%}) "
+                        f"and only {specific_count} specific indicators. "
+                        f"This may cause imprecise skill matching."
+                    ),
+                    file_path="SKILL.md",
+                    remediation=(
+                        "Replace generic terms with specific technical terms that describe "
+                        "exactly what file types, technologies, or operations this skill handles."
+                    ),
+                    analyzer="trigger",
+                )
+            )
+        return findings
+    def _check_keyword_baiting(self, skill: Skill) -> list[Finding]:
+        """Check for keyword stuffing / SEO-style baiting."""
+        findings = []
+        description = skill.description.strip()
+        # Look for comma-separated lists of 8+ keywords (not just 5)
+        # Also require the list to be at the START of description (SEO style)
+        # or contain repeated/similar words
+        keyword_lists = re.findall(r"[a-zA-Z]+(?:\s*,\s*[a-zA-Z]+){7,}", description)
+        # Only flag if the list is suspiciously long AND at the start
+        # OR contains repetitive patterns
+        if keyword_lists:
+            # Check if this is a legitimate "examples include" list
+            context_before = description[: description.find(keyword_lists[0])].lower()
+            if "example" in context_before or "such as" in context_before or "including" in context_before:
+                # This is likely a legitimate examples list, not keyword baiting
+                return findings
+            # Check for repetitive words in the list
+            words = [w.strip().lower() for w in keyword_lists[0].split(",")]
+            unique_ratio = len(set(words)) / len(words) if words else 1
+            # Only flag if many repeated words (ratio < 0.7) or list is at very start
+            if unique_ratio < 0.7 or description.strip().startswith(keyword_lists[0][:20]):
+                findings.append(
+                    Finding(
+                        id=f"TRIGGER_KEYWORD_BAIT_{hash(description) & 0xFFFFFFFF:08x}",
+                        rule_id="TRIGGER_KEYWORD_BAITING",
+                        category=ThreatCategory.SOCIAL_ENGINEERING,
+                        severity=Severity.MEDIUM,
+                        title="Skill description may contain keyword baiting",
+                        description=(
+                            "Description contains suspiciously long keyword list "
+                            "that may be an attempt to trigger the skill for many unrelated queries."
+                        ),
+                        file_path="SKILL.md",
+                        remediation=(
+                            "Replace keyword lists with natural language sentences that describe "
+                            "the skill's actual capabilities."
+                        ),
+                        analyzer="trigger",
+                    )
+                )
+        return findings
+    def get_specificity_score(self, description: str) -> float:
+        """
+        Calculate a specificity score for a description.
+        Args:
+            description: The skill description text
+        Returns:
+            Score from 0.0 (very generic) to 1.0 (very specific)
+        """
+        words = re.findall(r"\b[a-zA-Z]+\b", description.lower())
+        if not words:
+            return 0.0
+        generic_count = sum(1 for w in words if w in self.GENERIC_WORDS)
+        specific_count = sum(1 for w in words if w in self.SPECIFIC_INDICATORS)
+        # Base score from word count (more words = more specific, up to a point)
+        word_score = min(len(words) / 20, 1.0)
+        # Penalty for generic words
+        generic_penalty = generic_count / len(words) if words else 0
+        # Bonus for specific words
+        specific_bonus = min(specific_count / 5, 0.5)
+        score = word_score - generic_penalty + specific_bonus
+        return max(0.0, min(1.0, score))