npm - @vigolium/piolium - Versions diffs - 0.0.1 - Mend

@vigolium/piolium 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (271) hide show

package/LICENSE +21 -0
package/README.md +117 -0
package/agents/access-auditor.md +300 -0
package/agents/assumption-breaker.md +154 -0
package/agents/attack-designer.md +116 -0
package/agents/code-scanner.md +139 -0
package/agents/concurrency-auditor.md +238 -0
package/agents/confirm-writer.md +257 -0
package/agents/context-reviewer.md +274 -0
package/agents/cross-verifier.md +165 -0
package/agents/cve-scout.md +381 -0
package/agents/env-builder.md +282 -0
package/agents/env-profiler.md +205 -0
package/agents/evidence-collector.md +140 -0
package/agents/finding-grader.md +142 -0
package/agents/finding-writer.md +148 -0
package/agents/flow-tracer.md +106 -0
package/agents/goal-backtracer.md +146 -0
package/agents/history-miner.md +467 -0
package/agents/independent-verifier.md +118 -0
package/agents/intent-mapper.md +183 -0
package/agents/longshot-collector.md +128 -0
package/agents/longshot-prober.md +126 -0
package/agents/patch-auditor.md +73 -0
package/agents/poc-author.md +124 -0
package/agents/poc-runner.md +194 -0
package/agents/probe-lead.md +269 -0
package/agents/red-challenger.md +101 -0
package/agents/report-composer.md +208 -0
package/agents/review-adjudicator.md +216 -0
package/agents/spec-auditor.md +155 -0
package/agents/taint-tracer.md +265 -0
package/agents/test-locator.md +209 -0
package/agents/threat-modeler.md +132 -0
package/agents/variant-scanner.md +108 -0
package/agents/variant-spotter.md +110 -0
package/bin/piolium.mjs +376 -0
package/extensions/piolium/_vendor/yaml.bundle.d.mts +6 -0
package/extensions/piolium/_vendor/yaml.bundle.mjs +139 -0
package/extensions/piolium/agent-runner.ts +322 -0
package/extensions/piolium/agents.ts +266 -0
package/extensions/piolium/audit-state.ts +522 -0
package/extensions/piolium/bundled-resources.ts +97 -0
package/extensions/piolium/candidate-scan.ts +966 -0
package/extensions/piolium/command-target.ts +177 -0
package/extensions/piolium/console-stream.ts +57 -0
package/extensions/piolium/export-results.ts +380 -0
package/extensions/piolium/findings.ts +448 -0
package/extensions/piolium/heartbeat.ts +182 -0
package/extensions/piolium/help.ts +234 -0
package/extensions/piolium/index.ts +1865 -0
package/extensions/piolium/longshot.ts +530 -0
package/extensions/piolium/matcher-suggestions.ts +196 -0
package/extensions/piolium/matcher-utils.ts +83 -0
package/extensions/piolium/modes/balanced.ts +750 -0
package/extensions/piolium/modes/confirm-bootstrap.ts +186 -0
package/extensions/piolium/modes/confirm.ts +697 -0
package/extensions/piolium/modes/deep.ts +917 -0
package/extensions/piolium/modes/diff.ts +177 -0
package/extensions/piolium/modes/lite.ts +540 -0
package/extensions/piolium/modes/longshot.ts +595 -0
package/extensions/piolium/modes/merge.ts +204 -0
package/extensions/piolium/modes/phase-runner.ts +267 -0
package/extensions/piolium/modes/reinvest.ts +546 -0
package/extensions/piolium/modes/revisit.ts +279 -0
package/extensions/piolium/modes.ts +48 -0
package/extensions/piolium/phase-labels.ts +123 -0
package/extensions/piolium/phase-status-strip.ts +92 -0
package/extensions/piolium/prompt-prefix-editor.ts +39 -0
package/extensions/piolium/providers/anthropic-vertex.ts +836 -0
package/extensions/piolium/recon.ts +409 -0
package/extensions/piolium/result-stats.ts +105 -0
package/extensions/piolium/retry.ts +120 -0
package/extensions/piolium/scheduler.ts +212 -0
package/extensions/piolium/secrets.ts +368 -0
package/extensions/piolium/tools/web-tools.ts +148 -0
package/package.json +77 -0
package/skills/agentic-actions-auditor/SKILL.md +327 -0
package/skills/agentic-actions-auditor/references/action-profiles.md +186 -0
package/skills/agentic-actions-auditor/references/cross-file-resolution.md +209 -0
package/skills/agentic-actions-auditor/references/foundations.md +94 -0
package/skills/agentic-actions-auditor/references/vector-a-env-var-intermediary.md +77 -0
package/skills/agentic-actions-auditor/references/vector-b-direct-expression-injection.md +83 -0
package/skills/agentic-actions-auditor/references/vector-c-cli-data-fetch.md +83 -0
package/skills/agentic-actions-auditor/references/vector-d-pr-target-checkout.md +88 -0
package/skills/agentic-actions-auditor/references/vector-e-error-log-injection.md +88 -0
package/skills/agentic-actions-auditor/references/vector-f-subshell-expansion.md +82 -0
package/skills/agentic-actions-auditor/references/vector-g-eval-of-ai-output.md +91 -0
package/skills/agentic-actions-auditor/references/vector-h-dangerous-sandbox-configs.md +102 -0
package/skills/agentic-actions-auditor/references/vector-i-wildcard-allowlists.md +88 -0
package/skills/audit/SKILL.md +562 -0
package/skills/audit/assets/icon.svg +7 -0
package/skills/audit/hooks/scripts/validate_phase_output.py +550 -0
package/skills/audit/references/adversarial-review.md +148 -0
package/skills/audit/references/architecture-aware-sast.md +306 -0
package/skills/audit/references/audit-workflow.md +737 -0
package/skills/audit/references/chamber-protocol.md +384 -0
package/skills/audit/references/creative-attack-modes.md +221 -0
package/skills/audit/references/deep-analysis.md +273 -0
package/skills/audit/references/domain-attack-playbooks.md +1129 -0
package/skills/audit/references/knowledge-base-template.md +513 -0
package/skills/audit/references/real-env-validation.md +191 -0
package/skills/audit/references/report-templates.md +417 -0
package/skills/audit/references/triage-and-prereqs.md +134 -0
package/skills/audit/scripts/consolidate_drafts.py +554 -0
package/skills/audit/scripts/partition_findings.py +152 -0
package/skills/audit/scripts/rg-hotspots.sh +121 -0
package/skills/audit/scripts/stamp_file_state.py +349 -0
package/skills/code-reviewer/SKILL.md +65 -0
package/skills/codeql/SKILL.md +281 -0
package/skills/codeql/references/build-fixes.md +90 -0
package/skills/codeql/references/diagnostic-query-templates.md +339 -0
package/skills/codeql/references/extension-yaml-format.md +209 -0
package/skills/codeql/references/important-only-suite.md +153 -0
package/skills/codeql/references/language-details.md +207 -0
package/skills/codeql/references/macos-arm64e-workaround.md +179 -0
package/skills/codeql/references/performance-tuning.md +111 -0
package/skills/codeql/references/quality-assessment.md +172 -0
package/skills/codeql/references/ruleset-catalog.md +63 -0
package/skills/codeql/references/run-all-suite.md +92 -0
package/skills/codeql/references/sarif-processing.md +79 -0
package/skills/codeql/references/threat-models.md +51 -0
package/skills/codeql/workflows/build-database.md +280 -0
package/skills/codeql/workflows/create-data-extensions.md +261 -0
package/skills/codeql/workflows/run-analysis.md +301 -0
package/skills/differential-review/SKILL.md +220 -0
package/skills/differential-review/adversarial.md +203 -0
package/skills/differential-review/methodology.md +234 -0
package/skills/differential-review/patterns.md +300 -0
package/skills/differential-review/reporting.md +369 -0
package/skills/fp-check/SKILL.md +125 -0
package/skills/fp-check/references/bug-class-verification.md +114 -0
package/skills/fp-check/references/deep-verification.md +143 -0
package/skills/fp-check/references/evidence-templates.md +91 -0
package/skills/fp-check/references/false-positive-patterns.md +115 -0
package/skills/fp-check/references/gate-reviews.md +27 -0
package/skills/fp-check/references/standard-verification.md +78 -0
package/skills/insecure-defaults/SKILL.md +117 -0
package/skills/insecure-defaults/references/examples.md +409 -0
package/skills/last30days/SKILL.md +444 -0
package/skills/sarif-parsing/SKILL.md +483 -0
package/skills/sarif-parsing/resources/jq-queries.md +162 -0
package/skills/sarif-parsing/resources/sarif_helpers.py +331 -0
package/skills/security-threat-model/LICENSE.txt +201 -0
package/skills/security-threat-model/SKILL.md +81 -0
package/skills/security-threat-model/agents/openai.yaml +4 -0
package/skills/security-threat-model/references/prompt-template.md +255 -0
package/skills/security-threat-model/references/security-controls-and-assets.md +32 -0
package/skills/semgrep/SKILL.md +212 -0
package/skills/semgrep/references/rulesets.md +162 -0
package/skills/semgrep/references/scan-modes.md +110 -0
package/skills/semgrep/references/scanner-task-prompt.md +140 -0
package/skills/semgrep/scripts/merge_sarif.py +203 -0
package/skills/semgrep/workflows/scan-workflow.md +311 -0
package/skills/semgrep-rule-creator/SKILL.md +168 -0
package/skills/semgrep-rule-creator/references/quick-reference.md +202 -0
package/skills/semgrep-rule-creator/references/workflow.md +240 -0
package/skills/semgrep-rule-variant-creator/SKILL.md +205 -0
package/skills/semgrep-rule-variant-creator/references/applicability-analysis.md +250 -0
package/skills/semgrep-rule-variant-creator/references/language-syntax-guide.md +324 -0
package/skills/semgrep-rule-variant-creator/references/workflow.md +518 -0
package/skills/sharp-edges/SKILL.md +292 -0
package/skills/sharp-edges/references/auth-patterns.md +252 -0
package/skills/sharp-edges/references/case-studies.md +274 -0
package/skills/sharp-edges/references/config-patterns.md +333 -0
package/skills/sharp-edges/references/crypto-apis.md +190 -0
package/skills/sharp-edges/references/lang-c.md +205 -0
package/skills/sharp-edges/references/lang-csharp.md +285 -0
package/skills/sharp-edges/references/lang-go.md +270 -0
package/skills/sharp-edges/references/lang-java.md +263 -0
package/skills/sharp-edges/references/lang-javascript.md +269 -0
package/skills/sharp-edges/references/lang-kotlin.md +265 -0
package/skills/sharp-edges/references/lang-php.md +245 -0
package/skills/sharp-edges/references/lang-python.md +274 -0
package/skills/sharp-edges/references/lang-ruby.md +273 -0
package/skills/sharp-edges/references/lang-rust.md +272 -0
package/skills/sharp-edges/references/lang-swift.md +287 -0
package/skills/sharp-edges/references/language-specific.md +588 -0
package/skills/spec-to-code-compliance/SKILL.md +357 -0
package/skills/spec-to-code-compliance/resources/COMPLETENESS_CHECKLIST.md +69 -0
package/skills/spec-to-code-compliance/resources/IR_EXAMPLES.md +417 -0
package/skills/spec-to-code-compliance/resources/OUTPUT_REQUIREMENTS.md +105 -0
package/skills/supply-chain-risk-auditor/SKILL.md +67 -0
package/skills/supply-chain-risk-auditor/resources/results-template.md +41 -0
package/skills/variant-analysis/METHODOLOGY.md +327 -0
package/skills/variant-analysis/SKILL.md +142 -0
package/skills/variant-analysis/resources/codeql/cpp.ql +119 -0
package/skills/variant-analysis/resources/codeql/go.ql +69 -0
package/skills/variant-analysis/resources/codeql/java.ql +71 -0
package/skills/variant-analysis/resources/codeql/javascript.ql +63 -0
package/skills/variant-analysis/resources/codeql/python.ql +80 -0
package/skills/variant-analysis/resources/semgrep/cpp.yaml +98 -0
package/skills/variant-analysis/resources/semgrep/go.yaml +63 -0
package/skills/variant-analysis/resources/semgrep/java.yaml +61 -0
package/skills/variant-analysis/resources/semgrep/javascript.yaml +60 -0
package/skills/variant-analysis/resources/semgrep/python.yaml +72 -0
package/skills/variant-analysis/resources/variant-report-template.md +75 -0
package/skills/vuln-report/SKILL.md +137 -0
package/skills/vuln-report/agents/openai.yaml +4 -0
package/skills/vuln-report/references/report-template.md +135 -0
package/skills/wooyun-legacy/SKILL.md +367 -0
package/skills/wooyun-legacy/references/bank-penetration.md +222 -0
package/skills/wooyun-legacy/references/checklists/command-execution-checklist.md +119 -0
package/skills/wooyun-legacy/references/checklists/csrf-checklist.md +74 -0
package/skills/wooyun-legacy/references/checklists/file-upload-checklist.md +108 -0
package/skills/wooyun-legacy/references/checklists/info-disclosure-checklist.md +114 -0
package/skills/wooyun-legacy/references/checklists/logic-flaws-checklist.md +95 -0
package/skills/wooyun-legacy/references/checklists/misconfig-checklist.md +124 -0
package/skills/wooyun-legacy/references/checklists/path-traversal-checklist.md +87 -0
package/skills/wooyun-legacy/references/checklists/rce-checklist.md +93 -0
package/skills/wooyun-legacy/references/checklists/sql-injection-checklist.md +97 -0
package/skills/wooyun-legacy/references/checklists/ssrf-checklist.md +99 -0
package/skills/wooyun-legacy/references/checklists/unauthorized-access-checklist.md +89 -0
package/skills/wooyun-legacy/references/checklists/weak-password-checklist.md +115 -0
package/skills/wooyun-legacy/references/checklists/xss-checklist.md +103 -0
package/skills/wooyun-legacy/references/checklists/xxe-checklist.md +130 -0
package/skills/wooyun-legacy/references/info-disclosure.md +975 -0
package/skills/wooyun-legacy/references/logic-flaws.md +721 -0
package/skills/wooyun-legacy/references/path-traversal.md +1191 -0
package/skills/wooyun-legacy/references/telecom-penetration.md +156 -0
package/skills/wooyun-legacy/references/unauthorized-access.md +980 -0
package/skills/wooyun-legacy/references/xss.md +746 -0
package/skills/zeroize-audit/SKILL.md +371 -0
package/skills/zeroize-audit/configs/c.yaml +21 -0
package/skills/zeroize-audit/configs/default.yaml +128 -0
package/skills/zeroize-audit/configs/rust.yaml +83 -0
package/skills/zeroize-audit/prompts/report_template.md +238 -0
package/skills/zeroize-audit/prompts/system.md +163 -0
package/skills/zeroize-audit/prompts/task.md +97 -0
package/skills/zeroize-audit/references/compile-commands.md +231 -0
package/skills/zeroize-audit/references/detection-strategy.md +191 -0
package/skills/zeroize-audit/references/ir-analysis.md +252 -0
package/skills/zeroize-audit/references/mcp-analysis.md +221 -0
package/skills/zeroize-audit/references/poc-generation.md +470 -0
package/skills/zeroize-audit/references/rust-zeroization-patterns.md +867 -0
package/skills/zeroize-audit/schemas/input.json +83 -0
package/skills/zeroize-audit/schemas/output.json +140 -0
package/skills/zeroize-audit/tools/analyze_asm.sh +202 -0
package/skills/zeroize-audit/tools/analyze_cfg.py +381 -0
package/skills/zeroize-audit/tools/analyze_heap.sh +211 -0
package/skills/zeroize-audit/tools/analyze_ir_semantic.py +429 -0
package/skills/zeroize-audit/tools/diff_ir.sh +135 -0
package/skills/zeroize-audit/tools/diff_rust_mir.sh +189 -0
package/skills/zeroize-audit/tools/emit_asm.sh +67 -0
package/skills/zeroize-audit/tools/emit_ir.sh +77 -0
package/skills/zeroize-audit/tools/emit_rust_asm.sh +178 -0
package/skills/zeroize-audit/tools/emit_rust_ir.sh +150 -0
package/skills/zeroize-audit/tools/emit_rust_mir.sh +158 -0
package/skills/zeroize-audit/tools/extract_compile_flags.py +284 -0
package/skills/zeroize-audit/tools/generate_poc.py +1329 -0
package/skills/zeroize-audit/tools/mcp/apply_confidence_gates.py +113 -0
package/skills/zeroize-audit/tools/mcp/check_mcp.sh +68 -0
package/skills/zeroize-audit/tools/mcp/normalize_mcp_evidence.py +125 -0
package/skills/zeroize-audit/tools/scripts/check_llvm_patterns.py +481 -0
package/skills/zeroize-audit/tools/scripts/check_mir_patterns.py +554 -0
package/skills/zeroize-audit/tools/scripts/check_rust_asm.py +424 -0
package/skills/zeroize-audit/tools/scripts/check_rust_asm_aarch64.py +300 -0
package/skills/zeroize-audit/tools/scripts/check_rust_asm_x86.py +283 -0
package/skills/zeroize-audit/tools/scripts/find_dangerous_apis.py +375 -0
package/skills/zeroize-audit/tools/scripts/semantic_audit.py +923 -0
package/skills/zeroize-audit/tools/track_dataflow.sh +196 -0
package/skills/zeroize-audit/tools/validate_rust_toolchain.sh +298 -0
package/skills/zeroize-audit/workflows/phase-0-preflight.md +150 -0
package/skills/zeroize-audit/workflows/phase-1-source-analysis.md +144 -0
package/skills/zeroize-audit/workflows/phase-2-compiler-analysis.md +139 -0
package/skills/zeroize-audit/workflows/phase-3-interim-report.md +46 -0
package/skills/zeroize-audit/workflows/phase-4-poc-generation.md +46 -0
package/skills/zeroize-audit/workflows/phase-5-poc-validation.md +136 -0
package/skills/zeroize-audit/workflows/phase-6-final-report.md +44 -0
package/skills/zeroize-audit/workflows/phase-7-test-generation.md +42 -0
package/themes/piolium-srcery.json +94 -0

package/skills/sarif-parsing/SKILL.md ADDED Viewed

@@ -0,0 +1,483 @@
+---
+name: sarif-parsing
+description: >-
+  Parses and processes SARIF files from static analysis tools like CodeQL, Semgrep, or other
+  scanners. Triggers on "parse sarif", "read scan results", "aggregate findings", "deduplicate
+  alerts", or "process sarif output". Handles filtering, deduplication, format conversion, and
+  CI/CD integration of SARIF data. Does NOT run scans — use the Semgrep or CodeQL skills for that.
+allowed-tools:
+  - Bash
+  - Read
+  - Glob
+  - Grep
+---
+# SARIF Parsing Best Practices
+You are a SARIF parsing expert. Your role is to help users effectively read, analyze, and process SARIF files from static analysis tools.
+## When to Use
+Use this skill when:
+- Reading or interpreting static analysis scan results in SARIF format
+- Aggregating findings from multiple security tools
+- Deduplicating or filtering security alerts
+- Extracting specific vulnerabilities from SARIF files
+- Integrating SARIF data into CI/CD pipelines
+- Converting SARIF output to other formats
+## When NOT to Use
+Do NOT use this skill for:
+- Running static analysis scans (use CodeQL or Semgrep skills instead)
+- Writing CodeQL or Semgrep rules (use their respective skills)
+- Analyzing source code directly (SARIF is for processing existing scan results)
+- Triaging findings without SARIF input (use variant-analysis or audit skills)
+## SARIF Structure Overview
+SARIF 2.1.0 is the current OASIS standard. Every SARIF file has this hierarchical structure:
+```
+sarifLog
+├── version: "2.1.0"
+├── $schema: (optional, enables IDE validation)
+└── runs[] (array of analysis runs)
+    ├── tool
+    │   ├── driver
+    │   │   ├── name (required)
+    │   │   ├── version
+    │   │   └── rules[] (rule definitions)
+    │   └── extensions[] (plugins)
+    ├── results[] (findings)
+    │   ├── ruleId
+    │   ├── level (error/warning/note)
+    │   ├── message.text
+    │   ├── locations[]
+    │   │   └── physicalLocation
+    │   │       ├── artifactLocation.uri
+    │   │       └── region (startLine, startColumn, etc.)
+    │   ├── fingerprints{}
+    │   └── partialFingerprints{}
+    └── artifacts[] (scanned files metadata)
+```
+### Why Fingerprinting Matters
+Without stable fingerprints, you can't track findings across runs:
+- **Baseline comparison**: "Is this a new finding or did we see it before?"
+- **Regression detection**: "Did this PR introduce new vulnerabilities?"
+- **Suppression**: "Ignore this known false positive in future runs"
+Tools report different paths (`/path/to/project/` vs `/github/workspace/`), so path-based matching fails. Fingerprints hash the *content* (code snippet, rule ID, relative location) to create stable identifiers regardless of environment.
+## Tool Selection Guide
+| Use Case | Tool | Installation |
+|----------|------|--------------|
+| Quick CLI queries | jq | `brew install jq` / `apt install jq` |
+| Python scripting (simple) | pysarif | `pip install pysarif` |
+| Python scripting (advanced) | sarif-tools | `pip install sarif-tools` |
+| .NET applications | SARIF SDK | NuGet package |
+| JavaScript/Node.js | sarif-js | npm package |
+| Go applications | garif | `go get github.com/chavacava/garif` |
+| Validation | SARIF Validator | sarifweb.azurewebsites.net |
+## Strategy 1: Quick Analysis with jq
+For rapid exploration and one-off queries:
+```bash
+# Pretty print the file
+jq '.' results.sarif
+# Count total findings
+jq '[.runs[].results[]] | length' results.sarif
+# List all rule IDs triggered
+jq '[.runs[].results[].ruleId] | unique' results.sarif
+# Extract errors only
+jq '.runs[].results[] | select(.level == "error")' results.sarif
+# Get findings with file locations
+jq '.runs[].results[] | {
+  rule: .ruleId,
+  message: .message.text,
+  file: .locations[0].physicalLocation.artifactLocation.uri,
+  line: .locations[0].physicalLocation.region.startLine
+}' results.sarif
+# Filter by severity and get count per rule
+jq '[.runs[].results[] | select(.level == "error")] | group_by(.ruleId) | map({rule: .[0].ruleId, count: length})' results.sarif
+# Extract findings for a specific file
+jq --arg file "src/auth.py" '.runs[].results[] | select(.locations[].physicalLocation.artifactLocation.uri | contains($file))' results.sarif
+```
+## Strategy 2: Python with pysarif
+For programmatic access with full object model:
+```python
+from pysarif import load_from_file, save_to_file
+# Load SARIF file
+sarif = load_from_file("results.sarif")
+# Iterate through runs and results
+for run in sarif.runs:
+    tool_name = run.tool.driver.name
+    print(f"Tool: {tool_name}")
+    for result in run.results:
+        print(f"  [{result.level}] {result.rule_id}: {result.message.text}")
+        if result.locations:
+            loc = result.locations[0].physical_location
+            if loc and loc.artifact_location:
+                print(f"    File: {loc.artifact_location.uri}")
+                if loc.region:
+                    print(f"    Line: {loc.region.start_line}")
+# Save modified SARIF
+save_to_file(sarif, "modified.sarif")
+```
+## Strategy 3: Python with sarif-tools
+For aggregation, reporting, and CI/CD integration:
+```python
+from sarif import loader
+# Load single file
+sarif_data = loader.load_sarif_file("results.sarif")
+# Or load multiple files
+sarif_set = loader.load_sarif_files(["tool1.sarif", "tool2.sarif"])
+# Get summary report
+report = sarif_data.get_report()
+# Get histogram by severity
+errors = report.get_issue_type_histogram_for_severity("error")
+warnings = report.get_issue_type_histogram_for_severity("warning")
+# Filter results
+high_severity = [r for r in sarif_data.get_results()
+                 if r.get("level") == "error"]
+```
+**sarif-tools CLI commands:**
+```bash
+# Summary of findings
+sarif summary results.sarif
+# List all results with details
+sarif ls results.sarif
+# Get results by severity
+sarif ls --level error results.sarif
+# Diff two SARIF files (find new/fixed issues)
+sarif diff baseline.sarif current.sarif
+# Convert to other formats
+sarif csv results.sarif > results.csv
+sarif html results.sarif > report.html
+```
+## Strategy 4: Aggregating Multiple SARIF Files
+When combining results from multiple tools:
+```python
+import json
+from pathlib import Path
+def aggregate_sarif_files(sarif_paths: list[str]) -> dict:
+    """Combine multiple SARIF files into one."""
+    aggregated = {
+        "version": "2.1.0",
+        "$schema": "https://json.schemastore.org/sarif-2.1.0.json",
+        "runs": []
+    }
+    for path in sarif_paths:
+        with open(path) as f:
+            sarif = json.load(f)
+            aggregated["runs"].extend(sarif.get("runs", []))
+    return aggregated
+def deduplicate_results(sarif: dict) -> dict:
+    """Remove duplicate findings based on fingerprints."""
+    seen_fingerprints = set()
+    for run in sarif["runs"]:
+        unique_results = []
+        for result in run.get("results", []):
+            # Use partialFingerprints or create key from location
+            fp = None
+            if result.get("partialFingerprints"):
+                fp = tuple(sorted(result["partialFingerprints"].items()))
+            elif result.get("fingerprints"):
+                fp = tuple(sorted(result["fingerprints"].items()))
+            else:
+                # Fallback: create fingerprint from rule + location
+                loc = result.get("locations", [{}])[0]
+                phys = loc.get("physicalLocation", {})
+                fp = (
+                    result.get("ruleId"),
+                    phys.get("artifactLocation", {}).get("uri"),
+                    phys.get("region", {}).get("startLine")
+                )
+            if fp not in seen_fingerprints:
+                seen_fingerprints.add(fp)
+                unique_results.append(result)
+        run["results"] = unique_results
+    return sarif
+```
+## Strategy 5: Extracting Actionable Data
+```python
+import json
+from dataclasses import dataclass
+from typing import Optional
+@dataclass
+class Finding:
+    rule_id: str
+    level: str
+    message: str
+    file_path: Optional[str]
+    start_line: Optional[int]
+    end_line: Optional[int]
+    fingerprint: Optional[str]
+def extract_findings(sarif_path: str) -> list[Finding]:
+    """Extract structured findings from SARIF file."""
+    with open(sarif_path) as f:
+        sarif = json.load(f)
+    findings = []
+    for run in sarif.get("runs", []):
+        for result in run.get("results", []):
+            loc = result.get("locations", [{}])[0]
+            phys = loc.get("physicalLocation", {})
+            region = phys.get("region", {})
+            findings.append(Finding(
+                rule_id=result.get("ruleId", "unknown"),
+                level=result.get("level", "warning"),
+                message=result.get("message", {}).get("text", ""),
+                file_path=phys.get("artifactLocation", {}).get("uri"),
+                start_line=region.get("startLine"),
+                end_line=region.get("endLine"),
+                fingerprint=next(iter(result.get("partialFingerprints", {}).values()), None)
+            ))
+    return findings
+# Filter and prioritize
+def prioritize_findings(findings: list[Finding]) -> list[Finding]:
+    """Sort findings by severity."""
+    severity_order = {"error": 0, "warning": 1, "note": 2, "none": 3}
+    return sorted(findings, key=lambda f: severity_order.get(f.level, 99))
+```
+## Common Pitfalls and Solutions
+### 1. Path Normalization Issues
+Different tools report paths differently (absolute, relative, URI-encoded):
+```python
+from urllib.parse import unquote
+from pathlib import Path
+def normalize_path(uri: str, base_path: str = "") -> str:
+    """Normalize SARIF artifact URI to consistent path."""
+    # Remove file:// prefix if present
+    if uri.startswith("file://"):
+        uri = uri[7:]
+    # URL decode
+    uri = unquote(uri)
+    # Handle relative paths
+    if not Path(uri).is_absolute() and base_path:
+        uri = str(Path(base_path) / uri)
+    # Normalize separators
+    return str(Path(uri))
+```
+### 2. Fingerprint Mismatch Across Runs
+Fingerprints may not match if:
+- File paths differ between environments
+- Tool versions changed fingerprinting algorithm
+- Code was reformatted (changing line numbers)
+**Solution:** Use multiple fingerprint strategies:
+```python
+def compute_stable_fingerprint(result: dict, file_content: str = None) -> str:
+    """Compute environment-independent fingerprint."""
+    import hashlib
+    components = [
+        result.get("ruleId", ""),
+        result.get("message", {}).get("text", "")[:100],  # First 100 chars
+    ]
+    # Add code snippet if available
+    if file_content and result.get("locations"):
+        region = result["locations"][0].get("physicalLocation", {}).get("region", {})
+        if region.get("startLine"):
+            lines = file_content.split("\n")
+            line_idx = region["startLine"] - 1
+            if 0 <= line_idx < len(lines):
+                # Normalize whitespace
+                components.append(lines[line_idx].strip())
+    return hashlib.sha256("".join(components).encode()).hexdigest()[:16]
+```
+### 3. Missing or Incomplete Data
+SARIF allows many optional fields. Always use defensive access:
+```python
+def safe_get_location(result: dict) -> tuple[str, int]:
+    """Safely extract file and line from result."""
+    try:
+        loc = result.get("locations", [{}])[0]
+        phys = loc.get("physicalLocation", {})
+        file_path = phys.get("artifactLocation", {}).get("uri", "unknown")
+        line = phys.get("region", {}).get("startLine", 0)
+        return file_path, line
+    except (IndexError, KeyError, TypeError):
+        return "unknown", 0
+```
+### 4. Large File Performance
+For very large SARIF files (100MB+):
+```python
+import ijson  # pip install ijson
+def stream_results(sarif_path: str):
+    """Stream results without loading entire file."""
+    with open(sarif_path, "rb") as f:
+        # Stream through results arrays
+        for result in ijson.items(f, "runs.item.results.item"):
+            yield result
+```
+### 5. Schema Validation
+Validate before processing to catch malformed files:
+```bash
+# Using ajv-cli
+npm install -g ajv-cli
+ajv validate -s sarif-schema-2.1.0.json -d results.sarif
+# Using Python jsonschema
+pip install jsonschema
+```
+```python
+from jsonschema import validate, ValidationError
+import json
+def validate_sarif(sarif_path: str, schema_path: str) -> bool:
+    """Validate SARIF file against schema."""
+    with open(sarif_path) as f:
+        sarif = json.load(f)
+    with open(schema_path) as f:
+        schema = json.load(f)
+    try:
+        validate(sarif, schema)
+        return True
+    except ValidationError as e:
+        print(f"Validation error: {e.message}")
+        return False
+```
+## CI/CD Integration Patterns
+### GitHub Actions
+```yaml
+- name: Upload SARIF
+  uses: github/codeql-action/upload-sarif@v3
+  with:
+    sarif_file: results.sarif
+- name: Check for high severity
+  run: |
+    HIGH_COUNT=$(jq '[.runs[].results[] | select(.level == "error")] | length' results.sarif)
+    if [ "$HIGH_COUNT" -gt 0 ]; then
+      echo "Found $HIGH_COUNT high severity issues"
+      exit 1
+    fi
+```
+### Fail on New Issues
+```python
+from sarif import loader
+def check_for_regressions(baseline: str, current: str) -> int:
+    """Return count of new issues not in baseline."""
+    baseline_data = loader.load_sarif_file(baseline)
+    current_data = loader.load_sarif_file(current)
+    baseline_fps = {get_fingerprint(r) for r in baseline_data.get_results()}
+    new_issues = [r for r in current_data.get_results()
+                  if get_fingerprint(r) not in baseline_fps]
+    return len(new_issues)
+```
+## Key Principles
+1. **Validate first**: Check SARIF structure before processing
+2. **Handle optionals**: Many fields are optional; use defensive access
+3. **Normalize paths**: Tools report paths differently; normalize early
+4. **Fingerprint wisely**: Combine multiple strategies for stable deduplication
+5. **Stream large files**: Use ijson or similar for 100MB+ files
+6. **Aggregate thoughtfully**: Preserve tool metadata when combining files
+## Skill Resources
+For ready-to-use query templates, see [{baseDir}/resources/jq-queries.md]({baseDir}/resources/jq-queries.md):
+- 40+ jq queries for common SARIF operations
+- Severity filtering, rule extraction, aggregation patterns
+For Python utilities, see [{baseDir}/resources/sarif_helpers.py]({baseDir}/resources/sarif_helpers.py):
+- `normalize_path()` - Handle tool-specific path formats
+- `compute_fingerprint()` - Stable fingerprinting ignoring paths
+- `deduplicate_results()` - Remove duplicates across runs
+## Reference Links
+- [OASIS SARIF 2.1.0 Specification](https://docs.oasis-open.org/sarif/sarif/v2.1.0/sarif-v2.1.0.html)
+- [Microsoft SARIF Tutorials](https://github.com/microsoft/sarif-tutorials)
+- [SARIF SDK (.NET)](https://github.com/microsoft/sarif-sdk)
+- [sarif-tools (Python)](https://github.com/microsoft/sarif-tools)
+- [pysarif (Python)](https://github.com/Kjeld-P/pysarif)
+- [GitHub SARIF Support](https://docs.github.com/en/code-security/code-scanning/integrating-with-code-scanning/sarif-support-for-code-scanning)
+- [SARIF Validator](https://sarifweb.azurewebsites.net/)

package/skills/sarif-parsing/resources/jq-queries.md ADDED Viewed

@@ -0,0 +1,162 @@
+# SARIF jq Query Reference
+Ready-to-use jq queries for common SARIF parsing tasks.
+## Basic Exploration
+```bash
+# Pretty print
+jq '.' results.sarif
+# Get SARIF version
+jq '.version' results.sarif
+# List tool names from all runs
+jq '.runs[].tool.driver.name' results.sarif
+# Count runs
+jq '.runs | length' results.sarif
+```
+## Result Queries
+```bash
+# Total result count
+jq '[.runs[].results[]] | length' results.sarif
+# Count by severity level
+jq 'reduce .runs[].results[] as $r ({}; .[$r.level] += 1)' results.sarif
+# List unique rule IDs
+jq '[.runs[].results[].ruleId] | unique | sort' results.sarif
+# Count per rule
+jq '[.runs[].results[]] | group_by(.ruleId) | map({rule: .[0].ruleId, count: length}) | sort_by(-.count)' results.sarif
+```
+## Filtering Results
+```bash
+# Only errors
+jq '.runs[].results[] | select(.level == "error")' results.sarif
+# Only warnings
+jq '.runs[].results[] | select(.level == "warning")' results.sarif
+# By specific rule ID
+jq --arg rule "SQL_INJECTION" '.runs[].results[] | select(.ruleId == $rule)' results.sarif
+# By file path (contains)
+jq --arg file "auth" '.runs[].results[] | select(.locations[].physicalLocation.artifactLocation.uri | contains($file))' results.sarif
+# By file extension
+jq '.runs[].results[] | select(.locations[].physicalLocation.artifactLocation.uri | test("\\.py$"))' results.sarif
+# Multiple conditions
+jq '.runs[].results[] | select(.level == "error" and (.ruleId | startswith("SEC")))' results.sarif
+```
+## Extracting Locations
+```bash
+# File and line for each result
+jq '.runs[].results[] | {
+  rule: .ruleId,
+  file: .locations[0].physicalLocation.artifactLocation.uri,
+  line: .locations[0].physicalLocation.region.startLine
+}' results.sarif
+# Unique affected files
+jq '[.runs[].results[].locations[].physicalLocation.artifactLocation.uri] | unique | sort' results.sarif
+# Results grouped by file
+jq '[.runs[].results[] | {file: .locations[0].physicalLocation.artifactLocation.uri, result: .}] | group_by(.file) | map({file: .[0].file, count: length})' results.sarif
+```
+## Rule Information
+```bash
+# List all rules with severity
+jq '.runs[].tool.driver.rules[] | {id: .id, name: .name, level: .defaultConfiguration.level}' results.sarif
+# Get rule description by ID
+jq --arg id "RULE001" '.runs[].tool.driver.rules[] | select(.id == $id)' results.sarif
+# Rules with help URLs
+jq '.runs[].tool.driver.rules[] | select(.helpUri) | {id: .id, help: .helpUri}' results.sarif
+```
+## Fingerprints
+```bash
+# Results with fingerprints
+jq '.runs[].results[] | select(.fingerprints or .partialFingerprints) | {rule: .ruleId, fp: (.fingerprints // .partialFingerprints)}' results.sarif
+# Extract all partial fingerprints
+jq '[.runs[].results[].partialFingerprints] | add' results.sarif
+```
+## Aggregation and Reporting
+```bash
+# Summary by severity and rule
+jq '[.runs[].results[]] | group_by(.level) | map({level: .[0].level, rules: (group_by(.ruleId) | map({rule: .[0].ruleId, count: length}))})' results.sarif
+# Top 10 most frequent rules
+jq '[.runs[].results[]] | group_by(.ruleId) | map({rule: .[0].ruleId, count: length}) | sort_by(-.count) | .[0:10]' results.sarif
+# Files with most issues
+jq '[.runs[].results[] | .locations[0].physicalLocation.artifactLocation.uri] | group_by(.) | map({file: .[0], count: length}) | sort_by(-.count) | .[0:10]' results.sarif
+```
+## Output Formatting
+```bash
+# CSV-like output
+jq -r '.runs[].results[] | [.ruleId, .level, .locations[0].physicalLocation.artifactLocation.uri, .locations[0].physicalLocation.region.startLine, .message.text] | @csv' results.sarif
+# Tab-separated
+jq -r '.runs[].results[] | [.ruleId, .level, .locations[0].physicalLocation.artifactLocation.uri // "N/A"] | @tsv' results.sarif
+# Markdown table
+echo "| Rule | Level | File | Line |"
+echo "|------|-------|------|------|"
+jq -r '.runs[].results[] | "| \(.ruleId) | \(.level) | \(.locations[0].physicalLocation.artifactLocation.uri // "N/A") | \(.locations[0].physicalLocation.region.startLine // "N/A") |"' results.sarif
+```
+## Comparison and Diff
+```bash
+# Find rules in file1 not in file2
+comm -23 <(jq -r '[.runs[].results[].ruleId] | unique | sort[]' file1.sarif) <(jq -r '[.runs[].results[].ruleId] | unique | sort[]' file2.sarif)
+# Compare result counts
+echo "File 1: $(jq '[.runs[].results[]] | length' file1.sarif)"
+echo "File 2: $(jq '[.runs[].results[]] | length' file2.sarif)"
+```
+## Transformation
+```bash
+# Extract minimal SARIF (results only)
+jq '{version: .version, runs: [.runs[] | {tool: {driver: {name: .tool.driver.name}}, results: .results}]}' results.sarif
+# Filter and create new SARIF with only errors
+jq '.runs[].results = [.runs[].results[] | select(.level == "error")]' results.sarif > errors-only.sarif
+# Merge multiple SARIF files
+jq -s '{version: "2.1.0", runs: [.[].runs[]]}' file1.sarif file2.sarif > merged.sarif
+```
+## Validation Checks
+```bash
+# Check if version is 2.1.0
+jq -e '.version == "2.1.0"' results.sarif && echo "Valid version" || echo "Invalid version"
+# Check for empty results
+jq -e '[.runs[].results[]] | length > 0' results.sarif && echo "Has results" || echo "No results"
+# Verify all results have locations
+jq '[.runs[].results[] | select(.locations | length == 0)] | length' results.sarif
+```