PyPI - oath-mcp - Versions diffs - 0.1.0__tar.gz - Mend

oath-mcp 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (101) hide show

oath_mcp-0.1.0/.gitignore +89 -0
oath_mcp-0.1.0/CITATION.cff +22 -0
oath_mcp-0.1.0/LICENSE +21 -0
oath_mcp-0.1.0/PKG-INFO +276 -0
oath_mcp-0.1.0/README.md +203 -0
oath_mcp-0.1.0/corpus/.gitkeep +0 -0
oath_mcp-0.1.0/docker/eztools/Dockerfile +42 -0
oath_mcp-0.1.0/docker/eztools/dotnet-tools.json +46 -0
oath_mcp-0.1.0/docker-compose.yml +86 -0
oath_mcp-0.1.0/docs/ACCURACY.md +163 -0
oath_mcp-0.1.0/docs/ARCHITECTURE.md +173 -0
oath_mcp-0.1.0/docs/ARTIFACT.md +48 -0
oath_mcp-0.1.0/docs/DATASETS.md +168 -0
oath_mcp-0.1.0/docs/DEVPOST.md +144 -0
oath_mcp-0.1.0/docs/PUBLICATION.md +44 -0
oath_mcp-0.1.0/docs/RECORDING.md +527 -0
oath_mcp-0.1.0/docs/TRY_IT_OUT.md +149 -0
oath_mcp-0.1.0/docs/demo.svg +460 -0
oath_mcp-0.1.0/logs/.gitkeep +0 -0
oath_mcp-0.1.0/pyproject.toml +119 -0
oath_mcp-0.1.0/scripts/bootstrap-forensic-tools.sh +206 -0
oath_mcp-0.1.0/scripts/demo.py +238 -0
oath_mcp-0.1.0/scripts/dry-run.sh +229 -0
oath_mcp-0.1.0/scripts/export_sample_run.py +342 -0
oath_mcp-0.1.0/scripts/install-on-sift.sh +337 -0
oath_mcp-0.1.0/scripts/install-tools.sh +221 -0
oath_mcp-0.1.0/scripts/nss_baseline.py +509 -0
oath_mcp-0.1.0/scripts/oath-mcp.sh +49 -0
oath_mcp-0.1.0/scripts/prepare-demo.sh +112 -0
oath_mcp-0.1.0/scripts/render_accuracy.py +186 -0
oath_mcp-0.1.0/scripts/show_self_correction.py +342 -0
oath_mcp-0.1.0/src/oath/__init__.py +7 -0
oath_mcp-0.1.0/src/oath/__main__.py +7 -0
oath_mcp-0.1.0/src/oath/agent/__init__.py +0 -0
oath_mcp-0.1.0/src/oath/agent/demo.py +436 -0
oath_mcp-0.1.0/src/oath/agent/runner.py +284 -0
oath_mcp-0.1.0/src/oath/benchmark/__init__.py +62 -0
oath_mcp-0.1.0/src/oath/benchmark/claude_agent.py +391 -0
oath_mcp-0.1.0/src/oath/benchmark/claude_nss_agent.py +293 -0
oath_mcp-0.1.0/src/oath/benchmark/corpus.py +237 -0
oath_mcp-0.1.0/src/oath/benchmark/gemini_nss_agent.py +256 -0
oath_mcp-0.1.0/src/oath/benchmark/harness.py +214 -0
oath_mcp-0.1.0/src/oath/benchmark/question.py +297 -0
oath_mcp-0.1.0/src/oath/benchmark/scorer.py +193 -0
oath_mcp-0.1.0/src/oath/cli.py +617 -0
oath_mcp-0.1.0/src/oath/mcp/__init__.py +0 -0
oath_mcp-0.1.0/src/oath/mcp/evidence_handle.py +182 -0
oath_mcp-0.1.0/src/oath/mcp/persistence.py +181 -0
oath_mcp-0.1.0/src/oath/mcp/server.py +760 -0
oath_mcp-0.1.0/src/oath/mcp/tools/__init__.py +0 -0
oath_mcp-0.1.0/src/oath/mcp/tools/enumerate_credential_artifacts.py +469 -0
oath_mcp-0.1.0/src/oath/mcp/tools/find_strings_on_image.py +567 -0
oath_mcp-0.1.0/src/oath/mcp/tools/parse_amcache.py +308 -0
oath_mcp-0.1.0/src/oath/mcp/tools/parse_evtx.py +474 -0
oath_mcp-0.1.0/src/oath/mcp/tools/parse_mft.py +383 -0
oath_mcp-0.1.0/src/oath/mcp/tools/parse_prefetch.py +266 -0
oath_mcp-0.1.0/src/oath/mcp/tools/parse_registry.py +435 -0
oath_mcp-0.1.0/src/oath/mcp/tools/parse_usnjrnl.py +374 -0
oath_mcp-0.1.0/src/oath/mcp/tools/plaso_supertimeline.py +514 -0
oath_mcp-0.1.0/src/oath/mcp/tools/run_hayabusa.py +441 -0
oath_mcp-0.1.0/src/oath/mcp/tools/vol3_query.py +354 -0
oath_mcp-0.1.0/src/oath/narrator/__init__.py +34 -0
oath_mcp-0.1.0/src/oath/narrator/terminal.py +386 -0
oath_mcp-0.1.0/src/oath/receipt/__init__.py +0 -0
oath_mcp-0.1.0/src/oath/receipt/notarized.py +383 -0
oath_mcp-0.1.0/src/oath/witness/__init__.py +0 -0
oath_mcp-0.1.0/src/oath/witness/claim.py +185 -0
oath_mcp-0.1.0/src/oath/witness/ralph_wiggum.py +276 -0
oath_mcp-0.1.0/src/oath/witness/verifier.py +366 -0
oath_mcp-0.1.0/symbols/.gitkeep +0 -0
oath_mcp-0.1.0/tests/integration/test_mcp_server.py +308 -0
oath_mcp-0.1.0/tests/integration/test_spoliation.py +677 -0
oath_mcp-0.1.0/tests/unit/test_agent_runner.py +279 -0
oath_mcp-0.1.0/tests/unit/test_benchmark.py +436 -0
oath_mcp-0.1.0/tests/unit/test_benchmark_nss.py +336 -0
oath_mcp-0.1.0/tests/unit/test_claude_agent.py +210 -0
oath_mcp-0.1.0/tests/unit/test_claude_nss_agent.py +188 -0
oath_mcp-0.1.0/tests/unit/test_enumerate_credential_artifacts.py +280 -0
oath_mcp-0.1.0/tests/unit/test_find_strings_on_image.py +287 -0
oath_mcp-0.1.0/tests/unit/test_gemini_nss_agent.py +131 -0
oath_mcp-0.1.0/tests/unit/test_narrator.py +221 -0
oath_mcp-0.1.0/tests/unit/test_notarized.py +198 -0
oath_mcp-0.1.0/tests/unit/test_parse_amcache.py +134 -0
oath_mcp-0.1.0/tests/unit/test_parse_evtx.py +299 -0
oath_mcp-0.1.0/tests/unit/test_parse_mft.py +225 -0
oath_mcp-0.1.0/tests/unit/test_parse_prefetch.py +131 -0
oath_mcp-0.1.0/tests/unit/test_parse_registry.py +285 -0
oath_mcp-0.1.0/tests/unit/test_parse_usnjrnl.py +202 -0
oath_mcp-0.1.0/tests/unit/test_plaso_supertimeline.py +290 -0
oath_mcp-0.1.0/tests/unit/test_ralph_wiggum.py +261 -0
oath_mcp-0.1.0/tests/unit/test_run_hayabusa.py +272 -0
oath_mcp-0.1.0/tests/unit/test_vol3_query.py +257 -0
oath_mcp-0.1.0/tests/unit/test_witness_verifier.py +347 -0
oath_mcp-0.1.0/uninstall.sh +115 -0
oath_mcp-0.1.0/verify.sh +40 -0
oath_mcp-0.1.0/web/README.md +42 -0
oath_mcp-0.1.0/web/app.js +199 -0
oath_mcp-0.1.0/web/build-data.sh +71 -0
oath_mcp-0.1.0/web/data.js +497 -0
oath_mcp-0.1.0/web/index.html +188 -0
oath_mcp-0.1.0/web/styles.css +580 -0

oath_mcp-0.1.0/.gitignore ADDED Viewed

@@ -0,0 +1,89 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+.venv/
+venv/
+env/
+*.egg-info/
+.pytest_cache/
+.mypy_cache/
+.ruff_cache/
+# Node
+node_modules/
+.npm/
+# Build artifacts
+dist/
+build/
+*.whl
+# Local secrets / state
+.env
+.env.local
+*.token
+*.key
+# OS
+.DS_Store
+Thumbs.db
+# Editor
+.vscode/
+.idea/
+# Forensic corpora (big binaries — pulled by scripts, never committed)
+corpus/
+*.E01
+*.dd
+*.raw
+*.vmem
+*.mem
+*.lime
+*.dmp
+# Volatility 3 symbol packs
+symbols/
+# Working state
+.pair/
+tmp/
+*.log
+logs/*.jsonl
+# Benchmark intermediate output
+benchmarks/runs/
+benchmarks/cache/
+# But keep these
+!logs/.gitkeep
+!corpus/.gitkeep
+!symbols/.gitkeep
+# Sandboxed local forensic tools (large, machine-specific)
+.oath-tools/
+# Per-run logs / envelope store / signing keys (machine-specific)
+logs/
+.oath/
+keys/
+.claude/
+log2timeline-*.log.gz
+psort-*.log.gz
+# Paper-build artifacts (source + PDF are archived on Zenodo, not in-repo)
+oath.tex
+oath.pdf
+oath.aux
+oath.bbl
+oath.blg
+oath.log
+oath.out
+oath.bib
+oath_*.png
+# Local video composition (the recording lives outside the public repo)
+video/

oath_mcp-0.1.0/CITATION.cff ADDED Viewed

@@ -0,0 +1,22 @@
+cff-version: 1.2.0
+message: "If you use OATH, cite the preprint and the verifier artifact."
+title: "OATH verifier artifact v0.1.0"
+type: software
+authors:
+  - family-names: Gharsallah
+    given-names: Malek
+version: "v0.1.0"
+date-released: "2026-06-05"
+license: MIT
+doi: "10.5281/zenodo.20549626"
+url: "https://doi.org/10.5281/zenodo.20549626"
+repository-code: "https://github.com/GharsallahDev/oath-mcp"
+preferred-citation:
+  type: article
+  authors:
+    - family-names: Gharsallah
+      given-names: Malek
+  title: "OATH: Notarized Evidence Envelopes for LLM-Assisted Forensic Claims"
+  year: 2026
+  doi: "10.5281/zenodo.20549726"
+  url: "https://doi.org/10.5281/zenodo.20549726"

oath_mcp-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Malek Gharsallah
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

oath_mcp-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,276 @@
+Metadata-Version: 2.4
+Name: oath-mcp
+Version: 0.1.0
+Summary: OATH — typed MCP server + verifier-gated evidence receipts for LLM-assisted digital forensics.
+Project-URL: Homepage, https://github.com/GharsallahDev/oath-mcp
+Project-URL: Repository, https://github.com/GharsallahDev/oath-mcp
+Project-URL: Issues, https://github.com/GharsallahDev/oath-mcp/issues
+Project-URL: Preprint (Zenodo), https://doi.org/10.5281/zenodo.20549726
+Project-URL: Artifact (Zenodo), https://doi.org/10.5281/zenodo.20549626
+Author-email: GharsallahDev <email@medsyn.solutions>
+License: MIT
+License-File: LICENSE
+Keywords: claude-code,dfir,evidence,forensics,hayabusa,incident-response,mcp,sigma
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Information Technology
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: POSIX :: Linux
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Security
+Classifier: Topic :: System :: Systems Administration
+Requires-Python: >=3.11
+Requires-Dist: anyio>=4.3.0
+Requires-Dist: blake3>=0.4.0
+Requires-Dist: click>=8.1.0
+Requires-Dist: cryptography>=42.0.0
+Requires-Dist: httpx>=0.27.0
+Requires-Dist: mcp>=1.0.0
+Requires-Dist: pydantic>=2.5.0
+Requires-Dist: pynacl>=1.5.0
+Requires-Dist: rich>=13.7.0
+Requires-Dist: structlog>=24.1.0
+Provides-Extra: all
+Requires-Dist: anthropic>=0.40.0; extra == 'all'
+Requires-Dist: construct>=2.10.0; extra == 'all'
+Requires-Dist: dfir-iris-client>=2.0.0; extra == 'all'
+Requires-Dist: google-cloud-aiplatform>=1.50.0; extra == 'all'
+Requires-Dist: libfwsi-python>=20240315; extra == 'all'
+Requires-Dist: matplotlib>=3.8.0; extra == 'all'
+Requires-Dist: pandas>=2.2.0; extra == 'all'
+Requires-Dist: python-evtx>=0.7.4; extra == 'all'
+Requires-Dist: regipy>=4.0.0; extra == 'all'
+Requires-Dist: scikit-learn>=1.4.0; extra == 'all'
+Requires-Dist: volatility3>=2.7.0; extra == 'all'
+Requires-Dist: yara-python>=4.5.0; extra == 'all'
+Provides-Extra: benchmark
+Requires-Dist: matplotlib>=3.8.0; extra == 'benchmark'
+Requires-Dist: pandas>=2.2.0; extra == 'benchmark'
+Requires-Dist: scikit-learn>=1.4.0; extra == 'benchmark'
+Provides-Extra: claude
+Requires-Dist: anthropic>=0.40.0; extra == 'claude'
+Provides-Extra: dev
+Requires-Dist: hypothesis>=6.100.0; extra == 'dev'
+Requires-Dist: mypy>=1.9.0; extra == 'dev'
+Requires-Dist: pytest-asyncio>=0.23.0; extra == 'dev'
+Requires-Dist: pytest-cov>=4.1.0; extra == 'dev'
+Requires-Dist: pytest>=8.0.0; extra == 'dev'
+Requires-Dist: ruff>=0.4.0; extra == 'dev'
+Provides-Extra: iris
+Requires-Dist: dfir-iris-client>=2.0.0; extra == 'iris'
+Provides-Extra: memory
+Requires-Dist: volatility3>=2.7.0; extra == 'memory'
+Provides-Extra: parsers
+Requires-Dist: construct>=2.10.0; extra == 'parsers'
+Requires-Dist: libfwsi-python>=20240315; extra == 'parsers'
+Requires-Dist: python-evtx>=0.7.4; extra == 'parsers'
+Requires-Dist: regipy>=4.0.0; extra == 'parsers'
+Requires-Dist: yara-python>=4.5.0; extra == 'parsers'
+Provides-Extra: vertex
+Requires-Dist: google-cloud-aiplatform>=1.50.0; extra == 'vertex'
+Description-Content-Type: text/markdown
+# OATH
+Verifier-gated evidence receipts for LLM-assisted digital forensics.
+[![Preprint DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.20549726.svg)](https://doi.org/10.5281/zenodo.20549726)
+[![Artifact DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.20549626.svg)](https://doi.org/10.5281/zenodo.20549626)
+OATH is a research prototype for making forensic claims replayable. It separates
+what an LLM proposes from what the evidence proves: forensic tools produce signed
+`Notarized<T>` envelopes, and the Witness Oath Verifier promotes only claims that
+can be deterministically re-derived from the original evidence bytes.
+This repository supports the published preprint:
+> **OATH: Notarized Evidence Envelopes for LLM-Assisted Forensic Claims**
+> Zenodo DOI: [10.5281/zenodo.20549726](https://doi.org/10.5281/zenodo.20549726)
+The verifier artifact is archived separately at
+[10.5281/zenodo.20549626](https://doi.org/10.5281/zenodo.20549626).
+## Relationship to Protocol SIFT
+OATH extends [Protocol SIFT](https://github.com/teamdfir/protocol-sift) — the
+open-source autonomous-DFIR baseline (Claude Code + five DFIR skill packs +
+PDF reporter, installed under `~/.claude/`). Protocol SIFT provides the agent
+framework; OATH layers a typed MCP-server tool surface, `Notarized<T>`
+envelopes, and a verifier-gated promotion path on top. Both install scripts
+(`scripts/install-tools.sh`, `scripts/install-on-sift.sh`) call Protocol SIFT's
+own installer first, then install OATH. See
+[docs/ARCHITECTURE.md §"How OATH extends Protocol SIFT"](docs/ARCHITECTURE.md#how-oath-extends-protocol-sift)
+for the architectural diff.
+If you already have Protocol SIFT installed (Claude Code present at
+`~/.claude/CLAUDE.md` and the five skill packs at `~/.claude/skills/`), set
+`OATH_SKIP_PROTOCOL_SIFT=1` before running either install script to skip the
+baseline step:
+```bash
+OATH_SKIP_PROTOCOL_SIFT=1 bash scripts/install-on-sift.sh
+```
+## Core Idea
+LLM-assisted investigation fails dangerously when a fluent model summary is
+treated as evidence. OATH treats that as a systems problem. A finding is not
+accepted because the model said it; it is accepted only when it cites a signed
+receipt whose contents replay.
+Each `Notarized<T>` envelope binds:
+- original evidence hash
+- typed tool name and version
+- canonical tool arguments
+- raw tool-output hash
+- parsed-data hash
+- supporting byte offsets when available
+- model identifier and prompt hash when an LLM contributed
+- previous-envelope hash for tamper-evident sequencing
+- Ed25519 signature over the signed header
+The verifier then classifies claims as:
+- `VERIFIED`: the receipt and predicate replay successfully
+- `QUARANTINED`: the receipt is intact, but the cited claim is not supported
+- `RALPH_WIGGUM`: evidence drift or receipt tampering is detected, forcing visible
+  abandonment and re-proposal
+## Results
+The benchmark is DFIR-Metric Module III, using 510 scored string-search
+questions in the local harness and a four-candidate answer budget.
+| System | TUS@4 |
+|---|---:|
+| GPT-4.1 published baseline | 38.5% |
+| OATH deterministic baseline, no LLM | 78.43% |
+| OATH live agent with verifier | 92.75% |
+The architectural result matters more than the model headline: typed tool
+invocation plus deterministic replay removes a large class of free-form
+script-generation failures before any model-specific capability is counted.
+Full methodology and audit notes are in [docs/ACCURACY.md](docs/ACCURACY.md).
+## Artifact Release
+A verifier-focused artifact release is archived on Zenodo:
+- Artifact: [OATH verifier artifact v0.1.0](https://doi.org/10.5281/zenodo.20549626)
+- Preprint: [OATH: Notarized Evidence Envelopes for LLM-Assisted Forensic Claims](https://doi.org/10.5281/zenodo.20549726)
+The release is intended to let an independent reviewer answer the narrow
+question: does the receipt, signature, canonicalization, replay, and
+self-correction design work? It does not include private case data, signing
+secrets, API keys, or operational prompts.
+## Quick Start
+OATH is published as a Python MCP server. Four one-liners on a SANS SIFT
+Workstation get you from cold boot to "Claude Code is driving 13 typed
+forensic tools against your evidence":
+```bash
+# 1. Protocol SIFT baseline (Claude Code + DFIR skill packs)
+curl -fsSL https://raw.githubusercontent.com/teamdfir/protocol-sift/main/install.sh | bash
+# 2. Forensic-binary bootstrap (.NET 9, EZ Tools, Hayabusa — what SIFT lacks)
+curl -fsSL https://raw.githubusercontent.com/GharsallahDev/oath-mcp/main/scripts/bootstrap-forensic-tools.sh | bash
+exec bash    # pick up the new PATH
+# 3. uv (if not already installed)
+curl -LsSf https://astral.sh/uv/install.sh | sh && exec bash
+# 4. Wire OATH into Claude Code (this is what goes on screen in the demo)
+claude mcp add --transport stdio oath -- uvx oath-mcp
+```
+Then start a session and confirm the 13 typed tools are connected:
+```bash
+claude
+# inside Claude:
+/mcp        # → oath: connected · 13 tools
+```
+To use the operator CLI (`oath mount`, `oath verify`, `oath demo`) instead
+of driving via Claude Code, install the package as a tool:
+```bash
+uv tool install oath-mcp
+oath mount path/to/evidence.E01
+oath verify <envelope-id>
+```
+Full forensic workstation setup, including the longer-form
+`install-on-sift.sh` alternative and a non-SIFT Docker path, is documented
+in [docs/TRY_IT_OUT.md](docs/TRY_IT_OUT.md).
+### Developing locally
+For working on `src/oath/`:
+```bash
+git clone https://github.com/GharsallahDev/oath-mcp-mcp
+cd oath-mcp
+uv venv && uv pip install -e ".[dev]"
+PYTHONPATH=src python -m pytest tests/integration/test_spoliation.py -q
+```
+## Architecture
+```mermaid
+flowchart LR
+    IMG["Evidence image"] --> HANDLE["Read-only EvidenceHandle"]
+    HANDLE --> TOOLS["Typed forensic tools"]
+    TOOLS --> ENV["Signed Notarized<T> envelope"]
+    LLM["LLM proposes typed arguments and claims"] --> TOOLS
+    LLM --> CLAIM["Claim cites envelope_id"]
+    CLAIM --> VERIFY{"Witness Oath Verifier"}
+    ENV --> VERIFY
+    VERIFY -->|receipt replays + predicate matches| OK["VERIFIED"]
+    VERIFY -->|receipt intact, predicate missing| Q["QUARANTINED"]
+    VERIFY -->|hash/signature/data drift| R["RALPH_WIGGUM"]
+    R --> LLM
+```
+OATH uses a custom MCP-style tool surface with typed functions rather than an
+arbitrary shell. The LLM can propose arguments and hypotheses; it cannot promote
+its own findings. Promotion is reserved for the deterministic verifier.
+Detailed trust-boundary notes are in [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md).
+## Repository Map
+| Path | Purpose |
+|---|---|
+| `src/oath/receipt/` | `Notarized<T>` envelope, canonicalization, signatures, prompt hashing |
+| `src/oath/mcp/` | Typed forensic tool surface and evidence-handle plumbing |
+| `src/oath/witness/` | Verifier, claim predicates, self-correction events |
+| `src/oath/benchmark/` | DFIR-Metric harness and scoring utilities |
+| `tests/integration/test_spoliation.py` | Spoliation, data-integrity, chain, and Daubert-binding tests |
+| `logs/self-correction-demo/` | Re-runnable self-correction artifact |
+| `web/` | Static receipt explorer for signed sample envelopes |
+## What OATH Does Not Claim
+OATH does not prove legal admissibility, certify tool correctness, make wrappers
+honest by magic, prove general DFIR competence, or remove the need for examiner
+review. It provides a concrete receipt and verifier pattern for making
+LLM-assisted forensic claims auditable.
+## Documentation
+- [Architecture](docs/ARCHITECTURE.md)
+- [Artifact release notes](docs/ARTIFACT.md)
+- [Publication and citation notes](docs/PUBLICATION.md)
+- [Accuracy and benchmark notes](docs/ACCURACY.md)
+- [Dataset documentation](docs/DATASETS.md)
+- [Try-it-out instructions](docs/TRY_IT_OUT.md)
+## License
+MIT. See [LICENSE](LICENSE).

oath_mcp-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,203 @@
+# OATH
+Verifier-gated evidence receipts for LLM-assisted digital forensics.
+[![Preprint DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.20549726.svg)](https://doi.org/10.5281/zenodo.20549726)
+[![Artifact DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.20549626.svg)](https://doi.org/10.5281/zenodo.20549626)
+OATH is a research prototype for making forensic claims replayable. It separates
+what an LLM proposes from what the evidence proves: forensic tools produce signed
+`Notarized<T>` envelopes, and the Witness Oath Verifier promotes only claims that
+can be deterministically re-derived from the original evidence bytes.
+This repository supports the published preprint:
+> **OATH: Notarized Evidence Envelopes for LLM-Assisted Forensic Claims**
+> Zenodo DOI: [10.5281/zenodo.20549726](https://doi.org/10.5281/zenodo.20549726)
+The verifier artifact is archived separately at
+[10.5281/zenodo.20549626](https://doi.org/10.5281/zenodo.20549626).
+## Relationship to Protocol SIFT
+OATH extends [Protocol SIFT](https://github.com/teamdfir/protocol-sift) — the
+open-source autonomous-DFIR baseline (Claude Code + five DFIR skill packs +
+PDF reporter, installed under `~/.claude/`). Protocol SIFT provides the agent
+framework; OATH layers a typed MCP-server tool surface, `Notarized<T>`
+envelopes, and a verifier-gated promotion path on top. Both install scripts
+(`scripts/install-tools.sh`, `scripts/install-on-sift.sh`) call Protocol SIFT's
+own installer first, then install OATH. See
+[docs/ARCHITECTURE.md §"How OATH extends Protocol SIFT"](docs/ARCHITECTURE.md#how-oath-extends-protocol-sift)
+for the architectural diff.
+If you already have Protocol SIFT installed (Claude Code present at
+`~/.claude/CLAUDE.md` and the five skill packs at `~/.claude/skills/`), set
+`OATH_SKIP_PROTOCOL_SIFT=1` before running either install script to skip the
+baseline step:
+```bash
+OATH_SKIP_PROTOCOL_SIFT=1 bash scripts/install-on-sift.sh
+```
+## Core Idea
+LLM-assisted investigation fails dangerously when a fluent model summary is
+treated as evidence. OATH treats that as a systems problem. A finding is not
+accepted because the model said it; it is accepted only when it cites a signed
+receipt whose contents replay.
+Each `Notarized<T>` envelope binds:
+- original evidence hash
+- typed tool name and version
+- canonical tool arguments
+- raw tool-output hash
+- parsed-data hash
+- supporting byte offsets when available
+- model identifier and prompt hash when an LLM contributed
+- previous-envelope hash for tamper-evident sequencing
+- Ed25519 signature over the signed header
+The verifier then classifies claims as:
+- `VERIFIED`: the receipt and predicate replay successfully
+- `QUARANTINED`: the receipt is intact, but the cited claim is not supported
+- `RALPH_WIGGUM`: evidence drift or receipt tampering is detected, forcing visible
+  abandonment and re-proposal
+## Results
+The benchmark is DFIR-Metric Module III, using 510 scored string-search
+questions in the local harness and a four-candidate answer budget.
+| System | TUS@4 |
+|---|---:|
+| GPT-4.1 published baseline | 38.5% |
+| OATH deterministic baseline, no LLM | 78.43% |
+| OATH live agent with verifier | 92.75% |
+The architectural result matters more than the model headline: typed tool
+invocation plus deterministic replay removes a large class of free-form
+script-generation failures before any model-specific capability is counted.
+Full methodology and audit notes are in [docs/ACCURACY.md](docs/ACCURACY.md).
+## Artifact Release
+A verifier-focused artifact release is archived on Zenodo:
+- Artifact: [OATH verifier artifact v0.1.0](https://doi.org/10.5281/zenodo.20549626)
+- Preprint: [OATH: Notarized Evidence Envelopes for LLM-Assisted Forensic Claims](https://doi.org/10.5281/zenodo.20549726)
+The release is intended to let an independent reviewer answer the narrow
+question: does the receipt, signature, canonicalization, replay, and
+self-correction design work? It does not include private case data, signing
+secrets, API keys, or operational prompts.
+## Quick Start
+OATH is published as a Python MCP server. Four one-liners on a SANS SIFT
+Workstation get you from cold boot to "Claude Code is driving 13 typed
+forensic tools against your evidence":
+```bash
+# 1. Protocol SIFT baseline (Claude Code + DFIR skill packs)
+curl -fsSL https://raw.githubusercontent.com/teamdfir/protocol-sift/main/install.sh | bash
+# 2. Forensic-binary bootstrap (.NET 9, EZ Tools, Hayabusa — what SIFT lacks)
+curl -fsSL https://raw.githubusercontent.com/GharsallahDev/oath-mcp/main/scripts/bootstrap-forensic-tools.sh | bash
+exec bash    # pick up the new PATH
+# 3. uv (if not already installed)
+curl -LsSf https://astral.sh/uv/install.sh | sh && exec bash
+# 4. Wire OATH into Claude Code (this is what goes on screen in the demo)
+claude mcp add --transport stdio oath -- uvx oath-mcp
+```
+Then start a session and confirm the 13 typed tools are connected:
+```bash
+claude
+# inside Claude:
+/mcp        # → oath: connected · 13 tools
+```
+To use the operator CLI (`oath mount`, `oath verify`, `oath demo`) instead
+of driving via Claude Code, install the package as a tool:
+```bash
+uv tool install oath-mcp
+oath mount path/to/evidence.E01
+oath verify <envelope-id>
+```
+Full forensic workstation setup, including the longer-form
+`install-on-sift.sh` alternative and a non-SIFT Docker path, is documented
+in [docs/TRY_IT_OUT.md](docs/TRY_IT_OUT.md).
+### Developing locally
+For working on `src/oath/`:
+```bash
+git clone https://github.com/GharsallahDev/oath-mcp-mcp
+cd oath-mcp
+uv venv && uv pip install -e ".[dev]"
+PYTHONPATH=src python -m pytest tests/integration/test_spoliation.py -q
+```
+## Architecture
+```mermaid
+flowchart LR
+    IMG["Evidence image"] --> HANDLE["Read-only EvidenceHandle"]
+    HANDLE --> TOOLS["Typed forensic tools"]
+    TOOLS --> ENV["Signed Notarized<T> envelope"]
+    LLM["LLM proposes typed arguments and claims"] --> TOOLS
+    LLM --> CLAIM["Claim cites envelope_id"]
+    CLAIM --> VERIFY{"Witness Oath Verifier"}
+    ENV --> VERIFY
+    VERIFY -->|receipt replays + predicate matches| OK["VERIFIED"]
+    VERIFY -->|receipt intact, predicate missing| Q["QUARANTINED"]
+    VERIFY -->|hash/signature/data drift| R["RALPH_WIGGUM"]
+    R --> LLM
+```
+OATH uses a custom MCP-style tool surface with typed functions rather than an
+arbitrary shell. The LLM can propose arguments and hypotheses; it cannot promote
+its own findings. Promotion is reserved for the deterministic verifier.
+Detailed trust-boundary notes are in [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md).
+## Repository Map
+| Path | Purpose |
+|---|---|
+| `src/oath/receipt/` | `Notarized<T>` envelope, canonicalization, signatures, prompt hashing |
+| `src/oath/mcp/` | Typed forensic tool surface and evidence-handle plumbing |
+| `src/oath/witness/` | Verifier, claim predicates, self-correction events |
+| `src/oath/benchmark/` | DFIR-Metric harness and scoring utilities |
+| `tests/integration/test_spoliation.py` | Spoliation, data-integrity, chain, and Daubert-binding tests |
+| `logs/self-correction-demo/` | Re-runnable self-correction artifact |
+| `web/` | Static receipt explorer for signed sample envelopes |
+## What OATH Does Not Claim
+OATH does not prove legal admissibility, certify tool correctness, make wrappers
+honest by magic, prove general DFIR competence, or remove the need for examiner
+review. It provides a concrete receipt and verifier pattern for making
+LLM-assisted forensic claims auditable.
+## Documentation
+- [Architecture](docs/ARCHITECTURE.md)
+- [Artifact release notes](docs/ARTIFACT.md)
+- [Publication and citation notes](docs/PUBLICATION.md)
+- [Accuracy and benchmark notes](docs/ACCURACY.md)
+- [Dataset documentation](docs/DATASETS.md)
+- [Try-it-out instructions](docs/TRY_IT_OUT.md)
+## License
+MIT. See [LICENSE](LICENSE).

oath_mcp-0.1.0/corpus/.gitkeep ADDED Viewed

File without changes

oath_mcp-0.1.0/docker/eztools/Dockerfile ADDED Viewed

@@ -0,0 +1,42 @@
+# OATH — Eric Zimmerman's tools (EZ tools) in a pinned .NET 9 container.
+#
+# Pins:
+#   - .NET 9.0.0 (SDK runtime — EZ tools target net9.0)
+#   - dotnet-tools.json controls which tools + which versions get installed.
+#
+# Tools available after build (invoke as `dotnet TOOLNAME` inside the container):
+#   - MFTECmd       — $MFT, $J ($UsnJrnl), $LogFile, $Boot, $SDS, $I30 parser
+#   - EvtxECmd      — Windows Event Log (.evtx) parser with Sigma-style maps
+#   - AmcacheParser — Amcache.hve parser
+#   - PECmd         — Prefetch parser
+#   - SrumECmd      — SRUDB.dat (process / network / energy) parser
+#   - WxTCmd        — Windows Timeline ActivitiesCache.db parser
+#   - RECmd         — Registry hive parser with batch-mode plugins
+#   - SBECmd        — ShellBags parser
+#   - JLECmd        — Jump List parser
+#   - LECmd         — LNK (shortcut) parser
+#
+# All tools accept `--csv-output` or `--json-output` for structured output that
+# the OATH typed-functions layer can deterministically re-derive against.
+FROM mcr.microsoft.com/dotnet/sdk:9.0
+# Working dir for tool execution. Mounts inbound: /evidence (RO), /output (RW).
+WORKDIR /work
+VOLUME ["/evidence", "/output"]
+# Install EZ tools via dotnet-tools.json manifest (pinned versions).
+COPY dotnet-tools.json /work/.config/dotnet-tools.json
+RUN cd /work && dotnet tool restore && dotnet tool list
+# Add the local tool manifest dir to PATH so `EvtxECmd` etc. are callable.
+ENV PATH="/root/.dotnet/tools:${PATH}"
+ENV DOTNET_CLI_TELEMETRY_OPTOUT=1
+ENV DOTNET_NOLOGO=1
+# Quick self-check — fails the build if any tool was misnamed or unreleased.
+RUN dotnet EvtxECmd --version || (echo "EvtxECmd not found" && exit 1)
+RUN dotnet MFTECmd --version || (echo "MFTECmd not found" && exit 1)
+# Idle entrypoint; the OATH MCP server `docker exec`s into this container.
+CMD ["tail", "-f", "/dev/null"]