npm - tryassay - Versions diffs - 0.1.0 - Mend

tryassay 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

package/LICENSE +21 -0
package/README.md +553 -0
package/dist/cli.d.ts +2 -0
package/dist/cli.js +80 -0
package/dist/cli.js.map +1 -0
package/dist/commands/assess.d.ts +6 -0
package/dist/commands/assess.js +267 -0
package/dist/commands/assess.js.map +1 -0
package/dist/commands/describe.d.ts +3 -0
package/dist/commands/describe.js +114 -0
package/dist/commands/describe.js.map +1 -0
package/dist/commands/extract.d.ts +4 -0
package/dist/commands/extract.js +144 -0
package/dist/commands/extract.js.map +1 -0
package/dist/commands/hallucinate.d.ts +3 -0
package/dist/commands/hallucinate.js +100 -0
package/dist/commands/hallucinate.js.map +1 -0
package/dist/commands/init.d.ts +1 -0
package/dist/commands/init.js +39 -0
package/dist/commands/init.js.map +1 -0
package/dist/commands/regenerate.d.ts +3 -0
package/dist/commands/regenerate.js +158 -0
package/dist/commands/regenerate.js.map +1 -0
package/dist/commands/remediate.d.ts +5 -0
package/dist/commands/remediate.js +155 -0
package/dist/commands/remediate.js.map +1 -0
package/dist/commands/report.d.ts +3 -0
package/dist/commands/report.js +84 -0
package/dist/commands/report.js.map +1 -0
package/dist/commands/reverse.d.ts +9 -0
package/dist/commands/reverse.js +115 -0
package/dist/commands/reverse.js.map +1 -0
package/dist/commands/verify.d.ts +4 -0
package/dist/commands/verify.js +112 -0
package/dist/commands/verify.js.map +1 -0
package/dist/lib/anthropic.d.ts +13 -0
package/dist/lib/anthropic.js +60 -0
package/dist/lib/anthropic.js.map +1 -0
package/dist/lib/assessment-reporter.d.ts +5 -0
package/dist/lib/assessment-reporter.js +266 -0
package/dist/lib/assessment-reporter.js.map +1 -0
package/dist/lib/claim-extractor.d.ts +6 -0
package/dist/lib/claim-extractor.js +138 -0
package/dist/lib/claim-extractor.js.map +1 -0
package/dist/lib/code-verifier.d.ts +7 -0
package/dist/lib/code-verifier.js +265 -0
package/dist/lib/code-verifier.js.map +1 -0
package/dist/lib/codebase-indexer.d.ts +15 -0
package/dist/lib/codebase-indexer.js +156 -0
package/dist/lib/codebase-indexer.js.map +1 -0
package/dist/lib/config.d.ts +7 -0
package/dist/lib/config.js +38 -0
package/dist/lib/config.js.map +1 -0
package/dist/lib/constraint-engine.d.ts +2 -0
package/dist/lib/constraint-engine.js +337 -0
package/dist/lib/constraint-engine.js.map +1 -0
package/dist/lib/fs-utils.d.ts +1 -0
package/dist/lib/fs-utils.js +11 -0
package/dist/lib/fs-utils.js.map +1 -0
package/dist/lib/guided-generator.d.ts +2 -0
package/dist/lib/guided-generator.js +195 -0
package/dist/lib/guided-generator.js.map +1 -0
package/dist/lib/inventory-extractor.d.ts +7 -0
package/dist/lib/inventory-extractor.js +238 -0
package/dist/lib/inventory-extractor.js.map +1 -0
package/dist/lib/prompts.d.ts +3 -0
package/dist/lib/prompts.js +50 -0
package/dist/lib/prompts.js.map +1 -0
package/dist/lib/publisher.d.ts +2 -0
package/dist/lib/publisher.js +71 -0
package/dist/lib/publisher.js.map +1 -0
package/dist/lib/remediation-generator.d.ts +2 -0
package/dist/lib/remediation-generator.js +136 -0
package/dist/lib/remediation-generator.js.map +1 -0
package/dist/lib/remediator.d.ts +7 -0
package/dist/lib/remediator.js +209 -0
package/dist/lib/remediator.js.map +1 -0
package/dist/lib/report-generator.d.ts +8 -0
package/dist/lib/report-generator.js +190 -0
package/dist/lib/report-generator.js.map +1 -0
package/dist/lib/requirements-generator.d.ts +14 -0
package/dist/lib/requirements-generator.js +311 -0
package/dist/lib/requirements-generator.js.map +1 -0
package/dist/lib/spec-synthesizer.d.ts +2 -0
package/dist/lib/spec-synthesizer.js +136 -0
package/dist/lib/spec-synthesizer.js.map +1 -0
package/dist/lib/system-prompts.d.ts +12 -0
package/dist/lib/system-prompts.js +254 -0
package/dist/lib/system-prompts.js.map +1 -0
package/dist/types.d.ts +243 -0
package/dist/types.js +2 -0
package/dist/types.js.map +1 -0
package/package.json +49 -0

package/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Rock Steady Systems LLC
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

package/README.md ADDED Viewed

@@ -0,0 +1,553 @@
+<div align="center">
+# Assay
+### AI Code Verification
+**Find bugs that tests miss, linters ignore, and code review overlooks.**
+*Built on the LUCID methodology — Leveraging Unverified Claims Into Deliverables.*
+[![MIT License](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
+[![GitHub stars](https://img.shields.io/github/stars/gtsbahamas/hallucination-reversing-system?style=social)](https://github.com/gtsbahamas/hallucination-reversing-system/stargazers)
+[![Node.js 20+](https://img.shields.io/badge/Node.js-20%2B-339933?logo=node.js&logoColor=white)](https://nodejs.org/)
+[![TypeScript](https://img.shields.io/badge/TypeScript-5.7-3178C6?logo=typescript&logoColor=white)](https://www.typescriptlang.org/)
+[![Paper](https://img.shields.io/badge/Paper-PDF-red?logo=arxiv)](arxiv-submission/main.pdf)
+[![DOI](https://img.shields.io/badge/DOI-10.5281%2Fzenodo.18522644-blue)](https://doi.org/10.5281/zenodo.18522644)
+[![HumanEval](https://img.shields.io/badge/HumanEval-100%25%20pass%405-brightgreen)](results/)
+[![SWE--bench](https://img.shields.io/badge/SWE--bench-30.3%25%20(%2B65%25)-brightgreen)](results/)
+[Website](https://tryassay.ai) | [Paper](docs/paper.md) | [Methodology Guide](docs/methodology.md) | [Prior Art](docs/prior-art.md) | [CLI Reference](#cli-reference)
+</div>
+---
+> **Patent Notice:** The verification methodology implemented by Assay is the subject of U.S. Provisional Patent Application No. 63/980,048, filed February 11, 2026, assigned to Rock Steady Systems LLC. The software is licensed under the MIT License. Use of the software does not grant any patent license beyond the rights conveyed by the MIT License.
+---
+## Benchmark Results
+Assay was evaluated on two standard code generation benchmarks. All results validated by running real test suites, not LLM judgment.
+| Benchmark | Baseline | Assay | Improvement |
+|-----------|----------|-------|-------------|
+| **HumanEval** pass@1 | 86.6% | **98.8%** | +14.1% |
+| **HumanEval** pass@5 | -- | **100%** (164/164) | All problems solved |
+| **SWE-bench** resolve@1 | 18.3% | **25.0%** | +36.4% |
+| **SWE-bench** best-of-5 | -- | **30.3%** (91/300) | +65.5% |
+Key finding: LLM-as-judge verification actually **performs worse** at higher k values (97.2% vs 100% for Assay at k=5) because it hallucinates false positives. Structured claim extraction avoids this failure mode.
+Full benchmark data: [`results/`](results/) | [Benchmark report](https://tryassay.ai/report)
+---
+## The Problem
+Every AI development workflow treats hallucination as the enemy. Spec-Driven Development writes precise specs to prevent it. Prompt engineering constrains it. Guardrails filter it out.
+But three independent formal proofs have established that **hallucination cannot be eliminated** from LLMs:
+- **Xu et al. (2024)** -- learning theory proof that LLMs must hallucinate as general problem solvers
+- **Banerjee et al. (2024)** -- Godel's Incompleteness Theorem applied to LLM architecture
+- **Karpowicz (2025)** -- impossibility theorem via mechanism design and transformer analysis
+If hallucination is mathematically inevitable, suppressing it is fighting thermodynamics. **Assay harnesses it instead.**
+## The Insight
+When you ask an AI to write Terms of Service for an application that doesn't exist, it doesn't say "this application doesn't exist." It **confabulates**. It invents specific capabilities, data handling procedures, user rights, performance guarantees, and limitations -- all in the authoritative, precise language that legal documents demand.
+Every one of those hallucinated claims is a **testable requirement**.
+A single hallucinated ToS produces 80--150 testable claims spanning functionality, security, data privacy, performance, operations, and legal compliance. No human requirements-gathering process generates this breadth in 30 seconds.
+---
+## How Assay Works
+Assay implements the LUCID methodology -- a six-phase iterative cycle that converges hallucinated fiction toward verified reality:
+```
+                        THE ASSAY CYCLE
+    +------------------------------------------------------+
+    |                                                      |
+    |   +-----------+    +--------------+    +----------+  |
+    |   | 1. DESCRIBE|-->|2. HALLUCINATE|-->|3. EXTRACT|  |
+    |   |            |    |              |    |          |  |
+    |   | Loose idea |    | AI writes    |    | Each     |  |
+    |   | of the app |    | ToS as if    |    | claim =  |  |
+    |   |            |    | app is live  |    | testable |  |
+    |   +-----------+    +--------------+    | req      |  |
+    |                                        +----+-----+  |
+    |                                             |        |
+    |   +------------+    +-------------+         |        |
+    |   |5. CONVERGE |<---|  4. BUILD   |<--------+        |
+    |   |            |    |             |                   |
+    |   | Verify ToS |    | Implement   |                   |
+    |   | vs reality |    | until code  |                   |
+    |   |            |    | satisfies   |                   |
+    |   +-----+------+    +-------------+                   |
+    |         |                                            |
+    |    Gap found?                                        |
+    |    YES --> Fix --> Re-verify                         |
+    |    NO  --> Continue                                  |
+    |         |                                            |
+    |   +-----v--------+                                   |
+    |   |6. REGENERATE |   Feed verified reality back.     |
+    |   |              |   AI writes updated ToS.          |
+    |   | New ToS from |   New hallucinations = new reqs.  |
+    |   | updated state|-----------------------------------+
+    |   +--------------+   Loop to step 3
+    |
+    +-- EXIT: Delta between ToS and reality is acceptable
+```
+### Phase Details
+| Phase | What Happens | Output |
+|-------|-------------|--------|
+| **1. Describe** | Give the AI a loose, intentionally incomplete description. The gaps are where hallucination does its best work. | Seed description |
+| **2. Hallucinate** | AI writes Terms of Service as if the app is live in production with paying customers. Legal language forces precision -- no hedging allowed. | 400--600 lines of dense legal text |
+| **3. Extract** | Parse every declarative statement into a structured, testable claim with category, severity, and traceability back to the ToS clause. | 80--150 categorized claims |
+| **4. Build** | Implement the application using any methodology (TDD, agile, etc.). The ToS-derived claims are the acceptance criteria. | Working code |
+| **5. Converge** | Verify every claim against the actual codebase. Assign verdicts: PASS, PARTIAL, FAIL, or N/A. Generate a gap report. | Compliance score + gap report |
+| **6. Regenerate** | Feed verified reality back to the AI. It writes an updated ToS -- keeping what's real, revising what's partial, and hallucinating new features. | Next iteration's specification |
+### Convergence
+With each iteration:
+- The ratio of accurate-to-hallucinated claims increases
+- New hallucinations become more contextually grounded
+- The gap between spec and reality shrinks
+- The application grows in directions the AI deems plausible for the domain
+**Exit condition:** The team decides the delta is acceptable. This is a human judgment call, not an automated threshold.
+---
+## Empirical Results
+Assay was applied to a production Next.js application (~30,000 lines of TypeScript, 200+ files):
+| Iteration | Compliance | PASS | PARTIAL | FAIL | N/A |
+|-----------|-----------|------|---------|------|-----|
+| 1 | ~35% (est.) | -- | -- | -- | -- |
+| 3 | 57.3% | 38 | 15 | 32 | 6 |
+| 4 | 69.8% | 47 | 18 | 20 | 6 |
+| 5 | 83.2% | 61 | 15 | 9 | 6 |
+| **6** | **90.8%** | **68** | **12** | **5** | **6** |
+```
+Compliance Over Iterations:
+100% |
+ 90% |                                          *  90.8%
+ 80% |                              *  83.2%
+ 70% |                  *  69.8%
+ 60% |      *  57.3%
+ 50% |
+ 40% |
+ 35% |  *  ~35%
+     +--+------+------+------+------+------+--
+        1      2      3      4      5      6
+                    Iteration
+```
+**Total cost for 6 iterations: ~$17 in API tokens.**
+The 5 remaining FAIL claims after convergence were all **genuine missing functionality** -- not false positives. The hallucinated ToS correctly identified requirements a production app should have.
+---
+## Why Terms of Service?
+ToS is the ideal hallucination vehicle because the document format forces specificity across every dimension of a software product simultaneously:
+| ToS Section | Produces | Example Claim |
+|-------------|----------|---------------|
+| Service Description | Feature requirements | "The Service allows batch processing of up to 10,000 records" |
+| Acceptable Use | Input validation rules | "Users may not upload files exceeding 50MB" |
+| Data Handling | Privacy & security requirements | "User data is encrypted at rest using AES-256" |
+| Limitations | Performance boundaries | "The Service supports up to 10,000 concurrent users" |
+| SLA / Uptime | Reliability requirements | "The Service maintains 99.9% uptime" |
+| Termination | Account lifecycle requirements | "Data is retained for 30 days post-deletion" |
+| Liability | Error handling requirements | "Graceful degradation on third-party API failure" |
+| Modifications | Versioning requirements | "Users are notified 30 days before changes" |
+Legal language cannot be vague. *"The Service may do things"* is not a valid legal clause. The format forces the AI to hallucinate **precisely**.
+---
+## Quick Start
+### Prerequisites
+- Node.js 20+
+- An [Anthropic API key](https://console.anthropic.com/) (Claude)
+### Installation
+```bash
+# Clone the repository
+git clone https://github.com/gtsbahamas/hallucination-reversing-system.git
+cd hallucination-reversing-system
+# Install dependencies
+npm install
+# Build the CLI
+npm run build
+# Set your API key
+export ANTHROPIC_API_KEY="sk-ant-..."
+```
+### Run Your First Assay Cycle
+```bash
+# 1. Initialize an Assay project
+npx assay init
+# 2. Generate a hallucinated Terms of Service
+npx assay hallucinate
+# 3. Extract testable claims from the hallucination
+npx assay extract
+# 4. Verify claims against your codebase
+npx assay verify --repo /path/to/your/project
+# 5. Generate a gap report
+npx assay report
+# 6. Generate remediation tasks for gaps
+npx assay remediate --repo /path/to/your/project
+# 7. After fixing gaps, regenerate for the next iteration
+npx assay regenerate
+```
+Each iteration stores artifacts in `.assay/iterations/{N}/`, maintaining a complete audit trail.
+---
+## MCP Server (Claude Code, Cursor, Windsurf)
+Add Assay verification as a native tool in your AI editor with one config block.
+```bash
+npm install -g assay-mcp
+```
+**Claude Code** (`~/.claude/settings.json`):
+```json
+{
+  "mcpServers": {
+    "assay": {
+      "command": "npx",
+      "args": ["-y", "assay-mcp"],
+      "env": { "ASSAY_API_KEY": "ak_live_your_key_here" }
+    }
+  }
+}
+```
+Then ask your AI assistant: *"Verify this file with Assay"* or *"Generate a verified function that parses CSV"*
+Assay catches what the AI missed and shows you exactly what would have shipped without verification.
+Get a free API key at [tryassay.ai](https://tryassay.ai). See [mcp-server/README.md](mcp-server/README.md) for full docs.
+---
+## GitHub Action
+Add Assay verification to your CI/CD pipeline. Every PR gets a verification report as a comment.
+```yaml
+- uses: gtsbahamas/hallucination-reversing-system/github-action@v0.1.1
+  with:
+    assay-api-key: ${{ secrets.ASSAY_API_KEY }}
+```
+Two modes: **Assay API** (recommended, uses your Assay key) or **BYOK** (bring your own Anthropic key for self-hosted verification). See [github-action/README.md](github-action/README.md) for full docs.
+---
+## CLI Reference
+| Command | Phase | Description |
+|---------|-------|-------------|
+| `assay init` | Setup | Initialize project configuration (name, description, tech stack, audience) |
+| `assay hallucinate` | Phase 2 | Generate a hallucinated ToS/API docs/user manual from project config |
+| `assay describe` | Alt. input | Fetch an existing ToS from a URL (verify an existing product) |
+| `assay extract` | Phase 3 | Extract testable claims from a hallucinated or fetched document |
+| `assay verify` | Phase 5 | Verify extracted claims against a codebase |
+| `assay report` | Analysis | Generate a gap report from verification results |
+| `assay remediate` | Convergence | Generate code-level fix tasks from gaps |
+| `assay regenerate` | Phase 6 | Feed verified reality back, regenerate spec for next iteration |
+### Options
+```bash
+assay hallucinate --type tos|api-docs|user-manual   # Document type (default: tos)
+assay extract --iteration 3                          # Specify iteration (default: latest)
+assay extract --source my-tos.md                     # Extract from a file in .assay/sources/
+assay verify --repo /path/to/code --iteration 3      # Verify specific iteration
+assay remediate --threshold 95                       # Set compliance target (default: 95%)
+assay regenerate --iteration 3                       # Regenerate from specific iteration
+```
+---
+## Scoring Methodology
+Assay assigns four verdicts to each claim:
+| Verdict | Meaning | Score Weight |
+|---------|---------|-------------|
+| **PASS** | Code fully implements the claim | 1.0 |
+| **PARTIAL** | Code partially implements (some aspects missing) | 0.5 |
+| **FAIL** | Code does not implement or contradicts the claim | 0.0 |
+| **N/A** | Cannot be verified from code (e.g., legal-only claims) | Excluded |
+**Compliance score:**
+```
+Score = (PASS + 0.5 * PARTIAL) / (Total - N/A) * 100
+```
+Claims are categorized by type and severity:
+| Category | Examples |
+|----------|---------|
+| `functionality` | Features, user workflows, UI components |
+| `security` | Encryption, auth, access control |
+| `data-privacy` | Data handling, retention, deletion |
+| `operational` | Performance, uptime, monitoring |
+| `legal` | Terms, disclaimers, compliance |
+| Severity | Meaning |
+|----------|---------|
+| `critical` | Security breach or data loss if false |
+| `high` | Core functionality broken if false |
+| `medium` | Important but not showstopping |
+| `low` | Nice-to-have or cosmetic |
+---
+## The Neuroscience Behind Assay
+Assay is not an arbitrary methodology. It is grounded in three convergent lines of evidence from cognitive neuroscience:
+### 1. Transformers = Hippocampal Pattern Completion
+Ramsauer et al. (2020) proved that transformer self-attention is **mathematically equivalent** to the update rule of Hopfield networks -- the same associative memory computation performed by the hippocampal CA3 network. When an LLM generates text about a nonexistent app, it performs pattern completion from partial cues, filling gaps with plausible details. This is identical to how human memory reconstructs events -- some accurate, some confabulated.
+### 2. Perception as Controlled Hallucination
+The predictive processing framework (Friston, Clark, Seth) holds that the brain is a prediction machine. As Anil Seth states: *"We're all hallucinating all the time; when we agree about our hallucinations, we call it reality."* Hallucination and perception are the same generative process under different constraint levels. Assay deliberately operates unconstrained during the Hallucinate phase, then progressively introduces constraint through Converge and Regenerate.
+### 3. The REBUS Model (Relaxed Beliefs Under Psychedelics)
+Carhart-Harris and Friston (2019) showed that psychedelics relax the brain's top-down constraints, enabling novel associations that rigid priors normally suppress. This maps directly to LLM temperature: higher temperature = more novel (and hallucination-prone) outputs. Assay exploits this by generating freely at "high temperature," then constraining iteratively -- just as the brain reintegrates psychedelic insights under normal conditions.
+### The Naming
+The LUCID methodology is named for **lucid dreaming** -- the state where a dreamer becomes metacognitively aware they are dreaming while remaining in the dream. A lucid dreamer does not fight the dream. They participate with awareness, harvesting creative content while maintaining the ability to distinguish generated from real. Assay applies this principle to AI-generated code: harness the hallucination, don't suppress it.
+---
+## How Assay Differs From Traditional Approaches
+| Approach | Hallucination Stance | Spec Source | Convergence Loop | Verification |
+|----------|---------------------|-------------|------------------|-------------|
+| **Spec-Driven Development** (GitHub, 2025) | Prevents | Human-written | No | Spec compliance |
+| **Readme-Driven Development** (Preston-Werner, 2010) | N/A | Human-written | No | Manual |
+| **Design Fiction** (Sterling, 2005) | Intentional (human) | Human fiction | Loose | Informal |
+| **Vibe Coding** (Karpathy, 2025) | Tolerates | Human prompt | No | Ad hoc |
+| **Protein Hallucination** (Baker, Nobel 2024) | Exploits | Neural network | Validate-only | Lab synthesis |
+| **Assay** | **Exploits** | **AI-hallucinated ToS** | **Yes** | **Codebase verification** |
+Assay is the only methodology that combines AI-generated specification, deliberate hallucination exploitation, and iterative convergence verification against a real codebase.
+The closest analogue is David Baker's protein hallucination -- where neural network "dreams" serve as blueprints for novel biological structures. That insight earned the **2024 Nobel Prize in Chemistry**. Assay applies the identical principle to software engineering.
+---
+## Real-World Application
+Assay was developed and dogfooded on production applications, including an event photography platform and an AI agent platform. The gap analysis from a real Assay iteration looks like this:
+```
+Iteration 1: CrowdPics TV (112 claims extracted)
++----------------------------------+
+|  REAL          36  (32%)  ====   |
+|  PARTIAL       13  (12%)  ==     |
+|  HALLUCINATED  63  (56%)  ====== |
++----------------------------------+
+Each HALLUCINATED claim is a missing feature.
+Each PARTIAL claim is incomplete work.
+The gap IS the backlog.
+```
+After iterative remediation and regeneration, compliance converges toward 90%+. The remaining gaps are genuine missing functionality that serves as a prioritized development roadmap.
+---
+## Project Structure
+```
+hallucination-reversing-system/
+├── src/                        # CLI source (TypeScript)
+│   ├── cli.ts                  # Entry point (Commander.js)
+│   ├── commands/               # One file per CLI command
+│   │   ├── init.ts             # Project initialization
+│   │   ├── hallucinate.ts      # ToS generation
+│   │   ├── describe.ts         # Fetch existing ToS from URL
+│   │   ├── extract.ts          # Claim extraction
+│   │   ├── verify.ts           # Codebase verification
+│   │   ├── report.ts           # Gap report generation
+│   │   ├── remediate.ts        # Fix task generation
+│   │   └── regenerate.ts       # Iterative regeneration
+│   ├── lib/                    # Core modules
+│   │   ├── anthropic.ts        # Claude SDK wrapper
+│   │   ├── claim-extractor.ts  # Claim parsing logic
+│   │   ├── code-verifier.ts    # Codebase verification engine
+│   │   ├── codebase-indexer.ts # File tree indexing
+│   │   ├── config.ts           # Project configuration
+│   │   ├── prompts.ts          # LLM prompt templates
+│   │   └── ...
+│   └── types.ts                # Type definitions
+├── docs/                       # Documentation
+│   ├── paper.md                # Full research paper
+│   ├── methodology.md          # Methodology guide
+│   └── prior-art.md            # Prior art analysis
+├── applications/               # Real-world Assay applications
+├── arxiv-submission/           # Academic paper (LaTeX + PDF)
+├── chi-submission/             # CHI 2026 workshop submission
+├── index.html                  # Landing page (GitHub Pages)
+└── .assay/                     # Assay's own self-audit
+    └── iterations/
+        └── self-audit/         # Assay audited against itself
+```
+---
+## Publications
+| Venue | Status | Link |
+|-------|--------|------|
+| **Zenodo** (peer-reviewed DOI) | Published | [10.5281/zenodo.18522644](https://doi.org/10.5281/zenodo.18522644) |
+| **arXiv** | Submitted | [arxiv-submission/main.pdf](arxiv-submission/main.pdf) |
+| **CHI 2026 Workshop** | In progress | [chi-submission/](chi-submission/) |
+---
+## Token Economics
+Running a full Assay iteration is inexpensive:
+| Phase | Input Tokens | Output Tokens | Cost (approx.) |
+|-------|-------------|---------------|----------------|
+| Hallucinate | ~2K | ~12K | $0.15 |
+| Extract | ~15K | ~8K | $0.25 |
+| Verify | ~80K | ~20K | $1.50 |
+| Remediate | ~30K | ~15K | $0.60 |
+| Regenerate | ~20K | ~12K | $0.40 |
+| **Full iteration** | | | **~$2.90** |
+A complete 6-iteration cycle that achieves 90%+ compliance costs approximately **$17 in API tokens** -- producing a verified specification with 91 claims, a gap report, and a prioritized remediation plan.
+---
+## Principles
+1. **Hallucination is signal, not noise.** The AI's confabulations reveal what a plausible version of the application looks like.
+2. **Legal language enforces precision.** ToS cannot be vague. The format forces the AI to hallucinate precisely.
+3. **The gap is the backlog.** The difference between what the ToS claims and what the code does is your task list.
+4. **Reality is the only test.** A claim is satisfied when verified against running code, not when code is written.
+5. **The loop is the methodology.** Assay is not one-shot generation. It is iterative convergence between fiction and reality.
+6. **Verification requires external ground truth.** LLMs cannot self-correct without external feedback (Huang et al., ICLR 2024). The codebase is the ground truth.
+---
+## Contributing
+Contributions are welcome. Areas where help is particularly valuable:
+- **Multi-document hallucination** -- Extending beyond ToS to API docs, user manuals, privacy policies, and compliance certifications simultaneously
+- **Formal verification integration** -- Replacing LLM-based verification with property-based testing, model checking, or static analysis for specific claim categories
+- **CI/CD integration** -- Running Assay in continuous integration pipelines for specification-drift detection
+- **Language support** -- The CLI currently targets TypeScript/JavaScript codebases; other languages need codebase indexing adapters
+- **Benchmarking** -- Comparing initial hallucination quality across different LLMs (Claude, GPT-4, Gemini, Llama)
+### Development
+```bash
+git clone https://github.com/gtsbahamas/hallucination-reversing-system.git
+cd hallucination-reversing-system
+npm install
+npm run dev    # Watch mode (TypeScript compilation)
+npm run build  # Production build
+```
+---
+## FAQ
+**Q: Isn't this just "make stuff up and hope for the best"?**
+No. The hallucination is the *input*, not the output. Assay verifies every claim against the actual codebase. Unverified claims are surfaced as gaps. Nothing ships without evidence. The methodology is closer to the scientific method: hypothesize (hallucinate), test (verify), refine (regenerate).
+**Q: Why not just write requirements manually?**
+You can. But no human writes 91 testable requirements spanning functionality, security, data privacy, performance, operations, and legal compliance in 30 seconds. Assay generates comprehensive first-draft specifications at machine speed, then converges them toward reality through verification.
+**Q: Does this actually work in production?**
+Yes. Assay was developed while building production applications. The empirical results (57% to 91% compliance over 6 iterations) come from a real codebase with 30,000+ lines of TypeScript. The remaining gaps were genuine missing functionality, not false positives.
+**Q: How is this different from vibe coding?**
+Vibe coding tolerates hallucination in the *code*. Assay exploits hallucination in the *specification* and then demands rigorous verification of the code against that specification. The verification loop is the critical difference -- vibe coding has no convergence mechanism.
+**Q: What models does Assay support?**
+The CLI currently uses Anthropic's Claude via the official SDK. The architecture is model-agnostic -- any LLM capable of generating structured legal text and performing code analysis can be substituted.
+---
+## Citation
+```bibtex
+@article{wells2026lucid,
+  title={LUCID: Leveraging Unverified Claims Into Deliverables},
+  author={Wells, Ty},
+  year={2026},
+  doi={10.5281/zenodo.18522644},
+  url={https://github.com/gtsbahamas/hallucination-reversing-system}
+}
+```
+---
+## License
+[MIT](LICENSE) -- Use it, fork it, build on it.
+Copyright (c) 2026 Rock Steady Systems LLC.
+---
+<div align="center">
+*"Normal specification is hallucination constrained by reality. Assay is the first development tool that uses this principle: generate freely, then constrain iteratively, just as the brain does."*
+**Built by [Rock Steady Systems LLC](https://tryassay.ai)**
+</div>

package/dist/cli.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ #!/usr/bin/env node
2	+ export {};

package/dist/cli.js ADDED Viewed

@@ -0,0 +1,80 @@
+#!/usr/bin/env node
+import { Command } from 'commander';
+import { initCommand } from './commands/init.js';
+import { hallucinateCommand } from './commands/hallucinate.js';
+import { extractCommand } from './commands/extract.js';
+import { describeCommand } from './commands/describe.js';
+import { verifyCommand } from './commands/verify.js';
+import { reportCommand } from './commands/report.js';
+import { regenerateCommand } from './commands/regenerate.js';
+import { remediateCommand } from './commands/remediate.js';
+import { reverseCommand } from './commands/reverse.js';
+import { assessCommand } from './commands/assess.js';
+const program = new Command();
+program
+    .name('assay')
+    .description('Assay — AI code verification using the LUCID methodology')
+    .version('0.1.0');
+program
+    .command('init')
+    .description('Initialize an Assay project in the current directory')
+    .action(initCommand);
+program
+    .command('hallucinate')
+    .description('Generate a hallucinated spec from your project config')
+    .option('-t, --type <type>', 'Document type: tos, api-docs, user-manual', 'tos')
+    .action(hallucinateCommand);
+program
+    .command('describe')
+    .description('Fetch an existing ToS or Privacy Policy from a URL')
+    .option('-u, --url <url...>', 'URL(s) to fetch')
+    .action(describeCommand);
+program
+    .command('extract')
+    .description('Extract testable claims from a hallucinated or described document')
+    .option('-i, --iteration <number>', 'Iteration number (defaults to latest)')
+    .option('-s, --source <filename>', 'Source file from .assay/sources/ instead of iteration')
+    .action(extractCommand);
+program
+    .command('verify')
+    .description('Verify extracted claims against a codebase')
+    .option('-r, --repo <path>', 'Path to the codebase to verify against', '.')
+    .option('-i, --iteration <number>', 'Iteration number (defaults to latest)')
+    .action(verifyCommand);
+program
+    .command('report')
+    .description('Generate a gap report from verification results')
+    .option('-i, --iteration <number>', 'Iteration number (defaults to latest)')
+    .action(reportCommand);
+program
+    .command('regenerate')
+    .description('Regenerate a hallucinated spec from prior verification results (Phase 6)')
+    .option('-i, --iteration <number>', 'Source iteration to regenerate from (defaults to latest)')
+    .action(regenerateCommand);
+program
+    .command('remediate')
+    .description('Generate code-level fix tasks from verification results (converge code toward spec)')
+    .option('-i, --iteration <number>', 'Iteration number (defaults to latest)')
+    .option('-r, --repo <path>', 'Path to the codebase to remediate', '.')
+    .option('-t, --threshold <number>', 'Compliance threshold (default: 95)', '95')
+    .action(remediateCommand);
+program
+    .command('reverse')
+    .description('Reverse Assay — generate code with hallucination prevention')
+    .option('-t, --task <task>', 'Coding task description')
+    .option('-f, --task-file <path>', 'Read task from file')
+    .option('-l, --lang <language>', 'Target language', 'typescript')
+    .option('-o, --output <path>', 'Output file path')
+    .option('-v, --verbose', 'Show detailed progress')
+    .action(reverseCommand);
+program
+    .command('assess')
+    .description('Run autonomous LVR Loop 1 assessment against a codebase')
+    .argument('<target>', 'Path to codebase or GitHub repo URL')
+    .option('--publish', 'Upload results to tryassay.ai')
+    .option('--domain <domains>', 'Comma-separated domains to assess (default: all)')
+    .option('--concurrency <n>', 'Max parallel routes to process', '5')
+    .option('--api-url <url>', 'API URL for publishing', 'https://tryassay.ai')
+    .action(assessCommand);
+program.parse();
+//# sourceMappingURL=cli.js.map

package/dist/cli.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"cli.js","sourceRoot":"","sources":["../src/cli.ts"],"names":[],"mappings":";AAEA,OAAO,EAAE,OAAO,EAAE,MAAM,WAAW,CAAC;AACpC,OAAO,EAAE,WAAW,EAAE,MAAM,oBAAoB,CAAC;AACjD,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;AACvD,OAAO,EAAE,eAAe,EAAE,MAAM,wBAAwB,CAAC;AACzD,OAAO,EAAE,aAAa,EAAE,MAAM,sBAAsB,CAAC;AACrD,OAAO,EAAE,aAAa,EAAE,MAAM,sBAAsB,CAAC;AACrD,OAAO,EAAE,iBAAiB,EAAE,MAAM,0BAA0B,CAAC;AAC7D,OAAO,EAAE,gBAAgB,EAAE,MAAM,yBAAyB,CAAC;AAC3D,OAAO,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;AACvD,OAAO,EAAE,aAAa,EAAE,MAAM,sBAAsB,CAAC;AAErD,MAAM,OAAO,GAAG,IAAI,OAAO,EAAE,CAAC;AAE9B,OAAO;KACJ,IAAI,CAAC,OAAO,CAAC;KACb,WAAW,CAAC,0DAA0D,CAAC;KACvE,OAAO,CAAC,OAAO,CAAC,CAAC;AAEpB,OAAO;KACJ,OAAO,CAAC,MAAM,CAAC;KACf,WAAW,CAAC,sDAAsD,CAAC;KACnE,MAAM,CAAC,WAAW,CAAC,CAAC;AAEvB,OAAO;KACJ,OAAO,CAAC,aAAa,CAAC;KACtB,WAAW,CAAC,uDAAuD,CAAC;KACpE,MAAM,CAAC,mBAAmB,EAAE,2CAA2C,EAAE,KAAK,CAAC;KAC/E,MAAM,CAAC,kBAAkB,CAAC,CAAC;AAE9B,OAAO;KACJ,OAAO,CAAC,UAAU,CAAC;KACnB,WAAW,CAAC,oDAAoD,CAAC;KACjE,MAAM,CAAC,oBAAoB,EAAE,iBAAiB,CAAC;KAC/C,MAAM,CAAC,eAAe,CAAC,CAAC;AAE3B,OAAO;KACJ,OAAO,CAAC,SAAS,CAAC;KAClB,WAAW,CAAC,mEAAmE,CAAC;KAChF,MAAM,CAAC,0BAA0B,EAAE,uCAAuC,CAAC;KAC3E,MAAM,CAAC,yBAAyB,EAAE,uDAAuD,CAAC;KAC1F,MAAM,CAAC,cAAc,CAAC,CAAC;AAE1B,OAAO;KACJ,OAAO,CAAC,QAAQ,CAAC;KACjB,WAAW,CAAC,4CAA4C,CAAC;KACzD,MAAM,CAAC,mBAAmB,EAAE,wCAAwC,EAAE,GAAG,CAAC;KAC1E,MAAM,CAAC,0BAA0B,EAAE,uCAAuC,CAAC;KAC3E,MAAM,CAAC,aAAa,CAAC,CAAC;AAEzB,OAAO;KACJ,OAAO,CAAC,QAAQ,CAAC;KACjB,WAAW,CAAC,iDAAiD,CAAC;KAC9D,MAAM,CAAC,0BAA0B,EAAE,uCAAuC,CAAC;KAC3E,MAAM,CAAC,aAAa,CAAC,CAAC;AAEzB,OAAO;KACJ,OAAO,CAAC,YAAY,CAAC;KACrB,WAAW,CAAC,0EAA0E,CAAC;KACvF,MAAM,CAAC,0BAA0B,EAAE,0DAA0D,CAAC;KAC9F,MAAM,CAAC,iBAAiB,CAAC,CAAC;AAE7B,OAAO;KACJ,OAAO,CAAC,WAAW,CAAC;KACpB,WAAW,CAAC,qFAAqF,CAAC;KAClG,MAAM,CAAC,0BAA0B,EAAE,uCAAuC,CAAC;KAC3E,MAAM,CAAC,mBAAmB,EAAE,mCAAmC,EAAE,GAAG,CAAC;KACrE,MAAM,CAAC,0BAA0B,EAAE,oCAAoC,EAAE,IAAI,CAAC;KAC9E,MAAM,CAAC,gBAAgB,CAAC,CAAC;AAE5B,OAAO;KACJ,OAAO,CAAC,SAAS,CAAC;KAClB,WAAW,CAAC,6DAA6D,CAAC;KAC1E,MAAM,CAAC,mBAAmB,EAAE,yBAAyB,CAAC;KACtD,MAAM,CAAC,wBAAwB,EAAE,qBAAqB,CAAC;KACvD,MAAM,CAAC,uBAAuB,EAAE,iBAAiB,EAAE,YAAY,CAAC;KAChE,MAAM,CAAC,qBAAqB,EAAE,kBAAkB,CAAC;KACjD,MAAM,CAAC,eAAe,EAAE,wBAAwB,CAAC;KACjD,MAAM,CAAC,cAAc,CAAC,CAAC;AAE1B,OAAO;KACJ,OAAO,CAAC,QAAQ,CAAC;KACjB,WAAW,CAAC,yDAAyD,CAAC;KACtE,QAAQ,CAAC,UAAU,EAAE,qCAAqC,CAAC;KAC3D,MAAM,CAAC,WAAW,EAAE,+BAA+B,CAAC;KACpD,MAAM,CAAC,oBAAoB,EAAE,kDAAkD,CAAC;KAChF,MAAM,CAAC,mBAAmB,EAAE,gCAAgC,EAAE,GAAG,CAAC;KAClE,MAAM,CAAC,iBAAiB,EAAE,wBAAwB,EAAE,qBAAqB,CAAC;KAC1E,MAAM,CAAC,aAAa,CAAC,CAAC;AAEzB,OAAO,CAAC,KAAK,EAAE,CAAC"}

package/dist/commands/assess.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export declare function assessCommand(target: string, options: {
+    publish?: boolean;
+    domain?: string;
+    concurrency?: string;
+    apiUrl?: string;
+}): Promise<void>;