npm - @miller-tech/uap - Versions diffs - 1.40.0 → 1.41.0 - Mend

@miller-tech/uap 1.40.0 → 1.41.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (150) hide show

package/README.md +109 -642
package/dist/.tsbuildinfo +1 -1
package/dist/cli/deliver-defaults.d.ts +23 -0
package/dist/cli/deliver-defaults.d.ts.map +1 -0
package/dist/cli/deliver-defaults.js +121 -0
package/dist/cli/deliver-defaults.js.map +1 -0
package/dist/cli/init.d.ts.map +1 -1
package/dist/cli/init.js +29 -0
package/dist/cli/init.js.map +1 -1
package/dist/cli/setup.d.ts.map +1 -1
package/dist/cli/setup.js +19 -0
package/dist/cli/setup.js.map +1 -1
package/dist/policies/policy-tools.d.ts +7 -0
package/dist/policies/policy-tools.d.ts.map +1 -1
package/dist/policies/policy-tools.js +24 -2
package/dist/policies/policy-tools.js.map +1 -1
package/docs/INDEX.md +48 -286
package/docs/architecture/OVERVIEW.md +328 -0
package/docs/architecture/PROTOCOL.md +204 -0
package/docs/benchmarks/README.md +17 -192
package/docs/getting-started/CONFIGURATION.md +237 -0
package/docs/getting-started/INSTALLATION.md +125 -0
package/docs/getting-started/QUICKSTART.md +115 -0
package/docs/guides/COORDINATION.md +162 -0
package/docs/guides/DELIVER.md +115 -0
package/docs/guides/DEPLOY_BATCHING.md +212 -0
package/docs/guides/DROIDS_AND_SKILLS.md +202 -0
package/docs/guides/LOCAL_MODELS.md +148 -0
package/docs/guides/MCP_ROUTER.md +195 -0
package/docs/guides/MEMORY.md +235 -0
package/docs/guides/MULTI_MODEL.md +223 -0
package/docs/guides/POLICIES.md +190 -0
package/docs/guides/WORKTREE_WORKFLOW.md +185 -0
package/docs/integrations/MCP_ROUTER.md +147 -0
package/docs/integrations/RTK.md +102 -0
package/docs/reference/API.md +485 -0
package/docs/reference/CLI.md +719 -0
package/docs/reference/CONFIGURATION.md +90 -193
package/docs/reference/DATABASE_SCHEMA.md +110 -344
package/docs/reference/FEATURES.md +176 -472
package/docs/reference/PATTERNS.md +102 -0
package/docs/reference/PLATFORMS.md +83 -0
package/package.json +3 -1
package/src/policies/enforcers/7ebbc721-7540-4e9f-879a-770e0213a09b_architecture_review.py +101 -0
package/src/policies/enforcers/__pycache__/_common.cpython-312.pyc +0 -0
package/src/policies/enforcers/_common.py +100 -0
package/src/policies/enforcers/artifact_hygiene.py +52 -0
package/src/policies/enforcers/cluster_routing.py +63 -0
package/src/policies/enforcers/codebase_read_before_plan.py +52 -0
package/src/policies/enforcers/coord_overlap.py +81 -0
package/src/policies/enforcers/delivery_enforcement.py +97 -0
package/src/policies/enforcers/doc_live_over_report.py +50 -0
package/src/policies/enforcers/expert_review_required.py +135 -0
package/src/policies/enforcers/iac_parity.py +53 -0
package/src/policies/enforcers/mcp_router_first.py +37 -0
package/src/policies/enforcers/memory_before_plan.py +61 -0
package/src/policies/enforcers/parallel_reads.py +50 -0
package/src/policies/enforcers/rtk_wrap.py +44 -0
package/src/policies/enforcers/schema_diff_gate.py +80 -0
package/src/policies/enforcers/session_memory_write.py +52 -0
package/src/policies/enforcers/task_required.py +131 -0
package/src/policies/enforcers/test_gate.py +58 -0
package/src/policies/enforcers/validate_plan_before_build.py +75 -0
package/src/policies/enforcers/worktree_required.py +57 -0
package/src/policies/schemas/policies/architecture-review.md +51 -0
package/src/policies/schemas/policies/artifact-hygiene.md +29 -0
package/src/policies/schemas/policies/cluster-routing.md +31 -0
package/src/policies/schemas/policies/codebase-read-before-plan.md +30 -0
package/src/policies/schemas/policies/coord-overlap.md +24 -0
package/src/policies/schemas/policies/delivery-enforcement.md +45 -0
package/src/policies/schemas/policies/doc-live-over-report.md +32 -0
package/src/policies/schemas/policies/expert-review-required.md +60 -0
package/src/policies/schemas/policies/iac-parity.md +31 -0
package/src/policies/schemas/policies/mandatory-testing-deployment.md +147 -0
package/src/policies/schemas/policies/mcp-router-first.md +24 -0
package/src/policies/schemas/policies/memory-before-plan.md +24 -0
package/src/policies/schemas/policies/merge-deploy-monitor-verify.md +145 -0
package/src/policies/schemas/policies/parallel-reads.md +24 -0
package/src/policies/schemas/policies/rtk-wrap.md +26 -0
package/src/policies/schemas/policies/schema-diff-gate.md +30 -0
package/src/policies/schemas/policies/session-memory-write.md +24 -0
package/src/policies/schemas/policies/task-required.md +49 -0
package/src/policies/schemas/policies/test-gate.md +24 -0
package/src/policies/schemas/policies/validate-plan-before-build.md +28 -0
package/src/policies/schemas/policies/worktree-required.md +28 -0
package/templates/hooks/uap-policy-gate.sh +5 -0
package/docs/AGENTS.md +0 -423
package/docs/DOCUMENTATION_AUDIT_REPORT.md +0 -131
package/docs/GETTING_STARTED.md +0 -288
package/docs/PROJECT_ANALYSIS_REPORT.md +0 -510
package/docs/architecture/COMPLETE_ARCHITECTURE.md +0 -748
package/docs/architecture/EXPERT_STACK.md +0 -137
package/docs/architecture/MULTI_MODEL.md +0 -224
package/docs/architecture/PLATFORM_GATING.md +0 -68
package/docs/architecture/SYSTEM_ANALYSIS.md +0 -334
package/docs/architecture/UAP_COMPLIANCE.md +0 -217
package/docs/architecture/UAP_PROTOCOL.md +0 -339
package/docs/architecture/UAP_STRICT_DROIDS.md +0 -172
package/docs/archive/BALLS_MODE_SELF_ANALYSIS.md +0 -260
package/docs/archive/BENCHMARK_GAPS_AND_PLAN.md +0 -146
package/docs/archive/FAILING_TASKS_SOLUTION_PLAN.md +0 -668
package/docs/archive/JINJA2-SYSTEM-MESSAGE-FIX.md +0 -209
package/docs/archive/MODEL_ROUTING_IMPLEMENTATION_SUMMARY.md +0 -281
package/docs/archive/MODEL_ROUTING_OPTIMIZATION_PLAN.md +0 -320
package/docs/archive/NPM-PUBLISH-V0.9.1.md +0 -240
package/docs/archive/OPTIMIZATION_OPTIONS.md +0 -334
package/docs/archive/PARALLELISM_GAPS_AND_OPTIONS.md +0 -422
package/docs/archive/POLICY_GATE_IMPLEMENTATION.md +0 -245
package/docs/archive/SETUP_IMPROVEMENTS.md +0 -213
package/docs/archive/UAP_GENERIC_OPTIMIZATION_PLAN.md +0 -270
package/docs/archive/UAP_OPTIMIZATION_PLAN.md +0 -701
package/docs/archive/UAP_V103_PATTERN_DESIGN.md +0 -315
package/docs/archive/UAP_V104_COMPLIANCE_DESIGN.md +0 -223
package/docs/archive/changelog/2026-03-10_uap-100-compliance.md +0 -77
package/docs/archive/changelog/2026-03-10_uap-full-system-verification.md +0 -109
package/docs/archive/opencode-integration-guide.md +0 -740
package/docs/archive/opencode-integration-quickref.md +0 -180
package/docs/benchmarks/OVERNIGHT_RUNNER.md +0 -341
package/docs/benchmarks/SPECULATIVE_DECODING_JOURNEY_2026-03.md +0 -221
package/docs/benchmarks/VALIDATION_PLAN.md +0 -568
package/docs/blog/SPECULATIVE_DECODING_PRODUCTION_PLAYBOOK.md +0 -139
package/docs/blog/local-coding-agents.md +0 -266
package/docs/blog/x-thread.md +0 -254
package/docs/deployment/DEPLOYMENT.md +0 -895
package/docs/deployment/DEPLOYMENT_STRATEGIES.md +0 -518
package/docs/deployment/DEPLOY_BATCHER_ANALYSIS.md +0 -224
package/docs/deployment/DEPLOY_BATCHING.md +0 -273
package/docs/deployment/DEPLOY_BUCKETING_ANALYSIS.md +0 -420
package/docs/deployment/QWEN35_LLAMA_CPP.md +0 -426
package/docs/deployment/UAP_LLAMA_ANTHROPIC_PROXY_BOOTSTRAP.md +0 -279
package/docs/getting-started/INTEGRATION.md +0 -628
package/docs/getting-started/OVERVIEW.md +0 -324
package/docs/getting-started/SETUP.md +0 -377
package/docs/integrations/MCP_ROUTER_SETUP.md +0 -445
package/docs/integrations/RTK_INTEGRATION.md +0 -468
package/docs/operations/TROUBLESHOOTING.md +0 -660
package/docs/pr/PR_SPECULATIVE_DOCS_TEMPLATE.md +0 -146
package/docs/pr/UPSTREAM_PRS.md +0 -424
package/docs/reference/API_REFERENCE.md +0 -903
package/docs/reference/EXPERT_DROIDS.md +0 -219
package/docs/reference/HARNESS-MATRIX.md +0 -318
package/docs/reference/PATTERN_LIBRARY.md +0 -636
package/docs/reference/UAP_CLI_REFERENCE.md +0 -620
package/docs/research/BEHAVIORAL_PATTERNS.md +0 -228
package/docs/research/DOMAIN_STRATEGIES.md +0 -316
package/docs/research/MEMORY_SYSTEMS_COMPARISON.md +0 -812
package/docs/research/PATTERN_ANALYSIS_2026-01-18.md +0 -436
package/docs/research/PERFORMANCE_ANALYSIS_2026-01-18.md +0 -209
package/docs/research/PERFORMANCE_TEST_PLAN.md +0 -383
package/docs/research/TERMINAL_BENCH_LEARNINGS.md +0 -217

package/src/policies/schemas/policies/mandatory-testing-deployment.md ADDED Viewed

@@ -0,0 +1,147 @@
+# Policy: Mandatory Testing & Deployment Verification
+**ID**: `policy-mandatory-testing-deployment`
+**Name**: Mandatory Testing and Deployment Verification
+**Category**: testing
+**Level**: REQUIRED
+**Enforcement Stage**: review
+**Version**: 1.0
+## Purpose
+This policy enforces that all code changes MUST complete testing, deployment verification, and quality checks before a task can be marked as DONE or closed. This prevents incomplete work from being considered finished.
+## Rules
+```rules
+- title: "Mandatory Test Creation"
+  keywords: ["done", "complete", "finish", "close", "resolve", "merge"]
+  antiPatterns: ["no new tests", "zero tests added", "skip test creation", "tests not written"]
+- title: "Testing Requirement"
+  keywords: ["done", "complete", "finish", "close", "resolve", "merge"]
+  antiPatterns: ["incomplete test", "no test coverage", "untested code", "skip test"]
+- title: "Version Bump Required"
+  keywords: ["done", "complete", "finish", "close", "resolve", "merge", "push"]
+  antiPatterns: ["manual version edit", "no version bump", "skip version", "version not bumped"]
+- title: "Deployment Verification Required"
+  keywords: ["deploy", "production", "release", "push", "merge"]
+  antiPatterns: ["unverified deployment", "no smoke test", "deployment failed"]
+- title: "Quality Gate Enforcement"
+  keywords: ["quality", "lint", "type-check", "coverage", "security"]
+  antiPatterns: ["disable lint", "bypass type check", "low coverage", "security warning"]
+- title: "Documentation Requirement"
+  keywords: ["document", "readme", "api", "changelog", "migration"]
+  antiPatterns: ["no documentation", "missing changelog", "undocumented change"]
+```
+## Enforcement Behavior
+### When Triggered
+This policy is enforced during the **review stage** when:
+- Task status is being changed to DONE, COMPLETE, or CLOSED
+- Pull request is being merged
+- Deployment is being finalized
+- Release is being published
+### Required Actions Before Completion
+1. **Mandatory Test Creation**
+   - At least 2 new test cases MUST be written for every code change
+   - Tests must cover the new or changed behavior (not unrelated code)
+   - Tests must follow existing patterns: `test/<feature>.test.ts` using vitest (`describe`/`it`/`expect`)
+   - Tests must assert correctness (not just "it doesn't throw")
+   - Bug fixes: at least one test must reproduce the bug scenario
+   - New features: tests must cover the happy path and at least one edge case
+2. **Testing Verification**
+   - All unit tests must pass including the new ones
+   - Test coverage maintained or improved (no regression)
+   - Integration tests must pass
+   - E2E tests must pass for critical paths
+   - No new test failures introduced
+3. **Version Bump**
+   - Version must be bumped via `npm run version:patch`, `version:minor`, or `version:major`
+   - Manual edits to `package.json` version field are prohibited
+   - Commit type determines bump level: fix->patch, feat->minor, breaking->major
+   - CHANGELOG.md is updated automatically by the version script
+   - Git tag is created automatically
+4. **Deployment Verification**
+   - Deployment to staging/preview environment successful
+   - Smoke tests passed in target environment
+   - Rollback plan verified (if applicable)
+   - No deployment warnings/errors
+5. **Quality Checks**
+   - Linting passes without errors
+   - Type checking passes (for TypeScript projects)
+   - Security scan shows no critical/high vulnerabilities
+   - Performance benchmarks within acceptable range
+6. **Documentation**
+   - Code comments updated for public APIs
+   - README.md updated if CLI/tools changed
+   - Changelog entry added (automated via version bump script)
+   - Breaking changes documented
+### Verification Checklist
+Before marking work as DONE, verify:
+- [ ] At least 2 new tests written for changed code
+- [ ] New tests assert correctness (not just "doesn't throw")
+- [ ] All tests passing (`npm test`)
+- [ ] Test coverage maintained or improved
+- [ ] Code linting passes (`npm run lint`)
+- [ ] Type checking passes (`tsc --noEmit`)
+- [ ] Version bumped via `npm run version:patch/minor/major`
+- [ ] CHANGELOG.md updated (automated via version script)
+- [ ] Git tag created (automated via version script)
+- [ ] Deployment to staging successful (if applicable)
+- [ ] Smoke tests passed in staging (if applicable)
+- [ ] No new security vulnerabilities
+- [ ] Documentation updated
+- [ ] Reviewers approved
+- [ ] No unresolved TODOs or FIXMEs
+### Anti-Patterns to Avoid
+❌ **DO NOT** mark tasks as DONE when:
+- No new tests were written for code changes
+- Tests are failing or skipped
+- Version was not bumped or was bumped manually
+- Deployment hasn't been verified
+- Code quality gates are bypassed
+- Documentation is missing or outdated
+- Critical bugs remain open
+- Security warnings are ignored
+- Rollback plan doesn't exist for breaking changes
+## Implementation Notes
+This policy should be enforced by:
+1. **CI/CD pipelines** - Block merges if tests fail
+2. **Code review tools** - Require passing quality checks
+3. **Task management systems** - Block status changes without verification
+4. **Policy gate system** - Validate before allowing completion commands
+## Related Policies
+- `policy-code-quality` - General code quality requirements
+- `policy-security-gate` - Security scanning requirements
+- `policy-deployment-safety` - Deployment safety checks
+---
+_Last Updated: 2026-03-18_
+_Author: Miller Tech UAP System_

package/src/policies/schemas/policies/mcp-router-first.md ADDED Viewed

@@ -0,0 +1,24 @@
+# mcp-router-first
+**Category**: custom
+**Level**: RECOMMENDED
+**Enforcement Stage**: pre-exec
+**Tags**: mcp, router, tokens, context
+## Rule
+When the session lists MCP tools as deferred (loaded on demand), agents MUST use `ToolSearch` / `uap mcp-router` to pull individual tool schemas on need rather than eagerly loading full MCP tool catalogs.
+## Why
+The session has 150+ deferred MCP tools (Playwright, Pay2U API, Terraform, Drive, etc.). Loading the full schema set burns ~30k+ tokens. UAP's MCP Router provides 98% token reduction (per CLI docs).
+## Enforcement
+Python enforcer `mcp_router_first.py` blocks bulk-load patterns and requires the specific tool name in the ToolSearch query.
+```rules
+- title: "Load MCP tools on demand"
+  keywords: [mcp, tool-schema, load-tools]
+  antiPatterns: [load-all, bulk-load, eager-schema]
+```

package/src/policies/schemas/policies/memory-before-plan.md ADDED Viewed

@@ -0,0 +1,24 @@
+# memory-before-plan
+**Category**: workflow
+**Level**: REQUIRED
+**Enforcement Stage**: pre-exec
+**Tags**: memory, uap, planning
+## Rule
+Before producing any implementation plan that spans 3+ steps or touches 3+ files, the agent MUST have queried `uap memory query <topic>` within the last 5 minutes. The UAP compliance protocol already mandates this; this policy enforces it.
+## Why
+Avoids re-deriving context already captured in prior sessions. Reduces duplicate work and keeps guidance coherent across agent runs.
+## Enforcement
+Python enforcer `memory_before_plan.py` checks `agents/data/memory/short_term.db` for a recent `uap memory query` action tagged with a relevant topic.
+```rules
+- title: "Plans must be preceded by memory query"
+  keywords: [plan, implement, build, design, architect]
+  antiPatterns: [no-memory-check, skip-history]
+```

package/src/policies/schemas/policies/merge-deploy-monitor-verify.md ADDED Viewed

@@ -0,0 +1,145 @@
+# Policy: Merge, Deploy, Monitor, Verify
+**ID**: `policy-merge-deploy-monitor-verify`
+**Name**: Merge, Deploy, Monitor, Verify Before Done
+**Category**: completion
+**Level**: REQUIRED
+**Enforcement Stage**: review
+**Version**: 1.0
+## Purpose
+This policy enforces that a change is NOT DONE until it has been merged, rolled out via the designated pipeline, observed healthy in the target environment for a defined monitoring window, and verified with captured evidence to behave correctly end-to-end. Local "build green + tests pass" is necessary but not sufficient — DONE requires evidence from the deployed system, not just CI.
+## Rules
+```rules
+- title: "Merge Gate"
+  keywords: ["done", "complete", "finish", "close", "resolve", "shipped"]
+  antiPatterns: ["direct push to master", "no pr", "skip review", "force merge", "ci failing", "merged with red ci"]
+- title: "Deploy Gate"
+  keywords: ["done", "complete", "deploy", "release", "ship", "rollout"]
+  antiPatterns: ["manual deploy", "ad-hoc cluster command", "hand-edited resource", "deploy skipped", "deployment failed", "pipeline bypassed", "out-of-band rollout"]
+- title: "Monitor Gate"
+  keywords: ["done", "complete", "monitor", "observe", "verify health"]
+  antiPatterns: ["no monitoring window", "skip observation", "no dashboard checked", "alerts not reviewed", "ignored error rate", "skipped post-deploy check"]
+- title: "Verify Gate"
+  keywords: ["done", "complete", "verify", "confirm", "validate behavior"]
+  antiPatterns: ["unverified", "tests passed so done", "ci is enough", "no end-to-end check", "no evidence captured", "happy path only", "negative case skipped"]
+- title: "Evidence Capture"
+  keywords: ["close task", "mark done", "complete task", "resolve task"]
+  antiPatterns: ["no merge sha", "no deploy url", "no monitoring evidence", "no verification output", "missing screenshot", "missing log excerpt"]
+```
+## Enforcement Behavior
+### When Triggered
+This policy is enforced during the **review stage** when:
+- Task status is being changed to DONE, COMPLETE, CLOSED, or RESOLVED
+- A pull request is being declared "shipped"
+- An incident or change request is being closed
+- Work is being declared finished in any form
+### Required Actions Before Completion
+1. **Merge Gate**
+   - Change merged via reviewed PR from a feature/worktree branch into the integration branch
+   - All CI required checks green on the merge commit (build, tests, lint, type-check)
+   - At least one approving review (or self-review with explicit documented justification for trivial changes)
+   - Merge commit SHA recorded
+2. **Deploy Gate**
+   - Designated automated deployment pipeline executed end-to-end without error
+   - Application changes: artifact published and rollout completed in target environment(s) (staging through production, as scoped)
+   - Infrastructure changes: IaC pipeline succeeded (composes with `definition-of-done-iac`)
+   - Pipeline run URL recorded
+   - Manual deploys, ad-hoc cluster commands, and hand-edited cloud resources are FORBIDDEN as the deploy path
+3. **Monitor Gate**
+   - Minimum post-deploy observation window elapsed:
+     - 15 minutes for low-risk changes
+     - 1 hour for service/infrastructure changes
+     - 24 hours for high-blast-radius changes (auth, payments, data migrations, schema changes, traffic routing)
+   - Health signals reviewed and clean during the window:
+     - Error rate (no new error classes, no rate increase above baseline)
+     - Latency (p50/p95/p99 within SLO)
+     - Saturation (CPU/memory/connections within healthy bounds)
+     - Logs (no new ERROR/FATAL lines tied to the change)
+     - Alerts (no new alerts firing related to the change)
+   - Dashboard/log links recorded
+   - Any degraded signal blocks DONE until rolled back or rolled forward with a fix
+4. **Verify Gate**
+   - The specific behavior introduced/fixed is exercised end-to-end against the deployed environment
+   - Verification method matches change type:
+     - API/backend: live request against deployed endpoint with expected response asserted
+     - UI/frontend: interactive walkthrough of golden path AND the specific edge case
+     - Infrastructure: cluster/cloud CLI query confirming the resource exists and behaves as designed
+     - Data/schema: query confirming migrated data is shaped correctly and reads/writes succeed
+   - At least one negative case explicitly checked (the failure mode the change prevents does not occur)
+   - Evidence captured: response body, screenshot, command output, or log excerpt
+   - CI green is NOT verification — verification requires evidence from the deployed system
+### Verification Checklist
+Before marking work as DONE, verify and attach:
+- [ ] Merge commit SHA and PR URL recorded
+- [ ] Deployment pipeline run URL recorded
+- [ ] Target environment(s) reached and recorded (e.g. staging, production)
+- [ ] Monitoring window start/end timestamps recorded
+- [ ] Dashboard/log links reviewed during the window and attached
+- [ ] Health signals (error rate, latency, saturation, logs, alerts) all clean
+- [ ] Verification evidence captured (command output, response body, screenshot)
+- [ ] Negative case checked and the prevented failure mode confirmed absent
+- [ ] No new alerts fired during or after the observation window
+### Anti-Patterns to Avoid
+DO NOT mark tasks as DONE when:
+- The PR has been merged but the rollout hasn't run yet ("merged != deployed")
+- The rollout succeeded but no one observed the system afterwards ("deployed != working")
+- CI is green but the deployed environment was never exercised ("CI != production")
+- The monitoring window was skipped because "it's a small change"
+- Verification consisted of "the tests cover it" — tests cover code paths, not deployed behavior
+- Only the happy path was verified and the negative case was skipped
+- "No alerts fired" was used as proof of health when no alerts exist for the changed surface area
+- The deploy/monitor/verify gates were deferred to "next sprint" or "ops can check later"
+- Evidence was claimed but not actually captured or attached
+## Implementation Notes
+This policy should be enforced by:
+1. **Task management gate** — block status transitions to DONE/CLOSED until evidence fields are populated
+2. **PR merge bots** — require deployment status checks before allowing merge to be marked "shipped"
+3. **CI/CD pipelines** — emit deployment and verification webhooks that the policy gate consumes
+4. **Policy gate system (`uap-policy check`)** — validate before allowing completion commands
+## Default Status
+**Default: ON**
+**Level: REQUIRED**
+This policy is on by default for all UAP-managed projects. Disable only with explicit project-level override and documented justification (e.g. local-only experiments, scratch projects).
+## Related Policies
+- `policy-completion-gate` — Local completion gates (tests, build, lint, version bump, worktree)
+- `policy-mandatory-testing-deployment` — Test creation and quality requirements
+- `policy-definition-of-done-iac` — IaC-specific deploy + cluster verify requirements
+- `policy-iac-pipeline-enforcement` — Pipeline-only deploy path for infrastructure
+The local completion gate gets a change ready to ship. This policy ensures the change actually shipped, stayed healthy, and demonstrably works in the environment that matters.
+---
+_Last Updated: 2026-05-04_
+_Author: Miller Tech UAP System_

package/src/policies/schemas/policies/parallel-reads.md ADDED Viewed

@@ -0,0 +1,24 @@
+# parallel-reads
+**Category**: custom
+**Level**: RECOMMENDED
+**Enforcement Stage**: pre-exec
+**Tags**: performance, parallelism, exploration
+## Rule
+Two or more independent read-only operations (`Read`, `Grep`, `Glob`, non-mutating `Bash`, `WebFetch`) with no data dependency MUST be dispatched in a single tool-call batch.
+## Why
+Serial fan-out multiplies wall-clock by N on every exploration. Claude Code supports parallel tool calls in one message. Measured speed-up on codebase surveys: 2–5×.
+## Enforcement
+Python enforcer `parallel_reads.py` (post-exec sampler) detects serial read patterns within a tight time window and warns on the next message.
+```rules
+- title: "Batch independent reads"
+  keywords: [read, grep, glob, webfetch, inspect]
+  antiPatterns: [serial-read, one-by-one, sequential-survey]
+```

package/src/policies/schemas/policies/rtk-wrap.md ADDED Viewed

@@ -0,0 +1,26 @@
+# rtk-wrap
+**Category**: custom
+**Level**: REQUIRED
+**Enforcement Stage**: pre-exec
+**Tags**: rtk, tokens, efficiency
+## Rule
+These commands MUST be invoked via `rtk` wrapper, not directly: `git`, `kubectl`, `docker`, `docker-compose`, `npm`, `pnpm`, `yarn`, `helm`, `terraform`.
+Exception: `rtk` meta-commands (`rtk gain`, `rtk discover`, `rtk proxy`, `rtk --version`).
+## Why
+RTK delivers 60–90% token reduction on dev ops (`~/.claude/RTK.md`). Missing the wrap = proportional context waste.
+## Enforcement
+Python enforcer `rtk_wrap.py` inspects the Bash command string and blocks if a wrapped binary is invoked without the `rtk ` prefix.
+```rules
+- title: "Wrap heavy CLIs with rtk"
+  keywords: [bash, shell, git, kubectl, docker, npm, pnpm, yarn, helm, terraform]
+  antiPatterns: [raw-kubectl, raw-git, raw-docker, raw-npm]
+```

package/src/policies/schemas/policies/schema-diff-gate.md ADDED Viewed

@@ -0,0 +1,30 @@
+# schema-diff-gate
+**Category**: infrastructure
+**Level**: REQUIRED
+**Enforcement Stage**: pre-exec
+**Tags**: postgres, cnpg, pgdog, migrations, schema, spock, redis
+## Rule
+Changes to DB schema, connection pooler config, or replication topology MUST pass `uap schema-diff` before commit:
+- `migrations/**/*.sql`
+- `infra/postgres-spock/**`
+- `infra/helm_charts/**/pgdog*`
+- CNPG `Cluster` spec (pool sizes, instance count, connection limits)
+- Redis Sentinel / Envoy HA-write proxy configs
+## Why
+Branch `fix/zitadel-pgdog-capacity-v2` exists because a prior capacity change escaped review. PgDog connection limits cascade into Zitadel auth outages. Pre-commit gating prevents "v2 hotfix" cycles.
+## Enforcement
+Python enforcer `schema_diff_gate.py` runs `uap schema-diff` (or checks recent successful run in memory ≤1h) when the diff touches the listed paths.
+```rules
+- title: "Schema/capacity changes must pass schema-diff"
+  keywords: [migration, schema, pgdog, cnpg, spock, postgres, redis, sentinel, envoy, pool]
+  antiPatterns: [ALTER TABLE, max_connections, pool_size, instances:, replicas:]
+```

package/src/policies/schemas/policies/session-memory-write.md ADDED Viewed

@@ -0,0 +1,24 @@
+# session-memory-write
+**Category**: workflow
+**Level**: REQUIRED
+**Enforcement Stage**: post-exec
+**Tags**: memory, session, uap
+## Rule
+A session that changed code (Edit/Write/MultiEdit occurred) MUST insert at least one `session_memories` row with `type IN ('decision','lesson','pattern')` before terminating.
+## Why
+Session-end logs show most sessions end with no memory write even when code changed. Lessons evaporate. UAP's memory system only works if write-back happens.
+## Enforcement
+Python enforcer `session_memory_write.py` runs on session-end hook: if code_changed=true, verify a matching row exists in `agents/data/memory/short_term.db`.
+```rules
+- title: "Close the learning loop on code sessions"
+  keywords: [session-end, stop, terminate, finish]
+  antiPatterns: [no-memory-write, skip-lesson]
+```

package/src/policies/schemas/policies/task-required.md ADDED Viewed

@@ -0,0 +1,49 @@
+# task-required
+**Category**: workflow
+**Level**: REQUIRED
+**Enforcement Stage**: pre-exec
+**Tags**: uap, task, workflow, enforcement
+## Rule
+A UAP task MUST be `in_progress` before any mutating work. When no row in
+`.uap/tasks/tasks.db` has `status='in_progress'`, the enforcer blocks:
+- `Edit` / `Write` / `MultiEdit` on non-exempt paths
+- Bash ship actions: `git commit`, `git push`, `gh pr create`
+Exempt path prefixes (no task required): `.claude/`, `.cursor/`, `.opencode/`,
+`.codex/`, `.forge/`, `.uap/`, `.policy-tools/`, `src/policies/`, `scripts/`,
+`docs/`.
+To proceed: `uap task create --type <task|bug|feature> --title "<desc>"` then
+`uap task update <id> --status in_progress` (or `uap task claim <id>`).
+## Why
+The UAP compliance protocol's "create a task before work" step has historically
+been delivered as SessionStart text injection — advisory guidance the agent can
+silently skip. Observed in practice: a full multi-PR session completed with zero
+`uap task create` calls because nothing enforced it.
+A `pre-exec` policy enforcer makes the task requirement a hard gate rather than a
+suggestion, so UAP task tracking is guaranteed rather than best-effort. This is
+the task-tracking analogue of `worktree-required`.
+## Enforcement
+Python enforcer `task_required.py` resolves the primary worktree root via
+`git rev-parse --git-common-dir` (so it works from linked worktrees), reads
+`.uap/tasks/tasks.db`, and blocks when `COUNT(*) WHERE status='in_progress'` is
+zero.
+Fail-open: if UAP task tracking is not initialised (no `tasks.db`) or the DB is
+unreadable, the operation is allowed — non-UAP repositories are unaffected.
+Override for one-off meta-work: `UAP_NO_TASK=1`.
+```rules
+- title: "A UAP task must be in_progress before mutating work"
+  keywords: [edit, write, multiedit, bash, git commit, git push, gh pr create]
+  antiPatterns: [no-task, untracked-work, skip-task-create]
+```

package/src/policies/schemas/policies/test-gate.md ADDED Viewed

@@ -0,0 +1,24 @@
+# test-gate
+**Category**: quality
+**Level**: REQUIRED
+**Enforcement Stage**: review
+**Tags**: testing, pr, quality
+## Rule
+At PR-ready time, every changed service under `services/**` or `apps/**` MUST have a corresponding test delta (`tests/**` or `<service>/**/*.test.*`, `*_test.py`, `*.spec.ts`).
+## Why
+Session-end logs show `Tests: false` far more often than `true`. Review-stage gating ensures shipping code without tests is an explicit override, not the default.
+## Enforcement
+Python enforcer `test_gate.py` diffs `git diff --name-only origin/main...HEAD` against test-path regexes; blocks PR signoff if any changed service lacks a test file in the same PR.
+```rules
+- title: "Changed services require test deltas"
+  keywords: [pr, commit, merge, review, signoff]
+  antiPatterns: [no-tests, skip-tests, tests-later]
+```

package/src/policies/schemas/policies/validate-plan-before-build.md ADDED Viewed

@@ -0,0 +1,28 @@
+# validate-plan-before-build
+**Category**: workflow
+**Level**: REQUIRED
+**Enforcement Stage**: pre-exec
+**Tags**: planning, validation, accuracy
+## Rule
+When a plan is marked ready and the agent is about to begin implementation (first mutating tool call after plan emission: `Edit`, `Write`, `MultiEdit`, `Bash` that modifies state), the agent MUST first execute the prompt `validate the plan` and receive an explicit pass before proceeding.
+A plan is "ready" when:
+- User approves with "go", "build", "implement", "proceed", "ship it", "complete all", or similar
+- OR the agent emits ExitPlanMode / transitions out of a Plan phase
+## Why
+User directive: "when a plan is ready to build, execute prompt 'validate the plan'". Prevents shipping on stale/unvalidated plans — catches last-mile gaps before code changes begin.
+## Enforcement
+Python enforcer `validate_plan_before_build.py` tracks plan-ready state in session memory; on first mutating tool call post-ready, blocks and injects the `validate the plan` prompt. Unblocks only after a validation result is recorded.
+```rules
+- title: "Ready plans require explicit validation"
+  keywords: [edit, write, multiedit, implement, build, ship, commit]
+  antiPatterns: [unvalidated-plan, skip-validation, plan-stale]
+```

package/src/policies/schemas/policies/worktree-required.md ADDED Viewed

@@ -0,0 +1,28 @@
+# worktree-required
+**Category**: workflow
+**Level**: REQUIRED
+**Enforcement Stage**: pre-exec
+**Tags**: git, worktree, isolation, uap
+## Rule
+All `Edit`, `Write`, `MultiEdit` calls on tracked files MUST occur inside a UAP worktree at `.worktrees/NNN-<slug>/`. Exemptions:
+- Harness config under `.claude/`, `.cursor/`, `.opencode/`, `.codex/`, `.uap/`
+- New files under `src/policies/`, `scripts/`, `docs/`
+- Explicit override: user says "work directly" or `--no-worktree`
+## Why
+CLAUDE.md v2.3.0 mandates worktrees; the existing hook warns but doesn't block. Formalizing closes the gap — protects in-flight user edits from agent collisions.
+## Enforcement
+Python enforcer `worktree_required.py` checks whether the target file path is under `.worktrees/` and whether the session has an active worktree slug.
+```rules
+- title: "File edits must occur in a worktree"
+  keywords: [edit, write, multiedit, create-file, modify-file]
+  antiPatterns: [primary-checkout, no-worktree, direct-main]
+```

package/templates/hooks/uap-policy-gate.sh CHANGED Viewed

@@ -30,6 +30,11 @@ export UAP_REPO_ROOT="$MAIN_ROOT"
 # actual WORKING TREE, not the (possibly bare) MAIN_ROOT. Expose the current checkout
 # so _common.worktree_root() targets the worktree when an op runs from inside one.
 export UAP_WORKTREE_ROOT="$CHECKOUT_ROOT"
+# Delivery enforcement defaults to BLOCK for UAP-managed projects: substantive
+# source edits must route through `uap deliver` (verified completion against the
+# gates). The `:-` preserves any explicit operator/CI override (advisory|block).
+# Escape hatches still apply: UAP_DELIVER_ACTIVE=1 (inside deliver) / UAP_DELIVER_BYPASS=1.
+export UAP_ENFORCE_DELIVERY="${UAP_ENFORCE_DELIVERY:-block}"
 cd "$MAIN_ROOT"
 TOOL="$(printf '%s' "$PAYLOAD" | python3 -c 'import json,sys; d=json.load(sys.stdin); print(d.get("tool_name") or d.get("tool") or "")' 2>/dev/null || true)"