npm - principles-disciple - Versions diffs - 1.71.0 → 1.73.0 - Mend

principles-disciple 1.71.0 → 1.73.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (309) hide show

package/openclaw.plugin.json +10 -5
package/package.json +17 -19
package/scripts/acceptance-test.mjs +16 -73
package/scripts/sync-plugin.mjs +382 -77
package/src/commands/archive-impl.ts +2 -1
package/src/commands/capabilities.ts +2 -2
package/src/commands/context.ts +2 -2
package/src/commands/disable-impl.ts +2 -1
package/src/commands/evolution-status.ts +16 -16
package/src/commands/export.ts +12 -67
package/src/commands/pain.ts +91 -1
package/src/commands/principle-rollback.ts +2 -1
package/src/commands/promote-impl.ts +7 -43
package/src/commands/rollback-impl.ts +2 -1
package/src/commands/rollback.ts +2 -1
package/src/commands/samples.ts +2 -1
package/src/commands/thinking-os.ts +2 -1
package/src/config/errors.ts +18 -2
package/src/constants/diagnostician.ts +2 -2
package/src/constants/tools.ts +2 -1
package/src/core/__tests__/focus-history.test.ts +210 -0
package/src/core/config.ts +1 -1
package/src/core/confirm-first-gate.ts +255 -0
package/src/core/correction-cue-learner.ts +2 -136
package/src/core/correction-types.ts +16 -88
package/src/core/dictionary.ts +19 -20
package/src/core/empathy-keyword-matcher.ts +17 -289
package/src/core/empathy-types.ts +18 -229
package/src/core/event-log.ts +38 -132
package/src/core/evolution-reducer.ts +21 -2
package/src/core/evolution-types.ts +76 -464
package/src/core/file-store.ts +80 -0
package/src/core/focus-history.ts +228 -955
package/src/core/local-worker-routing.ts +34 -314
package/src/core/merge-gate-audit.ts +0 -195
package/src/core/pain-diagnostic-gate.ts +154 -0
package/src/core/pain-signal.ts +21 -138
package/src/core/pain.ts +15 -88
package/src/core/pd-task-reconciler.ts +26 -115
package/src/core/pd-task-service.ts +9 -9
package/src/core/pd-task-types.ts +23 -127
package/src/core/principle-compiler/__tests__/compiler-replay-gate.test.ts +174 -0
package/src/core/principle-compiler/code-validator.ts +15 -42
package/src/core/principle-compiler/compiler.ts +100 -15
package/src/core/principle-compiler/index.ts +5 -2
package/src/core/principle-compiler/template-generator.ts +4 -104
package/src/core/principle-injection.ts +10 -202
package/src/core/principle-internalization/filesystem-lifecycle-datasource.ts +42 -0
package/src/core/principle-internalization/lifecycle-read-model.ts +39 -242
package/src/core/principle-internalization/principle-lifecycle-service.ts +12 -10
package/src/core/principle-tree-ledger-adapter.ts +145 -0
package/src/core/principle-tree-ledger.ts +8 -6
package/src/core/reflection/reflection-context.ts +14 -109
package/src/core/replay-engine.ts +8 -500
package/src/core/rule-host-helpers.ts +5 -35
package/src/core/rule-host-types.ts +10 -82
package/src/core/rule-host.ts +6 -63
package/src/core/runtime-v2-prompt-activation-reader.ts +231 -0
package/src/core/session-tracker.ts +87 -101
package/src/core/shadow-observation-registry.ts +19 -48
package/src/core/trajectory.ts +3 -1
package/src/core/workflow-funnel-loader.ts +62 -68
package/src/core/workspace-context.ts +46 -0
package/src/core/workspace-dir-service.ts +1 -1
package/src/core/workspace-dir-validation.ts +18 -9
package/src/hooks/AGENTS.md +1 -1
package/src/hooks/gate-block-helper.ts +46 -44
package/src/hooks/gate.ts +207 -7
package/src/hooks/lifecycle.ts +30 -32
package/src/hooks/llm.ts +60 -32
package/src/hooks/pain.ts +297 -103
package/src/hooks/prompt.ts +469 -339
package/src/hooks/subagent.ts +2 -29
package/src/i18n/commands.ts +2 -10
package/src/index.ts +95 -85
package/src/openclaw-sdk.ts +311 -0
package/src/service/central-database.ts +8 -4
package/src/service/evolution-queue-migration.ts +2 -1
package/src/service/evolution-worker.ts +163 -1786
package/src/service/internalization-trigger-adapter.ts +302 -0
package/src/service/keyword-optimization-service.ts +4 -4
package/src/service/monitoring-query-service.ts +1 -215
package/src/service/queue-io.ts +60 -331
package/src/service/runtime-summary-service.ts +115 -18
package/src/service/subagent-workflow/index.ts +0 -41
package/src/service/subagent-workflow/types.ts +9 -120
package/src/service/subagent-workflow/workflow-store.ts +2 -119
package/src/service/workflow-watchdog.ts +0 -43
package/src/types/event-payload.ts +16 -74
package/src/types/event-types.ts +39 -547
package/src/types/hygiene-types.ts +7 -30
package/src/types/principle-tree-schema.ts +20 -222
package/src/types/queue.ts +15 -70
package/src/types/runtime-summary.ts +5 -49
package/src/utils/io.ts +10 -0
package/src/utils/retry.ts +1 -1
package/src/utils/shadow-fingerprint.ts +2 -2
package/src/utils/workspace-resolver.ts +50 -0
package/templates/langs/en/core/AGENTS.md +2 -2
package/templates/langs/en/core/BOOT.md +1 -1
package/templates/langs/en/core/HEARTBEAT.md +2 -2
package/templates/langs/en/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
package/templates/langs/en/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
package/templates/langs/en/skills/ai-sprint-orchestration/runtime/.gitignore +2 -2
package/templates/langs/en/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
package/templates/langs/en/skills/evolve-task/SKILL.md +1 -1
package/templates/langs/en/skills/pd-cli-operator/SKILL.md +67 -0
package/templates/langs/en/skills/pd-diagnostician/SKILL.md +1 -1
package/templates/langs/en/skills/pd-mentor/SKILL.md +1 -1
package/templates/langs/en/skills/pd-pain-signal/SKILL.md +17 -39
package/templates/langs/en/skills/pd-runtime-v2/SKILL.md +61 -0
package/templates/langs/zh/core/AGENTS.md +2 -2
package/templates/langs/zh/core/BOOT.md +1 -1
package/templates/langs/zh/core/HEARTBEAT.md +2 -2
package/templates/langs/zh/skills/ai-sprint-orchestration/references/agent-registry.json +1 -72
package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/bugfix-complex-template.json +6 -6
package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/feature-complex-template.json +6 -6
package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/nocturnal-trinity-quality-enhancement.json +8 -8
package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal-verify.json +2 -12
package/templates/langs/zh/skills/ai-sprint-orchestration/references/specs/workflow-validation-minimal.json +2 -12
package/templates/langs/zh/skills/ai-sprint-orchestration/runtime/.gitignore +2 -2
package/templates/langs/zh/skills/ai-sprint-orchestration/scripts/run.mjs +51 -15
package/templates/langs/zh/skills/ai-sprint-orchestration/test/run.test.mjs +21 -5
package/templates/langs/zh/skills/evolve-task/SKILL.md +2 -2
package/templates/langs/zh/skills/pd-cli-operator/SKILL.md +67 -0
package/templates/langs/zh/skills/pd-diagnostician/SKILL.md +1 -1
package/templates/langs/zh/skills/pd-mentor/SKILL.md +1 -1
package/templates/langs/zh/skills/pd-pain-signal/SKILL.md +17 -38
package/templates/langs/zh/skills/pd-runtime-v2/SKILL.md +61 -0
package/tests/build-artifacts.test.ts +1 -3
package/tests/commands/evolution-status.test.ts +0 -118
package/tests/core/bootstrap-rules.test.ts +1 -1
package/tests/core/config.test.ts +1 -1
package/tests/core/event-log.test.ts +35 -0
package/tests/core/evolution-engine.test.ts +610 -0
package/tests/core/file-store.test.ts +102 -0
package/tests/core/focus-history.test.ts +203 -11
package/tests/core/merge-gate-audit.test.ts +2 -169
package/tests/core/model-deployment-registry.test.ts +7 -1
package/tests/core/model-training-registry.test.ts +19 -0
package/tests/core/observability.test.ts +0 -1
package/tests/core/pain-diagnostic-gate.test.ts +498 -0
package/tests/core/pain.test.ts +0 -1
package/tests/core/principle-internalization/deprecated-readiness.test.ts +2 -2
package/tests/core/principle-internalization/lifecycle-metrics.test.ts +2 -2
package/tests/core/principle-internalization/{internalization-routing-policy.test.ts → lifecycle-routing-policy.test.ts} +6 -6
package/tests/core/principle-internalization/lineage-source-retired.test.ts +56 -0
package/tests/core/principle-internalization/principle-lifecycle-service.test.ts +1 -23
package/tests/core/principle-tree-ledger-adapter.test.ts +253 -0
package/tests/core/reflection-context.test.ts +0 -14
package/tests/core/replay-engine.test.ts +127 -215
package/tests/core/rule-host-helpers.test.ts +2 -2
package/tests/core/rule-implementation-runtime.test.ts +0 -27
package/tests/core/workflow-funnel-loader.test.ts +162 -0
package/tests/core/workspace-dir-validation.test.ts +8 -1
package/tests/core-anti-growth.test.ts +192 -0
package/tests/hook-workspace-nextaction-contract.test.ts +42 -0
package/tests/hooks/confirm-first-gate.test.ts +333 -0
package/tests/hooks/gate-auto-correct-shadow.test.ts +310 -0
package/tests/hooks/gate-auto-correct.test.ts +665 -0
package/tests/hooks/gate-rule-host-pipeline.test.ts +2 -1
package/tests/hooks/pain.test.ts +269 -12
package/tests/hooks/prompt-characterization.test.ts +500 -0
package/tests/hooks/prompt-size-guard.test.ts +329 -0
package/tests/hooks/runtime-v2-prompt-activation.test.ts +869 -0
package/tests/index.test.ts +94 -1
package/tests/integration/auto-entry-gate.test.ts +248 -0
package/tests/integration/internalization-trigger-guard.test.ts +69 -0
package/tests/integration/m8-legacy-paths.test.ts +63 -0
package/tests/integration/runtime-v2-pain-guard.test.ts +125 -0
package/tests/plugin-config-resolution-cutover.test.ts +359 -0
package/tests/runtime-v2-discovery-guard.test.ts +154 -0
package/tests/service/central-database.test.ts +457 -0
package/tests/service/evolution-worker.correction-observer.test.ts +173 -0
package/tests/service/evolution-worker.timeout.test.ts +11 -129
package/tests/service/internalization-trigger-adapter.test.ts +251 -0
package/tests/service/monitoring-query-service.test.ts +1 -47
package/tests/service/queue-io.test.ts +1 -62
package/tests/service/runtime-summary-service.test.ts +184 -3
package/tests/service/workflow-watchdog.test.ts +0 -91
package/tests/utils/file-lock.test.ts +5 -3
package/tests/utils/session-key.test.ts +52 -0
package/tests/utils/subagent-probe.test.ts +48 -1
package/vitest.config.ts +4 -11
package/.planning/codebase/ARCHITECTURE.md +0 -157
package/.planning/codebase/CONCERNS.md +0 -145
package/.planning/codebase/CONVENTIONS.md +0 -148
package/.planning/codebase/INTEGRATIONS.md +0 -81
package/.planning/codebase/STACK.md +0 -87
package/.planning/codebase/STRUCTURE.md +0 -193
package/.planning/codebase/TESTING.md +0 -243
package/.planning/phases/01-basic-visualization/01-GAP-CLOSURE-VERIFICATION.md +0 -113
package/docs/COMMAND_REFERENCE.md +0 -76
package/docs/COMMAND_REFERENCE_EN.md +0 -79
package/scripts/build-web.mjs +0 -46
package/scripts/diagnose-nocturnal.mjs +0 -537
package/scripts/seed-nocturnal-scenarios.mjs +0 -384
package/src/commands/nocturnal-review.ts +0 -322
package/src/commands/nocturnal-rollout.ts +0 -790
package/src/commands/nocturnal-train.ts +0 -986
package/src/commands/pd-reflect.ts +0 -88
package/src/core/adaptive-thresholds.ts +0 -478
package/src/core/diagnostician-task-store.ts +0 -192
package/src/core/nocturnal-arbiter.ts +0 -715
package/src/core/nocturnal-artifact-lineage.ts +0 -116
package/src/core/nocturnal-artificer.ts +0 -257
package/src/core/nocturnal-candidate-scoring.ts +0 -530
package/src/core/nocturnal-compliance.ts +0 -1146
package/src/core/nocturnal-dataset.ts +0 -763
package/src/core/nocturnal-executability.ts +0 -428
package/src/core/nocturnal-export.ts +0 -499
package/src/core/nocturnal-paths.ts +0 -240
package/src/core/nocturnal-reasoning-deriver.ts +0 -343
package/src/core/nocturnal-rule-implementation-validator.ts +0 -246
package/src/core/nocturnal-snapshot-contract.ts +0 -99
package/src/core/nocturnal-trajectory-extractor.ts +0 -512
package/src/core/nocturnal-trinity-types.ts +0 -218
package/src/core/nocturnal-trinity.ts +0 -2680
package/src/core/principle-internalization/deprecated-readiness.ts +0 -93
package/src/core/principle-internalization/internalization-routing-policy.ts +0 -208
package/src/core/principle-internalization/lifecycle-metrics.ts +0 -152
package/src/http/principles-console-route.ts +0 -709
package/src/service/central-health-service.ts +0 -49
package/src/service/central-overview-service.ts +0 -138
package/src/service/control-ui-query-service.ts +0 -900
package/src/service/cooldown-strategy.ts +0 -97
package/src/service/evolution-pain-context.ts +0 -79
package/src/service/evolution-query-service.ts +0 -407
package/src/service/health-query-service.ts +0 -1038
package/src/service/nocturnal-config.ts +0 -214
package/src/service/nocturnal-runtime.ts +0 -734
package/src/service/nocturnal-service.ts +0 -1605
package/src/service/nocturnal-target-selector.ts +0 -545
package/src/service/sleep-cycle.ts +0 -157
package/src/service/startup-reconciler.ts +0 -112
package/src/service/subagent-workflow/correction-observer-types.ts +0 -82
package/src/service/subagent-workflow/correction-observer-workflow-manager.ts +0 -250
package/src/service/subagent-workflow/deep-reflect-workflow-manager.ts +0 -1
package/src/service/subagent-workflow/dynamic-timeout.ts +0 -30
package/src/service/subagent-workflow/empathy-observer-workflow-manager.ts +0 -268
package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +0 -795
package/src/service/subagent-workflow/runtime-direct-driver.ts +0 -268
package/src/service/subagent-workflow/workflow-manager-base.ts +0 -580
package/src/tools/write-pain-flag.ts +0 -215
package/tests/commands/nocturnal-review.test.ts +0 -448
package/tests/commands/nocturnal-train.test.ts +0 -97
package/tests/commands/pd-reflect.test.ts +0 -49
package/tests/core/adaptive-thresholds.test.ts +0 -261
package/tests/core/nocturnal-arbiter.test.ts +0 -559
package/tests/core/nocturnal-artifact-lineage.test.ts +0 -53
package/tests/core/nocturnal-artificer.test.ts +0 -241
package/tests/core/nocturnal-candidate-scoring.test.ts +0 -532
package/tests/core/nocturnal-compliance-p-principles.test.ts +0 -133
package/tests/core/nocturnal-compliance.test.ts +0 -646
package/tests/core/nocturnal-dataset.test.ts +0 -892
package/tests/core/nocturnal-e2e.test.ts +0 -234
package/tests/core/nocturnal-executability.test.ts +0 -357
package/tests/core/nocturnal-export.test.ts +0 -517
package/tests/core/nocturnal-reasoning-deriver.test.ts +0 -372
package/tests/core/nocturnal-reviewed-subset-comparison.test.ts +0 -428
package/tests/core/nocturnal-rule-implementation-validator.test.ts +0 -127
package/tests/core/nocturnal-snapshot-contract.test.ts +0 -121
package/tests/core/nocturnal-trajectory-extractor.test.ts +0 -634
package/tests/core/nocturnal-trinity.test.ts +0 -2053
package/tests/core/pain-auto-repair.test.ts +0 -96
package/tests/core/pain-integration.test.ts +0 -510
package/tests/fixtures/nocturnal-reviewed-subset.json +0 -183
package/tests/http/principles-console-route.test.ts +0 -162
package/tests/integration/chaos-resilience.test.ts +0 -348
package/tests/integration/empathy-workflow-integration.test.ts +0 -626
package/tests/integration/pain-diagnostician-loop.e2e.test.ts +0 -380
package/tests/service/control-ui-query-service.test.ts +0 -121
package/tests/service/cooldown-strategy.test.ts +0 -164
package/tests/service/data-endpoints-regression.test.ts +0 -834
package/tests/service/empathy-observer-workflow-manager.test.ts +0 -175
package/tests/service/evolution-worker.nocturnal.test.ts +0 -601
package/tests/service/nocturnal-runtime-hardening.test.ts +0 -118
package/tests/service/nocturnal-runtime.test.ts +0 -473
package/tests/service/nocturnal-service-code-candidate.test.ts +0 -330
package/tests/service/nocturnal-target-selector.test.ts +0 -615
package/tests/service/startup-reconciler.test.ts +0 -148
package/tests/tools/write-pain-flag.test.ts +0 -358
package/ui/src/App.tsx +0 -45
package/ui/src/api.ts +0 -220
package/ui/src/charts.tsx +0 -955
package/ui/src/components/ErrorState.tsx +0 -6
package/ui/src/components/Loading.tsx +0 -13
package/ui/src/components/ProtectedRoute.tsx +0 -12
package/ui/src/components/Shell.tsx +0 -91
package/ui/src/components/WorkspaceConfig.tsx +0 -178
package/ui/src/components/index.ts +0 -5
package/ui/src/context/auth.tsx +0 -80
package/ui/src/context/theme.tsx +0 -66
package/ui/src/hooks/useAutoRefresh.ts +0 -39
package/ui/src/i18n/ui.ts +0 -473
package/ui/src/main.tsx +0 -16
package/ui/src/pages/EvolutionPage.tsx +0 -333
package/ui/src/pages/FeedbackPage.tsx +0 -138
package/ui/src/pages/GateMonitorPage.tsx +0 -136
package/ui/src/pages/LoginPage.tsx +0 -89
package/ui/src/pages/OverviewPage.tsx +0 -599
package/ui/src/pages/SamplesPage.tsx +0 -174
package/ui/src/pages/ThinkingModelsPage.tsx +0 -702
package/ui/src/styles.css +0 -2020
package/ui/src/types.ts +0 -384
package/ui/src/utils/format.ts +0 -15

package/tests/core/nocturnal-candidate-scoring.test.ts DELETED Viewed

@@ -1,532 +0,0 @@
-import { describe, it, expect } from 'vitest';
-import {
-  scoreCandidate,
-  checkThresholds,
-  rankCandidates,
-  runTournament,
-  DEFAULT_SCORING_WEIGHTS,
-  validateCandidateDiversity,
-} from '../../src/core/nocturnal-candidate-scoring.js';
-import type { DreamerCandidate, PhilosopherJudgment } from '../../src/core/nocturnal-trinity.js';
-import type { ThresholdValues } from '../../src/core/adaptive-thresholds.js';
-// ---------------------------------------------------------------------------
-// Test Fixtures
-// ---------------------------------------------------------------------------
-function makeCandidate(overrides: Partial<DreamerCandidate> = {}): DreamerCandidate {
-  return {
-    candidateIndex: 0,
-    badDecision: 'Did something wrong without verifying preconditions',
-    betterDecision: 'Read the relevant file to understand its structure before making changes',
-    rationale: 'Verifying preconditions prevents errors and ensures actions are appropriate',
-    confidence: 0.85,
-    ...overrides,
-  };
-}
-function makeJudgment(candidateIndex: number, overrides: Partial<PhilosopherJudgment> = {}): PhilosopherJudgment {
-  return {
-    candidateIndex,
-    critique: 'Strong alignment with the principle',
-    principleAligned: true,
-    score: 0.85,
-    rank: 1,
-    ...overrides,
-  };
-}
-const DEFAULT_THRESHOLDS: ThresholdValues = {
-  schemaCompletenessMin: 0.6,
-  principleAlignmentMin: 0.7,
-  executabilityMin: 0.65,
-  boundednessMin: 0.5,
-  confidenceMin: 0.6,
-  aggregateMin: 0.65,
-};
-// ---------------------------------------------------------------------------
-// Tests: scoreCandidate
-// ---------------------------------------------------------------------------
-describe('scoreCandidate', () => {
-  it('scores a valid candidate correctly', () => {
-    const candidate = makeCandidate();
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.schemaCompleteness).toBeGreaterThan(0);
-    expect(scores.principleAlignment).toBe(1.0); // principleAligned: true
-    expect(scores.executability).toBeGreaterThan(0);
-    expect(scores.boundedness).toBeGreaterThan(0);
-    expect(scores.confidence).toBeGreaterThan(0);
-    expect(scores.aggregate).toBeGreaterThan(0);
-  });
-  it('penalizes non-principle-aligned candidates', () => {
-    const candidate = makeCandidate();
-    const judgment = makeJudgment(0, { principleAligned: false, score: 0.4 });
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.principleAlignment).toBeLessThan(0.5);
-  });
-  it('penalizes missing fields in schema completeness', () => {
-    const candidate = makeCandidate({ betterDecision: '' });
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.schemaCompleteness).toBeLessThan(1.0);
-  });
-  it('penalizes generic betterDecision without actionable verbs', () => {
-    const candidate = makeCandidate({ betterDecision: 'Do something better' });
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.executability).toBeLessThan(1.0);
-  });
-  it('rewards specific betterDecision with file paths', () => {
-    const candidate = makeCandidate({
-      betterDecision: 'Read src/main.ts to understand the structure',
-    });
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.boundedness).toBeGreaterThan(0.5);
-  });
-  it('does not penalize words that merely contain "it" as a substring', () => {
-    const candidate = makeCandidate({
-      betterDecision: 'Verify preconditions in config.json before retrying',
-      confidence: 0.92,
-    });
-    const judgment = makeJudgment(0, { score: 0.92, principleAligned: true });
-    const scores = scoreCandidate(candidate, judgment);
-    // Boundedness should remain 0.7 (0.5 base + 0.2 specific target) because
-    // "preconditions" must not trigger the generic word "it" penalty.
-    expect(scores.boundedness).toBe(0.7);
-  });
-  it('uses custom weights when provided', () => {
-    const candidate = makeCandidate();
-    const judgment = makeJudgment(0);
-    const customWeights = { ...DEFAULT_SCORING_WEIGHTS, principleAlignment: 0.5 };
-    const scores = scoreCandidate(candidate, judgment, customWeights);
-    // With higher weight on principleAlignment, aggregate should be higher for aligned candidates
-    expect(scores.aggregate).toBeGreaterThan(0);
-  });
-  it('does not crash when badDecision is undefined — lowers score instead', () => {
-    const candidate = makeCandidate({ badDecision: undefined as unknown as string });
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.schemaCompleteness).toBeLessThan(1.0);
-    expect(scores.aggregate).toBeGreaterThanOrEqual(0);
-  });
-  it('does not crash when betterDecision is undefined — lowers score instead', () => {
-    const candidate = makeCandidate({ betterDecision: undefined as unknown as string });
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.schemaCompleteness).toBeLessThan(1.0);
-    expect(scores.aggregate).toBeGreaterThanOrEqual(0);
-  });
-  it('does not crash when both badDecision and betterDecision are undefined', () => {
-    const candidate = makeCandidate({
-      badDecision: undefined as unknown as string,
-      betterDecision: undefined as unknown as string,
-    });
-    const judgment = makeJudgment(0);
-    const scores = scoreCandidate(candidate, judgment);
-    expect(scores.schemaCompleteness).toBeLessThan(1.0);
-    expect(scores.aggregate).toBeGreaterThanOrEqual(0);
-  });
-});
-// ---------------------------------------------------------------------------
-// Tests: checkThresholds
-// ---------------------------------------------------------------------------
-describe('checkThresholds', () => {
-  it('passes all thresholds with good scores', () => {
-    const scores = {
-      schemaCompleteness: 0.9,
-      principleAlignment: 0.9,
-      executability: 0.9,
-      boundedness: 0.9,
-      confidence: 0.9,
-      aggregate: 0.9,
-    };
-    const [passed, failed] = checkThresholds(scores, DEFAULT_THRESHOLDS);
-    expect(passed).toBe(true);
-    expect(failed).toHaveLength(0);
-  });
-  it('fails when schema completeness is below threshold', () => {
-    const scores = {
-      schemaCompleteness: 0.3,
-      principleAlignment: 0.9,
-      executability: 0.9,
-      boundedness: 0.9,
-      confidence: 0.9,
-      aggregate: 0.9,
-    };
-    const [passed, failed] = checkThresholds(scores, DEFAULT_THRESHOLDS);
-    expect(passed).toBe(false);
-    // checkThresholds returns formatted strings like "schemaCompleteness (0.3 < 0.6)"
-    expect(failed.some(f => f.includes('schemaCompleteness'))).toBe(true);
-  });
-  it('fails when multiple thresholds are broken', () => {
-    const scores = {
-      schemaCompleteness: 0.3,
-      principleAlignment: 0.3,
-      executability: 0.3,
-      boundedness: 0.3,
-      confidence: 0.3,
-      aggregate: 0.3,
-    };
-    const [passed, failed] = checkThresholds(scores, DEFAULT_THRESHOLDS);
-    expect(passed).toBe(false);
-    expect(failed.length).toBeGreaterThan(1);
-  });
-  it('reports all failed thresholds', () => {
-    const scores = {
-      schemaCompleteness: 0.5,  // < 0.6 → FAIL
-      principleAlignment: 0.7,  // >= 0.7 → PASS (at threshold)
-      executability: 0.5,       // < 0.65 → FAIL
-      boundedness: 0.7,         // >= 0.65 → PASS (above new threshold)
-      confidence: 0.5,          // < 0.6 → FAIL
-      aggregate: 0.5,           // < 0.65 → FAIL
-    };
-    const [passed, failed] = checkThresholds(scores, DEFAULT_THRESHOLDS);
-    expect(passed).toBe(false);
-    // Exactly 4 failures: schemaCompleteness, executability, confidence, aggregate
-    expect(failed.length).toBe(4);
-    expect(failed.some(f => f.includes('schemaCompleteness'))).toBe(true);
-    expect(failed.some(f => f.includes('executability'))).toBe(true);
-    expect(failed.some(f => f.includes('confidence'))).toBe(true);
-    expect(failed.some(f => f.includes('aggregate'))).toBe(true);
-  });
-});
-// ---------------------------------------------------------------------------
-// Tests: rankCandidates
-// ---------------------------------------------------------------------------
-describe('rankCandidates', () => {
-  it('ranks candidates by aggregate score', () => {
-    // Use very different confidence levels to ensure clear ranking
-    // Candidate 0: low confidence (0.5) - lower aggregate
-    // Candidate 1: high confidence (0.9) - higher aggregate
-    const candidates = [
-      makeCandidate({ candidateIndex: 0, confidence: 0.5, betterDecision: 'Read config.json to understand setup' }),
-      makeCandidate({ candidateIndex: 1, confidence: 0.9, betterDecision: 'Read main.ts to understand setup' }),
-    ];
-    const judgments = [
-      makeJudgment(0, { score: 0.5, rank: 1, principleAligned: true }),
-      makeJudgment(1, { score: 0.9, rank: 1, principleAligned: true }),
-    ];
-    const ranked = rankCandidates(candidates, judgments, DEFAULT_THRESHOLDS);
-    // Candidate 1 has higher score and should be ranked first
-    expect(ranked[0].candidateIndex).toBe(1);
-    expect(ranked[0].rank).toBe(1);
-    expect(ranked[1].rank).toBe(2);
-  });
-  it('excludes candidates that fail thresholds', () => {
-    // Candidate 0 has low confidence and fails principle alignment - should fail
-    // Candidate 1 has high confidence and passes - should pass
-    const candidates = [
-      makeCandidate({ candidateIndex: 0, confidence: 0.3, betterDecision: 'Check errors in src/main.ts' }),
-      makeCandidate({ candidateIndex: 1, confidence: 0.9, betterDecision: 'Read error logs in error.json' }),
-    ];
-    const judgments = [
-      makeJudgment(0, { score: 0.5, principleAligned: false }),
-      makeJudgment(1, { score: 0.9, principleAligned: true }),
-    ];
-    const ranked = rankCandidates(candidates, judgments, DEFAULT_THRESHOLDS);
-    // Candidate 1 passes thresholds (high confidence, principle aligned, has file path)
-    expect(ranked[0].thresholdPassed).toBe(true);
-    // Candidate 0 fails thresholds (low confidence, not principle aligned)
-    expect(ranked[1].thresholdPassed).toBe(false);
-  });
-  it('uses candidateIndex as stable tie-break', () => {
-    // Two candidates with same scoring profile but different indices
-    const candidates = [
-      makeCandidate({ candidateIndex: 5, betterDecision: 'Read src/index.ts to understand', confidence: 0.8 }),
-      makeCandidate({ candidateIndex: 1, betterDecision: 'Read src/index.ts to understand', confidence: 0.8 }),
-    ];
-    // Both have identical judgments (same score, both aligned)
-    const judgments = [
-      makeJudgment(1, { score: 0.8, principleAligned: true }),
-      makeJudgment(5, { score: 0.8, principleAligned: true }),
-    ];
-    const ranked = rankCandidates(candidates, judgments, DEFAULT_THRESHOLDS);
-    // Lower candidateIndex wins tie
-    expect(ranked[0].candidateIndex).toBe(1);
-  });
-  it('handles empty input gracefully', () => {
-    const ranked = rankCandidates([], [], DEFAULT_THRESHOLDS);
-    expect(ranked).toHaveLength(0);
-  });
-  it('skips candidates without matching judgments', () => {
-    const candidates = [makeCandidate({ candidateIndex: 0 })];
-    const judgments = [makeJudgment(99)]; // No matching judgment
-    const ranked = rankCandidates(candidates, judgments, DEFAULT_THRESHOLDS);
-    expect(ranked).toHaveLength(0);
-  });
-});
-// ---------------------------------------------------------------------------
-// Tests: runTournament
-// ---------------------------------------------------------------------------
-describe('runTournament', () => {
-  it('selects the highest-scoring threshold-passing candidate', () => {
-    // Use actionable verbs and proper file paths to pass boundedness threshold
-    const candidates = [
-      makeCandidate({ candidateIndex: 0, confidence: 0.7, betterDecision: 'Read config.json to verify settings' }),
-      makeCandidate({ candidateIndex: 1, confidence: 0.9, betterDecision: 'Review error.json logs for errors' }),
-      makeCandidate({ candidateIndex: 2, confidence: 0.5, betterDecision: 'Check main.ts before proceeding' }),
-    ];
-    const judgments = [
-      makeJudgment(0, { score: 0.7, principleAligned: true }),
-      makeJudgment(1, { score: 0.9, principleAligned: true }),
-      makeJudgment(2, { score: 0.5, principleAligned: true }),
-    ];
-    const result = runTournament(candidates, judgments, DEFAULT_THRESHOLDS);
-    expect(result.success).toBe(true);
-    expect(result.winner).not.toBeNull();
-    expect(result.winner!.candidateIndex).toBe(1);
-    expect(result.rankedCandidates).toHaveLength(3);
-  });
-  it('fails when all candidates fail thresholds', () => {
-    // Candidates with poor confidence and not principle-aligned should fail
-    const candidates = [
-      makeCandidate({ candidateIndex: 0, confidence: 0.2, betterDecision: 'Do something in src.ts' }),
-      makeCandidate({ candidateIndex: 1, confidence: 0.1, betterDecision: 'Try again with config.json' }),
-    ];
-    const judgments = [
-      makeJudgment(0, { score: 0.3, principleAligned: false }),
-      makeJudgment(1, { score: 0.2, principleAligned: false }),
-    ];
-    const result = runTournament(candidates, judgments, DEFAULT_THRESHOLDS);
-    expect(result.success).toBe(false);
-    expect(result.winner).toBeNull();
-    expect(result.failureReason).toContain('threshold');
-  });
-  it('provides explainable trace', () => {
-    const candidates = [makeCandidate({ candidateIndex: 0, betterDecision: 'Read error.json to check logs' })];
-    const judgments = [makeJudgment(0, { score: 0.9, principleAligned: true })];
-    const result = runTournament(candidates, judgments, DEFAULT_THRESHOLDS);
-    expect(result.trace).toBeDefined();
-    expect(result.trace.length).toBeGreaterThan(0);
-    expect(result.trace[0].step).toBeDefined();
-    expect(result.trace[0].details).toBeDefined();
-  });
-  it('is deterministic — same inputs yield same winner', () => {
-    const candidates = [
-      makeCandidate({ candidateIndex: 0, confidence: 0.8, betterDecision: 'Read config.json to understand' }),
-      makeCandidate({ candidateIndex: 1, confidence: 0.9, betterDecision: 'Review error.json for issues' }),
-    ];
-    const judgments = [
-      makeJudgment(0, { score: 0.8, principleAligned: true }),
-      makeJudgment(1, { score: 0.9, principleAligned: true }),
-    ];
-    const result1 = runTournament(candidates, judgments, DEFAULT_THRESHOLDS);
-    const result2 = runTournament(candidates, judgments, DEFAULT_THRESHOLDS);
-    expect(result1.winner!.candidateIndex).toBe(result2.winner!.candidateIndex);
-  });
-});
-// ---------------------------------------------------------------------------
-// Tests: DEFAULT_SCORING_WEIGHTS
-// ---------------------------------------------------------------------------
-describe('DEFAULT_SCORING_WEIGHTS', () => {
-  it('has weights that sum to 1.0', () => {
-    const sum = Object.values(DEFAULT_SCORING_WEIGHTS).reduce((a, b) => a + b, 0);
-    expect(sum).toBeCloseTo(1.0, 2);
-  });
-  it('has all required properties', () => {
-    expect(DEFAULT_SCORING_WEIGHTS.schemaCompleteness).toBeDefined();
-    expect(DEFAULT_SCORING_WEIGHTS.principleAlignment).toBeDefined();
-    expect(DEFAULT_SCORING_WEIGHTS.executability).toBeDefined();
-    expect(DEFAULT_SCORING_WEIGHTS.boundedness).toBeDefined();
-    expect(DEFAULT_SCORING_WEIGHTS.confidence).toBeDefined();
-  });
-  it('has values in valid range (0-1)', () => {
-    for (const weight of Object.values(DEFAULT_SCORING_WEIGHTS)) {
-      expect(weight).toBeGreaterThanOrEqual(0);
-      expect(weight).toBeLessThanOrEqual(1);
-    }
-  });
-});
-// ---------------------------------------------------------------------------
-// Tests: validateCandidateDiversity
-// ---------------------------------------------------------------------------
-describe('validateCandidateDiversity', () => {
-  it('passes when candidates have 2+ distinct risk levels and low keyword overlap', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low', betterDecision: 'Read config.json to verify settings' }),
-      makeCandidate({ candidateIndex: 1, riskLevel: 'high', betterDecision: 'Refactor the entire authentication module from scratch' }),
-    ];
-    const result = validateCandidateDiversity(candidates);
-    expect(result.diversityCheckPassed).toBe(true);
-    expect(result.riskLevelDiversity).toBe(true);
-    expect(result.keywordOverlapPassed).toBe(true);
-  });
-  it('fails when all candidates have the same risk level', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low', betterDecision: 'Read file A to check settings' }),
-      makeCandidate({ candidateIndex: 1, riskLevel: 'low', betterDecision: 'Review file completely different approach' }),
-      makeCandidate({ candidateIndex: 2, riskLevel: 'low', betterDecision: 'Inspect another unique diagnostic method' }),
-    ];
-    const result = validateCandidateDiversity(candidates);
-    expect(result.diversityCheckPassed).toBe(false);
-    expect(result.riskLevelDiversity).toBe(false);
-  });
-  it('fails when candidate pair has keyword overlap > 0.8', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low', betterDecision: 'Review the authentication configuration file before making any changes to the system' }),
-      makeCandidate({ candidateIndex: 1, riskLevel: 'high', betterDecision: 'Review the authentication configuration file before making any changes to the system' }),
-    ];
-    const result = validateCandidateDiversity(candidates);
-    expect(result.diversityCheckPassed).toBe(false);
-    expect(result.keywordOverlapPassed).toBe(false);
-    expect(result.maxOverlapScore).toBeGreaterThan(0.8);
-  });
-  it('passes for single candidate', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low' }),
-    ];
-    const result = validateCandidateDiversity(candidates);
-    expect(result.diversityCheckPassed).toBe(true);
-    expect(result.details).toContain('Single candidate');
-  });
-  it('passes for empty array', () => {
-    const result = validateCandidateDiversity([]);
-    expect(result.diversityCheckPassed).toBe(true);
-    expect(result.details).toContain('No candidates');
-  });
-  it('passes when candidates lack riskLevel (graceful degradation)', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, betterDecision: 'Read config.json to verify settings' }),
-      makeCandidate({ candidateIndex: 1, betterDecision: 'Refactor the entire authentication module from scratch' }),
-    ];
-    // No riskLevel on any candidate - should pass (no risk levels to check)
-    const result = validateCandidateDiversity(candidates);
-    expect(result.diversityCheckPassed).toBe(true);
-    expect(result.riskLevelDiversity).toBe(true);
-  });
-  it('fails when some candidates have riskLevel but fewer than 2 distinct values', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'medium', betterDecision: 'Read config.json to verify settings' }),
-      makeCandidate({ candidateIndex: 1, betterDecision: 'Refactor the entire authentication module from scratch' }),
-    ];
-    // Only 1 candidate has riskLevel, so only 1 distinct value → fail
-    const result = validateCandidateDiversity(candidates);
-    expect(result.diversityCheckPassed).toBe(false);
-    expect(result.riskLevelDiversity).toBe(false);
-  });
-  it('uses max(|A|, |B|) as denominator for keyword overlap', () => {
-    // Short text A, long text B - overlap should use max as denominator
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low', betterDecision: 'review authentication configuration' }),
-      makeCandidate({ candidateIndex: 1, riskLevel: 'high', betterDecision: 'review authentication configuration before proceeding with changes to the deployment pipeline infrastructure' }),
-    ];
-    const result = validateCandidateDiversity(candidates);
-    // "review", "authentication", "configuration" overlap in both
-    // Set A = {review, authentication, configuration} = 3
-    // Set B = {review, authentication, configuration, before, proceeding, with, changes, deployment, pipeline, infrastructure} = 10
-    // intersection = 3, max(3, 10) = 10, overlap = 3/10 = 0.3
-    expect(result.maxOverlapScore).toBeLessThanOrEqual(0.4);
-  });
-  it('ignores words <= 3 characters in keyword overlap', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low', betterDecision: 'the and but for' }),
-      makeCandidate({ candidateIndex: 1, riskLevel: 'high', betterDecision: 'the and but for' }),
-    ];
-    // All words are <= 3 chars, so no keywords extracted → overlap = 0
-    const result = validateCandidateDiversity(candidates);
-    expect(result.keywordOverlapPassed).toBe(true);
-    expect(result.maxOverlapScore).toBe(0);
-  });
-  it('never throws on malformed input', () => {
-    // Undefined candidates
-    expect(() => validateCandidateDiversity(undefined as unknown as DreamerCandidate[])).not.toThrow();
-    // Null candidates
-    expect(() => validateCandidateDiversity(null as unknown as DreamerCandidate[])).not.toThrow();
-    // Candidates with undefined fields
-    expect(() => validateCandidateDiversity([
-      { candidateIndex: 0 } as DreamerCandidate,
-    ])).not.toThrow();
-    // Mixed valid and malformed
-    expect(() => validateCandidateDiversity([
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low' }),
-      { candidateIndex: 1 } as DreamerCandidate,
-    ])).not.toThrow();
-  });
-  it('returns correct maxOverlapScore rounded to 2 decimal places', () => {
-    const candidates: DreamerCandidate[] = [
-      makeCandidate({ candidateIndex: 0, riskLevel: 'low', betterDecision: 'Review configuration settings before deployment' }),
-      makeCandidate({ candidateIndex: 1, riskLevel: 'high', betterDecision: 'Review configuration settings before deployment testing' }),
-    ];
-    const result = validateCandidateDiversity(candidates);
-    // Verify the maxOverlapScore is a number with at most 2 decimal places
-    const decimalPart = result.maxOverlapScore.toString().split('.')[1];
-    if (decimalPart) {
-      expect(decimalPart.length).toBeLessThanOrEqual(2);
-    }
-    expect(typeof result.maxOverlapScore).toBe('number');
-  });
-});

package/tests/core/nocturnal-compliance-p-principles.test.ts DELETED Viewed

@@ -1,133 +0,0 @@
-/**
- * Tests for #216: P_* principle violation and opportunity detection
- *
- * Before this fix, detectOpportunity and detectViolation only handled T-01~T-09,
- * causing all P_* principles to return false for both applicable and violated.
- */
-import { describe, expect, it } from 'vitest';
-import { detectOpportunity, detectViolation } from '../../src/core/nocturnal-compliance.js';
-import type { SessionEvents } from '../../src/core/nocturnal-compliance.js';
-function makeSession(overrides: Partial<SessionEvents> = {}): SessionEvents {
-  return {
-    sessionId: 'test-session',
-    toolCalls: overrides.toolCalls ?? [],
-    painSignals: overrides.painSignals ?? [],
-    gateBlocks: overrides.gateBlocks ?? [],
-    userCorrections: overrides.userCorrections ?? [],
-    planApprovals: overrides.planApprovals ?? [],
-  };
-}
-describe('#216: P_* principle detection', () => {
-  describe('detectOpportunity for P_* principles', () => {
-    it('returns applicable=true when session has pain signals', () => {
-      const session = makeSession({
-        painSignals: [{ source: 'tool_failure', score: 80, reason: 'write failed' }],
-      });
-      const result = detectOpportunity('P_001', session);
-      expect(result.applicable).toBe(true);
-      expect(result.reason).toContain('pain signal');
-    });
-    it('returns applicable=true when session has tool failures', () => {
-      const session = makeSession({
-        toolCalls: [{ toolName: 'write', filePath: 'test.txt', outcome: 'failure', errorMessage: 'disk full' }],
-      });
-      const result = detectOpportunity('P_042', session);
-      expect(result.applicable).toBe(true);
-      expect(result.reason).toContain('tool failure');
-    });
-    it('returns applicable=true when session has gate blocks', () => {
-      const session = makeSession({
-        gateBlocks: [{ toolName: 'bash', reason: 'high risk operation' }],
-      });
-      const result = detectOpportunity('P_065', session);
-      expect(result.applicable).toBe(true);
-      expect(result.reason).toContain('gate block');
-    });
-    it('returns applicable=false when session has no negative signals', () => {
-      const session = makeSession({
-        toolCalls: [{ toolName: 'read', filePath: 'test.txt', outcome: 'success' }],
-      });
-      const result = detectOpportunity('P_001', session);
-      expect(result.applicable).toBe(false);
-      expect(result.reason).toContain('no pain/tool-failure/gate-block');
-    });
-  });
-  describe('detectViolation for P_* principles', () => {
-    it('returns violated=true when session has high pain signals (score >= 50)', () => {
-      const session = makeSession({
-        painSignals: [{ source: 'tool_failure', score: 80, reason: 'write failed' }],
-      });
-      const result = detectViolation('P_001', session);
-      expect(result.violated).toBe(true);
-      expect(result.reason).toContain('pain signal');
-    });
-    it('returns violated=false when pain signals are low (score < 50)', () => {
-      const session = makeSession({
-        painSignals: [{ source: 'minor_issue', score: 30, reason: 'cosmetic' }],
-        toolCalls: [{ toolName: 'read', filePath: 'test.txt', outcome: 'success' }],
-      });
-      const result = detectViolation('P_001', session);
-      expect(result.violated).toBe(false);
-      expect(result.reason).toContain('no violation signals');
-    });
-    it('returns violated=true when session has tool failures', () => {
-      const session = makeSession({
-        toolCalls: [
-          { toolName: 'write', filePath: 'test.txt', outcome: 'failure', errorMessage: 'disk full' },
-        ],
-      });
-      const result = detectViolation('P_042', session);
-      expect(result.violated).toBe(true);
-      expect(result.reason).toContain('tool failure');
-    });
-    it('returns violated=true when session has gate blocks', () => {
-      const session = makeSession({
-        gateBlocks: [{ toolName: 'bash', reason: 'high risk operation' }],
-      });
-      const result = detectViolation('P_065', session);
-      expect(result.violated).toBe(true);
-      expect(result.reason).toContain('gate block');
-    });
-    it('returns violated=false for clean session with no negative signals', () => {
-      const session = makeSession({
-        toolCalls: [{ toolName: 'read', filePath: 'test.txt', outcome: 'success' }],
-      });
-      const result = detectViolation('P_001', session);
-      expect(result.violated).toBe(false);
-      expect(result.reason).toContain('no violation signals');
-    });
-  });
-  describe('T-* principles still work (regression check)', () => {
-    it('T-01 opportunity detected for edit operations', () => {
-      const session = makeSession({
-        toolCalls: [{ toolName: 'edit_file', filePath: 'test.ts', outcome: 'success' }],
-      });
-      const result = detectOpportunity('T-01', session);
-      expect(result.applicable).toBe(true);
-    });
-    it('T-01 violation detected when editing without reading first', () => {
-      const session = makeSession({
-        toolCalls: [
-          { toolName: 'edit_file', filePath: 'test.ts', outcome: 'failure', errorMessage: 'merge conflict' },
-        ],
-        painSignals: [{ source: 'test.ts edit failed', score: 70, reason: 'Did not survey structure before editing' }],
-      });
-      const result = detectViolation('T-01', session);
-      // T-01 violation: edit without prior read, with pain signal matching file or pattern
-      expect(result.violated).toBe(true);
-    });
-  });
-});