principles-disciple 1.7.5 → 1.7.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/commands/context.js +5 -15
- package/dist/commands/evolution-status.js +29 -48
- package/dist/commands/export.js +61 -8
- package/dist/commands/nocturnal-review.d.ts +24 -0
- package/dist/commands/nocturnal-review.js +265 -0
- package/dist/commands/nocturnal-rollout.d.ts +27 -0
- package/dist/commands/nocturnal-rollout.js +671 -0
- package/dist/commands/nocturnal-train.d.ts +25 -0
- package/dist/commands/nocturnal-train.js +919 -0
- package/dist/commands/pain.js +8 -21
- package/dist/config/defaults/runtime.d.ts +40 -0
- package/dist/config/defaults/runtime.js +44 -0
- package/dist/config/errors.d.ts +84 -0
- package/dist/config/errors.js +94 -0
- package/dist/config/index.d.ts +7 -0
- package/dist/config/index.js +7 -0
- package/dist/constants/diagnostician.d.ts +0 -4
- package/dist/constants/diagnostician.js +0 -4
- package/dist/constants/tools.d.ts +2 -2
- package/dist/constants/tools.js +1 -1
- package/dist/core/adaptive-thresholds.d.ts +186 -0
- package/dist/core/adaptive-thresholds.js +300 -0
- package/dist/core/config.d.ts +2 -38
- package/dist/core/config.js +6 -61
- package/dist/core/control-ui-db.d.ts +27 -0
- package/dist/core/control-ui-db.js +18 -0
- package/dist/core/event-log.d.ts +1 -2
- package/dist/core/event-log.js +0 -3
- package/dist/core/evolution-engine.js +1 -21
- package/dist/core/evolution-reducer.d.ts +7 -1
- package/dist/core/evolution-reducer.js +56 -4
- package/dist/core/evolution-types.d.ts +61 -9
- package/dist/core/evolution-types.js +31 -9
- package/dist/core/external-training-contract.d.ts +276 -0
- package/dist/core/external-training-contract.js +269 -0
- package/dist/core/local-worker-routing.d.ts +175 -0
- package/dist/core/local-worker-routing.js +525 -0
- package/dist/core/model-deployment-registry.d.ts +218 -0
- package/dist/core/model-deployment-registry.js +503 -0
- package/dist/core/model-training-registry.d.ts +295 -0
- package/dist/core/model-training-registry.js +475 -0
- package/dist/core/nocturnal-arbiter.d.ts +159 -0
- package/dist/core/nocturnal-arbiter.js +534 -0
- package/dist/core/nocturnal-candidate-scoring.d.ts +137 -0
- package/dist/core/nocturnal-candidate-scoring.js +266 -0
- package/dist/core/nocturnal-compliance.d.ts +175 -0
- package/dist/core/nocturnal-compliance.js +824 -0
- package/dist/core/nocturnal-dataset.d.ts +224 -0
- package/dist/core/nocturnal-dataset.js +443 -0
- package/dist/core/nocturnal-executability.d.ts +85 -0
- package/dist/core/nocturnal-executability.js +331 -0
- package/dist/core/nocturnal-export.d.ts +124 -0
- package/dist/core/nocturnal-export.js +275 -0
- package/dist/core/nocturnal-paths.d.ts +124 -0
- package/dist/core/nocturnal-paths.js +214 -0
- package/dist/core/nocturnal-trajectory-extractor.d.ts +242 -0
- package/dist/core/nocturnal-trajectory-extractor.js +307 -0
- package/dist/core/nocturnal-trinity.d.ts +311 -0
- package/dist/core/nocturnal-trinity.js +880 -0
- package/dist/core/path-resolver.js +2 -1
- package/dist/core/paths.d.ts +6 -0
- package/dist/core/paths.js +6 -0
- package/dist/core/principle-training-state.d.ts +121 -0
- package/dist/core/principle-training-state.js +321 -0
- package/dist/core/promotion-gate.d.ts +238 -0
- package/dist/core/promotion-gate.js +529 -0
- package/dist/core/session-tracker.d.ts +10 -0
- package/dist/core/session-tracker.js +14 -0
- package/dist/core/shadow-observation-registry.d.ts +217 -0
- package/dist/core/shadow-observation-registry.js +308 -0
- package/dist/core/training-program.d.ts +233 -0
- package/dist/core/training-program.js +433 -0
- package/dist/core/trajectory.d.ts +155 -1
- package/dist/core/trajectory.js +292 -8
- package/dist/core/workspace-context.d.ts +0 -6
- package/dist/core/workspace-context.js +0 -12
- package/dist/hooks/bash-risk.d.ts +57 -0
- package/dist/hooks/bash-risk.js +137 -0
- package/dist/hooks/edit-verification.d.ts +62 -0
- package/dist/hooks/edit-verification.js +256 -0
- package/dist/hooks/gate-block-helper.d.ts +44 -0
- package/dist/hooks/gate-block-helper.js +119 -0
- package/dist/hooks/gate.d.ts +18 -0
- package/dist/hooks/gate.js +62 -751
- package/dist/hooks/gfi-gate.d.ts +40 -0
- package/dist/hooks/gfi-gate.js +113 -0
- package/dist/hooks/pain.js +6 -9
- package/dist/hooks/progressive-trust-gate.d.ts +51 -0
- package/dist/hooks/progressive-trust-gate.js +89 -0
- package/dist/hooks/prompt.d.ts +11 -11
- package/dist/hooks/prompt.js +167 -77
- package/dist/hooks/subagent.js +43 -6
- package/dist/hooks/thinking-checkpoint.d.ts +37 -0
- package/dist/hooks/thinking-checkpoint.js +51 -0
- package/dist/http/principles-console-route.js +13 -3
- package/dist/i18n/commands.js +8 -8
- package/dist/index.js +129 -28
- package/dist/service/central-database.js +2 -1
- package/dist/service/control-ui-query-service.d.ts +1 -1
- package/dist/service/control-ui-query-service.js +3 -3
- package/dist/service/evolution-query-service.d.ts +1 -1
- package/dist/service/evolution-query-service.js +5 -5
- package/dist/service/evolution-worker.d.ts +52 -4
- package/dist/service/evolution-worker.js +328 -16
- package/dist/service/nocturnal-runtime.d.ts +183 -0
- package/dist/service/nocturnal-runtime.js +352 -0
- package/dist/service/nocturnal-service.d.ts +163 -0
- package/dist/service/nocturnal-service.js +787 -0
- package/dist/service/nocturnal-target-selector.d.ts +145 -0
- package/dist/service/nocturnal-target-selector.js +315 -0
- package/dist/service/phase3-input-filter.d.ts +48 -12
- package/dist/service/phase3-input-filter.js +84 -18
- package/dist/service/runtime-summary-service.d.ts +34 -10
- package/dist/service/runtime-summary-service.js +87 -48
- package/dist/tools/deep-reflect.js +2 -1
- package/dist/types/event-types.d.ts +4 -10
- package/dist/types/runtime-summary.d.ts +47 -0
- package/dist/types/runtime-summary.js +1 -0
- package/dist/types.d.ts +0 -3
- package/dist/types.js +0 -2
- package/openclaw.plugin.json +1 -1
- package/package.json +1 -1
- package/templates/langs/en/skills/pd-mentor/SKILL.md +5 -5
- package/templates/langs/zh/skills/pd-mentor/SKILL.md +5 -5
- package/templates/pain_settings.json +0 -6
- package/dist/commands/trust.d.ts +0 -4
- package/dist/commands/trust.js +0 -78
- package/dist/core/trust-engine.d.ts +0 -96
- package/dist/core/trust-engine.js +0 -286
|
@@ -0,0 +1,145 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Nocturnal Target Selector — Principle + Session Selection for Sleep-Mode Reflection
|
|
3
|
+
* ================================================================================
|
|
4
|
+
*
|
|
5
|
+
* PURPOSE: Select one target principle and one violating session for nocturnal
|
|
6
|
+
* reflection processing. This module is a PURE SELECTOR — it does NOT execute
|
|
7
|
+
* reflection or write any artifacts.
|
|
8
|
+
*
|
|
9
|
+
* SELECTION LOGIC:
|
|
10
|
+
* 1. Filter principles to evaluable candidates (not manual_only, not cooldown)
|
|
11
|
+
* 2. Score candidates by: compliance health, violation trend, sample scarcity
|
|
12
|
+
* 3. Select top principle
|
|
13
|
+
* 4. Find violating sessions for that principle
|
|
14
|
+
* 5. Select best violating session by violation density
|
|
15
|
+
*
|
|
16
|
+
* SKIP CONDITIONS (return no-op cleanly):
|
|
17
|
+
* - no_evaluable_principles: No principles with auto-trainable evaluability
|
|
18
|
+
* - all_targets_in_cooldown: All candidates are in cooldown
|
|
19
|
+
* - no_violating_sessions: No sessions show violation signals for selected principle
|
|
20
|
+
* - workspace_not_idle: Workspace is active, nocturnal run not allowed
|
|
21
|
+
* - quota_exhausted: Max runs per window reached
|
|
22
|
+
* - insufficient_snapshot_data: Sessions exist but lack tool calls
|
|
23
|
+
*
|
|
24
|
+
* DESIGN CONSTRAINTS:
|
|
25
|
+
* - This is a PURE SELECTOR — no reflection execution
|
|
26
|
+
* - No raw text exposure
|
|
27
|
+
* - No artifact writing
|
|
28
|
+
* - No真实 subagent 调用
|
|
29
|
+
* - Deterministic based on inputs (no random selection)
|
|
30
|
+
*
|
|
31
|
+
* OUTPUT: NocturnalSelectionResult with:
|
|
32
|
+
* - decision: 'selected' | 'skip'
|
|
33
|
+
* - selectedPrincipleId?: string
|
|
34
|
+
* - selectedSessionId?: string
|
|
35
|
+
* - skipReason?: SkipReason
|
|
36
|
+
* - diagnostics: scoring and filtering details
|
|
37
|
+
*/
|
|
38
|
+
import { NocturnalTrajectoryExtractor } from '../core/nocturnal-trajectory-extractor.js';
|
|
39
|
+
import { type IdleCheckResult } from './nocturnal-runtime.js';
|
|
40
|
+
export type SkipReason = 'no_evaluable_principles' | 'all_targets_in_cooldown' | 'no_violating_sessions' | 'workspace_not_idle' | 'quota_exhausted' | 'insufficient_snapshot_data' | 'global_cooldown_active';
|
|
41
|
+
export interface SelectionDiagnostics {
|
|
42
|
+
/** Total evaluable principles found */
|
|
43
|
+
totalEvaluablePrinciples: number;
|
|
44
|
+
/** Principles filtered out by cooldown */
|
|
45
|
+
filteredByCooldown: number;
|
|
46
|
+
/** Principles that passed all filters */
|
|
47
|
+
passedPrinciples: string[];
|
|
48
|
+
/** Violating sessions found for selected principle */
|
|
49
|
+
violatingSessionCount: number;
|
|
50
|
+
/** Violation density of selected session (failures / total tool calls) */
|
|
51
|
+
selectedSessionViolationDensity: number | null;
|
|
52
|
+
/** Score of selected principle */
|
|
53
|
+
selectedPrincipleScore: number | null;
|
|
54
|
+
/** Score breakdown */
|
|
55
|
+
scoringBreakdown: Record<string, number>;
|
|
56
|
+
/** Whether workspace idle check passed */
|
|
57
|
+
idleCheckPassed: boolean;
|
|
58
|
+
/** Whether cooldown check passed */
|
|
59
|
+
cooldownCheckPassed: boolean;
|
|
60
|
+
/** Whether quota check passed */
|
|
61
|
+
quotaCheckPassed: boolean;
|
|
62
|
+
/** Recent pain context used for ranking bias (if available) */
|
|
63
|
+
painContext?: {
|
|
64
|
+
recentPainCount: number;
|
|
65
|
+
recentMaxPainScore: number;
|
|
66
|
+
hasRecentPain: boolean;
|
|
67
|
+
painSource?: string;
|
|
68
|
+
};
|
|
69
|
+
}
|
|
70
|
+
export interface NocturnalSelectionResult {
|
|
71
|
+
/** Whether a target was selected */
|
|
72
|
+
decision: 'selected' | 'skip';
|
|
73
|
+
/** Selected principle ID (if decision === 'selected') */
|
|
74
|
+
selectedPrincipleId?: string;
|
|
75
|
+
/** Selected violating session ID (if decision === 'selected') */
|
|
76
|
+
selectedSessionId?: string;
|
|
77
|
+
/** Reason for skip (if decision === 'skip') */
|
|
78
|
+
skipReason?: SkipReason;
|
|
79
|
+
/** Detailed diagnostics for observability */
|
|
80
|
+
diagnostics: SelectionDiagnostics;
|
|
81
|
+
}
|
|
82
|
+
export interface NocturnalTargetSelectorOptions {
|
|
83
|
+
/**
|
|
84
|
+
* Minimum violation density threshold for a session to be considered "violating".
|
|
85
|
+
* Default: 0.1 (at least 10% of tool calls are violation signals)
|
|
86
|
+
*/
|
|
87
|
+
minViolationDensity?: number;
|
|
88
|
+
/**
|
|
89
|
+
* Maximum number of recent sessions to consider for violation matching.
|
|
90
|
+
* Default: 50
|
|
91
|
+
*/
|
|
92
|
+
maxSessionCandidates?: number;
|
|
93
|
+
/**
|
|
94
|
+
* Idle threshold override (ms).
|
|
95
|
+
* Default: from nocturnal-runtime DEFAULT_IDLE_THRESHOLD_MS
|
|
96
|
+
*/
|
|
97
|
+
idleThresholdMs?: number;
|
|
98
|
+
/**
|
|
99
|
+
* Override idle check result (for testing).
|
|
100
|
+
* If provided, this result is used instead of calling checkWorkspaceIdle.
|
|
101
|
+
*/
|
|
102
|
+
idleCheckOverride?: IdleCheckResult;
|
|
103
|
+
/**
|
|
104
|
+
* Recent pain context from evolution worker.
|
|
105
|
+
* When provided, principles related to recent pain signals get ranking bias.
|
|
106
|
+
* This threads recent pain into sleep_reflection targeting without merging task kinds.
|
|
107
|
+
*/
|
|
108
|
+
recentPainContext?: {
|
|
109
|
+
mostRecent: {
|
|
110
|
+
score: number;
|
|
111
|
+
source: string;
|
|
112
|
+
reason: string;
|
|
113
|
+
timestamp: string;
|
|
114
|
+
} | null;
|
|
115
|
+
recentPainCount: number;
|
|
116
|
+
recentMaxPainScore: number;
|
|
117
|
+
};
|
|
118
|
+
}
|
|
119
|
+
/**
|
|
120
|
+
* Nocturnal Target Selector.
|
|
121
|
+
*
|
|
122
|
+
* Selects one target principle and one violating session for nocturnal reflection.
|
|
123
|
+
* This is a PURE FUNCTION — no side effects, no artifact writing.
|
|
124
|
+
*/
|
|
125
|
+
export declare class NocturnalTargetSelector {
|
|
126
|
+
private readonly extractor;
|
|
127
|
+
private readonly stateDir;
|
|
128
|
+
private readonly workspaceDir;
|
|
129
|
+
private readonly opts;
|
|
130
|
+
private readonly idleCheckOverride?;
|
|
131
|
+
private readonly recentPainContext?;
|
|
132
|
+
constructor(workspaceDir: string, stateDir: string, extractor: NocturnalTrajectoryExtractor, options?: NocturnalTargetSelectorOptions);
|
|
133
|
+
/**
|
|
134
|
+
* Select a target principle and violating session.
|
|
135
|
+
*
|
|
136
|
+
* @returns NocturnalSelectionResult with either selected targets or skip reason
|
|
137
|
+
*/
|
|
138
|
+
select(): NocturnalSelectionResult;
|
|
139
|
+
}
|
|
140
|
+
/**
|
|
141
|
+
* Select a nocturnal target (principle + session) with default options.
|
|
142
|
+
*
|
|
143
|
+
* This is a convenience wrapper for the common case.
|
|
144
|
+
*/
|
|
145
|
+
export declare function selectNocturnalTarget(workspaceDir: string, stateDir: string, extractor: NocturnalTrajectoryExtractor, options?: NocturnalTargetSelectorOptions): NocturnalSelectionResult;
|
|
@@ -0,0 +1,315 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Nocturnal Target Selector — Principle + Session Selection for Sleep-Mode Reflection
|
|
3
|
+
* ================================================================================
|
|
4
|
+
*
|
|
5
|
+
* PURPOSE: Select one target principle and one violating session for nocturnal
|
|
6
|
+
* reflection processing. This module is a PURE SELECTOR — it does NOT execute
|
|
7
|
+
* reflection or write any artifacts.
|
|
8
|
+
*
|
|
9
|
+
* SELECTION LOGIC:
|
|
10
|
+
* 1. Filter principles to evaluable candidates (not manual_only, not cooldown)
|
|
11
|
+
* 2. Score candidates by: compliance health, violation trend, sample scarcity
|
|
12
|
+
* 3. Select top principle
|
|
13
|
+
* 4. Find violating sessions for that principle
|
|
14
|
+
* 5. Select best violating session by violation density
|
|
15
|
+
*
|
|
16
|
+
* SKIP CONDITIONS (return no-op cleanly):
|
|
17
|
+
* - no_evaluable_principles: No principles with auto-trainable evaluability
|
|
18
|
+
* - all_targets_in_cooldown: All candidates are in cooldown
|
|
19
|
+
* - no_violating_sessions: No sessions show violation signals for selected principle
|
|
20
|
+
* - workspace_not_idle: Workspace is active, nocturnal run not allowed
|
|
21
|
+
* - quota_exhausted: Max runs per window reached
|
|
22
|
+
* - insufficient_snapshot_data: Sessions exist but lack tool calls
|
|
23
|
+
*
|
|
24
|
+
* DESIGN CONSTRAINTS:
|
|
25
|
+
* - This is a PURE SELECTOR — no reflection execution
|
|
26
|
+
* - No raw text exposure
|
|
27
|
+
* - No artifact writing
|
|
28
|
+
* - No真实 subagent 调用
|
|
29
|
+
* - Deterministic based on inputs (no random selection)
|
|
30
|
+
*
|
|
31
|
+
* OUTPUT: NocturnalSelectionResult with:
|
|
32
|
+
* - decision: 'selected' | 'skip'
|
|
33
|
+
* - selectedPrincipleId?: string
|
|
34
|
+
* - selectedSessionId?: string
|
|
35
|
+
* - skipReason?: SkipReason
|
|
36
|
+
* - diagnostics: scoring and filtering details
|
|
37
|
+
*/
|
|
38
|
+
import { listEvaluablePrinciples, } from '../core/principle-training-state.js';
|
|
39
|
+
import { checkWorkspaceIdle, checkCooldown, DEFAULT_IDLE_THRESHOLD_MS, } from './nocturnal-runtime.js';
|
|
40
|
+
import { detectViolation } from '../core/nocturnal-compliance.js';
|
|
41
|
+
/**
|
|
42
|
+
* Score a principle for nocturnal targeting.
|
|
43
|
+
* Higher score = better candidate for reflection.
|
|
44
|
+
*
|
|
45
|
+
* Scoring dimensions:
|
|
46
|
+
* 1. Compliance health (higher compliance = more worth teaching)
|
|
47
|
+
* 2. Violation trend (worsening trend = higher priority)
|
|
48
|
+
* 3. Sample scarcity (fewer samples = more valuable)
|
|
49
|
+
* 4. Cooldown penalty (in cooldown = lower priority)
|
|
50
|
+
* 5. Pain context bias (recent pain = higher priority for related principles)
|
|
51
|
+
*
|
|
52
|
+
* Score range: 0-100 (normalized)
|
|
53
|
+
*/
|
|
54
|
+
function scorePrinciple(state, cooldownActive, recentPainContext) {
|
|
55
|
+
let score = 50; // Base score
|
|
56
|
+
// Compliance contribution: 0-25 points
|
|
57
|
+
// High compliance = well-understood principle = good teaching target
|
|
58
|
+
// But very low compliance = confused principle = also needs work
|
|
59
|
+
const complianceContribution = Math.round(state.complianceRate * 25);
|
|
60
|
+
score += complianceContribution;
|
|
61
|
+
// Trend contribution: -10 to +10 points
|
|
62
|
+
// worsening trend (+1) = higher priority = +10
|
|
63
|
+
// improving trend (-1) = lower priority = -10
|
|
64
|
+
// stable (0) = neutral = 0
|
|
65
|
+
score += state.violationTrend * 10;
|
|
66
|
+
// Sample scarcity contribution: 0-15 points
|
|
67
|
+
// Fewer samples generated = more valuable new data
|
|
68
|
+
// Max at 0 samples, decreases as samples accumulate
|
|
69
|
+
const scarcityPenalty = Math.min(state.generatedSampleCount / 10, 1) * 15;
|
|
70
|
+
score += Math.round(15 - scarcityPenalty);
|
|
71
|
+
// Cooldown penalty: -30 points
|
|
72
|
+
if (cooldownActive) {
|
|
73
|
+
score -= 30;
|
|
74
|
+
}
|
|
75
|
+
// Pain context bias: up to +25 points
|
|
76
|
+
// Bias toward principles related to recent pain signals
|
|
77
|
+
if (recentPainContext && recentPainContext.recentPainCount > 0) {
|
|
78
|
+
// Most recent pain score contributes up to 15 points (pain scores are 1-10)
|
|
79
|
+
const mostRecentPainScore = recentPainContext.mostRecent?.score ?? 0;
|
|
80
|
+
const painScoreContribution = Math.round((mostRecentPainScore / 10) * 15);
|
|
81
|
+
score += painScoreContribution;
|
|
82
|
+
// Additional pain count adds up to 5 more points
|
|
83
|
+
const additionalPainContribution = Math.min(recentPainContext.recentPainCount - 1, 5) * 1;
|
|
84
|
+
score += additionalPainContribution;
|
|
85
|
+
// High pain scores (> 7) get extra 5-point boost
|
|
86
|
+
if (recentPainContext.recentMaxPainScore > 7) {
|
|
87
|
+
score += 5;
|
|
88
|
+
}
|
|
89
|
+
}
|
|
90
|
+
return Math.max(0, Math.min(100, score));
|
|
91
|
+
}
|
|
92
|
+
/**
|
|
93
|
+
* Compute violation signal density for a session.
|
|
94
|
+
* Returns 0-1 score (higher = more violation evidence).
|
|
95
|
+
*/
|
|
96
|
+
function computeViolationDensity(session) {
|
|
97
|
+
const total = session.toolCallCount;
|
|
98
|
+
if (total === 0)
|
|
99
|
+
return 0;
|
|
100
|
+
// Violation signals: failures, pain events, gate blocks
|
|
101
|
+
const violationSignals = session.failureCount + session.painEventCount * 0.5 + session.gateBlockCount * 0.3;
|
|
102
|
+
return Math.min(violationSignals / total, 1);
|
|
103
|
+
}
|
|
104
|
+
/**
|
|
105
|
+
* Nocturnal Target Selector.
|
|
106
|
+
*
|
|
107
|
+
* Selects one target principle and one violating session for nocturnal reflection.
|
|
108
|
+
* This is a PURE FUNCTION — no side effects, no artifact writing.
|
|
109
|
+
*/
|
|
110
|
+
export class NocturnalTargetSelector {
|
|
111
|
+
extractor;
|
|
112
|
+
stateDir;
|
|
113
|
+
workspaceDir;
|
|
114
|
+
opts;
|
|
115
|
+
idleCheckOverride;
|
|
116
|
+
recentPainContext;
|
|
117
|
+
constructor(workspaceDir, stateDir, extractor, options = {}) {
|
|
118
|
+
this.workspaceDir = workspaceDir;
|
|
119
|
+
this.stateDir = stateDir;
|
|
120
|
+
this.extractor = extractor;
|
|
121
|
+
// Destructure so they are NOT included in opts (stored separately)
|
|
122
|
+
const { idleCheckOverride, recentPainContext, ...restOptions } = options;
|
|
123
|
+
this.idleCheckOverride = idleCheckOverride;
|
|
124
|
+
this.recentPainContext = recentPainContext;
|
|
125
|
+
this.opts = {
|
|
126
|
+
minViolationDensity: restOptions.minViolationDensity ?? 0.1,
|
|
127
|
+
maxSessionCandidates: restOptions.maxSessionCandidates ?? 50,
|
|
128
|
+
idleThresholdMs: restOptions.idleThresholdMs ?? DEFAULT_IDLE_THRESHOLD_MS,
|
|
129
|
+
};
|
|
130
|
+
}
|
|
131
|
+
/**
|
|
132
|
+
* Select a target principle and violating session.
|
|
133
|
+
*
|
|
134
|
+
* @returns NocturnalSelectionResult with either selected targets or skip reason
|
|
135
|
+
*/
|
|
136
|
+
select() {
|
|
137
|
+
const diagnostics = {
|
|
138
|
+
totalEvaluablePrinciples: 0,
|
|
139
|
+
filteredByCooldown: 0,
|
|
140
|
+
passedPrinciples: [],
|
|
141
|
+
violatingSessionCount: 0,
|
|
142
|
+
selectedSessionViolationDensity: null,
|
|
143
|
+
selectedPrincipleScore: null,
|
|
144
|
+
scoringBreakdown: {},
|
|
145
|
+
idleCheckPassed: false,
|
|
146
|
+
cooldownCheckPassed: false,
|
|
147
|
+
quotaCheckPassed: false,
|
|
148
|
+
painContext: this.recentPainContext ? {
|
|
149
|
+
recentPainCount: this.recentPainContext.recentPainCount,
|
|
150
|
+
recentMaxPainScore: this.recentPainContext.recentMaxPainScore,
|
|
151
|
+
hasRecentPain: this.recentPainContext.recentPainCount > 0,
|
|
152
|
+
painSource: this.recentPainContext.mostRecent?.source,
|
|
153
|
+
} : undefined,
|
|
154
|
+
};
|
|
155
|
+
// Step 1: Idle check — if workspace is not idle, skip
|
|
156
|
+
const idleResult = this.idleCheckOverride ?? checkWorkspaceIdle(this.workspaceDir, {
|
|
157
|
+
idleThresholdMs: this.opts.idleThresholdMs,
|
|
158
|
+
});
|
|
159
|
+
diagnostics.idleCheckPassed = idleResult.isIdle;
|
|
160
|
+
if (!idleResult.isIdle) {
|
|
161
|
+
return {
|
|
162
|
+
decision: 'skip',
|
|
163
|
+
skipReason: 'workspace_not_idle',
|
|
164
|
+
diagnostics,
|
|
165
|
+
};
|
|
166
|
+
}
|
|
167
|
+
// Step 2: Cooldown and quota check
|
|
168
|
+
const cooldownResult = checkCooldown(this.stateDir);
|
|
169
|
+
diagnostics.cooldownCheckPassed = !cooldownResult.globalCooldownActive;
|
|
170
|
+
diagnostics.quotaCheckPassed = !cooldownResult.quotaExhausted;
|
|
171
|
+
if (cooldownResult.globalCooldownActive) {
|
|
172
|
+
return {
|
|
173
|
+
decision: 'skip',
|
|
174
|
+
skipReason: 'global_cooldown_active',
|
|
175
|
+
diagnostics,
|
|
176
|
+
};
|
|
177
|
+
}
|
|
178
|
+
if (cooldownResult.quotaExhausted) {
|
|
179
|
+
return {
|
|
180
|
+
decision: 'skip',
|
|
181
|
+
skipReason: 'quota_exhausted',
|
|
182
|
+
diagnostics,
|
|
183
|
+
};
|
|
184
|
+
}
|
|
185
|
+
// Step 3: Get evaluable principles
|
|
186
|
+
const evaluablePrinciples = listEvaluablePrinciples(this.stateDir);
|
|
187
|
+
diagnostics.totalEvaluablePrinciples = evaluablePrinciples.length;
|
|
188
|
+
if (evaluablePrinciples.length === 0) {
|
|
189
|
+
return {
|
|
190
|
+
decision: 'skip',
|
|
191
|
+
skipReason: 'no_evaluable_principles',
|
|
192
|
+
diagnostics,
|
|
193
|
+
};
|
|
194
|
+
}
|
|
195
|
+
// Step 4: Score and filter candidates
|
|
196
|
+
const scoredPrinciples = [];
|
|
197
|
+
for (const state of evaluablePrinciples) {
|
|
198
|
+
const cooldownCheck = checkCooldown(this.stateDir, state.principleId);
|
|
199
|
+
const cooldownActive = cooldownCheck.principleCooldownActive;
|
|
200
|
+
const score = scorePrinciple(state, cooldownActive, this.recentPainContext);
|
|
201
|
+
if (cooldownActive) {
|
|
202
|
+
diagnostics.filteredByCooldown++;
|
|
203
|
+
}
|
|
204
|
+
scoredPrinciples.push({
|
|
205
|
+
principleId: state.principleId,
|
|
206
|
+
state,
|
|
207
|
+
score,
|
|
208
|
+
violationDensity: state.applicableOpportunityCount > 0
|
|
209
|
+
? state.observedViolationCount / state.applicableOpportunityCount
|
|
210
|
+
: 0,
|
|
211
|
+
cooldownActive,
|
|
212
|
+
});
|
|
213
|
+
diagnostics.scoringBreakdown[state.principleId] = score;
|
|
214
|
+
}
|
|
215
|
+
// Filter out principles in cooldown (score already penalized but keep them in diagnostics)
|
|
216
|
+
const activeCandidates = scoredPrinciples.filter((p) => !p.cooldownActive);
|
|
217
|
+
if (activeCandidates.length === 0) {
|
|
218
|
+
diagnostics.passedPrinciples = [];
|
|
219
|
+
return {
|
|
220
|
+
decision: 'skip',
|
|
221
|
+
skipReason: 'all_targets_in_cooldown',
|
|
222
|
+
diagnostics,
|
|
223
|
+
};
|
|
224
|
+
}
|
|
225
|
+
// Sort by score descending
|
|
226
|
+
activeCandidates.sort((a, b) => b.score - a.score);
|
|
227
|
+
diagnostics.passedPrinciples = activeCandidates.map((p) => p.principleId);
|
|
228
|
+
// Select the top candidate
|
|
229
|
+
const selected = activeCandidates[0];
|
|
230
|
+
diagnostics.selectedPrincipleScore = selected.score;
|
|
231
|
+
// Step 5: Find violating sessions for the selected principle
|
|
232
|
+
const recentSessions = this.extractor.listRecentNocturnalCandidateSessions({
|
|
233
|
+
limit: this.opts.maxSessionCandidates,
|
|
234
|
+
minToolCalls: 1,
|
|
235
|
+
});
|
|
236
|
+
if (recentSessions.length === 0) {
|
|
237
|
+
return {
|
|
238
|
+
decision: 'skip',
|
|
239
|
+
skipReason: 'insufficient_snapshot_data',
|
|
240
|
+
diagnostics,
|
|
241
|
+
};
|
|
242
|
+
}
|
|
243
|
+
// Compute violation signals for each session
|
|
244
|
+
const violatingSessions = recentSessions.map((session) => {
|
|
245
|
+
const violationDensity = computeViolationDensity(session);
|
|
246
|
+
const snapshot = this.extractor.getNocturnalSessionSnapshot(session.sessionId);
|
|
247
|
+
// Use nocturnal-compliance to detect violations for the selected principle
|
|
248
|
+
let hasViolation = false;
|
|
249
|
+
if (snapshot) {
|
|
250
|
+
const violationResult = detectViolation(selected.principleId, {
|
|
251
|
+
sessionId: session.sessionId,
|
|
252
|
+
toolCalls: snapshot.toolCalls.map((tc) => ({
|
|
253
|
+
toolName: tc.toolName,
|
|
254
|
+
filePath: tc.filePath ?? undefined,
|
|
255
|
+
outcome: tc.outcome,
|
|
256
|
+
errorMessage: tc.errorMessage ?? undefined,
|
|
257
|
+
})),
|
|
258
|
+
painSignals: snapshot.painEvents.map((pe) => ({
|
|
259
|
+
source: pe.source,
|
|
260
|
+
score: pe.score,
|
|
261
|
+
reason: pe.reason ?? undefined,
|
|
262
|
+
})),
|
|
263
|
+
gateBlocks: snapshot.gateBlocks.map((gb) => ({
|
|
264
|
+
toolName: gb.toolName,
|
|
265
|
+
reason: gb.reason,
|
|
266
|
+
})),
|
|
267
|
+
userCorrections: [],
|
|
268
|
+
planApprovals: [],
|
|
269
|
+
});
|
|
270
|
+
hasViolation = violationResult.violated;
|
|
271
|
+
}
|
|
272
|
+
return {
|
|
273
|
+
sessionId: session.sessionId,
|
|
274
|
+
hasViolation,
|
|
275
|
+
violationSeverity: violationDensity,
|
|
276
|
+
failureCount: session.failureCount,
|
|
277
|
+
painEventCount: session.painEventCount,
|
|
278
|
+
gateBlockCount: session.gateBlockCount,
|
|
279
|
+
toolCallCount: session.toolCallCount,
|
|
280
|
+
};
|
|
281
|
+
});
|
|
282
|
+
// Filter to sessions with violations above threshold
|
|
283
|
+
const violating = violatingSessions.filter((s) => s.hasViolation && s.violationSeverity >= this.opts.minViolationDensity);
|
|
284
|
+
diagnostics.violatingSessionCount = violating.length;
|
|
285
|
+
if (violating.length === 0) {
|
|
286
|
+
return {
|
|
287
|
+
decision: 'skip',
|
|
288
|
+
skipReason: 'no_violating_sessions',
|
|
289
|
+
diagnostics,
|
|
290
|
+
};
|
|
291
|
+
}
|
|
292
|
+
// Sort by violation severity descending (most violating first)
|
|
293
|
+
violating.sort((a, b) => b.violationSeverity - a.violationSeverity);
|
|
294
|
+
const selectedSession = violating[0];
|
|
295
|
+
diagnostics.selectedSessionViolationDensity = selectedSession.violationSeverity;
|
|
296
|
+
return {
|
|
297
|
+
decision: 'selected',
|
|
298
|
+
selectedPrincipleId: selected.principleId,
|
|
299
|
+
selectedSessionId: selectedSession.sessionId,
|
|
300
|
+
diagnostics,
|
|
301
|
+
};
|
|
302
|
+
}
|
|
303
|
+
}
|
|
304
|
+
// ---------------------------------------------------------------------------
|
|
305
|
+
// Convenience function
|
|
306
|
+
// ---------------------------------------------------------------------------
|
|
307
|
+
/**
|
|
308
|
+
* Select a nocturnal target (principle + session) with default options.
|
|
309
|
+
*
|
|
310
|
+
* This is a convenience wrapper for the common case.
|
|
311
|
+
*/
|
|
312
|
+
export function selectNocturnalTarget(workspaceDir, stateDir, extractor, options = {}) {
|
|
313
|
+
const selector = new NocturnalTargetSelector(workspaceDir, stateDir, extractor, options);
|
|
314
|
+
return selector.select();
|
|
315
|
+
}
|
|
@@ -1,13 +1,33 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Phase 3 Input Filter
|
|
3
|
+
*
|
|
4
|
+
* CRITICAL: evaluatePhase3Inputs() does NOT read or use evolution_directive.json
|
|
5
|
+
* Directive is a compatibility-only display artifact, not a truth source.
|
|
6
|
+
*
|
|
7
|
+
* Phase 3 eligibility depends ONLY on:
|
|
8
|
+
* - Queue truth (valid evolution samples from queue)
|
|
9
|
+
*
|
|
10
|
+
* Any directive file is ignored for eligibility decisions.
|
|
11
|
+
*
|
|
12
|
+
* THREE-LANE CLASSIFICATION:
|
|
13
|
+
* - authoritative: Valid inputs that can be used for Phase 3 eligibility decisions
|
|
14
|
+
* - reference_only: Valid evidence that must NOT be used as positive eligibility input
|
|
15
|
+
* (e.g., timeout-only outcomes - they indicate completion but not success)
|
|
16
|
+
* - rejected: Invalid, corrupt, or policy-prohibited input
|
|
17
|
+
*/
|
|
18
|
+
/**
|
|
19
|
+
* Classification for Phase 3 inputs.
|
|
20
|
+
* - authoritative: Can be used for Phase 3 eligibility decisions
|
|
21
|
+
* - reference_only: Valid data but not for eligibility (e.g., timeout outcomes)
|
|
22
|
+
* - rejected: Invalid or corrupt data
|
|
23
|
+
*/
|
|
24
|
+
export type Phase3Classification = 'authoritative' | 'reference_only' | 'rejected';
|
|
1
25
|
export interface Phase3EvolutionInput {
|
|
2
26
|
id?: string | null;
|
|
3
27
|
status?: string | null;
|
|
4
28
|
started_at?: string | null;
|
|
5
29
|
completed_at?: string | null;
|
|
6
|
-
|
|
7
|
-
export interface Phase3TrustInput {
|
|
8
|
-
score?: number | null;
|
|
9
|
-
frozen?: boolean | null;
|
|
10
|
-
lastUpdated?: string | null;
|
|
30
|
+
resolution?: string | null;
|
|
11
31
|
}
|
|
12
32
|
export interface Phase3EvolutionSample {
|
|
13
33
|
taskId: string;
|
|
@@ -15,23 +35,39 @@ export interface Phase3EvolutionSample {
|
|
|
15
35
|
startedAt: string | null;
|
|
16
36
|
completedAt: string | null;
|
|
17
37
|
}
|
|
38
|
+
export interface Phase3ReferenceOnlySample {
|
|
39
|
+
taskId: string;
|
|
40
|
+
status: string;
|
|
41
|
+
classification: 'timeout_only' | 'other_reference';
|
|
42
|
+
reason: string;
|
|
43
|
+
}
|
|
18
44
|
export interface Phase3RejectedEvolutionSample {
|
|
19
45
|
taskId: string | null;
|
|
20
46
|
status: string | null;
|
|
21
47
|
reasons: string[];
|
|
22
48
|
}
|
|
23
|
-
export interface Phase3TrustResult {
|
|
24
|
-
eligible: boolean;
|
|
25
|
-
rejectedReasons: string[];
|
|
26
|
-
}
|
|
27
49
|
export interface Phase3InputFilterResult {
|
|
28
50
|
queueTruthReady: boolean;
|
|
29
|
-
trustInputReady: boolean;
|
|
30
51
|
phase3ShadowEligible: boolean;
|
|
31
52
|
evolution: {
|
|
32
53
|
eligible: Phase3EvolutionSample[];
|
|
54
|
+
referenceOnly: Phase3ReferenceOnlySample[];
|
|
33
55
|
rejected: Phase3RejectedEvolutionSample[];
|
|
34
56
|
};
|
|
35
|
-
trust: Phase3TrustResult;
|
|
36
57
|
}
|
|
37
|
-
|
|
58
|
+
/**
|
|
59
|
+
* Evaluates Phase 3 readiness based on queue inputs.
|
|
60
|
+
*
|
|
61
|
+
* IMPORTANT: Does NOT use evolution_directive.json.
|
|
62
|
+
* Directive is compatibility-only display artifact, not a truth source.
|
|
63
|
+
* Queue is the only authoritative execution truth source for Phase 3.
|
|
64
|
+
*
|
|
65
|
+
* THREE-LANE CLASSIFICATION:
|
|
66
|
+
* - authoritative: Valid inputs for Phase 3 eligibility
|
|
67
|
+
* - reference_only: Valid evidence but not for eligibility (e.g., timeout outcomes)
|
|
68
|
+
* - rejected: Invalid, corrupt, or policy-prohibited input
|
|
69
|
+
*
|
|
70
|
+
* @param queue - Evolution queue items to validate
|
|
71
|
+
* @returns Phase 3 eligibility results
|
|
72
|
+
*/
|
|
73
|
+
export declare function evaluatePhase3Inputs(queue: Phase3EvolutionInput[]): Phase3InputFilterResult;
|