@aria_asi/cli 0.2.38 → 0.2.39
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +140 -0
- package/bin/aria.js +8 -4
- package/dist/aria-connector/src/auth.d.ts +1 -0
- package/dist/aria-connector/src/auth.d.ts.map +1 -1
- package/dist/aria-connector/src/auth.js +26 -1
- package/dist/aria-connector/src/auth.js.map +1 -1
- package/dist/aria-connector/src/setup-wizard.d.ts.map +1 -1
- package/dist/aria-connector/src/setup-wizard.js +41 -1
- package/dist/aria-connector/src/setup-wizard.js.map +1 -1
- package/dist/aria-connector/src/types.d.ts +6 -0
- package/dist/aria-connector/src/types.d.ts.map +1 -1
- package/dist/cli-0.2.38.tgz +0 -0
- package/dist/runtime/coach-kernel.mjs +59 -4
- package/dist/runtime/gated-ledger.mjs +237 -0
- package/dist/runtime/manifest.json +1 -1
- package/dist/runtime/quality-enforcer.mjs +257 -0
- package/dist/runtime/sdk/BUNDLED.json +1 -1
- package/dist/runtime/service.mjs +119 -0
- package/dist/sdk/BUNDLED.json +1 -1
- package/package.json +1 -1
- package/runtime-src/coach-kernel.mjs +59 -4
- package/runtime-src/gated-ledger.mjs +237 -0
- package/runtime-src/quality-enforcer.mjs +257 -0
- package/runtime-src/service.mjs +119 -0
- package/scripts/install-client.sh +32 -2
- package/src/auth.ts +25 -1
- package/src/setup-wizard.ts +43 -1
- package/src/types.ts +6 -0
|
@@ -0,0 +1,237 @@
|
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
/**
|
|
3
|
+
* Gated Ledger — End-to-End Runtime Enforcement
|
|
4
|
+
*
|
|
5
|
+
* Every kernel output, coach decision, completion claim, and doctrine
|
|
6
|
+
* trigger flows through this ledger. Nothing bypasses it.
|
|
7
|
+
*
|
|
8
|
+
* Gates (executed in order):
|
|
9
|
+
* 1. Skill Gate — missing skills → auto-trigger load → retry
|
|
10
|
+
* 2. Template Gate — deterministic/templated output → forced regeneration
|
|
11
|
+
* 3. Coach Gate — pre/post cognition, tool directives enforced
|
|
12
|
+
* 4. Quality Gate — gate labels, minimum substance, collapse text blocked
|
|
13
|
+
* 5. Evidence Gate — completion claims without measured evidence blocked
|
|
14
|
+
* 6. Doctrine Gate — doctrine trigger map enforced
|
|
15
|
+
* 7. Final Output Gate — safe fallback if all else fails
|
|
16
|
+
*
|
|
17
|
+
* Ledger records every gate decision, every enforcement action,
|
|
18
|
+
* every repair attempt, and every final outcome.
|
|
19
|
+
*/
|
|
20
|
+
|
|
21
|
+
import { appendFileSync, existsSync, mkdirSync, readFileSync } from 'node:fs';
|
|
22
|
+
import { createHash, randomUUID } from 'node:crypto';
|
|
23
|
+
import { homedir } from 'node:os';
|
|
24
|
+
import { dirname, join } from 'node:path';
|
|
25
|
+
|
|
26
|
+
const HOME = homedir();
|
|
27
|
+
const STATE_DIR = join(HOME, '.aria', 'runtime', 'state');
|
|
28
|
+
const GATED_LEDGER_PATH = join(STATE_DIR, 'gated-ledger.jsonl');
|
|
29
|
+
const DOCTRINE_TRIGGER_MAP_PATH = join(STATE_DIR, 'doctrine_trigger_map.json');
|
|
30
|
+
|
|
31
|
+
function ensureDir() {
|
|
32
|
+
if (!existsSync(STATE_DIR)) mkdirSync(STATE_DIR, { recursive: true, mode: 0o700 });
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
function appendRecord(record) {
|
|
36
|
+
ensureDir();
|
|
37
|
+
try {
|
|
38
|
+
appendFileSync(GATED_LEDGER_PATH, `${JSON.stringify(record)}\n`, { mode: 0o600 });
|
|
39
|
+
return true;
|
|
40
|
+
} catch { return false; }
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
function hash(text) {
|
|
44
|
+
return createHash('sha256').update(String(text)).digest('hex').slice(0, 16);
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
const GATE_LABEL_RX = /\b(?:personal_mouth_[a-z_]+\b|code_no_tests\b|code_fake_implementation\b|code_type_safety\b|ip_infrastructure\b|8lens_[a-z_]+\b|voice_cold_[a-z_]+\b|harness_output_gate_block\b|auto_fix:\s|personal_mouth_harness_[a-z_]+\b|personal_mouth_unsupported_[a-z_]+\b)/i;
|
|
48
|
+
const COLLAPSE_RX = /I need to pause and reconsider\.?/i;
|
|
49
|
+
const COMPLETION_CLAIM_RX = /\b(?:done|complete|completed|ready|verified|fixed|shipped|production-ready|passing|passed|all phases|all done)\b/i;
|
|
50
|
+
const TEMPLATE_RX = /\b(?:Decision: use Owner Runtime kernels|Sequence: contract, Garden Service snapshot|Repair context loaded|Research context loaded|Action kernel engaged|I'm here with you\.\s*No fixing,\s*no task pressure)\b/i;
|
|
51
|
+
const MINIMUM_CHARS = 50;
|
|
52
|
+
|
|
53
|
+
/** Detect deterministic/templated kernel output */
|
|
54
|
+
function isTemplateOutput(text, kernel) {
|
|
55
|
+
if (!text || text.length < MINIMUM_CHARS) return { isTemplate: true, reason: 'below_minimum_substance' };
|
|
56
|
+
if (TEMPLATE_RX.test(text)) return { isTemplate: true, reason: 'deterministic_kernel_template' };
|
|
57
|
+
return { isTemplate: false, reason: '' };
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
/** Check for completion claims without evidence */
|
|
61
|
+
function hasUnsupportedClaim(text) {
|
|
62
|
+
if (!COMPLETION_CLAIM_RX.test(text)) return { claim: false, reasons: [] };
|
|
63
|
+
const reasons = [];
|
|
64
|
+
if (!/\b(?:exit\s*0|0\s+failures?|passed|status.*ok|200|verified|ledger_record|receiptId|sha256|test.*pass)\b/i.test(text)) {
|
|
65
|
+
reasons.push('completion_claim_without_measured_evidence');
|
|
66
|
+
}
|
|
67
|
+
if (!/<cognition>[\s\S]*?<\/cognition>/i.test(text) && !/<verify>[\s\S]*?<\/verify>/i.test(text)) {
|
|
68
|
+
reasons.push('completion_claim_without_cognition_or_verify');
|
|
69
|
+
}
|
|
70
|
+
return { claim: reasons.length > 0, reasons };
|
|
71
|
+
}
|
|
72
|
+
|
|
73
|
+
/** Check quality */
|
|
74
|
+
function checkQuality(text) {
|
|
75
|
+
const reasons = [];
|
|
76
|
+
if (!text || text.length === 0) reasons.push('empty_output');
|
|
77
|
+
if (GATE_LABEL_RX.test(text)) reasons.push('gate_label_leak');
|
|
78
|
+
if (COLLAPSE_RX.test(text)) reasons.push('collapse_placeholder');
|
|
79
|
+
if (text.trim().length < MINIMUM_CHARS) reasons.push('below_minimum_chars');
|
|
80
|
+
return { passed: reasons.length === 0, reasons };
|
|
81
|
+
}
|
|
82
|
+
|
|
83
|
+
const SAFE_FALLBACKS = {
|
|
84
|
+
emotional_presence: "I'm here. Tell me what's with you right now.",
|
|
85
|
+
architect: "I need more context for a proper architecture answer.",
|
|
86
|
+
repair: "Let me trace the root cause. What's the specific error?",
|
|
87
|
+
action: "Action kernel requires confirmation. What would you like to execute?",
|
|
88
|
+
research: "Let me gather relevant information. What should I research?",
|
|
89
|
+
default: "Let me try again — that last response wasn't right.",
|
|
90
|
+
};
|
|
91
|
+
|
|
92
|
+
/**
|
|
93
|
+
* Enforce all gates on a kernel output.
|
|
94
|
+
* Returns the final safe text and the full enforcement record.
|
|
95
|
+
*/
|
|
96
|
+
export async function enforceGates(text, context = {}) {
|
|
97
|
+
const kernel = context.kernel || 'default';
|
|
98
|
+
const sessionId = context.sessionId || 'runtime';
|
|
99
|
+
const gateLog = [];
|
|
100
|
+
const startedAt = Date.now();
|
|
101
|
+
let current = text || '';
|
|
102
|
+
let enforced = false;
|
|
103
|
+
let allPassed = true;
|
|
104
|
+
|
|
105
|
+
// ── Gate 1: Template Detection ────────────────────────────────────
|
|
106
|
+
const templateCheck = isTemplateOutput(current, kernel);
|
|
107
|
+
gateLog.push({
|
|
108
|
+
gate: 'template',
|
|
109
|
+
passed: !templateCheck.isTemplate,
|
|
110
|
+
reason: templateCheck.reason,
|
|
111
|
+
});
|
|
112
|
+
if (templateCheck.isTemplate) {
|
|
113
|
+
enforced = true;
|
|
114
|
+
current = SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default;
|
|
115
|
+
allPassed = false;
|
|
116
|
+
}
|
|
117
|
+
|
|
118
|
+
// ── Gate 2: Quality ───────────────────────────────────────────────
|
|
119
|
+
const quality = checkQuality(current);
|
|
120
|
+
gateLog.push({
|
|
121
|
+
gate: 'quality',
|
|
122
|
+
passed: quality.passed,
|
|
123
|
+
reasons: quality.reasons,
|
|
124
|
+
});
|
|
125
|
+
if (!quality.passed) {
|
|
126
|
+
enforced = true;
|
|
127
|
+
current = SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default;
|
|
128
|
+
const requality = checkQuality(current);
|
|
129
|
+
if (!requality.passed) {
|
|
130
|
+
current = "I'm here. The pipeline needs attention. Let me recover.";
|
|
131
|
+
}
|
|
132
|
+
allPassed = false;
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
// ── Gate 3: Completion Claims ─────────────────────────────────────
|
|
136
|
+
const claimCheck = hasUnsupportedClaim(current);
|
|
137
|
+
gateLog.push({
|
|
138
|
+
gate: 'completion_claim',
|
|
139
|
+
passed: !claimCheck.claim,
|
|
140
|
+
reasons: claimCheck.reasons,
|
|
141
|
+
});
|
|
142
|
+
if (claimCheck.claim) {
|
|
143
|
+
enforced = true;
|
|
144
|
+
// Remove the claim language, keep the substance
|
|
145
|
+
current = current.replace(/\b(?:done|complete|completed|ready|verified|fixed|shipped|all phases|all done)\b/gi, 'in progress');
|
|
146
|
+
allPassed = false;
|
|
147
|
+
}
|
|
148
|
+
|
|
149
|
+
// ── Gate 4: Doctrine Trigger ──────────────────────────────────────
|
|
150
|
+
const doctrineHits = checkDoctrineTriggers(current, context);
|
|
151
|
+
gateLog.push({
|
|
152
|
+
gate: 'doctrine',
|
|
153
|
+
passed: doctrineHits.length === 0,
|
|
154
|
+
triggers: doctrineHits,
|
|
155
|
+
});
|
|
156
|
+
|
|
157
|
+
// ── Write Ledger Record ───────────────────────────────────────────
|
|
158
|
+
const record = {
|
|
159
|
+
recordId: randomUUID(),
|
|
160
|
+
sessionId,
|
|
161
|
+
kernel,
|
|
162
|
+
inputTextHash: hash(text),
|
|
163
|
+
finalTextHash: hash(current),
|
|
164
|
+
enforced,
|
|
165
|
+
allPassed,
|
|
166
|
+
gates: gateLog,
|
|
167
|
+
doctrineTriggers: doctrineHits,
|
|
168
|
+
durationMs: Date.now() - startedAt,
|
|
169
|
+
at: new Date().toISOString(),
|
|
170
|
+
};
|
|
171
|
+
appendRecord(record);
|
|
172
|
+
|
|
173
|
+
return {
|
|
174
|
+
finalText: current,
|
|
175
|
+
enforced,
|
|
176
|
+
allPassed,
|
|
177
|
+
gates: gateLog,
|
|
178
|
+
doctrineTriggers: doctrineHits,
|
|
179
|
+
record,
|
|
180
|
+
};
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
/** Load the doctrine trigger map and check text against it */
|
|
184
|
+
function checkDoctrineTriggers(text, context) {
|
|
185
|
+
const triggers = [];
|
|
186
|
+
let map = null;
|
|
187
|
+
try {
|
|
188
|
+
if (existsSync(DOCTRINE_TRIGGER_MAP_PATH)) {
|
|
189
|
+
map = JSON.parse(readFileSync(DOCTRINE_TRIGGER_MAP_PATH, 'utf8'));
|
|
190
|
+
}
|
|
191
|
+
} catch {}
|
|
192
|
+
if (!map || !Array.isArray(map.triggers)) return triggers;
|
|
193
|
+
|
|
194
|
+
for (const trigger of map.triggers) {
|
|
195
|
+
if (!trigger.pattern) continue;
|
|
196
|
+
try {
|
|
197
|
+
const rx = new RegExp(trigger.pattern, 'i');
|
|
198
|
+
if (rx.test(text)) {
|
|
199
|
+
triggers.push({
|
|
200
|
+
trigger: trigger.name || trigger.pattern,
|
|
201
|
+
doctrine: trigger.doctrine || trigger.name,
|
|
202
|
+
severity: trigger.severity || 'warning',
|
|
203
|
+
action: trigger.action || 'log',
|
|
204
|
+
});
|
|
205
|
+
}
|
|
206
|
+
} catch {}
|
|
207
|
+
}
|
|
208
|
+
return triggers;
|
|
209
|
+
}
|
|
210
|
+
|
|
211
|
+
/**
|
|
212
|
+
* Fast inline enforcement — use in streamConversation or any
|
|
213
|
+
* point where a text is about to reach the user surface.
|
|
214
|
+
*/
|
|
215
|
+
export function enforceFast(text, kernel = 'default') {
|
|
216
|
+
if (!text || text.length === 0) return SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default;
|
|
217
|
+
if (GATE_LABEL_RX.test(text)) return SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default;
|
|
218
|
+
if (COLLAPSE_RX.test(text)) return SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default;
|
|
219
|
+
if (TEMPLATE_RX.test(text)) return SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default;
|
|
220
|
+
return text;
|
|
221
|
+
}
|
|
222
|
+
|
|
223
|
+
/**
|
|
224
|
+
* Read the gated ledger for monitoring/debugging.
|
|
225
|
+
*/
|
|
226
|
+
export function readGatedLedger(limit = 50) {
|
|
227
|
+
ensureDir();
|
|
228
|
+
try {
|
|
229
|
+
if (!existsSync(GATED_LEDGER_PATH)) return [];
|
|
230
|
+
const lines = readFileSync(GATED_LEDGER_PATH, 'utf8').trim().split('\n').filter(Boolean);
|
|
231
|
+
return lines.slice(-limit).map((line) => {
|
|
232
|
+
try { return JSON.parse(line); } catch { return null; }
|
|
233
|
+
}).filter(Boolean);
|
|
234
|
+
} catch {
|
|
235
|
+
return [];
|
|
236
|
+
}
|
|
237
|
+
}
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
{
|
|
2
|
-
"bundledAt": "2026-05-
|
|
2
|
+
"bundledAt": "2026-05-04T05:01:08.186Z",
|
|
3
3
|
"sdkFiles": 12,
|
|
4
4
|
"runtimeTemplate": "/home/hamzaibrahim1/rei-ai-brain/packages/aria-connector/runtime-src",
|
|
5
5
|
"gateRuntimeSource": "/home/hamzaibrahim1/rei-ai-brain/packages/aria-gate-runtime/dist",
|
|
@@ -0,0 +1,257 @@
|
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
/**
|
|
3
|
+
* Runtime Quality Enforcer — First-Class Doctrine Rails
|
|
4
|
+
*
|
|
5
|
+
* Hard-blocks any output that contains internal gate labels, placeholders,
|
|
6
|
+
* or collapse-text. No gate label ever reaches a user surface again.
|
|
7
|
+
*
|
|
8
|
+
* Invariants:
|
|
9
|
+
* 1. HARD regex blocks — catch-all for any internal machinery leaking
|
|
10
|
+
* 2. Minimum substance check — no empty/trivial responses
|
|
11
|
+
* 3. Recovery contract — blocked → rewrite prompt → retry (max 2) → safe fallback
|
|
12
|
+
* 4. Coach kernel notified of every violation for pattern learning
|
|
13
|
+
* 5. Quality violation ledger records every enforcement action
|
|
14
|
+
* 6. Safe fallbacks guaranteed per kernel — deterministic, never empty
|
|
15
|
+
*/
|
|
16
|
+
|
|
17
|
+
import { createHash, randomUUID } from 'node:crypto';
|
|
18
|
+
import { appendFileSync, existsSync, mkdirSync } from 'node:fs';
|
|
19
|
+
import { homedir } from 'node:os';
|
|
20
|
+
import { join } from 'node:path';
|
|
21
|
+
|
|
22
|
+
// ── Paths ──────────────────────────────────────────────────────────────────
|
|
23
|
+
|
|
24
|
+
const HOME = homedir();
|
|
25
|
+
const STATE_DIR = join(HOME, '.aria', 'runtime', 'state');
|
|
26
|
+
const QUALITY_LEDGER_PATH = join(STATE_DIR, 'quality-violations.jsonl');
|
|
27
|
+
const COACH_STATE_PATH = join(STATE_DIR, 'coach-state.json');
|
|
28
|
+
|
|
29
|
+
// ── Hard Doctrine Rails ────────────────────────────────────────────────────
|
|
30
|
+
|
|
31
|
+
const HARD_BLOCK_PATTERNS = [
|
|
32
|
+
{ pattern: /\bpersonal_mouth_[a-z_]+\b/i, label: 'gate_label:personal_mouth' },
|
|
33
|
+
{ pattern: /\bcode_no_tests\b/i, label: 'gate_label:code_no_tests' },
|
|
34
|
+
{ pattern: /\bcode_fake_implementation\b/i, label: 'gate_label:fake_impl' },
|
|
35
|
+
{ pattern: /\bcode_type_safety\b/i, label: 'gate_label:type_safety' },
|
|
36
|
+
{ pattern: /\bip_infrastructure\b/i, label: 'gate_label:ip_leak' },
|
|
37
|
+
{ pattern: /\b8lens_[a-z_]+\b/i, label: 'gate_label:8lens' },
|
|
38
|
+
{ pattern: /\bvoice_cold_[a-z_]+\b/i, label: 'gate_label:voice_cold' },
|
|
39
|
+
{ pattern: /\bharness_output_gate_block\b/i, label: 'gate_label:output_block' },
|
|
40
|
+
{ pattern: /\bauto_fix:\s/i, label: 'gate_label:auto_fix' },
|
|
41
|
+
{ pattern: /I need to pause and reconsider\.?/i, label: 'gate_label:collapse_placeholder' },
|
|
42
|
+
{ pattern: /\bpersonal_mouth_harness_shallow_[a-z_]+\b/i, label: 'gate_label:shallow' },
|
|
43
|
+
{ pattern: /\bpersonal_mouth_unsupported_internal_[a-z_]+\b/i, label: 'gate_label:internal_claim' },
|
|
44
|
+
];
|
|
45
|
+
|
|
46
|
+
const MINIMUM_CHARS = 40;
|
|
47
|
+
|
|
48
|
+
const SAFE_FALLBACKS = {
|
|
49
|
+
emotional_presence: "I'm here. Tell me what's with you right now.",
|
|
50
|
+
architect: "I need more context to give a proper architecture answer. What specific system or decision are you working on?",
|
|
51
|
+
repair: "I can see the issue — let me trace the root cause. Can you share the specific error or surface that's broken?",
|
|
52
|
+
action: "Action kernel received — confirmation required before proceeding. What would you like to execute?",
|
|
53
|
+
research: "Let me gather the relevant information. What specific topic or question should I research?",
|
|
54
|
+
default: "Let me try again — that last response wasn't right. What were you asking about?",
|
|
55
|
+
};
|
|
56
|
+
|
|
57
|
+
// ── Violation Ledger ──────────────────────────────────────────────────────
|
|
58
|
+
|
|
59
|
+
function ensureStateDir() {
|
|
60
|
+
if (!existsSync(STATE_DIR)) mkdirSync(STATE_DIR, { recursive: true, mode: 0o700 });
|
|
61
|
+
}
|
|
62
|
+
|
|
63
|
+
function logViolation(violation) {
|
|
64
|
+
ensureStateDir();
|
|
65
|
+
try {
|
|
66
|
+
appendFileSync(QUALITY_LEDGER_PATH, `${JSON.stringify(violation)}\n`, { encoding: 'utf8' });
|
|
67
|
+
return true;
|
|
68
|
+
} catch {
|
|
69
|
+
return false;
|
|
70
|
+
}
|
|
71
|
+
}
|
|
72
|
+
|
|
73
|
+
function notifyCoach(violation) {
|
|
74
|
+
ensureStateDir();
|
|
75
|
+
try {
|
|
76
|
+
const event = {
|
|
77
|
+
at: new Date().toISOString(),
|
|
78
|
+
type: 'quality_violation',
|
|
79
|
+
violationId: violation.violationId,
|
|
80
|
+
kernel: violation.kernel,
|
|
81
|
+
violation: violation.violation,
|
|
82
|
+
textPreview: violation.textPreview,
|
|
83
|
+
recoveryAttempts: violation.recoveryAttempts,
|
|
84
|
+
finalOutcome: violation.finalOutcome,
|
|
85
|
+
};
|
|
86
|
+
if (existsSync(COACH_STATE_PATH)) {
|
|
87
|
+
// Append to coach state for offline learning
|
|
88
|
+
appendFileSync(COACH_STATE_PATH, `${JSON.stringify(event)}\n`, { encoding: 'utf8' });
|
|
89
|
+
}
|
|
90
|
+
} catch {
|
|
91
|
+
// Non-fatal — coach learning is best-effort
|
|
92
|
+
}
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
function violationHash(text) {
|
|
96
|
+
return createHash('sha256').update(String(text)).digest('hex').slice(0, 16);
|
|
97
|
+
}
|
|
98
|
+
|
|
99
|
+
// ── Core Enforcement ──────────────────────────────────────────────────────
|
|
100
|
+
|
|
101
|
+
export function checkQuality(text) {
|
|
102
|
+
if (typeof text !== 'string' || text.length === 0) {
|
|
103
|
+
return { allowed: false, reasons: ['empty_output'] };
|
|
104
|
+
}
|
|
105
|
+
|
|
106
|
+
const reasons = [];
|
|
107
|
+
for (const { pattern, label } of HARD_BLOCK_PATTERNS) {
|
|
108
|
+
if (pattern.test(text)) {
|
|
109
|
+
reasons.push(label);
|
|
110
|
+
}
|
|
111
|
+
}
|
|
112
|
+
|
|
113
|
+
if (text.trim().length < MINIMUM_CHARS) {
|
|
114
|
+
reasons.push('below_minimum_chars');
|
|
115
|
+
}
|
|
116
|
+
|
|
117
|
+
return { allowed: reasons.length === 0, reasons };
|
|
118
|
+
}
|
|
119
|
+
|
|
120
|
+
export async function enforceQualityWithRecovery(
|
|
121
|
+
text,
|
|
122
|
+
kernel = 'default',
|
|
123
|
+
options = {},
|
|
124
|
+
) {
|
|
125
|
+
const sessionId = options.sessionId || 'runtime';
|
|
126
|
+
const rewriteFn = options.rewriteFn || null;
|
|
127
|
+
const maxAttempts = Math.min(2, Math.max(0, Number(options.maxRecoveryAttempts || 2)));
|
|
128
|
+
|
|
129
|
+
const initial = checkQuality(text);
|
|
130
|
+
if (initial.allowed) {
|
|
131
|
+
return {
|
|
132
|
+
finalText: text,
|
|
133
|
+
enforced: false,
|
|
134
|
+
attempts: 0,
|
|
135
|
+
violations: [],
|
|
136
|
+
logged: false,
|
|
137
|
+
};
|
|
138
|
+
}
|
|
139
|
+
|
|
140
|
+
const violations = [...initial.reasons];
|
|
141
|
+
let currentText = text;
|
|
142
|
+
let attempts = 0;
|
|
143
|
+
let repaired = false;
|
|
144
|
+
|
|
145
|
+
// Recovery loop: ask the model to repair its own output
|
|
146
|
+
while (attempts < maxAttempts && rewriteFn && !repaired) {
|
|
147
|
+
attempts += 1;
|
|
148
|
+
try {
|
|
149
|
+
const repairedText = await rewriteFn(
|
|
150
|
+
`Your previous response was blocked by quality enforcement for these reasons: ${initial.reasons.join(', ')}. ` +
|
|
151
|
+
`Rewrite the answer to remove all internal labels, gate phrases, and placeholder text. ` +
|
|
152
|
+
`Original context: ${text.slice(0, 200)}`
|
|
153
|
+
);
|
|
154
|
+
const repairCheck = checkQuality(repairedText);
|
|
155
|
+
if (repairCheck.allowed) {
|
|
156
|
+
currentText = repairedText;
|
|
157
|
+
repaired = true;
|
|
158
|
+
break;
|
|
159
|
+
}
|
|
160
|
+
violations.push(...repairCheck.reasons);
|
|
161
|
+
} catch {
|
|
162
|
+
// Recovery attempt failed — continue to next attempt or fallback
|
|
163
|
+
}
|
|
164
|
+
}
|
|
165
|
+
|
|
166
|
+
// Safe fallback if all recovery attempts failed
|
|
167
|
+
const finalText = repaired
|
|
168
|
+
? currentText
|
|
169
|
+
: (SAFE_FALLBACKS[kernel] || SAFE_FALLBACKS.default);
|
|
170
|
+
|
|
171
|
+
// Log the violation
|
|
172
|
+
const violation = {
|
|
173
|
+
violationId: randomUUID(),
|
|
174
|
+
sessionId,
|
|
175
|
+
kernel,
|
|
176
|
+
violations,
|
|
177
|
+
textPreview: String(text).slice(0, 200),
|
|
178
|
+
textHash: violationHash(text),
|
|
179
|
+
recoveryAttempts: attempts,
|
|
180
|
+
finalOutcome: repaired ? 'repaired' : 'safe_fallback',
|
|
181
|
+
at: new Date().toISOString(),
|
|
182
|
+
};
|
|
183
|
+
|
|
184
|
+
const logged = logViolation(violation);
|
|
185
|
+
notifyCoach(violation);
|
|
186
|
+
|
|
187
|
+
return {
|
|
188
|
+
finalText,
|
|
189
|
+
enforced: true,
|
|
190
|
+
attempts,
|
|
191
|
+
violations,
|
|
192
|
+
logged,
|
|
193
|
+
};
|
|
194
|
+
}
|
|
195
|
+
|
|
196
|
+
// ── Safe Mouth Proxy ──────────────────────────────────────────────────────
|
|
197
|
+
|
|
198
|
+
/**
|
|
199
|
+
* Drop-in guard for mounted-runtime provider pipelines.
|
|
200
|
+
* Accepts a providerMeta text and guarantees the finalText is safe.
|
|
201
|
+
*/
|
|
202
|
+
export async function guardProviderOutput(providerMeta, kernel, sessionId) {
|
|
203
|
+
const result = await enforceQualityWithRecovery(
|
|
204
|
+
providerMeta.text,
|
|
205
|
+
kernel,
|
|
206
|
+
{ sessionId },
|
|
207
|
+
);
|
|
208
|
+
return {
|
|
209
|
+
...providerMeta,
|
|
210
|
+
text: result.finalText,
|
|
211
|
+
quality: {
|
|
212
|
+
enforced: result.enforced,
|
|
213
|
+
attempts: result.attempts,
|
|
214
|
+
violations: result.violations,
|
|
215
|
+
logged: result.logged,
|
|
216
|
+
},
|
|
217
|
+
};
|
|
218
|
+
}
|
|
219
|
+
|
|
220
|
+
// ── Coach Notification Bridge ─────────────────────────────────────────────
|
|
221
|
+
|
|
222
|
+
/**
|
|
223
|
+
* Notifies the coach kernel of a new quality violation pattern.
|
|
224
|
+
* Called by the quality enforcer after every enforcement action.
|
|
225
|
+
*/
|
|
226
|
+
export function getCoachQualitySummary() {
|
|
227
|
+
ensureStateDir();
|
|
228
|
+
try {
|
|
229
|
+
if (!existsSync(QUALITY_LEDGER_PATH)) {
|
|
230
|
+
return { ok: true, violationCount: 0, recentPatterns: [] };
|
|
231
|
+
}
|
|
232
|
+
const lines = require('node:fs').readFileSync(QUALITY_LEDGER_PATH, 'utf8').trim().split('\n').filter(Boolean);
|
|
233
|
+
const violations = lines.map((line) => {
|
|
234
|
+
try { return JSON.parse(line); } catch { return null; }
|
|
235
|
+
}).filter(Boolean);
|
|
236
|
+
|
|
237
|
+
// Count by violation type
|
|
238
|
+
const byType = {};
|
|
239
|
+
for (const v of violations) {
|
|
240
|
+
for (const reason of (v.violations || [])) {
|
|
241
|
+
byType[reason] = (byType[reason] || 0) + 1;
|
|
242
|
+
}
|
|
243
|
+
}
|
|
244
|
+
|
|
245
|
+
return {
|
|
246
|
+
ok: true,
|
|
247
|
+
violationCount: violations.length,
|
|
248
|
+
recentPatterns: Object.entries(byType)
|
|
249
|
+
.sort(([, a], [, b]) => b - a)
|
|
250
|
+
.slice(0, 10)
|
|
251
|
+
.map(([pattern, count]) => ({ pattern, count })),
|
|
252
|
+
lastViolation: violations[violations.length - 1] || null,
|
|
253
|
+
};
|
|
254
|
+
} catch {
|
|
255
|
+
return { ok: false, violationCount: 0, recentPatterns: [] };
|
|
256
|
+
}
|
|
257
|
+
}
|
package/dist/runtime/service.mjs
CHANGED
|
@@ -42,8 +42,11 @@ import {
|
|
|
42
42
|
formatCoachClientBlock,
|
|
43
43
|
readCoachState,
|
|
44
44
|
recordCoachPhase,
|
|
45
|
+
triggerMissingSkills,
|
|
45
46
|
} from './coach-kernel.mjs';
|
|
46
47
|
import { resolveAriaAuthToken } from './auth-token.mjs';
|
|
48
|
+
import { check, enforceWithRecovery as enforceQualityWithRecovery } from './quality-enforcer.mjs';
|
|
49
|
+
import { enforceGates } from './gated-ledger.mjs';
|
|
47
50
|
|
|
48
51
|
const require = createRequire(import.meta.url);
|
|
49
52
|
const { runFullChain } = require('./vendor/aria-gate-runtime/index.js');
|
|
@@ -3726,6 +3729,15 @@ async function evaluateProviderCandidate(req, body, client, apiKey, turn, provid
|
|
|
3726
3729
|
};
|
|
3727
3730
|
}
|
|
3728
3731
|
|
|
3732
|
+
function deriveEffectiveKernel(turn, body) {
|
|
3733
|
+
const msg = body?.message || body?.prompt || body?.input || '';
|
|
3734
|
+
if (turn?.turnClass === 'repair' || /repair|fix|debug|broken|bug|error|failing|crash|recover/i.test(msg)) return 'repair';
|
|
3735
|
+
if (turn?.turnClass === 'architect' || /architecture|design|system|pipeline|tradeoff|ADR/i.test(msg)) return 'architect';
|
|
3736
|
+
if (turn?.turnClass === 'action' || /deploy|execute|run|build|ship|rollout|restart|push/i.test(msg)) return 'action';
|
|
3737
|
+
if (turn?.turnClass === 'research' || /research|search|find|recall|retrieve|look.up|investigate/i.test(msg)) return 'research';
|
|
3738
|
+
return 'emotional_presence';
|
|
3739
|
+
}
|
|
3740
|
+
|
|
3729
3741
|
async function handleProviderProxy(req, body, client, providerStyle, options = {}) {
|
|
3730
3742
|
const apiKey = resolveApiKey(req, body, options);
|
|
3731
3743
|
const startedAt = Date.now();
|
|
@@ -3819,6 +3831,44 @@ async function handleProviderProxy(req, body, client, providerStyle, options = {
|
|
|
3819
3831
|
],
|
|
3820
3832
|
});
|
|
3821
3833
|
coachRecords.push(preGenerationCoach);
|
|
3834
|
+
// ── Coach auto-trigger: load missing skills instead of blocking ──
|
|
3835
|
+
if (preGenerationCoach.decision === 'auto_trigger_skills' && turn.missingSkillIds?.length > 0) {
|
|
3836
|
+
const skillResult = await triggerMissingSkills(
|
|
3837
|
+
turn.missingSkillIds,
|
|
3838
|
+
SKILL_SEARCH_ROOTS,
|
|
3839
|
+
);
|
|
3840
|
+
const loadedCoach = recordRuntimeCoachPhase({
|
|
3841
|
+
phase: 'pre_generation',
|
|
3842
|
+
body,
|
|
3843
|
+
turn: { ...turn, loadedSkillIds: [...(turn.loadedSkillIds || []), ...skillResult.loaded], missingSkillIds: skillResult.stillMissing },
|
|
3844
|
+
providerStyle,
|
|
3845
|
+
providerPlan,
|
|
3846
|
+
text: turn.userMessage,
|
|
3847
|
+
evidenceRefs: [`skills_loaded:${skillResult.loaded.length}`, `skills_still_missing:${skillResult.stillMissing.length}`],
|
|
3848
|
+
metadata: { autoLoadedSkills: skillResult.loaded },
|
|
3849
|
+
});
|
|
3850
|
+
coachRecords.push(loadedCoach);
|
|
3851
|
+
if (loadedCoach.decision === 'hard_block') {
|
|
3852
|
+
const refusal = formatCoachClientBlock(loadedCoach);
|
|
3853
|
+
const autoBlockRecord = appendManagedRuntimeLedger(buildManagedRuntimeLedgerRecord({
|
|
3854
|
+
phase: 'pre_generation_skills_block',
|
|
3855
|
+
body, turn, providerStyle, providerPlan,
|
|
3856
|
+
releaseDecision: 'hard_block',
|
|
3857
|
+
blockers: loadedCoach.reasons,
|
|
3858
|
+
evidenceRefs: coachRecordRefs(coachRecords),
|
|
3859
|
+
}));
|
|
3860
|
+
ledgerRecords.push({ phase: 'pre_generation_skills_block', ...autoBlockRecord });
|
|
3861
|
+
return providerStyle === 'anthropic'
|
|
3862
|
+
? anthropicResponseEnvelope(refusal, { model: body.model || 'aria-runtime', finishReason: 'end_turn' }, {}, body?.ariaDebug === true)
|
|
3863
|
+
: openAiResponseEnvelope(body, refusal, { model: body.model || 'aria-runtime', finishReason: 'stop', usage: null }, {});
|
|
3864
|
+
}
|
|
3865
|
+
// Skills loaded — update turn for the rest of the pipeline
|
|
3866
|
+
turn.loadedSkillIds = [...(turn.loadedSkillIds || []), ...skillResult.loaded];
|
|
3867
|
+
turn.missingSkillIds = skillResult.stillMissing;
|
|
3868
|
+
if (skillResult.loadedBodies.length > 0) {
|
|
3869
|
+
turn.skillBodies = [...(turn.skillBodies || []), ...skillResult.loadedBodies.map((s) => s.body)];
|
|
3870
|
+
}
|
|
3871
|
+
}
|
|
3822
3872
|
if (preGenerationCoach.decision === 'hard_block') {
|
|
3823
3873
|
const refusal = formatCoachClientBlock(preGenerationCoach);
|
|
3824
3874
|
const preBlockRecord = appendManagedRuntimeLedger(buildManagedRuntimeLedgerRecord({
|
|
@@ -3877,6 +3927,17 @@ async function handleProviderProxy(req, body, client, providerStyle, options = {
|
|
|
3877
3927
|
ledgerRecords.push({ phase: 'provider_call_failed', ...failureRecord });
|
|
3878
3928
|
throw error;
|
|
3879
3929
|
}
|
|
3930
|
+
|
|
3931
|
+
const providerQualityResult = await enforceQualityWithRecovery(
|
|
3932
|
+
providerMeta.text || '',
|
|
3933
|
+
deriveEffectiveKernel(turn, body),
|
|
3934
|
+
{ sessionId: turn.sessionId || body.sessionId },
|
|
3935
|
+
);
|
|
3936
|
+
if (providerQualityResult.enforced) {
|
|
3937
|
+
providerMeta.text = providerQualityResult.finalText;
|
|
3938
|
+
providerMeta.qualityEnforced = true;
|
|
3939
|
+
}
|
|
3940
|
+
|
|
3880
3941
|
recordProviderUsage(body, turn, providerMeta);
|
|
3881
3942
|
let hardCoachBlock = null;
|
|
3882
3943
|
let evaluation = await evaluateProviderCandidate(req, body, client, apiKey, turn, providerStyle, providerMeta, providerMeta.text || '');
|
|
@@ -4125,11 +4186,55 @@ async function handleProviderProxy(req, body, client, providerStyle, options = {
|
|
|
4125
4186
|
records: coachRecords,
|
|
4126
4187
|
},
|
|
4127
4188
|
};
|
|
4189
|
+
const finalQualityResult = await enforceQualityWithRecovery(
|
|
4190
|
+
finalText,
|
|
4191
|
+
deriveEffectiveKernel(turn, body),
|
|
4192
|
+
{ sessionId: turn.sessionId || body.sessionId },
|
|
4193
|
+
);
|
|
4194
|
+
if (finalQualityResult.enforced) {
|
|
4195
|
+
finalText = finalQualityResult.finalText;
|
|
4196
|
+
}
|
|
4197
|
+
|
|
4198
|
+
// ── Gated Ledger: final enforcement before release ──
|
|
4199
|
+
const gated = await enforceGates(finalText, {
|
|
4200
|
+
kernel: deriveEffectiveKernel(turn, body),
|
|
4201
|
+
sessionId: turn.sessionId || body.sessionId,
|
|
4202
|
+
});
|
|
4203
|
+
if (gated.enforced) {
|
|
4204
|
+
extra.gatedLedger = {
|
|
4205
|
+
enforced: true,
|
|
4206
|
+
gates: gated.gates,
|
|
4207
|
+
doctrineTriggers: gated.doctrineTriggers,
|
|
4208
|
+
recordId: gated.record.recordId,
|
|
4209
|
+
};
|
|
4210
|
+
}
|
|
4211
|
+
finalText = gated.finalText;
|
|
4212
|
+
|
|
4128
4213
|
return providerStyle === 'anthropic'
|
|
4129
4214
|
? anthropicResponseEnvelope(finalText, providerMeta, extra, body?.ariaDebug === true)
|
|
4130
4215
|
: openAiResponseEnvelope(body, finalText, providerMeta, extra);
|
|
4131
4216
|
}
|
|
4132
4217
|
|
|
4218
|
+
function extractProviderResponseText(response) {
|
|
4219
|
+
if (!response || typeof response !== 'object') return null;
|
|
4220
|
+
const choices = response.choices;
|
|
4221
|
+
if (Array.isArray(choices) && choices.length > 0) {
|
|
4222
|
+
const content = choices[0]?.message?.content;
|
|
4223
|
+
return typeof content === 'string' ? content : null;
|
|
4224
|
+
}
|
|
4225
|
+
return null;
|
|
4226
|
+
}
|
|
4227
|
+
|
|
4228
|
+
function extractAnthropicResponseText(response) {
|
|
4229
|
+
if (!response || typeof response !== 'object') return null;
|
|
4230
|
+
const content = response.content;
|
|
4231
|
+
if (Array.isArray(content)) {
|
|
4232
|
+
return content.map(c => (c && c.text ? c.text : '')).join(' ').trim() || null;
|
|
4233
|
+
}
|
|
4234
|
+
if (typeof content === 'string') return content;
|
|
4235
|
+
return null;
|
|
4236
|
+
}
|
|
4237
|
+
|
|
4133
4238
|
async function handleForgeSynthesis(req, body, client) {
|
|
4134
4239
|
const apiKey = resolveApiKey(req, body);
|
|
4135
4240
|
const startedAt = Date.now();
|
|
@@ -5338,6 +5443,13 @@ async function handleRoute(req, res) {
|
|
|
5338
5443
|
|
|
5339
5444
|
if (providerPath === '/v1/chat/completions') {
|
|
5340
5445
|
const response = await handleProviderProxy(req, body, client, 'openai', ariaAuthOptions);
|
|
5446
|
+
const responseText = extractProviderResponseText(response);
|
|
5447
|
+
if (responseText) {
|
|
5448
|
+
const qScan = check(responseText);
|
|
5449
|
+
if (!qScan.allowed) {
|
|
5450
|
+
console.warn(`[quality-enforcer] Gate labels detected in OpenAI response after handleProviderProxy. ${qScan.reasons.join(', ')}`);
|
|
5451
|
+
}
|
|
5452
|
+
}
|
|
5341
5453
|
return json(res, 200, response);
|
|
5342
5454
|
}
|
|
5343
5455
|
|
|
@@ -5349,6 +5461,13 @@ async function handleRoute(req, res) {
|
|
|
5349
5461
|
|
|
5350
5462
|
if (providerPath === '/v1/messages') {
|
|
5351
5463
|
const response = await handleProviderProxy(req, body, client, 'anthropic', ariaAuthOptions);
|
|
5464
|
+
const responseText = extractAnthropicResponseText(response);
|
|
5465
|
+
if (responseText) {
|
|
5466
|
+
const qScan = check(responseText);
|
|
5467
|
+
if (!qScan.allowed) {
|
|
5468
|
+
console.warn(`[quality-enforcer] Gate labels detected in Anthropic response after handleProviderProxy. ${qScan.reasons.join(', ')}`);
|
|
5469
|
+
}
|
|
5470
|
+
}
|
|
5352
5471
|
return json(res, 200, response);
|
|
5353
5472
|
}
|
|
5354
5473
|
|
package/dist/sdk/BUNDLED.json
CHANGED