@gajae-code/coding-agent 0.6.4 → 0.6.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +22 -0
- package/dist/types/cli/migrate-cli.d.ts +20 -0
- package/dist/types/commands/migrate.d.ts +33 -0
- package/dist/types/config/keybindings.d.ts +4 -0
- package/dist/types/gjc-runtime/deep-interview-recorder.d.ts +2 -0
- package/dist/types/gjc-runtime/deep-interview-runtime.d.ts +2 -2
- package/dist/types/gjc-runtime/goal-mode-request.d.ts +1 -1
- package/dist/types/gjc-runtime/session-layout.d.ts +59 -0
- package/dist/types/gjc-runtime/session-resolution.d.ts +47 -0
- package/dist/types/gjc-runtime/state-graph.d.ts +1 -1
- package/dist/types/gjc-runtime/state-runtime.d.ts +5 -4
- package/dist/types/gjc-runtime/state-schema.d.ts +2 -0
- package/dist/types/gjc-runtime/state-writer.d.ts +36 -7
- package/dist/types/gjc-runtime/ultragoal-runtime.d.ts +7 -4
- package/dist/types/gjc-runtime/workflow-command-ref.d.ts +1 -1
- package/dist/types/gjc-runtime/workflow-manifest.d.ts +1 -1
- package/dist/types/harness-control-plane/storage.d.ts +2 -1
- package/dist/types/hooks/skill-state.d.ts +12 -4
- package/dist/types/migrate/action-planner.d.ts +11 -0
- package/dist/types/migrate/adapters/claude-code.d.ts +2 -0
- package/dist/types/migrate/adapters/codex.d.ts +5 -0
- package/dist/types/migrate/adapters/index.d.ts +45 -0
- package/dist/types/migrate/adapters/opencode.d.ts +2 -0
- package/dist/types/migrate/executor.d.ts +2 -0
- package/dist/types/migrate/mcp-mapper.d.ts +20 -0
- package/dist/types/migrate/report.d.ts +18 -0
- package/dist/types/migrate/skill-normalizer.d.ts +27 -0
- package/dist/types/migrate/types.d.ts +126 -0
- package/dist/types/modes/components/custom-editor.d.ts +1 -1
- package/dist/types/modes/shared/agent-wire/unattended-audit.d.ts +1 -1
- package/dist/types/research-plan/index.d.ts +1 -0
- package/dist/types/research-plan/ledger.d.ts +33 -0
- package/dist/types/rlm/artifacts.d.ts +1 -1
- package/dist/types/runtime-mcp/config-writer.d.ts +26 -0
- package/dist/types/skill-state/active-state.d.ts +6 -11
- package/dist/types/skill-state/canonical-skills.d.ts +3 -0
- package/dist/types/skill-state/workflow-hud.d.ts +2 -0
- package/dist/types/task/spawn-gate.d.ts +1 -10
- package/package.json +7 -7
- package/src/cli/migrate-cli.ts +106 -0
- package/src/cli.ts +1 -0
- package/src/commands/deep-interview.ts +2 -2
- package/src/commands/migrate.ts +46 -0
- package/src/commands/state.ts +2 -1
- package/src/commands/team.ts +7 -3
- package/src/coordinator-mcp/policy.ts +10 -2
- package/src/defaults/gjc/extensions/grok-cli-vendor/biome.json +0 -1
- package/src/defaults/gjc/skills/deep-interview/SKILL.md +28 -24
- package/src/defaults/gjc/skills/ralplan/SKILL.md +8 -4
- package/src/defaults/gjc/skills/team/SKILL.md +51 -47
- package/src/defaults/gjc/skills/ultragoal/SKILL.md +17 -13
- package/src/extensibility/custom-commands/loader.ts +0 -7
- package/src/extensibility/gjc-plugins/injection.ts +23 -4
- package/src/extensibility/gjc-plugins/state.ts +16 -1
- package/src/gjc-runtime/deep-interview-recorder.ts +43 -18
- package/src/gjc-runtime/deep-interview-runtime.ts +49 -23
- package/src/gjc-runtime/goal-mode-request.ts +26 -11
- package/src/gjc-runtime/launch-tmux.ts +6 -1
- package/src/gjc-runtime/ralplan-runtime.ts +79 -50
- package/src/gjc-runtime/session-layout.ts +180 -0
- package/src/gjc-runtime/session-resolution.ts +217 -0
- package/src/gjc-runtime/state-graph.ts +1 -2
- package/src/gjc-runtime/state-migrations.ts +1 -0
- package/src/gjc-runtime/state-runtime.ts +230 -121
- package/src/gjc-runtime/state-schema.ts +2 -0
- package/src/gjc-runtime/state-writer.ts +289 -41
- package/src/gjc-runtime/team-runtime.ts +43 -19
- package/src/gjc-runtime/tmux-sessions.ts +7 -1
- package/src/gjc-runtime/ultragoal-guard.ts +45 -2
- package/src/gjc-runtime/ultragoal-runtime.ts +121 -41
- package/src/gjc-runtime/workflow-command-ref.ts +1 -2
- package/src/gjc-runtime/workflow-manifest.ts +1 -2
- package/src/harness-control-plane/storage.ts +14 -4
- package/src/hooks/native-skill-hook.ts +38 -12
- package/src/hooks/skill-state.ts +178 -83
- package/src/internal-urls/docs-index.generated.ts +6 -4
- package/src/migrate/action-planner.ts +318 -0
- package/src/migrate/adapters/claude-code.ts +39 -0
- package/src/migrate/adapters/codex.ts +70 -0
- package/src/migrate/adapters/index.ts +277 -0
- package/src/migrate/adapters/opencode.ts +52 -0
- package/src/migrate/executor.ts +81 -0
- package/src/migrate/mcp-mapper.ts +152 -0
- package/src/migrate/report.ts +104 -0
- package/src/migrate/skill-normalizer.ts +80 -0
- package/src/migrate/types.ts +163 -0
- package/src/modes/bridge/bridge-mode.ts +2 -2
- package/src/modes/components/custom-editor.ts +30 -20
- package/src/modes/rpc/rpc-mode.ts +2 -2
- package/src/modes/shared/agent-wire/unattended-audit.ts +3 -2
- package/src/prompts/agents/init.md +1 -1
- package/src/prompts/system/plan-mode-active.md +1 -1
- package/src/prompts/tools/ast-grep.md +1 -1
- package/src/prompts/tools/search.md +1 -1
- package/src/prompts/tools/task.md +1 -2
- package/src/research-plan/index.ts +1 -0
- package/src/research-plan/ledger.ts +177 -0
- package/src/rlm/artifacts.ts +12 -3
- package/src/rlm/index.ts +7 -0
- package/src/runtime-mcp/config-writer.ts +46 -0
- package/src/session/agent-session.ts +15 -21
- package/src/setup/hermes-setup.ts +1 -1
- package/src/skill-state/active-state.ts +72 -108
- package/src/skill-state/canonical-skills.ts +4 -0
- package/src/skill-state/deep-interview-mutation-guard.ts +28 -109
- package/src/skill-state/workflow-hud.ts +4 -2
- package/src/skill-state/workflow-state-contract.ts +3 -3
- package/src/task/agents.ts +1 -22
- package/src/task/index.ts +1 -41
- package/src/task/spawn-gate.ts +1 -38
- package/src/task/types.ts +1 -1
- package/src/tools/ask.ts +34 -12
- package/src/tools/computer.ts +58 -4
- package/dist/types/extensibility/custom-commands/bundled/review/index.d.ts +0 -10
- package/src/extensibility/custom-commands/bundled/review/index.ts +0 -456
- package/src/prompts/agents/explore.md +0 -58
- package/src/prompts/agents/plan.md +0 -49
- package/src/prompts/agents/reviewer.md +0 -141
- package/src/prompts/agents/task.md +0 -16
- package/src/prompts/review-request.md +0 -70
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
import { Editor, type KeyId, matchesKey, parseKittySequence } from "@gajae-code/tui";
|
|
2
2
|
import { BracketedPasteHandler } from "@gajae-code/tui/bracketed-paste";
|
|
3
|
-
import type
|
|
3
|
+
import { type AppKeybinding, KEYBINDINGS } from "../../config/keybindings";
|
|
4
4
|
|
|
5
5
|
type ConfigurableEditorAction = Extract<
|
|
6
6
|
AppKeybinding,
|
|
@@ -23,25 +23,35 @@ type ConfigurableEditorAction = Extract<
|
|
|
23
23
|
| "app.clipboard.copyPrompt"
|
|
24
24
|
>;
|
|
25
25
|
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
"app.
|
|
31
|
-
"app.
|
|
32
|
-
"app.
|
|
33
|
-
"app.
|
|
34
|
-
"app.
|
|
35
|
-
"app.model.
|
|
36
|
-
"app.
|
|
37
|
-
"app.
|
|
38
|
-
"app.
|
|
39
|
-
"app.
|
|
40
|
-
"app.
|
|
41
|
-
"app.
|
|
42
|
-
"app.
|
|
43
|
-
"app.
|
|
44
|
-
|
|
26
|
+
// Editor-configurable app actions. Defaults are derived from the central
|
|
27
|
+
// KEYBINDINGS registry so there is a single source of truth (e.g. the
|
|
28
|
+
// platform-aware app.clipboard.pasteImage default is not duplicated here).
|
|
29
|
+
const CONFIGURABLE_EDITOR_ACTIONS = [
|
|
30
|
+
"app.interrupt",
|
|
31
|
+
"app.clear",
|
|
32
|
+
"app.exit",
|
|
33
|
+
"app.suspend",
|
|
34
|
+
"app.thinking.cycle",
|
|
35
|
+
"app.model.cycleForward",
|
|
36
|
+
"app.model.cycleBackward",
|
|
37
|
+
"app.model.select",
|
|
38
|
+
"app.model.selectTemporary",
|
|
39
|
+
"app.tools.expand",
|
|
40
|
+
"app.thinking.toggle",
|
|
41
|
+
"app.editor.external",
|
|
42
|
+
"app.history.search",
|
|
43
|
+
"app.message.queue",
|
|
44
|
+
"app.message.dequeue",
|
|
45
|
+
"app.clipboard.pasteImage",
|
|
46
|
+
"app.clipboard.copyPrompt",
|
|
47
|
+
] as const satisfies readonly ConfigurableEditorAction[];
|
|
48
|
+
|
|
49
|
+
const DEFAULT_ACTION_KEYS = Object.fromEntries(
|
|
50
|
+
CONFIGURABLE_EDITOR_ACTIONS.map(action => {
|
|
51
|
+
const defaultKeys = KEYBINDINGS[action].defaultKeys;
|
|
52
|
+
return [action, Array.isArray(defaultKeys) ? [...defaultKeys] : [defaultKeys]];
|
|
53
|
+
}),
|
|
54
|
+
) as Record<ConfigurableEditorAction, KeyId[]>;
|
|
45
55
|
|
|
46
56
|
const PASTE_DECISION_TIMEOUT_MS = 5_000;
|
|
47
57
|
const PENDING_PASTE_INPUT_MAX = 64;
|
|
@@ -11,13 +11,13 @@
|
|
|
11
11
|
* - Extension UI: Extension UI requests are emitted, client responds with extension_ui_response
|
|
12
12
|
*/
|
|
13
13
|
|
|
14
|
-
import * as path from "node:path";
|
|
15
14
|
import { $pickenv, logger, readLines, Snowflake } from "@gajae-code/utils";
|
|
16
15
|
import type {
|
|
17
16
|
ExtensionUIContext,
|
|
18
17
|
ExtensionUIDialogOptions,
|
|
19
18
|
ExtensionWidgetOptions,
|
|
20
19
|
} from "../../extensibility/extensions";
|
|
20
|
+
import { workflowGatePath } from "../../gjc-runtime/session-layout";
|
|
21
21
|
import { type Theme, theme } from "../../modes/theme/theme";
|
|
22
22
|
import type { AgentSession } from "../../session/agent-session";
|
|
23
23
|
import { initializeExtensions } from "../runtime-init";
|
|
@@ -336,7 +336,7 @@ export async function runRpcMode(
|
|
|
336
336
|
// Unattended control plane (#318/#319/#323/G011): routes negotiate_unattended +
|
|
337
337
|
// workflow_gate_response and lets skill runtimes emit gates over RPC.
|
|
338
338
|
const gateStore = new FileGateStore(
|
|
339
|
-
|
|
339
|
+
workflowGatePath(session.sessionManager.getCwd(), session.sessionId, session.sessionId),
|
|
340
340
|
);
|
|
341
341
|
const unattendedControlPlane = new UnattendedSessionControlPlane({
|
|
342
342
|
runId: session.sessionId,
|
|
@@ -12,6 +12,7 @@
|
|
|
12
12
|
*/
|
|
13
13
|
import { closeSync, fsyncSync, mkdirSync, openSync, readFileSync, writeSync } from "node:fs";
|
|
14
14
|
import * as path from "node:path";
|
|
15
|
+
import { sessionAuditDir } from "../../../gjc-runtime/session-layout";
|
|
15
16
|
import type { RpcBudgetExceeded, RpcWorkflowGateKind, RpcWorkflowStage } from "../../rpc/rpc-types";
|
|
16
17
|
import { answerHashOf } from "./workflow-gate-schema";
|
|
17
18
|
|
|
@@ -69,9 +70,9 @@ function defaultId(): string {
|
|
|
69
70
|
return `ae_${Date.now().toString(36)}_${idCounter.toString(36)}`;
|
|
70
71
|
}
|
|
71
72
|
|
|
72
|
-
export function defaultAuditPath(runId: string, root = process.cwd()): string {
|
|
73
|
+
export function defaultAuditPath(runId: string, root = process.cwd(), gjcSessionId = runId): string {
|
|
73
74
|
const safe = runId.replace(/[^a-zA-Z0-9_.-]/g, "_");
|
|
74
|
-
return path.join(root,
|
|
75
|
+
return path.join(sessionAuditDir(root, gjcSessionId), "unattended", `${safe}.jsonl`);
|
|
75
76
|
}
|
|
76
77
|
|
|
77
78
|
/** Append-only audit log writer + reader for one unattended run. */
|
|
@@ -5,7 +5,7 @@ thinking-level: medium
|
|
|
5
5
|
hide: true
|
|
6
6
|
---
|
|
7
7
|
|
|
8
|
-
Generate AGENTS.md by launching multiple
|
|
8
|
+
Generate AGENTS.md by launching multiple canonical role agents in parallel (via `task` tool, usually `planner` or `architect`) scanning different areas (core src, tests, configs/build, scripts/docs), then synthesize findings into a single file.
|
|
9
9
|
|
|
10
10
|
<structure>
|
|
11
11
|
- **Project Overview**: Brief description of project purpose
|
|
@@ -82,7 +82,7 @@ The plan MUST be scannable yet detailed enough to execute.
|
|
|
82
82
|
|
|
83
83
|
<procedure>
|
|
84
84
|
### Phase 1: Understand
|
|
85
|
-
You MUST focus on the request and associated code. You SHOULD launch parallel
|
|
85
|
+
You MUST focus on the request and associated code. You SHOULD launch parallel canonical role agents (`planner` or `architect`) when scope spans multiple areas.
|
|
86
86
|
|
|
87
87
|
### Phase 2: Design
|
|
88
88
|
You MUST draft an approach based on exploration. You MUST consider trade-offs briefly, then choose.
|
|
@@ -38,5 +38,5 @@ Performs structural code search using AST matching via native ast-grep.
|
|
|
38
38
|
<critical>
|
|
39
39
|
- Avoid repo-root scans — narrow `paths` first
|
|
40
40
|
- Parse issues are query failure, not evidence of absence: repair the pattern or tighten `paths` before concluding "no matches"
|
|
41
|
-
- For broad/open-ended
|
|
41
|
+
- For broad/open-ended inspection across subsystems, delegate a bounded fact-finding task to an appropriate canonical role agent (`planner` or `architect`) first
|
|
42
42
|
</critical>
|
|
@@ -21,5 +21,5 @@ Searches files using powerful regex matching.
|
|
|
21
21
|
- You MUST use the built-in `search` tool for any content search. NEVER shell out to `grep`, `rg`, `ripgrep`, `ag`, `ack`, `git grep`, `awk`, `sed`-for-search, or any other CLI search via Bash — even for a single match, even "just to check quickly", even piped through other commands.
|
|
22
22
|
- Bash `grep`/`rg` loses `.gitignore` semantics, bypasses result limits, and wastes tokens. The `search` tool is faster, structured, and already wired into the workspace — there is no scenario where Bash search is preferable.
|
|
23
23
|
- If you catch yourself typing `grep`, `rg`, or `| grep` in a Bash command, stop and re-issue the lookup through the `search` tool instead.
|
|
24
|
-
- If the search is open-ended
|
|
24
|
+
- If the search is open-ended and requires multiple rounds across subsystems, delegate a bounded fact-finding task to an appropriate canonical role agent (`planner` for sequencing/context maps or `architect` for read-only architecture assessment) instead of chaining broad `search` calls yourself.
|
|
25
25
|
</critical>
|
|
@@ -28,13 +28,12 @@ Subagents have no conversation history. Every fact, file path, and direction the
|
|
|
28
28
|
{{/if}}
|
|
29
29
|
{{#if independentMode}}- `.inheritContext`: independent mode cannot inherit parent conversation. Omit it or set `"none"`; any non-`none` value is rejected before scheduling.{{/if}}
|
|
30
30
|
{{#if customSchemaEnabled}}- `schema`: JTD schema for expected structured output (do not put format rules in assignments){{/if}}
|
|
31
|
-
- `spawnPlan` (optional): required before any batch with more than 4 tasks
|
|
31
|
+
- `spawnPlan` (optional): required before any batch with more than 4 tasks; include whyParallel, whyNotLocal, independence, expectedReceiptShape, and maxInlineTokens.
|
|
32
32
|
{{#if isolationEnabled}}- `isolated`: run in isolated env; use when tasks edit overlapping files{{/if}}
|
|
33
33
|
</parameters>
|
|
34
34
|
|
|
35
35
|
<rules>
|
|
36
36
|
- HARD runtime gate: calls with more than 4 tasks are rejected before any child launches unless `spawnPlan` is complete.
|
|
37
|
-
- Reviewer->explore gate: a `reviewer` spawning `explore` is rejected before launch unless `spawnPlan` is complete, even for a single task.
|
|
38
37
|
- NEVER assign tasks to run project-wide build/test/lint. Caller verifies after the batch.
|
|
39
38
|
- **Subagents do not verify, lint, or format.** Every assignment MUST instruct the subagent to skip all gates and formatters. You run them once at the end across the union of changed files — avoids redundant runs and racing formatter passes.
|
|
40
39
|
{{#if ircEnabled}}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
export * from "./ledger";
|
|
@@ -0,0 +1,177 @@
|
|
|
1
|
+
export type ResearchPlanConfidence = "low" | "medium" | "high";
|
|
2
|
+
|
|
3
|
+
export type ResearchEvidenceVerdict = "support" | "contradict" | "uncertain";
|
|
4
|
+
|
|
5
|
+
export interface ResearchPlanItem {
|
|
6
|
+
claim: string;
|
|
7
|
+
confidence: ResearchPlanConfidence;
|
|
8
|
+
unknowns: string[];
|
|
9
|
+
evidenceNeeded: string[];
|
|
10
|
+
counterexampleQueries: string[];
|
|
11
|
+
sourceConflictPolicy: string;
|
|
12
|
+
dropCondition: string;
|
|
13
|
+
verifierChecks: string[];
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
export interface ResearchEvidenceEntry {
|
|
17
|
+
claim: string;
|
|
18
|
+
source: string;
|
|
19
|
+
confidence: ResearchPlanConfidence;
|
|
20
|
+
verdict: ResearchEvidenceVerdict;
|
|
21
|
+
notes?: string;
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
export interface ResearchLedgerVerdict {
|
|
25
|
+
claim: string;
|
|
26
|
+
finalVerdict: "accepted" | "rejected" | "uncertain";
|
|
27
|
+
survivingSources: ResearchEvidenceEntry[];
|
|
28
|
+
rejectReason?: string;
|
|
29
|
+
unresolvedUnknowns: string[];
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
export interface ResearchPlanValidationResult {
|
|
33
|
+
valid: boolean;
|
|
34
|
+
errors: string[];
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
const CONFIDENCE_VALUES = new Set<ResearchPlanConfidence>(["low", "medium", "high"]);
|
|
38
|
+
const EVIDENCE_VERDICTS = new Set<ResearchEvidenceVerdict>(["support", "contradict", "uncertain"]);
|
|
39
|
+
|
|
40
|
+
function isNonEmptyString(value: unknown): value is string {
|
|
41
|
+
return typeof value === "string" && value.trim().length > 0;
|
|
42
|
+
}
|
|
43
|
+
|
|
44
|
+
function validateStringArray(value: unknown, field: string, minLength = 1): string[] {
|
|
45
|
+
if (!Array.isArray(value)) return [`${field} must be an array`];
|
|
46
|
+
if (value.length < minLength) return [`${field} must contain at least ${minLength} item(s)`];
|
|
47
|
+
return value.flatMap((item, index) =>
|
|
48
|
+
isNonEmptyString(item) ? [] : [`${field}[${index}] must be a non-empty string`],
|
|
49
|
+
);
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
export function validateResearchPlanItem(item: Partial<ResearchPlanItem>): ResearchPlanValidationResult {
|
|
53
|
+
const errors: string[] = [];
|
|
54
|
+
if (!isNonEmptyString(item.claim)) errors.push("claim must be a non-empty string");
|
|
55
|
+
if (!item.confidence || !CONFIDENCE_VALUES.has(item.confidence)) {
|
|
56
|
+
errors.push("confidence must be one of: low, medium, high");
|
|
57
|
+
}
|
|
58
|
+
errors.push(...validateStringArray(item.unknowns, "unknowns", 0));
|
|
59
|
+
errors.push(...validateStringArray(item.evidenceNeeded, "evidenceNeeded"));
|
|
60
|
+
errors.push(...validateStringArray(item.counterexampleQueries, "counterexampleQueries"));
|
|
61
|
+
if (!isNonEmptyString(item.sourceConflictPolicy)) errors.push("sourceConflictPolicy must be a non-empty string");
|
|
62
|
+
if (!isNonEmptyString(item.dropCondition)) errors.push("dropCondition must be a non-empty string");
|
|
63
|
+
errors.push(...validateStringArray(item.verifierChecks, "verifierChecks"));
|
|
64
|
+
return { valid: errors.length === 0, errors };
|
|
65
|
+
}
|
|
66
|
+
|
|
67
|
+
export function validateResearchEvidenceEntry(entry: Partial<ResearchEvidenceEntry>): ResearchPlanValidationResult {
|
|
68
|
+
const errors: string[] = [];
|
|
69
|
+
if (!isNonEmptyString(entry.claim)) errors.push("claim must be a non-empty string");
|
|
70
|
+
if (!isNonEmptyString(entry.source)) errors.push("source must be a non-empty string");
|
|
71
|
+
if (!entry.confidence || !CONFIDENCE_VALUES.has(entry.confidence)) {
|
|
72
|
+
errors.push("confidence must be one of: low, medium, high");
|
|
73
|
+
}
|
|
74
|
+
if (!entry.verdict || !EVIDENCE_VERDICTS.has(entry.verdict)) {
|
|
75
|
+
errors.push("verdict must be one of: support, contradict, uncertain");
|
|
76
|
+
}
|
|
77
|
+
return { valid: errors.length === 0, errors };
|
|
78
|
+
}
|
|
79
|
+
|
|
80
|
+
function lower(value: string): string {
|
|
81
|
+
return value.toLowerCase();
|
|
82
|
+
}
|
|
83
|
+
|
|
84
|
+
function matchesDropCondition(item: ResearchPlanItem, evidence: ResearchEvidenceEntry[]): string | undefined {
|
|
85
|
+
const condition = lower(item.dropCondition);
|
|
86
|
+
const contradiction = evidence.find(entry => entry.verdict === "contradict");
|
|
87
|
+
if (contradiction && /(counterexample|contradict|conflict|falsif)/.test(condition)) {
|
|
88
|
+
return `dropCondition matched by contradictory source: ${contradiction.source}`;
|
|
89
|
+
}
|
|
90
|
+
const unresolved = evidence.find(entry => entry.verdict === "uncertain");
|
|
91
|
+
if (unresolved && /(unknown|unresolved|uncertain)/.test(condition)) {
|
|
92
|
+
return `dropCondition matched by unresolved evidence: ${unresolved.source}`;
|
|
93
|
+
}
|
|
94
|
+
return undefined;
|
|
95
|
+
}
|
|
96
|
+
|
|
97
|
+
function sourceConflictReason(item: ResearchPlanItem, evidence: ResearchEvidenceEntry[]): string | undefined {
|
|
98
|
+
const supporting = evidence.filter(entry => entry.verdict === "support");
|
|
99
|
+
const contradicting = evidence.filter(entry => entry.verdict === "contradict");
|
|
100
|
+
if (supporting.length === 0 || contradicting.length === 0) return undefined;
|
|
101
|
+
const policy = lower(item.sourceConflictPolicy);
|
|
102
|
+
if (/(reject|drop|do not accept|prefer contradiction|requires resolution)/.test(policy)) {
|
|
103
|
+
return `sourceConflictPolicy rejected mixed support/contradiction (${supporting.length} support, ${contradicting.length} contradict)`;
|
|
104
|
+
}
|
|
105
|
+
return "source conflict remains unresolved";
|
|
106
|
+
}
|
|
107
|
+
|
|
108
|
+
export function evaluateResearchLedger(
|
|
109
|
+
item: ResearchPlanItem,
|
|
110
|
+
evidence: readonly ResearchEvidenceEntry[],
|
|
111
|
+
): ResearchLedgerVerdict {
|
|
112
|
+
const relevantEvidence = evidence.filter(entry => entry.claim === item.claim);
|
|
113
|
+
const invalidItem = validateResearchPlanItem(item);
|
|
114
|
+
if (!invalidItem.valid) {
|
|
115
|
+
return {
|
|
116
|
+
claim: item.claim,
|
|
117
|
+
finalVerdict: "rejected",
|
|
118
|
+
survivingSources: [],
|
|
119
|
+
rejectReason: `invalid research plan item: ${invalidItem.errors.join("; ")}`,
|
|
120
|
+
unresolvedUnknowns: item.unknowns,
|
|
121
|
+
};
|
|
122
|
+
}
|
|
123
|
+
const invalidEvidence = relevantEvidence.flatMap(entry => validateResearchEvidenceEntry(entry).errors);
|
|
124
|
+
if (invalidEvidence.length > 0) {
|
|
125
|
+
return {
|
|
126
|
+
claim: item.claim,
|
|
127
|
+
finalVerdict: "rejected",
|
|
128
|
+
survivingSources: [],
|
|
129
|
+
rejectReason: `invalid evidence entry: ${invalidEvidence.join("; ")}`,
|
|
130
|
+
unresolvedUnknowns: item.unknowns,
|
|
131
|
+
};
|
|
132
|
+
}
|
|
133
|
+
if (relevantEvidence.length === 0) {
|
|
134
|
+
return {
|
|
135
|
+
claim: item.claim,
|
|
136
|
+
finalVerdict: "uncertain",
|
|
137
|
+
survivingSources: [],
|
|
138
|
+
rejectReason: "no evidence collected for claim",
|
|
139
|
+
unresolvedUnknowns: item.unknowns,
|
|
140
|
+
};
|
|
141
|
+
}
|
|
142
|
+
const supporting = relevantEvidence.filter(entry => entry.verdict === "support");
|
|
143
|
+
const firstContradiction = relevantEvidence.find(entry => entry.verdict === "contradict");
|
|
144
|
+
let dropReason = matchesDropCondition(item, relevantEvidence) ?? sourceConflictReason(item, relevantEvidence);
|
|
145
|
+
// A counterexample with no surviving support falsifies the claim regardless of how the
|
|
146
|
+
// dropCondition / sourceConflictPolicy prose is worded. Without this, a purely contradicted
|
|
147
|
+
// claim would slip through as "uncertain" and reopen the hallucination survival path the
|
|
148
|
+
// evidence ledger exists to close (a contested claim already rejects via sourceConflictReason).
|
|
149
|
+
if (!dropReason && firstContradiction && supporting.length === 0) {
|
|
150
|
+
dropReason = `claim contradicted by counterexample with no supporting evidence: ${firstContradiction.source}`;
|
|
151
|
+
}
|
|
152
|
+
if (dropReason) {
|
|
153
|
+
return {
|
|
154
|
+
claim: item.claim,
|
|
155
|
+
finalVerdict: "rejected",
|
|
156
|
+
survivingSources: supporting,
|
|
157
|
+
rejectReason: dropReason,
|
|
158
|
+
unresolvedUnknowns: item.unknowns,
|
|
159
|
+
};
|
|
160
|
+
}
|
|
161
|
+
const uncertain = relevantEvidence.some(entry => entry.verdict === "uncertain");
|
|
162
|
+
if (uncertain || supporting.length === 0) {
|
|
163
|
+
return {
|
|
164
|
+
claim: item.claim,
|
|
165
|
+
finalVerdict: "uncertain",
|
|
166
|
+
survivingSources: supporting,
|
|
167
|
+
rejectReason: uncertain ? "unresolved uncertainty remains" : "no supporting evidence survived verification",
|
|
168
|
+
unresolvedUnknowns: item.unknowns,
|
|
169
|
+
};
|
|
170
|
+
}
|
|
171
|
+
return {
|
|
172
|
+
claim: item.claim,
|
|
173
|
+
finalVerdict: "accepted",
|
|
174
|
+
survivingSources: supporting,
|
|
175
|
+
unresolvedUnknowns: [],
|
|
176
|
+
};
|
|
177
|
+
}
|
package/src/rlm/artifacts.ts
CHANGED
|
@@ -1,12 +1,17 @@
|
|
|
1
1
|
/**
|
|
2
|
-
* RLM session artifact layout under <cwd>/.gjc/rlm/<
|
|
2
|
+
* RLM session artifact layout under <cwd>/.gjc/_session-{gjcSessionId}/rlm/<rlmSessionId>/.
|
|
3
|
+
*
|
|
4
|
+
* The GJC session id (process boundary) scopes the directory; the RLM session id
|
|
5
|
+
* names the individual research run within it. The two ids are kept distinct.
|
|
3
6
|
*/
|
|
4
7
|
import * as fs from "node:fs/promises";
|
|
5
8
|
import * as path from "node:path";
|
|
6
9
|
import { readNotebookDocument } from "../edit/notebook";
|
|
10
|
+
import { rlmArtifactRoot } from "../gjc-runtime/session-layout";
|
|
11
|
+
import { resolveGjcSessionForWrite } from "../gjc-runtime/session-resolution";
|
|
7
12
|
import type { RlmArtifactPaths } from "./types";
|
|
8
13
|
|
|
9
|
-
export const RLM_DIR_SEGMENT =
|
|
14
|
+
export const RLM_DIR_SEGMENT = "rlm";
|
|
10
15
|
|
|
11
16
|
const SESSION_ID_RE = /^[A-Za-z0-9_-]+$/;
|
|
12
17
|
|
|
@@ -25,7 +30,11 @@ export function resolveRlmArtifactPaths(cwd: string, sessionId: string): RlmArti
|
|
|
25
30
|
if (!isValidRlmSessionId(sessionId)) {
|
|
26
31
|
throw new Error(`Invalid RLM session id: ${JSON.stringify(sessionId)}`);
|
|
27
32
|
}
|
|
28
|
-
const dir =
|
|
33
|
+
const dir = rlmArtifactRoot(
|
|
34
|
+
cwd,
|
|
35
|
+
resolveGjcSessionForWrite(cwd, { envSessionId: process.env.GJC_SESSION_ID }).gjcSessionId,
|
|
36
|
+
sessionId,
|
|
37
|
+
);
|
|
29
38
|
return {
|
|
30
39
|
dir,
|
|
31
40
|
notebookPath: path.join(dir, "notebook.ipynb"),
|
package/src/rlm/index.ts
CHANGED
|
@@ -11,6 +11,7 @@ import { getProjectDir } from "@gajae-code/utils";
|
|
|
11
11
|
import { type Args, parseArgs } from "../cli/args";
|
|
12
12
|
import { disposeKernelSessionsByOwner } from "../eval/py/executor";
|
|
13
13
|
import type { CustomTool } from "../extensibility/custom-tools/types";
|
|
14
|
+
import { resolveSessionIdFromSources, writeSessionActivityMarker } from "../gjc-runtime/session-resolution";
|
|
14
15
|
import { type RlmPreset, runRootCommand } from "../main";
|
|
15
16
|
import rlmReportCommandPrompt from "../prompts/system/rlm-report-command.md" with { type: "text" };
|
|
16
17
|
import type { CreateAgentSessionOptions } from "../sdk";
|
|
@@ -231,6 +232,12 @@ async function writeRlmMetadata(input: {
|
|
|
231
232
|
successfulRuns: input.successfulRuns,
|
|
232
233
|
};
|
|
233
234
|
await Bun.write(input.paths.metadataPath, `${JSON.stringify(metadata, null, 2)}\n`);
|
|
235
|
+
// Best-effort: update the per-session activity marker so latest-session auto-detect
|
|
236
|
+
// accounts for RLM-only generated output (AC2). Never let marker failure break RLM.
|
|
237
|
+
const gjcSessionId = resolveSessionIdFromSources({ envSessionId: process.env.GJC_SESSION_ID })?.gjcSessionId;
|
|
238
|
+
if (gjcSessionId) {
|
|
239
|
+
await writeSessionActivityMarker(input.cwd, gjcSessionId, { writer: "rlm" }).catch(() => {});
|
|
240
|
+
}
|
|
234
241
|
}
|
|
235
242
|
|
|
236
243
|
export async function runRlmCommand(argv: string[]): Promise<void> {
|
|
@@ -149,6 +149,52 @@ export async function updateMCPServer(filePath: string, name: string, config: MC
|
|
|
149
149
|
await writeMCPConfigFile(filePath, updated);
|
|
150
150
|
}
|
|
151
151
|
|
|
152
|
+
/**
|
|
153
|
+
* Result of an {@link upsertMCPServer} call.
|
|
154
|
+
* - `added`: server did not exist and was written.
|
|
155
|
+
* - `updated`: server existed and was overwritten because `force` was set.
|
|
156
|
+
* - `skipped`: server existed and `force` was not set, so nothing was written.
|
|
157
|
+
*/
|
|
158
|
+
export type UpsertMCPServerResult =
|
|
159
|
+
| { status: "added" }
|
|
160
|
+
| { status: "updated" }
|
|
161
|
+
| { status: "skipped"; reason: "exists" };
|
|
162
|
+
|
|
163
|
+
/**
|
|
164
|
+
* Add an MCP server, or overwrite an existing one only when `force` is set.
|
|
165
|
+
*
|
|
166
|
+
* Collision-aware wrapper over {@link addMCPServer} / {@link updateMCPServer} used by
|
|
167
|
+
* `gjc migrate`. Never connects to the server. Reuses the underlying writers so the
|
|
168
|
+
* rest of the config file (including `disabledServers`) is preserved on update.
|
|
169
|
+
*
|
|
170
|
+
* @throws Error if the server name or config is invalid (validated before any write).
|
|
171
|
+
*/
|
|
172
|
+
export async function upsertMCPServer(
|
|
173
|
+
filePath: string,
|
|
174
|
+
name: string,
|
|
175
|
+
config: MCPServerConfig,
|
|
176
|
+
options: { force?: boolean } = {},
|
|
177
|
+
): Promise<UpsertMCPServerResult> {
|
|
178
|
+
// Validate name up front so an invalid name fails regardless of collision state.
|
|
179
|
+
const nameError = validateServerName(name);
|
|
180
|
+
if (nameError) {
|
|
181
|
+
throw new Error(nameError);
|
|
182
|
+
}
|
|
183
|
+
|
|
184
|
+
const existing = await getMCPServer(filePath, name);
|
|
185
|
+
if (existing) {
|
|
186
|
+
if (!options.force) {
|
|
187
|
+
return { status: "skipped", reason: "exists" };
|
|
188
|
+
}
|
|
189
|
+
// updateMCPServer preserves the rest of MCPConfigFile, incl. disabledServers.
|
|
190
|
+
await updateMCPServer(filePath, name, config);
|
|
191
|
+
return { status: "updated" };
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
await addMCPServer(filePath, name, config);
|
|
195
|
+
return { status: "added" };
|
|
196
|
+
}
|
|
197
|
+
|
|
152
198
|
/**
|
|
153
199
|
* Remove an MCP server from a config file.
|
|
154
200
|
*
|
|
@@ -183,6 +183,11 @@ import type { HookCommandContext } from "../extensibility/hooks/types";
|
|
|
183
183
|
import type { Skill, SkillWarning } from "../extensibility/skills";
|
|
184
184
|
import { expandSlashCommand, type FileSlashCommand } from "../extensibility/slash-commands";
|
|
185
185
|
import { buildGjcRuntimeSessionEnv, consumePendingGoalModeRequest } from "../gjc-runtime/goal-mode-request";
|
|
186
|
+
import {
|
|
187
|
+
assertNonEmptyGjcSessionId,
|
|
188
|
+
modeStatePath as sessionModeStatePath,
|
|
189
|
+
sessionStateDir,
|
|
190
|
+
} from "../gjc-runtime/session-layout";
|
|
186
191
|
import { persistCoordinatorRuntimeStateFromEvent } from "../gjc-runtime/session-state-sidecar";
|
|
187
192
|
import { writeArtifact } from "../gjc-runtime/state-writer";
|
|
188
193
|
import { requestGjcWorkerIntegrationAttempt } from "../gjc-runtime/team-runtime";
|
|
@@ -312,13 +317,6 @@ export type AgentSessionEvent =
|
|
|
312
317
|
| { type: "thinking_level_changed"; thinkingLevel: ThinkingLevel | undefined }
|
|
313
318
|
| { type: "goal_updated"; goal: Goal | null; state?: GoalModeState };
|
|
314
319
|
|
|
315
|
-
/**
|
|
316
|
-
* Safe path component pattern used to validate session-id segments before
|
|
317
|
-
* joining them into `.gjc/state` paths. Mirrors the regex used by the
|
|
318
|
-
* `gjc state` runtime selector resolver.
|
|
319
|
-
*/
|
|
320
|
-
const SAFE_PATH_COMPONENT = /^[A-Za-z0-9_-][A-Za-z0-9._-]{0,63}$/;
|
|
321
|
-
|
|
322
320
|
function isUnderProjectGjc(cwd: string, targetPath: string): boolean {
|
|
323
321
|
const relative = path.relative(path.join(path.resolve(cwd), ".gjc"), path.resolve(targetPath));
|
|
324
322
|
return relative === "" || (!relative.startsWith("..") && !path.isAbsolute(relative));
|
|
@@ -1370,21 +1368,17 @@ export class AgentSession {
|
|
|
1370
1368
|
getActiveSkillPhase(): string | undefined {
|
|
1371
1369
|
const active = this.#activeSkillState;
|
|
1372
1370
|
if (!active) return undefined;
|
|
1373
|
-
// Path safety: refuse to read mode-state files when the skill or
|
|
1374
|
-
// session-id are not safe path components. The `skill` tool
|
|
1375
|
-
// interprets undefined as a non-terminal phase, so chaining is
|
|
1376
|
-
// refused — there is no risk of bypassing the guard via a custom
|
|
1377
|
-
// skill name with `..` or a session-id with separators.
|
|
1378
1371
|
if (!isCanonicalGjcWorkflowSkill(active.skill)) return undefined;
|
|
1379
|
-
|
|
1380
|
-
return undefined;
|
|
1381
|
-
}
|
|
1372
|
+
const sessionId = active.sessionId ?? this.sessionManager.getSessionId();
|
|
1382
1373
|
try {
|
|
1383
|
-
|
|
1384
|
-
|
|
1385
|
-
|
|
1386
|
-
|
|
1387
|
-
const filePath = path.join(
|
|
1374
|
+
assertNonEmptyGjcSessionId(sessionId, "AgentSession.getActiveSkillPhase");
|
|
1375
|
+
// Keep the session-state-dir construction explicit here so the chain guard
|
|
1376
|
+
// refuses to fall back to a legacy root `.gjc/state` read.
|
|
1377
|
+
const stateDir = sessionStateDir(this.sessionManager.getCwd(), sessionId);
|
|
1378
|
+
const filePath = path.join(
|
|
1379
|
+
stateDir,
|
|
1380
|
+
path.basename(sessionModeStatePath(this.sessionManager.getCwd(), sessionId, active.skill)),
|
|
1381
|
+
);
|
|
1388
1382
|
const raw = fs.readFileSync(filePath, "utf-8");
|
|
1389
1383
|
const parsed = JSON.parse(raw) as { current_phase?: unknown };
|
|
1390
1384
|
return typeof parsed.current_phase === "string" ? parsed.current_phase : undefined;
|
|
@@ -3763,7 +3757,7 @@ export class AgentSession {
|
|
|
3763
3757
|
* prompts or tool execution can run.
|
|
3764
3758
|
*/
|
|
3765
3759
|
#wrapToolForDeepInterviewMutationGuard<T extends AgentTool>(tool: T): T {
|
|
3766
|
-
if (!["edit", "write", "ast_edit"
|
|
3760
|
+
if (!["edit", "write", "ast_edit"].includes(tool.name)) return tool;
|
|
3767
3761
|
return new Proxy(tool, {
|
|
3768
3762
|
get: (target, prop) => {
|
|
3769
3763
|
if (prop !== "execute") return Reflect.get(target, prop, target);
|
|
@@ -404,7 +404,7 @@ async function installConfig(spec: CoordinatorSetupSpec, force: boolean): Promis
|
|
|
404
404
|
|
|
405
405
|
async function runSmoke(spec: CoordinatorSetupSpec): Promise<HermesSetupResult["smoke"]> {
|
|
406
406
|
const requiredTools = [...COORDINATOR_MCP_TOOL_NAMES];
|
|
407
|
-
const server = createCoordinatorMcpServer({ env:
|
|
407
|
+
const server = createCoordinatorMcpServer({ env: renderHermesServerBlock(spec).env as NodeJS.ProcessEnv });
|
|
408
408
|
const listed = await server.handleJsonRpc({ jsonrpc: "2.0", id: 1, method: "tools/list", params: {} });
|
|
409
409
|
const listedResult = isRecord(listed.result) ? listed.result : {};
|
|
410
410
|
const tools = Array.isArray(listedResult.tools) ? listedResult.tools : [];
|