@gajae-code/coding-agent 0.6.4 → 0.6.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (120) hide show
  1. package/CHANGELOG.md +22 -0
  2. package/dist/types/cli/migrate-cli.d.ts +20 -0
  3. package/dist/types/commands/migrate.d.ts +33 -0
  4. package/dist/types/config/keybindings.d.ts +4 -0
  5. package/dist/types/gjc-runtime/deep-interview-recorder.d.ts +2 -0
  6. package/dist/types/gjc-runtime/deep-interview-runtime.d.ts +2 -2
  7. package/dist/types/gjc-runtime/goal-mode-request.d.ts +1 -1
  8. package/dist/types/gjc-runtime/session-layout.d.ts +59 -0
  9. package/dist/types/gjc-runtime/session-resolution.d.ts +47 -0
  10. package/dist/types/gjc-runtime/state-graph.d.ts +1 -1
  11. package/dist/types/gjc-runtime/state-runtime.d.ts +5 -4
  12. package/dist/types/gjc-runtime/state-schema.d.ts +2 -0
  13. package/dist/types/gjc-runtime/state-writer.d.ts +36 -7
  14. package/dist/types/gjc-runtime/ultragoal-runtime.d.ts +7 -4
  15. package/dist/types/gjc-runtime/workflow-command-ref.d.ts +1 -1
  16. package/dist/types/gjc-runtime/workflow-manifest.d.ts +1 -1
  17. package/dist/types/harness-control-plane/storage.d.ts +2 -1
  18. package/dist/types/hooks/skill-state.d.ts +12 -4
  19. package/dist/types/migrate/action-planner.d.ts +11 -0
  20. package/dist/types/migrate/adapters/claude-code.d.ts +2 -0
  21. package/dist/types/migrate/adapters/codex.d.ts +5 -0
  22. package/dist/types/migrate/adapters/index.d.ts +45 -0
  23. package/dist/types/migrate/adapters/opencode.d.ts +2 -0
  24. package/dist/types/migrate/executor.d.ts +2 -0
  25. package/dist/types/migrate/mcp-mapper.d.ts +20 -0
  26. package/dist/types/migrate/report.d.ts +18 -0
  27. package/dist/types/migrate/skill-normalizer.d.ts +27 -0
  28. package/dist/types/migrate/types.d.ts +126 -0
  29. package/dist/types/modes/components/custom-editor.d.ts +1 -1
  30. package/dist/types/modes/shared/agent-wire/unattended-audit.d.ts +1 -1
  31. package/dist/types/research-plan/index.d.ts +1 -0
  32. package/dist/types/research-plan/ledger.d.ts +33 -0
  33. package/dist/types/rlm/artifacts.d.ts +1 -1
  34. package/dist/types/runtime-mcp/config-writer.d.ts +26 -0
  35. package/dist/types/skill-state/active-state.d.ts +6 -11
  36. package/dist/types/skill-state/canonical-skills.d.ts +3 -0
  37. package/dist/types/skill-state/workflow-hud.d.ts +2 -0
  38. package/dist/types/task/spawn-gate.d.ts +1 -10
  39. package/package.json +7 -7
  40. package/src/cli/migrate-cli.ts +106 -0
  41. package/src/cli.ts +1 -0
  42. package/src/commands/deep-interview.ts +2 -2
  43. package/src/commands/migrate.ts +46 -0
  44. package/src/commands/state.ts +2 -1
  45. package/src/commands/team.ts +7 -3
  46. package/src/coordinator-mcp/policy.ts +10 -2
  47. package/src/defaults/gjc/extensions/grok-cli-vendor/biome.json +0 -1
  48. package/src/defaults/gjc/skills/deep-interview/SKILL.md +28 -24
  49. package/src/defaults/gjc/skills/ralplan/SKILL.md +8 -4
  50. package/src/defaults/gjc/skills/team/SKILL.md +51 -47
  51. package/src/defaults/gjc/skills/ultragoal/SKILL.md +17 -13
  52. package/src/extensibility/custom-commands/loader.ts +0 -7
  53. package/src/extensibility/gjc-plugins/injection.ts +23 -4
  54. package/src/extensibility/gjc-plugins/state.ts +16 -1
  55. package/src/gjc-runtime/deep-interview-recorder.ts +43 -18
  56. package/src/gjc-runtime/deep-interview-runtime.ts +49 -23
  57. package/src/gjc-runtime/goal-mode-request.ts +26 -11
  58. package/src/gjc-runtime/launch-tmux.ts +6 -1
  59. package/src/gjc-runtime/ralplan-runtime.ts +79 -50
  60. package/src/gjc-runtime/session-layout.ts +180 -0
  61. package/src/gjc-runtime/session-resolution.ts +217 -0
  62. package/src/gjc-runtime/state-graph.ts +1 -2
  63. package/src/gjc-runtime/state-migrations.ts +1 -0
  64. package/src/gjc-runtime/state-runtime.ts +230 -121
  65. package/src/gjc-runtime/state-schema.ts +2 -0
  66. package/src/gjc-runtime/state-writer.ts +289 -41
  67. package/src/gjc-runtime/team-runtime.ts +43 -19
  68. package/src/gjc-runtime/tmux-sessions.ts +7 -1
  69. package/src/gjc-runtime/ultragoal-guard.ts +45 -2
  70. package/src/gjc-runtime/ultragoal-runtime.ts +121 -41
  71. package/src/gjc-runtime/workflow-command-ref.ts +1 -2
  72. package/src/gjc-runtime/workflow-manifest.ts +1 -2
  73. package/src/harness-control-plane/storage.ts +14 -4
  74. package/src/hooks/native-skill-hook.ts +38 -12
  75. package/src/hooks/skill-state.ts +178 -83
  76. package/src/internal-urls/docs-index.generated.ts +6 -4
  77. package/src/migrate/action-planner.ts +318 -0
  78. package/src/migrate/adapters/claude-code.ts +39 -0
  79. package/src/migrate/adapters/codex.ts +70 -0
  80. package/src/migrate/adapters/index.ts +277 -0
  81. package/src/migrate/adapters/opencode.ts +52 -0
  82. package/src/migrate/executor.ts +81 -0
  83. package/src/migrate/mcp-mapper.ts +152 -0
  84. package/src/migrate/report.ts +104 -0
  85. package/src/migrate/skill-normalizer.ts +80 -0
  86. package/src/migrate/types.ts +163 -0
  87. package/src/modes/bridge/bridge-mode.ts +2 -2
  88. package/src/modes/components/custom-editor.ts +30 -20
  89. package/src/modes/rpc/rpc-mode.ts +2 -2
  90. package/src/modes/shared/agent-wire/unattended-audit.ts +3 -2
  91. package/src/prompts/agents/init.md +1 -1
  92. package/src/prompts/system/plan-mode-active.md +1 -1
  93. package/src/prompts/tools/ast-grep.md +1 -1
  94. package/src/prompts/tools/search.md +1 -1
  95. package/src/prompts/tools/task.md +1 -2
  96. package/src/research-plan/index.ts +1 -0
  97. package/src/research-plan/ledger.ts +177 -0
  98. package/src/rlm/artifacts.ts +12 -3
  99. package/src/rlm/index.ts +7 -0
  100. package/src/runtime-mcp/config-writer.ts +46 -0
  101. package/src/session/agent-session.ts +15 -21
  102. package/src/setup/hermes-setup.ts +1 -1
  103. package/src/skill-state/active-state.ts +72 -108
  104. package/src/skill-state/canonical-skills.ts +4 -0
  105. package/src/skill-state/deep-interview-mutation-guard.ts +28 -109
  106. package/src/skill-state/workflow-hud.ts +4 -2
  107. package/src/skill-state/workflow-state-contract.ts +3 -3
  108. package/src/task/agents.ts +1 -22
  109. package/src/task/index.ts +1 -41
  110. package/src/task/spawn-gate.ts +1 -38
  111. package/src/task/types.ts +1 -1
  112. package/src/tools/ask.ts +34 -12
  113. package/src/tools/computer.ts +58 -4
  114. package/dist/types/extensibility/custom-commands/bundled/review/index.d.ts +0 -10
  115. package/src/extensibility/custom-commands/bundled/review/index.ts +0 -456
  116. package/src/prompts/agents/explore.md +0 -58
  117. package/src/prompts/agents/plan.md +0 -49
  118. package/src/prompts/agents/reviewer.md +0 -141
  119. package/src/prompts/agents/task.md +0 -16
  120. package/src/prompts/review-request.md +0 -70
@@ -1,6 +1,6 @@
1
1
  import { Editor, type KeyId, matchesKey, parseKittySequence } from "@gajae-code/tui";
2
2
  import { BracketedPasteHandler } from "@gajae-code/tui/bracketed-paste";
3
- import type { AppKeybinding } from "../../config/keybindings";
3
+ import { type AppKeybinding, KEYBINDINGS } from "../../config/keybindings";
4
4
 
5
5
  type ConfigurableEditorAction = Extract<
6
6
  AppKeybinding,
@@ -23,25 +23,35 @@ type ConfigurableEditorAction = Extract<
23
23
  | "app.clipboard.copyPrompt"
24
24
  >;
25
25
 
26
- const DEFAULT_ACTION_KEYS: Record<ConfigurableEditorAction, KeyId[]> = {
27
- "app.interrupt": ["escape"],
28
- "app.clear": ["ctrl+c"],
29
- "app.exit": ["ctrl+d"],
30
- "app.suspend": ["ctrl+z"],
31
- "app.thinking.cycle": ["shift+tab"],
32
- "app.model.cycleForward": ["ctrl+p"],
33
- "app.model.cycleBackward": ["shift+ctrl+p"],
34
- "app.model.select": ["ctrl+l"],
35
- "app.model.selectTemporary": ["alt+p"],
36
- "app.tools.expand": ["ctrl+o"],
37
- "app.thinking.toggle": ["ctrl+t"],
38
- "app.editor.external": ["ctrl+g"],
39
- "app.history.search": ["ctrl+r"],
40
- "app.message.queue": ["alt+enter"],
41
- "app.message.dequeue": ["alt+up"],
42
- "app.clipboard.pasteImage": ["ctrl+v"],
43
- "app.clipboard.copyPrompt": ["alt+shift+c"],
44
- };
26
+ // Editor-configurable app actions. Defaults are derived from the central
27
+ // KEYBINDINGS registry so there is a single source of truth (e.g. the
28
+ // platform-aware app.clipboard.pasteImage default is not duplicated here).
29
+ const CONFIGURABLE_EDITOR_ACTIONS = [
30
+ "app.interrupt",
31
+ "app.clear",
32
+ "app.exit",
33
+ "app.suspend",
34
+ "app.thinking.cycle",
35
+ "app.model.cycleForward",
36
+ "app.model.cycleBackward",
37
+ "app.model.select",
38
+ "app.model.selectTemporary",
39
+ "app.tools.expand",
40
+ "app.thinking.toggle",
41
+ "app.editor.external",
42
+ "app.history.search",
43
+ "app.message.queue",
44
+ "app.message.dequeue",
45
+ "app.clipboard.pasteImage",
46
+ "app.clipboard.copyPrompt",
47
+ ] as const satisfies readonly ConfigurableEditorAction[];
48
+
49
+ const DEFAULT_ACTION_KEYS = Object.fromEntries(
50
+ CONFIGURABLE_EDITOR_ACTIONS.map(action => {
51
+ const defaultKeys = KEYBINDINGS[action].defaultKeys;
52
+ return [action, Array.isArray(defaultKeys) ? [...defaultKeys] : [defaultKeys]];
53
+ }),
54
+ ) as Record<ConfigurableEditorAction, KeyId[]>;
45
55
 
46
56
  const PASTE_DECISION_TIMEOUT_MS = 5_000;
47
57
  const PENDING_PASTE_INPUT_MAX = 64;
@@ -11,13 +11,13 @@
11
11
  * - Extension UI: Extension UI requests are emitted, client responds with extension_ui_response
12
12
  */
13
13
 
14
- import * as path from "node:path";
15
14
  import { $pickenv, logger, readLines, Snowflake } from "@gajae-code/utils";
16
15
  import type {
17
16
  ExtensionUIContext,
18
17
  ExtensionUIDialogOptions,
19
18
  ExtensionWidgetOptions,
20
19
  } from "../../extensibility/extensions";
20
+ import { workflowGatePath } from "../../gjc-runtime/session-layout";
21
21
  import { type Theme, theme } from "../../modes/theme/theme";
22
22
  import type { AgentSession } from "../../session/agent-session";
23
23
  import { initializeExtensions } from "../runtime-init";
@@ -336,7 +336,7 @@ export async function runRpcMode(
336
336
  // Unattended control plane (#318/#319/#323/G011): routes negotiate_unattended +
337
337
  // workflow_gate_response and lets skill runtimes emit gates over RPC.
338
338
  const gateStore = new FileGateStore(
339
- path.join(session.sessionManager.getCwd(), ".gjc", "state", "workflow-gates", `${session.sessionId}.json`),
339
+ workflowGatePath(session.sessionManager.getCwd(), session.sessionId, session.sessionId),
340
340
  );
341
341
  const unattendedControlPlane = new UnattendedSessionControlPlane({
342
342
  runId: session.sessionId,
@@ -12,6 +12,7 @@
12
12
  */
13
13
  import { closeSync, fsyncSync, mkdirSync, openSync, readFileSync, writeSync } from "node:fs";
14
14
  import * as path from "node:path";
15
+ import { sessionAuditDir } from "../../../gjc-runtime/session-layout";
15
16
  import type { RpcBudgetExceeded, RpcWorkflowGateKind, RpcWorkflowStage } from "../../rpc/rpc-types";
16
17
  import { answerHashOf } from "./workflow-gate-schema";
17
18
 
@@ -69,9 +70,9 @@ function defaultId(): string {
69
70
  return `ae_${Date.now().toString(36)}_${idCounter.toString(36)}`;
70
71
  }
71
72
 
72
- export function defaultAuditPath(runId: string, root = process.cwd()): string {
73
+ export function defaultAuditPath(runId: string, root = process.cwd(), gjcSessionId = runId): string {
73
74
  const safe = runId.replace(/[^a-zA-Z0-9_.-]/g, "_");
74
- return path.join(root, ".gjc", "audit", "unattended", `${safe}.jsonl`);
75
+ return path.join(sessionAuditDir(root, gjcSessionId), "unattended", `${safe}.jsonl`);
75
76
  }
76
77
 
77
78
  /** Append-only audit log writer + reader for one unattended run. */
@@ -5,7 +5,7 @@ thinking-level: medium
5
5
  hide: true
6
6
  ---
7
7
 
8
- Generate AGENTS.md by launching multiple `explore` agents in parallel (via `task` tool) scanning different areas (core src, tests, configs/build, scripts/docs), then synthesize findings into a single file.
8
+ Generate AGENTS.md by launching multiple canonical role agents in parallel (via `task` tool, usually `planner` or `architect`) scanning different areas (core src, tests, configs/build, scripts/docs), then synthesize findings into a single file.
9
9
 
10
10
  <structure>
11
11
  - **Project Overview**: Brief description of project purpose
@@ -82,7 +82,7 @@ The plan MUST be scannable yet detailed enough to execute.
82
82
 
83
83
  <procedure>
84
84
  ### Phase 1: Understand
85
- You MUST focus on the request and associated code. You SHOULD launch parallel explore agents when scope spans multiple areas.
85
+ You MUST focus on the request and associated code. You SHOULD launch parallel canonical role agents (`planner` or `architect`) when scope spans multiple areas.
86
86
 
87
87
  ### Phase 2: Design
88
88
  You MUST draft an approach based on exploration. You MUST consider trade-offs briefly, then choose.
@@ -38,5 +38,5 @@ Performs structural code search using AST matching via native ast-grep.
38
38
  <critical>
39
39
  - Avoid repo-root scans — narrow `paths` first
40
40
  - Parse issues are query failure, not evidence of absence: repair the pattern or tighten `paths` before concluding "no matches"
41
- - For broad/open-ended exploration across subsystems, use Task tool with explore subagent first
41
+ - For broad/open-ended inspection across subsystems, delegate a bounded fact-finding task to an appropriate canonical role agent (`planner` or `architect`) first
42
42
  </critical>
@@ -21,5 +21,5 @@ Searches files using powerful regex matching.
21
21
  - You MUST use the built-in `search` tool for any content search. NEVER shell out to `grep`, `rg`, `ripgrep`, `ag`, `ack`, `git grep`, `awk`, `sed`-for-search, or any other CLI search via Bash — even for a single match, even "just to check quickly", even piped through other commands.
22
22
  - Bash `grep`/`rg` loses `.gitignore` semantics, bypasses result limits, and wastes tokens. The `search` tool is faster, structured, and already wired into the workspace — there is no scenario where Bash search is preferable.
23
23
  - If you catch yourself typing `grep`, `rg`, or `| grep` in a Bash command, stop and re-issue the lookup through the `search` tool instead.
24
- - If the search is open-ended, requiring multiple rounds, you MUST use the Task tool with the explore subagent instead of chaining `search` calls yourself.
24
+ - If the search is open-ended and requires multiple rounds across subsystems, delegate a bounded fact-finding task to an appropriate canonical role agent (`planner` for sequencing/context maps or `architect` for read-only architecture assessment) instead of chaining broad `search` calls yourself.
25
25
  </critical>
@@ -28,13 +28,12 @@ Subagents have no conversation history. Every fact, file path, and direction the
28
28
  {{/if}}
29
29
  {{#if independentMode}}- `.inheritContext`: independent mode cannot inherit parent conversation. Omit it or set `"none"`; any non-`none` value is rejected before scheduling.{{/if}}
30
30
  {{#if customSchemaEnabled}}- `schema`: JTD schema for expected structured output (do not put format rules in assignments){{/if}}
31
- - `spawnPlan` (optional): required before any batch with more than 4 tasks, and before a reviewer agent spawns `explore`; include whyParallel, whyNotLocal, independence, expectedReceiptShape, and maxInlineTokens.
31
+ - `spawnPlan` (optional): required before any batch with more than 4 tasks; include whyParallel, whyNotLocal, independence, expectedReceiptShape, and maxInlineTokens.
32
32
  {{#if isolationEnabled}}- `isolated`: run in isolated env; use when tasks edit overlapping files{{/if}}
33
33
  </parameters>
34
34
 
35
35
  <rules>
36
36
  - HARD runtime gate: calls with more than 4 tasks are rejected before any child launches unless `spawnPlan` is complete.
37
- - Reviewer->explore gate: a `reviewer` spawning `explore` is rejected before launch unless `spawnPlan` is complete, even for a single task.
38
37
  - NEVER assign tasks to run project-wide build/test/lint. Caller verifies after the batch.
39
38
  - **Subagents do not verify, lint, or format.** Every assignment MUST instruct the subagent to skip all gates and formatters. You run them once at the end across the union of changed files — avoids redundant runs and racing formatter passes.
40
39
  {{#if ircEnabled}}
@@ -0,0 +1 @@
1
+ export * from "./ledger";
@@ -0,0 +1,177 @@
1
+ export type ResearchPlanConfidence = "low" | "medium" | "high";
2
+
3
+ export type ResearchEvidenceVerdict = "support" | "contradict" | "uncertain";
4
+
5
+ export interface ResearchPlanItem {
6
+ claim: string;
7
+ confidence: ResearchPlanConfidence;
8
+ unknowns: string[];
9
+ evidenceNeeded: string[];
10
+ counterexampleQueries: string[];
11
+ sourceConflictPolicy: string;
12
+ dropCondition: string;
13
+ verifierChecks: string[];
14
+ }
15
+
16
+ export interface ResearchEvidenceEntry {
17
+ claim: string;
18
+ source: string;
19
+ confidence: ResearchPlanConfidence;
20
+ verdict: ResearchEvidenceVerdict;
21
+ notes?: string;
22
+ }
23
+
24
+ export interface ResearchLedgerVerdict {
25
+ claim: string;
26
+ finalVerdict: "accepted" | "rejected" | "uncertain";
27
+ survivingSources: ResearchEvidenceEntry[];
28
+ rejectReason?: string;
29
+ unresolvedUnknowns: string[];
30
+ }
31
+
32
+ export interface ResearchPlanValidationResult {
33
+ valid: boolean;
34
+ errors: string[];
35
+ }
36
+
37
+ const CONFIDENCE_VALUES = new Set<ResearchPlanConfidence>(["low", "medium", "high"]);
38
+ const EVIDENCE_VERDICTS = new Set<ResearchEvidenceVerdict>(["support", "contradict", "uncertain"]);
39
+
40
+ function isNonEmptyString(value: unknown): value is string {
41
+ return typeof value === "string" && value.trim().length > 0;
42
+ }
43
+
44
+ function validateStringArray(value: unknown, field: string, minLength = 1): string[] {
45
+ if (!Array.isArray(value)) return [`${field} must be an array`];
46
+ if (value.length < minLength) return [`${field} must contain at least ${minLength} item(s)`];
47
+ return value.flatMap((item, index) =>
48
+ isNonEmptyString(item) ? [] : [`${field}[${index}] must be a non-empty string`],
49
+ );
50
+ }
51
+
52
+ export function validateResearchPlanItem(item: Partial<ResearchPlanItem>): ResearchPlanValidationResult {
53
+ const errors: string[] = [];
54
+ if (!isNonEmptyString(item.claim)) errors.push("claim must be a non-empty string");
55
+ if (!item.confidence || !CONFIDENCE_VALUES.has(item.confidence)) {
56
+ errors.push("confidence must be one of: low, medium, high");
57
+ }
58
+ errors.push(...validateStringArray(item.unknowns, "unknowns", 0));
59
+ errors.push(...validateStringArray(item.evidenceNeeded, "evidenceNeeded"));
60
+ errors.push(...validateStringArray(item.counterexampleQueries, "counterexampleQueries"));
61
+ if (!isNonEmptyString(item.sourceConflictPolicy)) errors.push("sourceConflictPolicy must be a non-empty string");
62
+ if (!isNonEmptyString(item.dropCondition)) errors.push("dropCondition must be a non-empty string");
63
+ errors.push(...validateStringArray(item.verifierChecks, "verifierChecks"));
64
+ return { valid: errors.length === 0, errors };
65
+ }
66
+
67
+ export function validateResearchEvidenceEntry(entry: Partial<ResearchEvidenceEntry>): ResearchPlanValidationResult {
68
+ const errors: string[] = [];
69
+ if (!isNonEmptyString(entry.claim)) errors.push("claim must be a non-empty string");
70
+ if (!isNonEmptyString(entry.source)) errors.push("source must be a non-empty string");
71
+ if (!entry.confidence || !CONFIDENCE_VALUES.has(entry.confidence)) {
72
+ errors.push("confidence must be one of: low, medium, high");
73
+ }
74
+ if (!entry.verdict || !EVIDENCE_VERDICTS.has(entry.verdict)) {
75
+ errors.push("verdict must be one of: support, contradict, uncertain");
76
+ }
77
+ return { valid: errors.length === 0, errors };
78
+ }
79
+
80
+ function lower(value: string): string {
81
+ return value.toLowerCase();
82
+ }
83
+
84
+ function matchesDropCondition(item: ResearchPlanItem, evidence: ResearchEvidenceEntry[]): string | undefined {
85
+ const condition = lower(item.dropCondition);
86
+ const contradiction = evidence.find(entry => entry.verdict === "contradict");
87
+ if (contradiction && /(counterexample|contradict|conflict|falsif)/.test(condition)) {
88
+ return `dropCondition matched by contradictory source: ${contradiction.source}`;
89
+ }
90
+ const unresolved = evidence.find(entry => entry.verdict === "uncertain");
91
+ if (unresolved && /(unknown|unresolved|uncertain)/.test(condition)) {
92
+ return `dropCondition matched by unresolved evidence: ${unresolved.source}`;
93
+ }
94
+ return undefined;
95
+ }
96
+
97
+ function sourceConflictReason(item: ResearchPlanItem, evidence: ResearchEvidenceEntry[]): string | undefined {
98
+ const supporting = evidence.filter(entry => entry.verdict === "support");
99
+ const contradicting = evidence.filter(entry => entry.verdict === "contradict");
100
+ if (supporting.length === 0 || contradicting.length === 0) return undefined;
101
+ const policy = lower(item.sourceConflictPolicy);
102
+ if (/(reject|drop|do not accept|prefer contradiction|requires resolution)/.test(policy)) {
103
+ return `sourceConflictPolicy rejected mixed support/contradiction (${supporting.length} support, ${contradicting.length} contradict)`;
104
+ }
105
+ return "source conflict remains unresolved";
106
+ }
107
+
108
+ export function evaluateResearchLedger(
109
+ item: ResearchPlanItem,
110
+ evidence: readonly ResearchEvidenceEntry[],
111
+ ): ResearchLedgerVerdict {
112
+ const relevantEvidence = evidence.filter(entry => entry.claim === item.claim);
113
+ const invalidItem = validateResearchPlanItem(item);
114
+ if (!invalidItem.valid) {
115
+ return {
116
+ claim: item.claim,
117
+ finalVerdict: "rejected",
118
+ survivingSources: [],
119
+ rejectReason: `invalid research plan item: ${invalidItem.errors.join("; ")}`,
120
+ unresolvedUnknowns: item.unknowns,
121
+ };
122
+ }
123
+ const invalidEvidence = relevantEvidence.flatMap(entry => validateResearchEvidenceEntry(entry).errors);
124
+ if (invalidEvidence.length > 0) {
125
+ return {
126
+ claim: item.claim,
127
+ finalVerdict: "rejected",
128
+ survivingSources: [],
129
+ rejectReason: `invalid evidence entry: ${invalidEvidence.join("; ")}`,
130
+ unresolvedUnknowns: item.unknowns,
131
+ };
132
+ }
133
+ if (relevantEvidence.length === 0) {
134
+ return {
135
+ claim: item.claim,
136
+ finalVerdict: "uncertain",
137
+ survivingSources: [],
138
+ rejectReason: "no evidence collected for claim",
139
+ unresolvedUnknowns: item.unknowns,
140
+ };
141
+ }
142
+ const supporting = relevantEvidence.filter(entry => entry.verdict === "support");
143
+ const firstContradiction = relevantEvidence.find(entry => entry.verdict === "contradict");
144
+ let dropReason = matchesDropCondition(item, relevantEvidence) ?? sourceConflictReason(item, relevantEvidence);
145
+ // A counterexample with no surviving support falsifies the claim regardless of how the
146
+ // dropCondition / sourceConflictPolicy prose is worded. Without this, a purely contradicted
147
+ // claim would slip through as "uncertain" and reopen the hallucination survival path the
148
+ // evidence ledger exists to close (a contested claim already rejects via sourceConflictReason).
149
+ if (!dropReason && firstContradiction && supporting.length === 0) {
150
+ dropReason = `claim contradicted by counterexample with no supporting evidence: ${firstContradiction.source}`;
151
+ }
152
+ if (dropReason) {
153
+ return {
154
+ claim: item.claim,
155
+ finalVerdict: "rejected",
156
+ survivingSources: supporting,
157
+ rejectReason: dropReason,
158
+ unresolvedUnknowns: item.unknowns,
159
+ };
160
+ }
161
+ const uncertain = relevantEvidence.some(entry => entry.verdict === "uncertain");
162
+ if (uncertain || supporting.length === 0) {
163
+ return {
164
+ claim: item.claim,
165
+ finalVerdict: "uncertain",
166
+ survivingSources: supporting,
167
+ rejectReason: uncertain ? "unresolved uncertainty remains" : "no supporting evidence survived verification",
168
+ unresolvedUnknowns: item.unknowns,
169
+ };
170
+ }
171
+ return {
172
+ claim: item.claim,
173
+ finalVerdict: "accepted",
174
+ survivingSources: supporting,
175
+ unresolvedUnknowns: [],
176
+ };
177
+ }
@@ -1,12 +1,17 @@
1
1
  /**
2
- * RLM session artifact layout under <cwd>/.gjc/rlm/<sessionId>/.
2
+ * RLM session artifact layout under <cwd>/.gjc/_session-{gjcSessionId}/rlm/<rlmSessionId>/.
3
+ *
4
+ * The GJC session id (process boundary) scopes the directory; the RLM session id
5
+ * names the individual research run within it. The two ids are kept distinct.
3
6
  */
4
7
  import * as fs from "node:fs/promises";
5
8
  import * as path from "node:path";
6
9
  import { readNotebookDocument } from "../edit/notebook";
10
+ import { rlmArtifactRoot } from "../gjc-runtime/session-layout";
11
+ import { resolveGjcSessionForWrite } from "../gjc-runtime/session-resolution";
7
12
  import type { RlmArtifactPaths } from "./types";
8
13
 
9
- export const RLM_DIR_SEGMENT = path.join(".gjc", "rlm");
14
+ export const RLM_DIR_SEGMENT = "rlm";
10
15
 
11
16
  const SESSION_ID_RE = /^[A-Za-z0-9_-]+$/;
12
17
 
@@ -25,7 +30,11 @@ export function resolveRlmArtifactPaths(cwd: string, sessionId: string): RlmArti
25
30
  if (!isValidRlmSessionId(sessionId)) {
26
31
  throw new Error(`Invalid RLM session id: ${JSON.stringify(sessionId)}`);
27
32
  }
28
- const dir = path.join(cwd, RLM_DIR_SEGMENT, sessionId);
33
+ const dir = rlmArtifactRoot(
34
+ cwd,
35
+ resolveGjcSessionForWrite(cwd, { envSessionId: process.env.GJC_SESSION_ID }).gjcSessionId,
36
+ sessionId,
37
+ );
29
38
  return {
30
39
  dir,
31
40
  notebookPath: path.join(dir, "notebook.ipynb"),
package/src/rlm/index.ts CHANGED
@@ -11,6 +11,7 @@ import { getProjectDir } from "@gajae-code/utils";
11
11
  import { type Args, parseArgs } from "../cli/args";
12
12
  import { disposeKernelSessionsByOwner } from "../eval/py/executor";
13
13
  import type { CustomTool } from "../extensibility/custom-tools/types";
14
+ import { resolveSessionIdFromSources, writeSessionActivityMarker } from "../gjc-runtime/session-resolution";
14
15
  import { type RlmPreset, runRootCommand } from "../main";
15
16
  import rlmReportCommandPrompt from "../prompts/system/rlm-report-command.md" with { type: "text" };
16
17
  import type { CreateAgentSessionOptions } from "../sdk";
@@ -231,6 +232,12 @@ async function writeRlmMetadata(input: {
231
232
  successfulRuns: input.successfulRuns,
232
233
  };
233
234
  await Bun.write(input.paths.metadataPath, `${JSON.stringify(metadata, null, 2)}\n`);
235
+ // Best-effort: update the per-session activity marker so latest-session auto-detect
236
+ // accounts for RLM-only generated output (AC2). Never let marker failure break RLM.
237
+ const gjcSessionId = resolveSessionIdFromSources({ envSessionId: process.env.GJC_SESSION_ID })?.gjcSessionId;
238
+ if (gjcSessionId) {
239
+ await writeSessionActivityMarker(input.cwd, gjcSessionId, { writer: "rlm" }).catch(() => {});
240
+ }
234
241
  }
235
242
 
236
243
  export async function runRlmCommand(argv: string[]): Promise<void> {
@@ -149,6 +149,52 @@ export async function updateMCPServer(filePath: string, name: string, config: MC
149
149
  await writeMCPConfigFile(filePath, updated);
150
150
  }
151
151
 
152
+ /**
153
+ * Result of an {@link upsertMCPServer} call.
154
+ * - `added`: server did not exist and was written.
155
+ * - `updated`: server existed and was overwritten because `force` was set.
156
+ * - `skipped`: server existed and `force` was not set, so nothing was written.
157
+ */
158
+ export type UpsertMCPServerResult =
159
+ | { status: "added" }
160
+ | { status: "updated" }
161
+ | { status: "skipped"; reason: "exists" };
162
+
163
+ /**
164
+ * Add an MCP server, or overwrite an existing one only when `force` is set.
165
+ *
166
+ * Collision-aware wrapper over {@link addMCPServer} / {@link updateMCPServer} used by
167
+ * `gjc migrate`. Never connects to the server. Reuses the underlying writers so the
168
+ * rest of the config file (including `disabledServers`) is preserved on update.
169
+ *
170
+ * @throws Error if the server name or config is invalid (validated before any write).
171
+ */
172
+ export async function upsertMCPServer(
173
+ filePath: string,
174
+ name: string,
175
+ config: MCPServerConfig,
176
+ options: { force?: boolean } = {},
177
+ ): Promise<UpsertMCPServerResult> {
178
+ // Validate name up front so an invalid name fails regardless of collision state.
179
+ const nameError = validateServerName(name);
180
+ if (nameError) {
181
+ throw new Error(nameError);
182
+ }
183
+
184
+ const existing = await getMCPServer(filePath, name);
185
+ if (existing) {
186
+ if (!options.force) {
187
+ return { status: "skipped", reason: "exists" };
188
+ }
189
+ // updateMCPServer preserves the rest of MCPConfigFile, incl. disabledServers.
190
+ await updateMCPServer(filePath, name, config);
191
+ return { status: "updated" };
192
+ }
193
+
194
+ await addMCPServer(filePath, name, config);
195
+ return { status: "added" };
196
+ }
197
+
152
198
  /**
153
199
  * Remove an MCP server from a config file.
154
200
  *
@@ -183,6 +183,11 @@ import type { HookCommandContext } from "../extensibility/hooks/types";
183
183
  import type { Skill, SkillWarning } from "../extensibility/skills";
184
184
  import { expandSlashCommand, type FileSlashCommand } from "../extensibility/slash-commands";
185
185
  import { buildGjcRuntimeSessionEnv, consumePendingGoalModeRequest } from "../gjc-runtime/goal-mode-request";
186
+ import {
187
+ assertNonEmptyGjcSessionId,
188
+ modeStatePath as sessionModeStatePath,
189
+ sessionStateDir,
190
+ } from "../gjc-runtime/session-layout";
186
191
  import { persistCoordinatorRuntimeStateFromEvent } from "../gjc-runtime/session-state-sidecar";
187
192
  import { writeArtifact } from "../gjc-runtime/state-writer";
188
193
  import { requestGjcWorkerIntegrationAttempt } from "../gjc-runtime/team-runtime";
@@ -312,13 +317,6 @@ export type AgentSessionEvent =
312
317
  | { type: "thinking_level_changed"; thinkingLevel: ThinkingLevel | undefined }
313
318
  | { type: "goal_updated"; goal: Goal | null; state?: GoalModeState };
314
319
 
315
- /**
316
- * Safe path component pattern used to validate session-id segments before
317
- * joining them into `.gjc/state` paths. Mirrors the regex used by the
318
- * `gjc state` runtime selector resolver.
319
- */
320
- const SAFE_PATH_COMPONENT = /^[A-Za-z0-9_-][A-Za-z0-9._-]{0,63}$/;
321
-
322
320
  function isUnderProjectGjc(cwd: string, targetPath: string): boolean {
323
321
  const relative = path.relative(path.join(path.resolve(cwd), ".gjc"), path.resolve(targetPath));
324
322
  return relative === "" || (!relative.startsWith("..") && !path.isAbsolute(relative));
@@ -1370,21 +1368,17 @@ export class AgentSession {
1370
1368
  getActiveSkillPhase(): string | undefined {
1371
1369
  const active = this.#activeSkillState;
1372
1370
  if (!active) return undefined;
1373
- // Path safety: refuse to read mode-state files when the skill or
1374
- // session-id are not safe path components. The `skill` tool
1375
- // interprets undefined as a non-terminal phase, so chaining is
1376
- // refused — there is no risk of bypassing the guard via a custom
1377
- // skill name with `..` or a session-id with separators.
1378
1371
  if (!isCanonicalGjcWorkflowSkill(active.skill)) return undefined;
1379
- if (active.sessionId !== undefined && !SAFE_PATH_COMPONENT.test(active.sessionId)) {
1380
- return undefined;
1381
- }
1372
+ const sessionId = active.sessionId ?? this.sessionManager.getSessionId();
1382
1373
  try {
1383
- const stateDir = path.join(this.sessionManager.getCwd(), ".gjc", "state");
1384
- const segments = active.sessionId
1385
- ? [stateDir, "sessions", encodeURIComponent(active.sessionId).replaceAll(".", "%2E")]
1386
- : [stateDir];
1387
- const filePath = path.join(...segments, `${active.skill}-state.json`);
1374
+ assertNonEmptyGjcSessionId(sessionId, "AgentSession.getActiveSkillPhase");
1375
+ // Keep the session-state-dir construction explicit here so the chain guard
1376
+ // refuses to fall back to a legacy root `.gjc/state` read.
1377
+ const stateDir = sessionStateDir(this.sessionManager.getCwd(), sessionId);
1378
+ const filePath = path.join(
1379
+ stateDir,
1380
+ path.basename(sessionModeStatePath(this.sessionManager.getCwd(), sessionId, active.skill)),
1381
+ );
1388
1382
  const raw = fs.readFileSync(filePath, "utf-8");
1389
1383
  const parsed = JSON.parse(raw) as { current_phase?: unknown };
1390
1384
  return typeof parsed.current_phase === "string" ? parsed.current_phase : undefined;
@@ -3763,7 +3757,7 @@ export class AgentSession {
3763
3757
  * prompts or tool execution can run.
3764
3758
  */
3765
3759
  #wrapToolForDeepInterviewMutationGuard<T extends AgentTool>(tool: T): T {
3766
- if (!["edit", "write", "ast_edit", "bash"].includes(tool.name)) return tool;
3760
+ if (!["edit", "write", "ast_edit"].includes(tool.name)) return tool;
3767
3761
  return new Proxy(tool, {
3768
3762
  get: (target, prop) => {
3769
3763
  if (prop !== "execute") return Reflect.get(target, prop, target);
@@ -404,7 +404,7 @@ async function installConfig(spec: CoordinatorSetupSpec, force: boolean): Promis
404
404
 
405
405
  async function runSmoke(spec: CoordinatorSetupSpec): Promise<HermesSetupResult["smoke"]> {
406
406
  const requiredTools = [...COORDINATOR_MCP_TOOL_NAMES];
407
- const server = createCoordinatorMcpServer({ env: {} });
407
+ const server = createCoordinatorMcpServer({ env: renderHermesServerBlock(spec).env as NodeJS.ProcessEnv });
408
408
  const listed = await server.handleJsonRpc({ jsonrpc: "2.0", id: 1, method: "tools/list", params: {} });
409
409
  const listedResult = isRecord(listed.result) ? listed.result : {};
410
410
  const tools = Array.isArray(listedResult.tools) ? listedResult.tools : [];