npm - muonroi-cli - Versions diffs - 1.4.1 → 1.6.0 - Mend

muonroi-cli 1.4.1 → 1.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (194) hide show

package/LICENSE +21 -21
package/README.md +122 -122
package/dist/packages/agent-harness-core/src/predicate.d.ts +1 -1
package/dist/src/agent-harness/__tests__/mock-model.spec.js +48 -1
package/dist/src/agent-harness/mock-model.d.ts +11 -0
package/dist/src/agent-harness/mock-model.js +21 -0
package/dist/src/cli/cost-forensics.js +12 -12
package/dist/src/council/__tests__/clarification-prompt.test.js +51 -0
package/dist/src/council/__tests__/clarifier-ready-gate.test.js +32 -0
package/dist/src/council/__tests__/decisions-lock.test.js +17 -1
package/dist/src/council/__tests__/oauth-reachable.test.d.ts +1 -0
package/dist/src/council/__tests__/oauth-reachable.test.js +31 -0
package/dist/src/council/__tests__/parse-outcome-fallback.test.js +11 -0
package/dist/src/council/clarifier.js +9 -1
package/dist/src/council/debate.js +5 -1
package/dist/src/council/decisions-lock.js +3 -3
package/dist/src/council/index.js +12 -5
package/dist/src/council/leader.d.ts +0 -17
package/dist/src/council/leader.js +22 -15
package/dist/src/council/planner.js +1 -1
package/dist/src/council/prompts.js +63 -57
package/dist/src/council/types.d.ts +7 -0
package/dist/src/ee/__tests__/ee-onboarding.test.d.ts +1 -0
package/dist/src/ee/__tests__/ee-onboarding.test.js +32 -0
package/dist/src/ee/artifact-cache.d.ts +56 -0
package/dist/src/ee/artifact-cache.js +155 -0
package/dist/src/ee/artifact-cache.test.d.ts +1 -0
package/dist/src/ee/artifact-cache.test.js +69 -0
package/dist/src/ee/auth.d.ts +9 -0
package/dist/src/ee/auth.js +19 -0
package/dist/src/ee/ee-onboarding.d.ts +5 -0
package/dist/src/ee/ee-onboarding.js +76 -0
package/dist/src/ee/search.js +7 -5
package/dist/src/ee/search.test.d.ts +1 -0
package/dist/src/ee/search.test.js +23 -0
package/dist/src/generated/version.d.ts +1 -1
package/dist/src/generated/version.js +1 -1
package/dist/src/headless/output.js +6 -4
package/dist/src/headless/output.test.js +4 -3
package/dist/src/index.js +20 -1
package/dist/src/mcp/__tests__/auto-setup.test.js +74 -0
package/dist/src/mcp/__tests__/client-pool.spec.d.ts +1 -0
package/dist/src/mcp/__tests__/client-pool.spec.js +98 -0
package/dist/src/mcp/__tests__/parallel-build.spec.d.ts +1 -0
package/dist/src/mcp/__tests__/parallel-build.spec.js +67 -0
package/dist/src/mcp/__tests__/smart-filter.test.js +56 -0
package/dist/src/mcp/auto-setup.js +56 -2
package/dist/src/mcp/client-pool.d.ts +46 -0
package/dist/src/mcp/client-pool.js +212 -0
package/dist/src/mcp/oauth-callback.js +2 -2
package/dist/src/mcp/parse-headers.test.js +14 -14
package/dist/src/mcp/runtime.d.ts +28 -0
package/dist/src/mcp/runtime.js +117 -51
package/dist/src/mcp/self-verify-runner.d.ts +14 -0
package/dist/src/mcp/self-verify-runner.js +38 -0
package/dist/src/mcp/setup-guide-text.d.ts +9 -0
package/dist/src/mcp/setup-guide-text.js +84 -0
package/dist/src/mcp/smart-filter.js +49 -0
package/dist/src/mcp/smoke.test.js +43 -43
package/dist/src/mcp/tools-server.d.ts +7 -0
package/dist/src/mcp/tools-server.js +19 -22
package/dist/src/models/catalog.json +349 -349
package/dist/src/ops/__tests__/doctor-ee-health.test.js +21 -0
package/dist/src/ops/doctor.d.ts +3 -2
package/dist/src/ops/doctor.js +47 -11
package/dist/src/ops/doctor.test.js +4 -3
package/dist/src/orchestrator/__tests__/mcp-capability-block.test.d.ts +1 -0
package/dist/src/orchestrator/__tests__/mcp-capability-block.test.js +39 -0
package/dist/src/orchestrator/__tests__/project-stack.test.d.ts +1 -0
package/dist/src/orchestrator/__tests__/project-stack.test.js +65 -0
package/dist/src/orchestrator/batch-turn-runner.js +7 -11
package/dist/src/orchestrator/compaction.d.ts +2 -0
package/dist/src/orchestrator/compaction.js +14 -1
package/dist/src/orchestrator/compaction.test.js +25 -1
package/dist/src/orchestrator/message-processor.js +72 -32
package/dist/src/orchestrator/orchestrator.js +26 -0
package/dist/src/orchestrator/prompts.d.ts +51 -0
package/dist/src/orchestrator/prompts.js +257 -134
package/dist/src/orchestrator/scope-ceiling.js +6 -1
package/dist/src/orchestrator/scope-reminder.d.ts +12 -0
package/dist/src/orchestrator/scope-reminder.js +16 -0
package/dist/src/orchestrator/scope-reminder.test.js +22 -1
package/dist/src/orchestrator/stream-runner.js +23 -15
package/dist/src/orchestrator/subagent-compactor.d.ts +14 -5
package/dist/src/orchestrator/subagent-compactor.js +30 -8
package/dist/src/orchestrator/subagent-compactor.spec.js +18 -0
package/dist/src/orchestrator/text-tool-call-detector.test.js +13 -13
package/dist/src/pil/__tests__/clarity-gate.test.js +24 -215
package/dist/src/pil/__tests__/config.test.js +1 -17
package/dist/src/pil/__tests__/discovery.test.js +144 -11
package/dist/src/pil/__tests__/layer1-intent-trace.test.js +7 -2
package/dist/src/pil/__tests__/layer1-intent.test.js +3 -0
package/dist/src/pil/__tests__/layer16-clarity.test.js +32 -116
package/dist/src/pil/__tests__/layer4-gsd.test.js +37 -0
package/dist/src/pil/__tests__/layer6-output.test.js +158 -18
package/dist/src/pil/__tests__/llm-classify.test.js +49 -2
package/dist/src/pil/__tests__/surface-compaction-artifacts.test.d.ts +1 -0
package/dist/src/pil/__tests__/surface-compaction-artifacts.test.js +112 -0
package/dist/src/pil/agent-operating-contract.d.ts +1 -1
package/dist/src/pil/agent-operating-contract.js +2 -0
package/dist/src/pil/agent-operating-contract.test.js +7 -2
package/dist/src/pil/cheap-model-playbook.js +35 -35
package/dist/src/pil/cheap-model-workbooks.js +16 -13
package/dist/src/pil/clarity-gate.d.ts +21 -19
package/dist/src/pil/clarity-gate.js +26 -153
package/dist/src/pil/config.d.ts +9 -1
package/dist/src/pil/config.js +15 -4
package/dist/src/pil/discovery.js +211 -136
package/dist/src/pil/layer1-intent.d.ts +12 -0
package/dist/src/pil/layer1-intent.js +283 -38
package/dist/src/pil/layer1-intent.test.js +210 -4
package/dist/src/pil/layer16-clarity.d.ts +25 -11
package/dist/src/pil/layer16-clarity.js +19 -306
package/dist/src/pil/layer3-ee-injection.d.ts +19 -0
package/dist/src/pil/layer3-ee-injection.js +96 -4
package/dist/src/pil/layer4-gsd.js +18 -6
package/dist/src/pil/layer6-output.d.ts +2 -0
package/dist/src/pil/layer6-output.js +151 -25
package/dist/src/pil/llm-classify.d.ts +26 -0
package/dist/src/pil/llm-classify.js +34 -5
package/dist/src/pil/native-capabilities-workbook.d.ts +1 -1
package/dist/src/pil/native-capabilities-workbook.js +82 -76
package/dist/src/pil/pipeline.js +15 -9
package/dist/src/pil/schema.d.ts +8 -0
package/dist/src/pil/schema.js +12 -1
package/dist/src/pil/task-tier-map.js +4 -0
package/dist/src/pil/types.d.ts +11 -1
package/dist/src/product-loop/done-gate.js +3 -3
package/dist/src/product-loop/loop-driver.js +18 -18
package/dist/src/product-loop/progress-snapshot.js +4 -4
package/dist/src/providers/auth/gemini-oauth.js +6 -15
package/dist/src/providers/auth/grok-oauth.js +6 -15
package/dist/src/providers/auth/openai-oauth.js +6 -15
package/dist/src/providers/mcp-vision-bridge.js +48 -48
package/dist/src/reporter/index.js +1 -1
package/dist/src/scaffold/bb-ecosystem-apply.js +47 -47
package/dist/src/scaffold/bb-quality-gate.js +5 -5
package/dist/src/scaffold/continuation-prompt.js +60 -60
package/dist/src/scaffold/init-new.js +453 -453
package/dist/src/self-qa/__tests__/scenario-planner.test.js +3 -3
package/dist/src/self-qa/agentic-loop.js +24 -19
package/dist/src/self-qa/spec-emitter.js +26 -23
package/dist/src/storage/__tests__/migrations.test.js +2 -2
package/dist/src/storage/interaction-log.js +5 -5
package/dist/src/storage/migrations.js +122 -122
package/dist/src/storage/sessions.js +42 -42
package/dist/src/storage/transcript.js +91 -84
package/dist/src/storage/usage.js +14 -14
package/dist/src/storage/workspaces.js +12 -12
package/dist/src/tools/__tests__/native-tools.test.d.ts +1 -0
package/dist/src/tools/__tests__/native-tools.test.js +53 -0
package/dist/src/tools/git-safety.d.ts +61 -0
package/dist/src/tools/git-safety.js +141 -0
package/dist/src/tools/git-safety.test.d.ts +1 -0
package/dist/src/tools/git-safety.test.js +111 -0
package/dist/src/tools/native-tools.d.ts +31 -0
package/dist/src/tools/native-tools.js +273 -0
package/dist/src/tools/registry-ee-query.test.js +18 -1
package/dist/src/tools/registry-git-safety.test.d.ts +7 -0
package/dist/src/tools/registry-git-safety.test.js +92 -0
package/dist/src/tools/registry.js +52 -6
package/dist/src/ui/__tests__/markdown-render.test.d.ts +1 -0
package/dist/src/ui/__tests__/markdown-render.test.js +48 -0
package/dist/src/ui/app.js +0 -0
package/dist/src/ui/components/message-view.js +4 -1
package/dist/src/ui/components/structured-response-view.js +7 -3
package/dist/src/ui/components/tool-group.js +7 -1
package/dist/src/ui/markdown-render.d.ts +41 -0
package/dist/src/ui/markdown-render.js +223 -0
package/dist/src/ui/markdown.d.ts +10 -0
package/dist/src/ui/markdown.js +12 -35
package/dist/src/ui/slash/council-inspect.js +4 -4
package/dist/src/ui/slash/export.js +4 -4
package/dist/src/ui/utils/text.d.ts +8 -0
package/dist/src/ui/utils/text.js +16 -0
package/dist/src/ui/utils/text.test.d.ts +1 -0
package/dist/src/ui/utils/text.test.js +23 -0
package/dist/src/usage/ledger.js +48 -15
package/dist/src/utils/__tests__/footprint-gitignore.test.d.ts +1 -0
package/dist/src/utils/__tests__/footprint-gitignore.test.js +50 -0
package/dist/src/utils/clipboard-image.js +23 -23
package/dist/src/utils/open-url.d.ts +56 -0
package/dist/src/utils/open-url.js +58 -0
package/dist/src/utils/open-url.test.d.ts +1 -0
package/dist/src/utils/open-url.test.js +86 -0
package/dist/src/utils/settings.d.ts +12 -0
package/dist/src/utils/settings.js +48 -0
package/dist/src/utils/side-question.js +2 -2
package/dist/src/utils/skills.js +3 -3
package/dist/src/verify/__tests__/coverage-parsers.test.js +30 -30
package/dist/src/verify/environment.js +2 -1
package/package.json +1 -1
package/dist/src/pil/layer16-clarity.test.js +0 -31
/package/dist/src/{pil/layer16-clarity.test.d.ts → council/__tests__/clarification-prompt.test.d.ts} +0 -0

package/dist/src/pil/layer16-clarity.d.ts CHANGED Viewed

@@ -1,19 +1,33 @@
+/**
+ * src/pil/layer16-clarity.ts
+ *
+ * Phase 2 (2026-06-16): `detectClarityGaps` and its keyword option-builders
+ * (`buildOutcomeOptions` / `buildScopeOptions` / `pickBest*` / recency ranking)
+ * were removed. The configured chat model now decides every clarification —
+ * its questions, options, recommended default, and reason — in
+ * `proposeModelGaps` (`discovery.ts`). There is no regex gap synthesis.
+ *
+ * What remains here is gap RENDERING + RESOLUTION (consumed by the model path):
+ *   - the "provide my own details" no-answer sentinel,
+ *   - `buildInterviewQuestion` (ClarityGap → askcard),
+ *   - `resolveGapsNonInteractive` (default-answer resolution when headless),
+ *   - `getAutofilledOutcome` / `getDefaultOutcome` (outcome-label polish).
+ */
 import type { CouncilQuestionData } from "../types/index.js";
 import type { ClarifiedIntent, ClarityGap, ProjectContext } from "./discovery-types.js";
 import type { TaskType } from "./types.js";
-export declare function detectClarityGaps(raw: string, taskType: TaskType | null, confidence: number, projectContext: ProjectContext): ClarityGap[];
 /**
- * Pick the "Recommended" default index for the scope askcard.
- *
- * Bug fixed (live obs 2026-06-04, deepseek session): the scope gap hardcoded
- * defaultIndex 0, but buildScopeOptions lists recency-ranked (NOT prompt-matched)
- * bounded contexts first when nothing matched — so the card recommended an
- * arbitrary subdir (e.g. "src/cli") for a repo-wide prompt while "Entire project"
- * was demoted to last. Only recommend a specific bounded context when the prompt
- * literally names it (same word-overlap test buildScopeOptions uses); otherwise
- * recommend "Entire project".
+ * The default "no specific answer" meta-option offered for a model-generated
+ * clarification when the model supplies no concrete recommendations. Selecting
+ * it means "use your judgment / I have nothing specific to add" — it is a
+ * sentinel, NOT a real outcome, so it must never surface verbatim as the
+ * resolved outcome. Centralised here so discovery.ts (which presents the
+ * option) and the outcome-resolution paths agree on the exact strings.
  */
-export declare function pickBestScopeIndex(raw: string, options: string[]): number;
+export declare const PROVIDE_OWN_DETAILS_OPTION_EN = "I will provide my own details / constraints";
+export declare const PROVIDE_OWN_DETAILS_OPTION_VI = "T\u00F4i s\u1EBD tr\u1EA3 l\u1EDDi t\u1EF1 do / cung c\u1EA5p chi ti\u1EBFt c\u1EA7n thi\u1EBFt";
+/** True when an answer is the "I'll provide my own details" meta-option (any locale). */
+export declare function isProvideOwnDetailsSentinel(answer: string | null | undefined): boolean;
 export declare function buildInterviewQuestion(gap: ClarityGap, questionId: string): CouncilQuestionData;
 export declare function resolveGapsNonInteractive(gaps: ClarityGap[], projectContext: ProjectContext, raw: string): ClarifiedIntent;
 export declare function getAutofilledOutcome(taskType: TaskType | null, raw?: string): string | null;

package/dist/src/pil/layer16-clarity.js CHANGED Viewed

@@ -1,309 +1,20 @@
-import { canInferOutcome, countFileReferences, hasExplicitScope, hasExternalInfoScope, hasImageScope, hasOperationalScope, hasSelfContainedComputationScope, hasWholeRepoScope, } from "./clarity-gate.js";
-export function detectClarityGaps(raw, taskType, confidence, projectContext) {
-    const gaps = [];
-    // PIL-L6 fix — debug joins the autofill set. For "fix ci fail" the outcome
-    // is trivially "error resolved / pipeline green" and forcing an askcard
-    // there produces noise (the user already said "goal: ci green").
-    const AUTOFILL_OUTCOME_TYPES = new Set(["analyze", "plan", "documentation", "debug"]);
-    if (!canInferOutcome(taskType, raw)) {
-        if (taskType && AUTOFILL_OUTCOME_TYPES.has(taskType)) {
-            // These task types have predictable outcomes — auto-fill without asking
-        }
-        else if (!taskType || taskType === "general") {
-            // B2 intent-swallow fix — a `general` (or unclassified) prompt has no
-            // task-specific outcome options, so `buildOutcomeOptions` falls back to
-            // the tautological ["Task completed", "Issue resolved"]. Asking that
-            // askcard adds zero signal, and its default answer overwrites the intent
-            // → "general: Task completed", discarding the user's original request.
-            // Skip it; the outcome defaults to the raw prompt downstream
-            // (buildClarifiedIntentFromAnswers / getDefaultOutcome), preserving intent.
-        }
-        else {
-            const outcomeOptions = buildOutcomeOptions(taskType, projectContext);
-            gaps.push({
-                dimension: "outcome",
-                description: "Cannot infer the expected outcome from the prompt",
-                suggestedQuestion: `What's the expected outcome? ${taskType === "debug" ? "(e.g., error gone, test passes, behavior fixed)" : "(e.g., feature works, file updated, test passes)"}`,
-                options: outcomeOptions,
-                defaultIndex: pickBestOutcomeIndex(taskType, outcomeOptions, raw),
-            });
-        }
-    }
-    // PIL-L6 fix — operational scope (CI / build / deploy / lint) is enough
-    // even without a file path. The task's target is the pipeline itself.
-    //
-    // B2-symmetric scope guard — the scope detector assumes EVERY prompt is a
-    // codebase task: any prompt lacking a file/module/operational reference gets
-    // asked "Which part of the codebase should this target?". For a general or
-    // unclassified prompt that has no codebase dimension at all (e.g. a pure
-    // chat / generation request like "Reply with one word: PONG", live session
-    // 8a87aa060c6a) this question is nonsensical, and because it is the only gap
-    // it also drags in a downstream acceptance card. Skip it for general/null —
-    // the same population the B2 outcome guard above protects. Scope then falls
-    // back to project-root in resolveGapsNonInteractive. Classified code tasks
-    // (debug/generate/refactor/…) still get the scope-narrowing askcard.
-    // Image-scope guard — an image-analysis task (e.g. "analyze diagram.png",
-    // "take a screenshot and describe it") is scoped to the IMAGE, not the
-    // codebase, so the "Which part of the codebase?" askcard is nonsensical for
-    // it. Symmetric to hasOperationalScope (pipeline-scoped). hasImageScope is
-    // deliberately narrow so it never swallows a real codebase task.
-    const scopeAppliesToCodebase = !!taskType && taskType !== "general";
-    if (scopeAppliesToCodebase &&
-        countFileReferences(raw) === 0 &&
-        !hasExplicitScope(raw) &&
-        !hasOperationalScope(raw) &&
-        !hasImageScope(raw) &&
-        !hasExternalInfoScope(raw) &&
-        // Whole-repo / eval prompts ("đánh giá repo", "review the entire codebase")
-        // are already scoped to everything — asking "which part?" (and recommending
-        // a narrow subdir as default) is nonsensical. See hasWholeRepoScope.
-        !hasWholeRepoScope(raw) &&
-        // Self-contained computation ("Compute f([3,1,2]) …") supplies its operand
-        // data inline — there is no codebase to scope. See hasSelfContainedComputationScope.
-        !hasSelfContainedComputationScope(raw)) {
-        const scopeOptions = buildScopeOptions(raw, projectContext);
-        gaps.push({
-            dimension: "scope",
-            description: "No specific file or module referenced",
-            suggestedQuestion: "Which part of the codebase should this target?",
-            options: scopeOptions,
-            defaultIndex: pickBestScopeIndex(raw, scopeOptions),
-        });
-    }
-    const hasConstraint = /\b(\d+\s*ms|\d+\s*%|faster|slower|before|deadline|limit|max|min)\b/i.test(raw);
-    const isPerformanceTask = /\b(optimi[zs]e|performance|speed|fast|slow|latency|throughput)\b/i.test(raw);
-    if (isPerformanceTask && !hasConstraint) {
-        gaps.push({
-            dimension: "constraint",
-            description: "Performance target not specified",
-            suggestedQuestion: "Any specific performance target? (e.g., <200ms response, 50% faster)",
-            options: ["General improvement", "Specific latency target", "Reduce bundle size"],
-            defaultIndex: 0,
-        });
-    }
-    return gaps;
-}
+import { hasOperationalScope } from "./clarity-gate.js";
 /**
- * Phase 5 F8 — context-aware default option for outcome askcards.
- *
- * The askcard's "Recommended" badge previously pinned to options[0]
- * regardless of prompt content. For prompts like "improve test coverage"
- * (generate options: Feature implemented / File created / Tests added),
- * defaulting to "Feature implemented" was wrong — the user explicitly
- * mentioned tests. This picks a more relevant option based on prompt
- * keywords, with a fallback to 0 when nothing matches.
- *
- * Keep this list short — overengineering breaks predictability. We only
- * encode the keyword→index pairs we've actually seen mismatch in the
- * 5-baseline + sanity sessions.
+ * The default "no specific answer" meta-option offered for a model-generated
+ * clarification when the model supplies no concrete recommendations. Selecting
+ * it means "use your judgment / I have nothing specific to add" — it is a
+ * sentinel, NOT a real outcome, so it must never surface verbatim as the
+ * resolved outcome. Centralised here so discovery.ts (which presents the
+ * option) and the outcome-resolution paths agree on the exact strings.
  */
-function pickBestOutcomeIndex(taskType, options, raw) {
-    if (options.length <= 1)
-        return 0;
-    const lower = raw.toLowerCase();
-    const has = (re) => re.test(lower);
-    const find = (substring) => options.findIndex((o) => o.toLowerCase().includes(substring));
-    switch (taskType) {
-        case "generate": {
-            // "improve coverage", "add tests", "viết test" → "Tests added"
-            if (has(/\b(coverage|unit test|viết test|viet test|spec|jest|vitest|pytest)\b/) || has(/\btest(?:s|ing)?\b/)) {
-                const idx = find("test");
-                if (idx >= 0)
-                    return idx;
-            }
-            // "scaffold", "boilerplate", "tạo file mới" → "File created with boilerplate"
-            if (has(/\b(scaffold|boilerplate|template|skeleton)\b/) || has(/\btạo file\b|\btao file\b/)) {
-                const idx = find("file created");
-                if (idx >= 0)
-                    return idx;
-            }
-            return 0; // "Feature implemented and working"
-        }
-        case "refactor": {
-            // "performance", "speed", "faster" → "Better performance"
-            if (has(/\b(performance|speed|fast(er)?|slow|latency|throughput|optimi[zs]e)\b/)) {
-                const idx = find("performance");
-                if (idx >= 0)
-                    return idx;
-            }
-            // "test", "testable" → "Easier to test"
-            if (has(/\b(testable|easier to test|unit test)\b/)) {
-                const idx = find("test");
-                if (idx >= 0)
-                    return idx;
-            }
-            return 0; // "Code cleaner, same behavior"
-        }
-        case "debug": {
-            // "test fail", "test pass" → "Test passes"
-            if (has(/\btest(?:s|ing)? (?:fail|pass)/) || has(/\bspec fail/)) {
-                const idx = find("test passes");
-                if (idx >= 0)
-                    return idx;
-            }
-            return 0; // "Error disappears"
-        }
-        case "documentation": {
-            if (has(/\b(readme)\b/)) {
-                const idx = find("readme");
-                if (idx >= 0)
-                    return idx;
-            }
-            if (has(/\b(api docs|api documentation|openapi|swagger)\b/)) {
-                const idx = find("api docs");
-                if (idx >= 0)
-                    return idx;
-            }
-            return 0;
-        }
-        case "plan": {
-            if (has(/\b(trade-?offs?|alternative|compare)\b/)) {
-                const idx = find("trade");
-                if (idx >= 0)
-                    return idx;
-            }
-            if (has(/\b(step.?by.?step|phase|roadmap)\b/)) {
-                const idx = find("step-by-step");
-                if (idx >= 0)
-                    return idx;
-            }
-            return 0;
-        }
-        case "analyze": {
-            if (has(/\b(root cause|why|tại sao|tai sao|crash|stack trace)\b/)) {
-                const idx = find("root cause");
-                if (idx >= 0)
-                    return idx;
-            }
-            if (has(/\b(recommend|suggest|đề xuất|de xuat)\b/)) {
-                const idx = find("recommendations");
-                if (idx >= 0)
-                    return idx;
-            }
-            return 0;
-        }
-        default:
-            return 0;
-    }
-}
-function buildOutcomeOptions(taskType, ctx) {
-    switch (taskType) {
-        case "debug":
-            return ["Error disappears", "Test passes", "Feature works correctly"];
-        case "refactor":
-            return ["Code cleaner, same behavior", "Better performance", "Easier to test"];
-        case "generate":
-            return ["Feature implemented and working", "File created with boilerplate", "Tests added"];
-        case "documentation":
-            return ["Docs updated", "README reflects current state", "API docs generated"];
-        case "plan":
-            return ["Architecture decided", "Step-by-step plan", "Trade-offs documented"];
-        case "analyze":
-            return ["Root cause identified", "Report generated", "Recommendations listed"];
-        default:
-            return ["Task completed", "Issue resolved"];
-    }
-}
-/**
- * Pick the "Recommended" default index for the scope askcard.
- *
- * Bug fixed (live obs 2026-06-04, deepseek session): the scope gap hardcoded
- * defaultIndex 0, but buildScopeOptions lists recency-ranked (NOT prompt-matched)
- * bounded contexts first when nothing matched — so the card recommended an
- * arbitrary subdir (e.g. "src/cli") for a repo-wide prompt while "Entire project"
- * was demoted to last. Only recommend a specific bounded context when the prompt
- * literally names it (same word-overlap test buildScopeOptions uses); otherwise
- * recommend "Entire project".
- */
-export function pickBestScopeIndex(raw, options) {
-    const entireIdx = options.findIndex((o) => /entire project/i.test(o));
-    const fallback = entireIdx >= 0 ? entireIdx : Math.max(0, options.length - 1);
-    const words = raw
-        .toLowerCase()
-        .split(/\s+/)
-        .filter((w) => w.length > 2);
-    for (let i = 0; i < options.length; i++) {
-        const opt = options[i] ?? "";
-        if (/entire project/i.test(opt))
-            continue;
-        const nameMatch = opt.match(/\(([^)]+)\)\s*$/);
-        const name = (nameMatch?.[1] ?? opt).toLowerCase();
-        if (words.some((w) => name.includes(w) || w.includes(name)))
-            return i;
-    }
-    return fallback;
-}
-function buildScopeOptions(raw, ctx) {
-    const words = raw
-        .toLowerCase()
-        .split(/\s+/)
-        .filter((w) => w.length > 2);
-    const matching = ctx.boundedContexts.filter((bc) => {
-        const name = bc.name.toLowerCase();
-        return words.some((w) => name.includes(w) || w.includes(name));
-    });
-    const options = matching.map((bc) => `${bc.path} (${bc.name})`);
-    if (options.length === 0 && ctx.boundedContexts.length > 0) {
-        // Phase 5 F4 — when no keyword matches a module name, the previous
-        // fallback returned the first 3 alphabetically (which on muonroi-cli
-        // surfaced `agent-harness`, `billing`, `chat` — three OLD scaffolding
-        // folders that almost never match a fresh prompt). Rank by recency
-        // signal instead: most recently modified module dir comes first.
-        const ranked = rankModulesByRecency(ctx.boundedContexts, ctx.cwd);
-        options.push(...ranked.slice(0, 3).map((bc) => `${bc.path} (${bc.name})`));
-    }
-    options.push("Entire project");
-    return options.slice(0, 4);
-}
-/**
- * F4 — rank bounded contexts by recency-of-modification of any tracked file
- * inside. Falls back to alphabetical order when stat() throws for the dir.
- * The 4-level depth cap + 50-entry-per-level cap keeps the walk under 200ms
- * even on huge monorepos.
- */
-function rankModulesByRecency(contexts, cwd) {
-    const fs = require("node:fs");
-    const path = require("node:path");
-    const scored = contexts.map((bc) => {
-        const dirPath = path.join(cwd, bc.path);
-        let maxMtime = 0;
-        try {
-            // walk up to 4 levels deep, cap entries per level
-            const walk = (dir, depth) => {
-                if (depth > 4)
-                    return;
-                let entries = [];
-                try {
-                    entries = fs.readdirSync(dir).slice(0, 50);
-                }
-                catch {
-                    return;
-                }
-                for (const e of entries) {
-                    if (e.startsWith(".") || e === "node_modules" || e === "dist")
-                        continue;
-                    try {
-                        const full = path.join(dir, e);
-                        const st = fs.statSync(full);
-                        if (st.mtimeMs > maxMtime)
-                            maxMtime = st.mtimeMs;
-                        if (st.isDirectory())
-                            walk(full, depth + 1);
-                    }
-                    catch {
-                        /* skip unreadable entries */
-                    }
-                }
-            };
-            walk(dirPath, 0);
-        }
-        catch {
-            /* fall back to mtime=0 — keeps the entry at the bottom of the ranked list */
-        }
-        return { bc, mtime: maxMtime };
-    });
-    scored.sort((a, b) => b.mtime - a.mtime);
-    return scored.map((s) => s.bc);
+export const PROVIDE_OWN_DETAILS_OPTION_EN = "I will provide my own details / constraints";
+export const PROVIDE_OWN_DETAILS_OPTION_VI = "Tôi sẽ trả lời tự do / cung cấp chi tiết cần thiết";
+/** True when an answer is the "I'll provide my own details" meta-option (any locale). */
+export function isProvideOwnDetailsSentinel(answer) {
+    if (!answer)
+        return false;
+    const norm = answer.trim().toLowerCase();
+    return norm === PROVIDE_OWN_DETAILS_OPTION_EN.toLowerCase() || norm === PROVIDE_OWN_DETAILS_OPTION_VI.toLowerCase();
 }
 export function buildInterviewQuestion(gap, questionId) {
     const options = gap.options.map((label) => ({
@@ -335,7 +46,9 @@ export function resolveGapsNonInteractive(gaps, projectContext, raw) {
         const defaultAnswer = gap.options[gap.defaultIndex] ?? gap.options[0] ?? "";
         switch (gap.dimension) {
             case "outcome":
-                outcome = defaultAnswer;
+                // The "provide my own details" meta-option is a no-answer sentinel —
+                // leave outcome empty so the inferred/default outcome is used downstream.
+                outcome = isProvideOwnDetailsSentinel(defaultAnswer) ? "" : defaultAnswer;
                 break;
             case "scope": {
                 const relevant = projectContext.relevantModules.map((m) => m.path);
@@ -377,7 +90,7 @@ export function getAutofilledOutcome(taskType, raw) {
         // Prevents generic "Local path...", "In prompts/ directory...", "Complete the task..." in [Discovery]
         return "Native self-assessment of the CLI with specific, actionable code fixes proposed and verified";
     }
-    // PIL-L6 fix — operational debug tasks have a stronger default outcome
+    // Operational debug tasks (CI/build/deploy) have a stronger default outcome.
     if (taskType === "debug" && hasOperationalScope(raw)) {
         return "Pipeline green, all checks passing";
     }

package/dist/src/pil/layer3-ee-injection.d.ts CHANGED Viewed

@@ -16,3 +16,22 @@
  */
 import type { PipelineContext } from "./types.js";
 export declare function layer3EeInjection(ctx: PipelineContext): Promise<PipelineContext>;
+/**
+ * Issue #4 — meta-turn TARGETED complement to Layer 3's checkpoint arm.
+ *
+ * Since issue #2, Layer 3 now runs on the meta-analysis path too, so its
+ * checkpoint arm already surfaces recent checkpoints/artifacts for the agent.
+ * That arm uses a FIXED recency query, though — it isn't biased toward the
+ * current meta question. This arm fills that gap: it searches by `ctx.raw` so a
+ * self-evaluating agent sees the elided tool-artifacts RELEVANT to what it's
+ * analyzing, rendered via the same `formatTaskCheckpoints` so the `[artifact]
+ * … id=X` refs appear automatically instead of waiting on a manual `ee_query`.
+ *
+ * Defers to Layer 3: if a checkpoint block was already injected this turn (any
+ * `ee-checkpoint-injected` marker present) it skips entirely — no duplicate
+ * block and no second EE round-trip. Gated on `sessionId` (no session ⇒ no prior
+ * compaction to rehydrate). Strictly additive and fail-open: any error /
+ * no-session / no-match / already-surfaced returns ctx with the original
+ * `enriched` plus an `ee-meta-artifacts` layer marker for forensics.
+ */
+export declare function surfaceCompactionArtifacts(ctx: PipelineContext): Promise<PipelineContext>;

package/dist/src/pil/layer3-ee-injection.js CHANGED Viewed

@@ -119,7 +119,7 @@ async function queryEeBridge(raw) {
         const [principleRaw, behavioralRaw, checkpointRaw] = await Promise.all([
             searchByText(raw, ["experience-principles"], 3, signal),
             searchByText(raw, ["experience-behavioral"], 4, signal),
-            searchByText("Context checkpoint summary OR \"compaction checkpoint\" recent Progress DONE elided OR tool-artifact OR \"tool result id=\"", ["experience-behavioral"], 3, signal).catch(() => []),
+            searchByText('Context checkpoint summary OR "compaction checkpoint" recent Progress DONE elided OR tool-artifact OR "tool result id="', ["experience-behavioral"], 3, signal).catch(() => []),
         ]);
         const principlePoints = principleRaw.filter((p) => (p.score ?? 0) >= PIL_PRINCIPLES_FLOOR);
         const behavioralPoints = behavioralRaw.filter((p) => (p.score ?? 0) >= PIL_SCORE_FLOOR);
@@ -161,14 +161,16 @@ function formatExperienceHints(points) {
 function formatTaskCheckpoints(points) {
     if (points.length === 0)
         return "";
-    const lines = points.map((p) => {
+    const lines = points
+        .map((p) => {
         const t = extractPointText(p);
         // Idea 4: surface tool-artifact refs so agent sees "elided high-value, query for full"
         if (/tool-artifact|tool result id=|elided.*id=/.test(t.toLowerCase())) {
             return `- [artifact] ${t.slice(0, 160)} [id:${p.id}]`;
         }
         return `- ${t.slice(0, 180)} [id:${p.id}]`;
-    }).filter((l) => l !== "- ");
+    })
+        .filter((l) => l !== "- ");
     if (lines.length === 0)
         return "";
     return `[task checkpoints — prior compactions: use to answer "task finished?", "compacted yet?". Artifacts: use ee.query tool with "tool-artifact id=XXX" for full elided tool output.] \n${lines.join("\n")}`;
@@ -282,7 +284,7 @@ export async function layer3EeInjection(ctx) {
             const text = extractPointText(p);
             return text.length === 0 || !checkpointMarkerShas.has(payloadSha16(text));
         })
-        : (result.checkpointPoints || []);
+        : result.checkpointPoints || [];
     const allPoints = [...deduplicatedPrinciples, ...deduplicatedBehavioral, ...deduplicatedCheckpoints];
     // STALE-01: Register injected point IDs for prompt-stale reconciliation.
     updateLastSurfacedState(allPoints.map((p) => String(p.id)));
@@ -359,4 +361,94 @@ export async function layer3EeInjection(ctx) {
         ],
     };
 }
+/**
+ * Records whose text actually reads like a compaction checkpoint or an elided
+ * tool-artifact. Used to keep generic behavioral hits from being mislabelled as
+ * `[artifact]`/checkpoint lines when we search by the meta question (ctx.raw)
+ * rather than the fixed checkpoint-arm query.
+ */
+const CHECKPOINT_LIKE_RE = /context checkpoint summary|compaction checkpoint|tool-artifact|tool result id=|elided|progress[^a-z]*done|✔/i;
+/**
+ * Issue #4 — meta-turn TARGETED complement to Layer 3's checkpoint arm.
+ *
+ * Since issue #2, Layer 3 now runs on the meta-analysis path too, so its
+ * checkpoint arm already surfaces recent checkpoints/artifacts for the agent.
+ * That arm uses a FIXED recency query, though — it isn't biased toward the
+ * current meta question. This arm fills that gap: it searches by `ctx.raw` so a
+ * self-evaluating agent sees the elided tool-artifacts RELEVANT to what it's
+ * analyzing, rendered via the same `formatTaskCheckpoints` so the `[artifact]
+ * … id=X` refs appear automatically instead of waiting on a manual `ee_query`.
+ *
+ * Defers to Layer 3: if a checkpoint block was already injected this turn (any
+ * `ee-checkpoint-injected` marker present) it skips entirely — no duplicate
+ * block and no second EE round-trip. Gated on `sessionId` (no session ⇒ no prior
+ * compaction to rehydrate). Strictly additive and fail-open: any error /
+ * no-session / no-match / already-surfaced returns ctx with the original
+ * `enriched` plus an `ee-meta-artifacts` layer marker for forensics.
+ */
+export async function surfaceCompactionArtifacts(ctx) {
+    const markLayer = (applied, delta) => ({
+        ...ctx,
+        layers: [...ctx.layers, { name: "ee-meta-artifacts", applied, delta }],
+    });
+    if (!ctx.sessionId)
+        return markLayer(false, "no-session");
+    // Defer to Layer 3: a checkpoint/artifact block is already present this turn,
+    // so don't duplicate it or pay a second EE round-trip. This arm only fills the
+    // gap when Layer 3's fixed-query checkpoint arm surfaced nothing.
+    if (extractCheckpointMarkerShas(ctx.enriched).size > 0)
+        return markLayer(false, "already-surfaced");
+    let points = [];
+    try {
+        const signal = AbortSignal.timeout(PIL_SEARCH_TIMEOUT_MS);
+        // Bias toward records relevant to THIS meta question (ctx.raw) while pulling
+        // in checkpoint/artifact vocabulary so the single cheap arm lands on the
+        // compaction records rather than generic behavioral patterns.
+        const query = `${ctx.raw}\nContext checkpoint summary tool-artifact "tool result id=" elided Progress DONE`;
+        const raw = await searchByText(query, ["experience-behavioral"], 5, signal);
+        points = raw
+            .filter((p) => (p.score ?? 0) >= PIL_SCORE_FLOOR * 0.7)
+            .filter((p) => CHECKPOINT_LIKE_RE.test(extractPointText(p)));
+    }
+    catch (err) {
+        logEeFailure("pil.meta.surfaceCompactionArtifacts", classifyEeError(err), err, { budgetMs: PIL_SEARCH_TIMEOUT_MS });
+        return markLayer(false, `error=${String(err)}`);
+    }
+    if (points.length === 0)
+        return markLayer(false, "no-artifacts");
+    const cpText = formatTaskCheckpoints(points);
+    if (!cpText)
+        return markLayer(false, "no-artifacts");
+    // Append the marker AFTER truncation so it always survives into `enriched`
+    // — that marker is what makes the defer-check above fire on any later pass.
+    const blockSha = payloadSha16(cpText);
+    const body = truncateToBudget(cpText, Math.floor(ctx.tokenBudget * 0.12));
+    const block = `${body}\n<!-- ee-checkpoint-injected:${blockSha} -->`;
+    try {
+        if (ctx.sessionId) {
+            logInteraction(ctx.sessionId, "ee_injection", {
+                eventSubtype: "injected",
+                data: {
+                    phase: "pil_meta_artifacts",
+                    role: "knowledge_retriever",
+                    checkpointCount: points.length,
+                    pointIds: points.map((p) => String(p.id)),
+                    injectedChars: block.length,
+                },
+            });
+        }
+    }
+    catch (err) {
+        // No silent catch: surfacing succeeded; only the audit write failed.
+        console.error(`[pil.meta.surfaceCompactionArtifacts] interaction log failed: ${err?.message}`);
+    }
+    return {
+        ...ctx,
+        enriched: `${ctx.enriched}\n${block}`,
+        layers: [
+            ...ctx.layers,
+            { name: "ee-meta-artifacts", applied: true, delta: `artifacts=${points.length} chars=${block.length}` },
+        ],
+    };
+}
 //# sourceMappingURL=layer3-ee-injection.js.map

package/dist/src/pil/layer4-gsd.js CHANGED Viewed

@@ -23,7 +23,7 @@ import { detectGrayAreas } from "../gsd/gray-areas.js";
 import { detectGsdPhase } from "../gsd/types.js";
 import { classifyEeError, logEeFailure } from "../utils/ee-logger.js";
 import { truncateToBudget } from "./budget.js";
-import { isMetaAnalysisPrompt } from "./layer6-output.js";
+import { isImplementationIntent, isMetaAnalysisPrompt, isQuestionLike } from "./layer6-output.js";
 function mapRouteToPhase(route) {
     switch (route) {
         case "qc-flow":
@@ -79,11 +79,23 @@ export async function layer4Gsd(ctx) {
     }
     const complexity = scoreComplexity(ctx.raw);
     const grayAreas = complexity.tier === "heavy" ? detectGrayAreas(ctx.raw).questions : [];
-    // Informational/meta prompts (a question or a self/meta CLI analysis) ask for
-    // an ANSWER, not a code change. The implement/verify directive leaks into the
-    // human-facing reply as a "2-3 line plan" + process narration (session
-    // 829a83888dd2). Route them to the human-facing question directive instead.
-    const informational = isMetaAnalysisPrompt(ctx.raw) || ctx.taskType === "general";
+    // Informational prompts (a question / explanation / self-eval) ask for an
+    // ANSWER, not a code change. The implement/verify directive otherwise leaks
+    // into the human-facing reply as a "2-3 line plan" + process narration
+    // (session 829a83888dd2). Route them to the human-facing question directive.
+    //
+    // Phase 2b: when the model classified the deliverable, CONSUME it — an
+    // "answer" deliverable IS informational. Only when the model didn't emit one
+    // (deliverableKind null → legacy cascade, or the model omitted the word) do
+    // we fall back to the legacy regex predicates:
+    //   1. isMetaAnalysisPrompt — self/CLI evaluation, prior-turn reflection.
+    //   2. taskType "general" classified as a real task by L1.
+    //   3. question-shaped prompt that is NOT an implementation request.
+    const informational = ctx.deliverableKind
+        ? ctx.deliverableKind === "answer"
+        : isMetaAnalysisPrompt(ctx.raw) ||
+            (ctx.taskType === "general" && ctx.intentKind === "task") ||
+            (isQuestionLike(ctx.raw) && !isImplementationIntent(ctx.raw));
     const directive = buildDirective({ complexity, phase, grayAreas, informational });
     const budgetChars = Math.floor(ctx.tokenBudget * DIRECTIVE_BUDGET_FRACTION);
     const trimmed = truncateToBudget(directive.text, budgetChars);

package/dist/src/pil/layer6-output.d.ts CHANGED Viewed

@@ -18,5 +18,7 @@ import type { PipelineContext } from "./types.js";
 export declare function isMetaAnalysisPrompt(raw: string): boolean;
 export declare function applyPilSuffix(systemPrompt: string, ctx: PipelineContext, responseToolsActive?: boolean): string;
 export declare function isImplementationIntent(raw: string): boolean;
+export declare function isQuestionLike(raw: string): boolean;
+export declare function prefersStructuredReport(raw: string): boolean;
 export declare function getResponseToolSet(ctx: PipelineContext, providerId?: ProviderId): ToolSet;
 export declare function layer6Output(ctx: PipelineContext): Promise<PipelineContext>;