npm - muonroi-cli - Versions diffs - 1.4.1 → 1.5.0 - Mend

muonroi-cli 1.4.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (172) hide show

package/LICENSE +21 -21
package/README.md +122 -122
package/dist/packages/agent-harness-core/src/predicate.d.ts +1 -1
package/dist/src/agent-harness/__tests__/mock-model.spec.js +48 -1
package/dist/src/agent-harness/mock-model.d.ts +11 -0
package/dist/src/agent-harness/mock-model.js +21 -0
package/dist/src/cli/cost-forensics.js +12 -12
package/dist/src/council/__tests__/clarification-prompt.test.js +51 -0
package/dist/src/council/__tests__/clarifier-ready-gate.test.js +32 -0
package/dist/src/council/__tests__/decisions-lock.test.js +17 -1
package/dist/src/council/__tests__/oauth-reachable.test.d.ts +1 -0
package/dist/src/council/__tests__/oauth-reachable.test.js +31 -0
package/dist/src/council/__tests__/parse-outcome-fallback.test.js +11 -0
package/dist/src/council/clarifier.js +9 -1
package/dist/src/council/debate.js +5 -1
package/dist/src/council/decisions-lock.js +3 -3
package/dist/src/council/index.js +12 -5
package/dist/src/council/leader.d.ts +0 -17
package/dist/src/council/leader.js +22 -15
package/dist/src/council/planner.js +1 -1
package/dist/src/council/prompts.js +63 -57
package/dist/src/council/types.d.ts +7 -0
package/dist/src/ee/__tests__/ee-onboarding.test.d.ts +1 -0
package/dist/src/ee/__tests__/ee-onboarding.test.js +32 -0
package/dist/src/ee/auth.d.ts +9 -0
package/dist/src/ee/auth.js +19 -0
package/dist/src/ee/ee-onboarding.d.ts +5 -0
package/dist/src/ee/ee-onboarding.js +76 -0
package/dist/src/generated/version.d.ts +1 -1
package/dist/src/generated/version.js +1 -1
package/dist/src/headless/output.js +6 -4
package/dist/src/headless/output.test.js +4 -3
package/dist/src/index.js +20 -1
package/dist/src/mcp/__tests__/auto-setup.test.js +74 -0
package/dist/src/mcp/__tests__/client-pool.spec.d.ts +1 -0
package/dist/src/mcp/__tests__/client-pool.spec.js +98 -0
package/dist/src/mcp/__tests__/parallel-build.spec.d.ts +1 -0
package/dist/src/mcp/__tests__/parallel-build.spec.js +67 -0
package/dist/src/mcp/__tests__/smart-filter.test.js +56 -0
package/dist/src/mcp/auto-setup.js +56 -2
package/dist/src/mcp/client-pool.d.ts +46 -0
package/dist/src/mcp/client-pool.js +212 -0
package/dist/src/mcp/oauth-callback.js +2 -2
package/dist/src/mcp/parse-headers.test.js +14 -14
package/dist/src/mcp/runtime.d.ts +28 -0
package/dist/src/mcp/runtime.js +117 -51
package/dist/src/mcp/self-verify-runner.d.ts +14 -0
package/dist/src/mcp/self-verify-runner.js +38 -0
package/dist/src/mcp/setup-guide-text.d.ts +9 -0
package/dist/src/mcp/setup-guide-text.js +84 -0
package/dist/src/mcp/smart-filter.js +49 -0
package/dist/src/mcp/smoke.test.js +43 -43
package/dist/src/mcp/tools-server.d.ts +7 -0
package/dist/src/mcp/tools-server.js +19 -22
package/dist/src/models/catalog.json +349 -349
package/dist/src/ops/__tests__/doctor-ee-health.test.js +21 -0
package/dist/src/ops/doctor.d.ts +3 -2
package/dist/src/ops/doctor.js +47 -11
package/dist/src/ops/doctor.test.js +4 -3
package/dist/src/orchestrator/__tests__/mcp-capability-block.test.d.ts +1 -0
package/dist/src/orchestrator/__tests__/mcp-capability-block.test.js +39 -0
package/dist/src/orchestrator/__tests__/project-stack.test.d.ts +1 -0
package/dist/src/orchestrator/__tests__/project-stack.test.js +65 -0
package/dist/src/orchestrator/batch-turn-runner.js +7 -11
package/dist/src/orchestrator/message-processor.js +57 -27
package/dist/src/orchestrator/orchestrator.js +26 -0
package/dist/src/orchestrator/prompts.d.ts +51 -0
package/dist/src/orchestrator/prompts.js +257 -134
package/dist/src/orchestrator/scope-ceiling.js +6 -1
package/dist/src/orchestrator/stream-runner.js +20 -15
package/dist/src/orchestrator/text-tool-call-detector.test.js +13 -13
package/dist/src/pil/__tests__/clarity-gate.test.js +24 -215
package/dist/src/pil/__tests__/config.test.js +1 -17
package/dist/src/pil/__tests__/discovery.test.js +144 -11
package/dist/src/pil/__tests__/layer1-intent-trace.test.js +7 -2
package/dist/src/pil/__tests__/layer1-intent.test.js +3 -0
package/dist/src/pil/__tests__/layer16-clarity.test.js +32 -116
package/dist/src/pil/__tests__/layer4-gsd.test.js +37 -0
package/dist/src/pil/__tests__/layer6-output.test.js +137 -18
package/dist/src/pil/__tests__/llm-classify.test.js +49 -2
package/dist/src/pil/agent-operating-contract.d.ts +1 -1
package/dist/src/pil/agent-operating-contract.js +2 -0
package/dist/src/pil/agent-operating-contract.test.js +7 -2
package/dist/src/pil/cheap-model-playbook.js +35 -35
package/dist/src/pil/cheap-model-workbooks.js +16 -13
package/dist/src/pil/clarity-gate.d.ts +21 -19
package/dist/src/pil/clarity-gate.js +26 -153
package/dist/src/pil/config.d.ts +9 -1
package/dist/src/pil/config.js +15 -4
package/dist/src/pil/discovery.js +211 -136
package/dist/src/pil/layer1-intent.d.ts +12 -0
package/dist/src/pil/layer1-intent.js +283 -38
package/dist/src/pil/layer1-intent.test.js +210 -4
package/dist/src/pil/layer16-clarity.d.ts +25 -11
package/dist/src/pil/layer16-clarity.js +19 -306
package/dist/src/pil/layer4-gsd.js +18 -6
package/dist/src/pil/layer6-output.d.ts +2 -0
package/dist/src/pil/layer6-output.js +137 -22
package/dist/src/pil/llm-classify.d.ts +26 -0
package/dist/src/pil/llm-classify.js +34 -5
package/dist/src/pil/native-capabilities-workbook.d.ts +1 -1
package/dist/src/pil/native-capabilities-workbook.js +82 -76
package/dist/src/pil/schema.d.ts +8 -0
package/dist/src/pil/schema.js +12 -1
package/dist/src/pil/task-tier-map.js +4 -0
package/dist/src/pil/types.d.ts +11 -1
package/dist/src/product-loop/done-gate.js +3 -3
package/dist/src/product-loop/loop-driver.js +18 -18
package/dist/src/product-loop/progress-snapshot.js +4 -4
package/dist/src/providers/auth/gemini-oauth.js +6 -15
package/dist/src/providers/auth/grok-oauth.js +6 -15
package/dist/src/providers/auth/openai-oauth.js +6 -15
package/dist/src/providers/mcp-vision-bridge.js +48 -48
package/dist/src/reporter/index.js +1 -1
package/dist/src/scaffold/bb-ecosystem-apply.js +47 -47
package/dist/src/scaffold/bb-quality-gate.js +5 -5
package/dist/src/scaffold/continuation-prompt.js +60 -60
package/dist/src/scaffold/init-new.js +453 -453
package/dist/src/self-qa/__tests__/scenario-planner.test.js +3 -3
package/dist/src/self-qa/agentic-loop.js +24 -19
package/dist/src/self-qa/spec-emitter.js +26 -23
package/dist/src/storage/__tests__/migrations.test.js +2 -2
package/dist/src/storage/interaction-log.js +5 -5
package/dist/src/storage/migrations.js +122 -122
package/dist/src/storage/sessions.js +42 -42
package/dist/src/storage/transcript.js +91 -84
package/dist/src/storage/usage.js +14 -14
package/dist/src/storage/workspaces.js +12 -12
package/dist/src/tools/__tests__/native-tools.test.d.ts +1 -0
package/dist/src/tools/__tests__/native-tools.test.js +53 -0
package/dist/src/tools/git-safety.d.ts +61 -0
package/dist/src/tools/git-safety.js +141 -0
package/dist/src/tools/git-safety.test.d.ts +1 -0
package/dist/src/tools/git-safety.test.js +111 -0
package/dist/src/tools/native-tools.d.ts +31 -0
package/dist/src/tools/native-tools.js +273 -0
package/dist/src/tools/registry-git-safety.test.d.ts +7 -0
package/dist/src/tools/registry-git-safety.test.js +92 -0
package/dist/src/tools/registry.js +39 -4
package/dist/src/ui/__tests__/markdown-render.test.d.ts +1 -0
package/dist/src/ui/__tests__/markdown-render.test.js +48 -0
package/dist/src/ui/app.js +0 -0
package/dist/src/ui/components/message-view.js +4 -1
package/dist/src/ui/components/structured-response-view.js +7 -3
package/dist/src/ui/components/tool-group.js +7 -1
package/dist/src/ui/markdown-render.d.ts +41 -0
package/dist/src/ui/markdown-render.js +223 -0
package/dist/src/ui/markdown.d.ts +10 -0
package/dist/src/ui/markdown.js +12 -35
package/dist/src/ui/slash/council-inspect.js +4 -4
package/dist/src/ui/slash/export.js +4 -4
package/dist/src/ui/utils/text.d.ts +8 -0
package/dist/src/ui/utils/text.js +16 -0
package/dist/src/ui/utils/text.test.d.ts +1 -0
package/dist/src/ui/utils/text.test.js +23 -0
package/dist/src/usage/ledger.js +48 -15
package/dist/src/utils/__tests__/footprint-gitignore.test.d.ts +1 -0
package/dist/src/utils/__tests__/footprint-gitignore.test.js +50 -0
package/dist/src/utils/clipboard-image.js +23 -23
package/dist/src/utils/open-url.d.ts +56 -0
package/dist/src/utils/open-url.js +58 -0
package/dist/src/utils/open-url.test.d.ts +1 -0
package/dist/src/utils/open-url.test.js +86 -0
package/dist/src/utils/settings.d.ts +12 -0
package/dist/src/utils/settings.js +48 -0
package/dist/src/utils/side-question.js +2 -2
package/dist/src/utils/skills.js +3 -3
package/dist/src/verify/__tests__/coverage-parsers.test.js +30 -30
package/dist/src/verify/environment.js +2 -1
package/package.json +1 -1
package/dist/src/pil/layer16-clarity.test.js +0 -31
/package/dist/src/{pil/layer16-clarity.test.d.ts → council/__tests__/clarification-prompt.test.d.ts} +0 -0

package/dist/src/pil/cheap-model-workbooks.js CHANGED Viewed

@@ -23,19 +23,19 @@
  * Universal anti-ramble convergence block — applies to every task type.
  * Kept tight; the per-task addendum below specialises it.
  */
-export const CHEAP_MODEL_CONVERGENCE = `[CONVERGENCE — minimise tool calls; the system prompt + tools are re-sent every call, so each extra step is expensive]
-- Plan the FEWEST reads you need, then read the specific file/section directly.
-  Do NOT broad-grep, re-read a file you already read, or explore "just in case".
-- The moment you have enough to act, STOP investigating and make the change.
-- Make the SMALLEST correct change for the request; do not widen scope.
-- Finish the action before you answer — never stop mid-step (e.g. "I'm verifying…").
-  When done, state completion in ONE line (what changed + that it's verified);
-  no recap, no next-steps padding.
-- GROUND every claim in what you actually read or ran THIS turn: cite real
-  file:line, and never invent counts, line numbers, names, or bugs. If a number
-  (test/file count) is not verified by a command you ran, run the check or mark
-  it "unverified" — do NOT guess a value or assert a finding you did not observe.
+export const CHEAP_MODEL_CONVERGENCE = `[CONVERGENCE — minimise tool calls; the system prompt + tools are re-sent every call, so each extra step is expensive]
+- Plan the FEWEST reads you need, then read the specific file/section directly.
+  Do NOT broad-grep, re-read a file you already read, or explore "just in case".
+- The moment you have enough to act, STOP investigating and make the change.
+- Make the SMALLEST correct change for the request; do not widen scope.
+- Finish the action before you answer — never stop mid-step (e.g. "I'm verifying…").
+  When done, state completion in ONE line (what changed + that it's verified);
+  no recap, no next-steps padding.
+- GROUND every claim in what you actually read or ran THIS turn: cite real
+  file:line, and never invent counts, line numbers, names, or bugs. If a number
+  (test/file count) is not verified by a command you ran, run the check or mark
+  it "unverified" — do NOT guess a value or assert a finding you did not observe.
 - ANTI-MÙ: After compaction note or pre-warn, emit PRESERVE_FULL_CONTEXT (full) or KEEP_TOOL_IDS: id1,id2 to protect high-value (auto for read_file/grep on src/PLAN/error). Use the ee_query tool with "tool-artifact id=XXX" for on-demand full re-hydrate. Recall checkpoints. `;
 /**
  * Per-task-type addenda. Each is 1–2 tight lines targeting that type's most
@@ -47,6 +47,9 @@ const TASK_WORKBOOKS = {
         "Never mask a failure to make it pass (no continue-on-error, swallowed catch, skipped test, `|| true`).",
     generate: "GENERATE: confirm the target file + the surrounding pattern, write the new code to match it, then stop. " +
         "Do not scaffold extras or restructure unrelated code.",
+    build: "BUILD: scaffold the MINIMUM runnable project/feature that satisfies the request, matching the chosen stack's " +
+        "conventions. Wire it end-to-end and verify it builds/runs before stopping. Do NOT add speculative features, " +
+        "extra files, or config the request did not ask for.",
     refactor: "REFACTOR: change only what was named (rename/extract/move). Preserve behaviour; add nothing new.",
     analyze: "ANALYZE: answer from what you have already read — do not read the whole codebase. Bullet findings, no narrative. " +
         "For a repo/code review, base findings on the ACTUAL code you inspect (file sizes, structure, key modules), not just AGENTS.md/CLAUDE.md docs.",

package/dist/src/pil/clarity-gate.d.ts CHANGED Viewed

@@ -1,22 +1,24 @@
-import type { TaskType } from "./types.js";
-export interface L1Signal {
-    confidence: number;
-    taskType: TaskType | null;
-    complexity: "low" | "medium" | "high";
-}
-export declare function isDirectImperative(raw: string): boolean;
-export declare function canInferOutcome(taskType: TaskType | null, raw: string): boolean;
 /**
- * PIL-L6 fix — operational-domain scope (CI, deploy, build, lint) implies
- * scope is the project's pipeline/infra, not a specific file. "fix ci fail"
- * doesn't have a file path but the scope is unambiguous: it's the .github/
- * workflows + whatever those workflows run. Treat as scoped for auto-pass.
+ * src/pil/clarity-gate.ts
+ *
+ * Phase 2 (2026-06-16): the regex/keyword ASK gate (`shouldAutoPass`,
+ * `canInferOutcome`, and the per-modality scope detectors) was removed. The
+ * configured chat model is now the sole decider of whether a turn needs
+ * clarification — see `proposeModelGaps` in `discovery.ts`. Keyword heuristics
+ * deciding what/whether to ask were "bad bad bad UX" (miss billions of cases)
+ * per the user directive; there is no regex fallback by design.
+ *
+ * Two helpers survive because they are NOT ask-gating:
+ *   - `detectNoClarifySignal` — honours an explicit USER instruction ("don't
+ *     ask" / "đừng hỏi"). That is user consent, not classification.
+ *   - `hasOperationalScope` — used only by `getAutofilledOutcome` to pick a
+ *     better outcome LABEL for CI/build/deploy debug turns (output polish, not
+ *     a decision about whether to interview).
+ */
+/**
+ * Operational-domain detector (CI / deploy / build / lint). Used by
+ * `getAutofilledOutcome` to refine the resolved outcome label for pipeline
+ * debug turns; it no longer gates any askcard.
  */
 export declare function hasOperationalScope(raw: string): boolean;
-export declare function countFileReferences(raw: string): number;
-export declare function hasExplicitScope(raw: string): boolean;
-export declare function hasImageScope(raw: string): boolean;
-export declare function hasExternalInfoScope(raw: string): boolean;
-export declare function hasWholeRepoScope(raw: string): boolean;
-export declare function hasSelfContainedComputationScope(raw: string): boolean;
-export declare function shouldAutoPass(l1: L1Signal, raw: string): boolean;
+export declare function detectNoClarifySignal(raw: string): boolean;

package/dist/src/pil/clarity-gate.js CHANGED Viewed

@@ -1,162 +1,35 @@
-import { getAutoPassThreshold } from "./config.js";
 /**
- * A direct imperative command — "run the tests", "echo ok", "show the config",
- * "list the ports" — has a self-evident outcome (the command executes / the
- * thing is shown), so it should NOT trigger an outcome-clarification askcard.
- * Requires an executable verb at the very start followed by a concrete object
- * (a bare "run" with no object stays ambiguous → false).
- */
-const DIRECT_IMPERATIVE_RE = /^\s*(run|execute|show|list|print|echo)\b\s+\S/i;
-export function isDirectImperative(raw) {
-    return DIRECT_IMPERATIVE_RE.test(raw);
-}
-export function canInferOutcome(taskType, raw) {
-    if (!taskType)
-        return false;
-    // PIL clarity over-trigger fix: a "general" prompt normally can't infer its
-    // outcome, but a direct imperative command is the exception — its outcome is
-    // obvious, so asking "what's the expected outcome?" is pure noise.
-    if (taskType === "general")
-        return isDirectImperative(raw);
-    const hasErrorRef = /error|exception|stack|TypeError|Cannot|failed|crash|fail(?:s|ed|ing)?|broken|red/i.test(raw);
-    const hasFileLineRef = /\.\w+:\d+/.test(raw);
-    const hasTargetState = /should|must|expect|return|produce|output|become/i.test(raw);
-    const hasAddPattern = /\b(add|create|implement|write|generate)\b.*\b(to|in|for|into)\b/i.test(raw);
-    // PIL-L6 fix — explicit goal phrase in the prompt is itself an outcome
-    // ("goal sẽ là ci green", "want: tests passing", "expect: 0 errors").
-    // Without this, debug prompts that name the desired end-state still
-    // tripped the interview because none of the verb-noun patterns matched.
-    const hasExplicitGoal = /\b(goal|target|expect|want|mong muốn|mong muon|kết quả|ket qua)\b[:\s]/i.test(raw);
-    return hasErrorRef || hasFileLineRef || hasTargetState || hasAddPattern || hasExplicitGoal;
-}
-/**
- * PIL-L6 fix — operational-domain scope (CI, deploy, build, lint) implies
- * scope is the project's pipeline/infra, not a specific file. "fix ci fail"
- * doesn't have a file path but the scope is unambiguous: it's the .github/
- * workflows + whatever those workflows run. Treat as scoped for auto-pass.
- */
-export function hasOperationalScope(raw) {
-    return /\b(ci|cd|build|deploy(?:ment)?|action(?:s)?|workflow|pipeline|lint|tests?|coverage|gh\s+(check|run|workflow))\b/i.test(raw);
-}
-export function countFileReferences(raw) {
-    return (raw.match(/[\w-]+\.\w{1,5}/g) ?? []).filter((m) => /\.(ts|tsx|js|jsx|py|rs|go|java|cs|rb|vue|svelte|css|scss|json|yaml|yml|toml|md)$/i.test(m)).length;
-}
-export function hasExplicitScope(raw) {
-    return /\b(src\/|lib\/|app\/|pages\/|components\/|modules\/|packages\/)\S+/.test(raw);
-}
-/**
- * An image-analysis prompt is scoped to the IMAGE, not the codebase. "analyze
- * diagram.png", "take a screenshot and describe it" name their target directly,
- * so the "Which part of the codebase should this target?" askcard is
- * nonsensical for them — exactly like operational (CI/build) prompts are scoped
- * to the pipeline (see hasOperationalScope). Detect a concrete image signal: an
- * image file extension, a data:image URI, or an unambiguous image noun.
+ * src/pil/clarity-gate.ts
  *
- * Deliberately NARROW: a false positive here SUPPRESSES a legitimate clarifying
- * question (quality risk), so overloaded words are excluded —
- *   - "logo" / "icon" / "diagram" / "chart" / "mockup" appear in real codebase
- *     tasks ("add a logo to the header"),
- *   - bare "image" collides with container/Docker usage ("rebuild the image"),
- *   - "picture" collides with the "bigger picture" idiom,
- *   - Vietnamese substrings (ảnh/hình) collide with frequent non-image words
- *     ("ảnh hưởng", "màn hình", "hình thức").
- * Only a file extension, data:image URI, "screenshot", or "photo" qualify.
- */
-const IMAGE_SCOPE_RE = /\.(png|jpe?g|gif|webp|svg|bmp|tiff?|heic|avif|ico)\b|data:image\/|\bscreen-?shots?\b|\bphotos?\b/i;
-export function hasImageScope(raw) {
-    return IMAGE_SCOPE_RE.test(raw);
-}
-/**
- * A web-search / external-information prompt ("search the web for X", "google
- * the error", a bare URL, "latest news on Y") is scoped to the WEB, not the
- * codebase, so the "Which part of the codebase should this target?" askcard is
- * nonsensical for it — symmetric to hasOperationalScope / hasImageScope. (Live:
- * "search the web for the latest vitest release notes" → taskType=analyze fired
- * the scope askcard and recorded a wrong scope of "src/mcp".)
+ * Phase 2 (2026-06-16): the regex/keyword ASK gate (`shouldAutoPass`,
+ * `canInferOutcome`, and the per-modality scope detectors) was removed. The
+ * configured chat model is now the sole decider of whether a turn needs
+ * clarification — see `proposeModelGaps` in `discovery.ts`. Keyword heuristics
+ * deciding what/whether to ask were "bad bad bad UX" (miss billions of cases)
+ * per the user directive; there is no regex fallback by design.
  *
- * Deliberately NARROW — only UNAMBIGUOUSLY-external intent. It must not reuse
- * the broad hasDocsSignal vocabulary (library/api/install/package), because
- * those words routinely describe real codebase tasks ("add the zod library to
- * the auth module") that genuinely need the scope askcard. In particular a bare
- * "search" is excluded so "search the codebase" / "implement the search
- * feature" still get scoped.
+ * Two helpers survive because they are NOT ask-gating:
+ *   - `detectNoClarifySignal` — honours an explicit USER instruction ("don't
+ *     ask" / "đừng hỏi"). That is user consent, not classification.
+ *   - `hasOperationalScope` — used only by `getAutofilledOutcome` to pick a
+ *     better outcome LABEL for CI/build/deploy debug turns (output polish, not
+ *     a decision about whether to interview).
  */
-const EXTERNAL_INFO_SCOPE_RE = /https?:\/\/\S+|\bsearch\s+(the\s+)?(web|internet|online)\b|\bweb\s*search\b|\bon\s+the\s+(web|internet)\b|\bgoogle\b|\b(news|weather|headlines)\b/i;
-export function hasExternalInfoScope(raw) {
-    return EXTERNAL_INFO_SCOPE_RE.test(raw);
-}
 /**
- * A whole-repo / whole-project prompt ("đánh giá repo này", "review the entire
- * codebase", "audit the whole project") is ALREADY scoped — to everything — so
- * the "Which part of the codebase should this target?" askcard is nonsensical
- * (and worse, it recommends a single bounded context like "src/cli" as the
- * default, which is wrong for a repo-wide eval). Symmetric to the other scope
- * predicates. Live: gemini-2.5-flash classified "đánh giá repo …" as analyze and
- * got the scope askcard whose recommended option was a narrow subdir.
- *
- * Deliberately NARROW — it must NOT fire on a narrow task that merely mentions a
- * repo/project ("add X to this repo", "fix the bug in the project"), or those
- * would wrongly skip a legitimate scope question. So it requires EITHER an
- * explicit wholeness qualifier (whole/entire/all/toàn bộ/cả) on a repo/project/
- * codebase noun, OR an evaluation/overview verb (review/audit/evaluate/assess/
- * analyze/overview · đánh giá/phân tích/tổng quan/kiểm tra) applied to that noun.
+ * Operational-domain detector (CI / deploy / build / lint). Used by
+ * `getAutofilledOutcome` to refine the resolved outcome label for pipeline
+ * debug turns; it no longer gates any askcard.
  */
-const WHOLE_REPO_SCOPE_RE =
-// NOTE: leading anchors on Vietnamese-initial alternatives use (?:^|\s) not
-// \b — JS \b is ASCII-only and never matches before a non-ASCII letter like
-// "đ", so "\bđánh" would silently fail to match "đánh giá repo".
-/\b(whole|entire|overall|all\s+of\s+the|across\s+the)\s+(repo(?:sitory)?|code-?base|project)\b|(?:^|\s)(toàn\s*bộ|toan\s*bo|cả|ca)\s+(repo|dự\s*án|du\s*an|m[ãa]\s*ngu[ồo]n|code-?base|project)\b|\b(review|audit|evaluate|assess|analy[sz]e|summari[sz]e|overview\s+of|summary\s+of)\s+(?:\S+\s+){0,2}?(repo(?:sitory)?|code-?base|project)\b|(?:^|\s)(đánh\s*giá|danh\s*gia|phân\s*tích|phan\s*tich|tổng\s*quan|tong\s*quan|kiểm\s*tra|kiem\s*tra|tóm\s*tắt|tom\s*tat)\s+(?:\S+\s+){0,2}?(toàn|toan|repo|dự\s*án|du\s*an|m[ãa]\s*ngu[ồo]n|code-?base|project)\b/i;
-export function hasWholeRepoScope(raw) {
-    return WHOLE_REPO_SCOPE_RE.test(raw);
-}
-/**
- * A self-contained computation / reasoning prompt supplies its operand data
- * INLINE ("Compute f([3,1,2]) …", "what is the median of [10, 4, 7]?") — the
- * task's target is the data in the prompt, not the codebase, so the "Which part
- * of the codebase should this target?" askcard is nonsensical for it. Symmetric
- * to hasOperationalScope / hasImageScope / hasExternalInfoScope / hasWholeRepoScope.
- *
- * Live: "Compute f([3,1,2]) where f sorts the list ascending then returns the
- * sum of the first two elements." classified taskType=analyze — the regex
- * classifier matched the bare word "list" (regex:read, conf 0.80, which also
- * skips the brain) — and fired BOTH the pil-interview scope askcard (auto
- * "Entire project") and the pil-acceptance card on a pure math problem.
- *
- * Deliberately NARROW — a false positive here SUPPRESSES a legitimate scope
- * question (quality risk), so it requires BOTH:
- *   1. an inline DATA literal — a bracketed comma-list of >=2 numeric or quoted
- *      string values (`[3, 1, 2]`, `["a", "b"]`). A bracketed list of bare
- *      identifiers (`[auth.ts, session.ts]`) is NOT data — those are file/symbol
- *      references and stay codebase-scoped; the regex only accepts numbers and
- *      quoted strings, so it never matches them. Single-element `[0]` (array
- *      indexing) is excluded by the >=2-element requirement.
- *   2. computation framing — a compute/evaluate/sort/sum/statistic verb or a
- *      "what is …" / "given the array …" question frame.
- * The AND keeps real codebase tasks that merely embed a literal (e.g. "set the
- * default retry delays to [100, 200, 400] in the config") correctly scoped.
- */
-const INLINE_DATA_LITERAL_RE = /\[\s*(?:-?\d+(?:\.\d+)?|"[^"]*"|'[^']*')(?:\s*,\s*(?:-?\d+(?:\.\d+)?|"[^"]*"|'[^']*'))+\s*\]/;
-const COMPUTE_FRAMING_RE = /\b(comput(?:e|ing)|calculat(?:e|ing|ion)|evaluat(?:e|ing)|solve|sort(?:s|ed|ing)?|sum|median|mean|average|max(?:imum)?|min(?:imum)?|largest|smallest|reverse[ds]?|result\s+of|what(?:'?s|\s+is|\s+are)|given\s+(?:the\s+)?(?:array|list|sequence|set|matrix|string|numbers?))\b/i;
-export function hasSelfContainedComputationScope(raw) {
-    return INLINE_DATA_LITERAL_RE.test(raw) && COMPUTE_FRAMING_RE.test(raw);
+export function hasOperationalScope(raw) {
+    return /\b(ci|cd|build|deploy(?:ment)?|action(?:s)?|workflow|pipeline|lint|tests?|coverage|gh\s+(check|run|workflow))\b/i.test(raw);
 }
-export function shouldAutoPass(l1, raw) {
-    if (l1.confidence < getAutoPassThreshold())
-        return false;
-    if (!canInferOutcome(l1.taskType, raw))
-        return false;
-    // PIL-L6 fix — debug prompts about CI/build/deploy don't need a file path
-    // because their scope is the pipeline itself. Operational scope counts.
-    if (countFileReferences(raw) === 0 &&
-        !hasExplicitScope(raw) &&
-        !hasOperationalScope(raw) &&
-        !hasImageScope(raw) &&
-        !hasExternalInfoScope(raw) &&
-        !hasWholeRepoScope(raw) &&
-        !hasSelfContainedComputationScope(raw))
-        return false;
-    if (l1.complexity === "high")
-        return false;
-    return true;
+// The user explicitly told the agent NOT to clarify ("don't ask", "trả lời
+// thẳng"). When present, discovery skips ALL interview + acceptance cards. Narrow
+// on purpose: the idiom "don't ask me why" (seeking an explanation, not a
+// directive to skip questions) is excluded via a negative lookahead. EN + VI
+// (with diacritics + bare-ASCII transliterations).
+const NO_CLARIFY_RE = /\b(?:don'?t|do not)\s+ask(?!\s+me\s+(?:why|how|what))\b|\bno\s+(?:questions?|clarif(?:ication|ying)|interview)\b|\bwithout\s+asking\b|\bjust\s+answer\b|\banswer\s+(?:me\s+)?directly\b|\bstop\s+asking\b|đừng\s+hỏi|không\s+(?:cần\s+)?hỏi|khỏi\s+hỏi|trả\s+lời\s+(?:thẳng|luôn|liền|ngay|trực\s*tiếp)|\bdung\s+hoi\b|\bkhong\s+(?:can\s+)?hoi\b|\btra\s+loi\s+(?:thang|luon|lien|ngay)\b/i;
+export function detectNoClarifySignal(raw) {
+    return !!raw && NO_CLARIFY_RE.test(raw);
 }
 //# sourceMappingURL=clarity-gate.js.map

package/dist/src/pil/config.d.ts CHANGED Viewed

@@ -5,6 +5,14 @@
  *   Default OFF during rollout; flip to ON after dual-run validation.
  */
 export declare function isUnifiedPilEnabled(): boolean;
+/**
+ * MUONROI_LLM_FIRST_CLASSIFY: model-first Layer-1 classification. When enabled
+ * (default), the configured model classifies taskType/intentKind/style at the
+ * top of the turn and the brittle keyword-regex cascade becomes the OFFLINE
+ * fallback (used only when the model call fails / is not wired). Set to "0" to
+ * revert to the regex-first cascade. Requires opts.llmFallback to be wired
+ * (the orchestrator does this on the main path); without it, the cascade runs.
+ */
+export declare function isLlmFirstClassifyEnabled(): boolean;
 export declare function isDiscoveryEnabled(): boolean;
-export declare function getAutoPassThreshold(): number;
 export declare function getMaxInterviewQuestions(): number;

package/dist/src/pil/config.js CHANGED Viewed

@@ -11,13 +11,24 @@ export function isUnifiedPilEnabled() {
         return true;
     return false;
 }
+/**
+ * MUONROI_LLM_FIRST_CLASSIFY: model-first Layer-1 classification. When enabled
+ * (default), the configured model classifies taskType/intentKind/style at the
+ * top of the turn and the brittle keyword-regex cascade becomes the OFFLINE
+ * fallback (used only when the model call fails / is not wired). Set to "0" to
+ * revert to the regex-first cascade. Requires opts.llmFallback to be wired
+ * (the orchestrator does this on the main path); without it, the cascade runs.
+ */
+export function isLlmFirstClassifyEnabled() {
+    return process.env.MUONROI_LLM_FIRST_CLASSIFY !== "0";
+}
 export function isDiscoveryEnabled() {
     return process.env.MUONROI_PIL_DISCOVERY !== "0";
 }
-export function getAutoPassThreshold() {
-    const v = Number(process.env.MUONROI_PIL_AUTOPASS_THRESHOLD);
-    return Number.isFinite(v) && v >= 0.5 && v <= 1.0 ? v : 0.85;
-}
+// Phase 2 (2026-06-16): getAutoPassThreshold() was removed with the regex
+// auto-pass gate (shouldAutoPass). The model now decides whether a turn needs
+// clarification, so there is no confidence threshold to tune. The
+// MUONROI_PIL_AUTOPASS_THRESHOLD env var is therefore inert.
 export function getMaxInterviewQuestions() {
     const v = Number(process.env.MUONROI_PIL_MAX_QUESTIONS);
     return Number.isFinite(v) && v >= 1 && v <= 5 ? v : 3;