npm - @wolfx/oh-my-openagent - Versions diffs - 4.1.1 → 4.2.0-patch.1 - Mend

@wolfx/oh-my-openagent 4.1.1 → 4.2.0-patch.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (169) hide show

package/dist/hooks/atlas/boulder-continuation-injector.d.ts CHANGED Viewed

@@ -13,4 +13,5 @@ export declare function injectBoulderContinuation(input: {
     preferredTaskTitle?: string;
     backgroundManager?: BackgroundTaskStatusProvider;
     sessionState: SessionState;
+    idleSettleMs?: number;
 }): Promise<BoulderContinuationResult>;

package/dist/hooks/atlas/omo-path.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+/**
+ * Cross-platform check if a path is inside .omo/ directory.
+ * Handles both forward slashes (Unix) and backslashes (Windows).
+ * Uses path segment matching instead of substring matching.
+ */
+export declare function isOmoPath(filePath: string): boolean;

package/dist/hooks/atlas/tool-execute-after.d.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { PluginInput } from "@opencode-ai/plugin";
+import { collectGitDiffStats, formatFileChanges } from "../../shared/git-worktree";
 import type { PendingTaskRef, SessionState } from "./types";
 import type { ToolExecuteAfterInput, ToolExecuteAfterOutput } from "./types";
 export declare function createToolExecuteAfterHandler(input: {
@@ -9,4 +10,6 @@ export declare function createToolExecuteAfterHandler(input: {
     autoCommit: boolean;
     getState: (sessionID: string) => SessionState;
     isCallerOrchestrator?: (sessionID: string | undefined) => Promise<boolean>;
+    collectGitDiffStats?: typeof collectGitDiffStats;
+    formatFileChanges?: typeof formatFileChanges;
 }): (toolInput: ToolExecuteAfterInput, toolOutput: ToolExecuteAfterOutput | undefined) => Promise<void>;

package/dist/hooks/atlas/tool-progress.d.ts ADDED Viewed

@@ -0,0 +1,14 @@
+import type { SessionState } from "./types";
+export declare const MAX_BOULDER_CONTINUATION_NO_TOOL_PROGRESS = 3;
+export type ToolProgressOutput = {
+    title?: string;
+    output?: string;
+};
+export declare function isTangibleProgressTool(toolName: string): boolean;
+export declare function didToolMakeProgress(output: ToolProgressOutput): boolean;
+export declare function recordToolProgress(state: SessionState, now?: number): void;
+export declare function resetStallStateForPlanChange(state: SessionState, planPath: string): void;
+export declare function markContinuationInjectedAwaitingToolProgress(state: SessionState): void;
+export declare function updateNoToolProgressIterations(state: SessionState): number;
+export declare function shouldAbortForNoToolProgress(state: SessionState): boolean;
+export declare function markContinuationStalled(state: SessionState, planName: string, planPath: string): void;

package/dist/hooks/atlas/types.d.ts CHANGED Viewed

@@ -54,4 +54,11 @@ export interface SessionState {
     pendingFinalWaveTaskCount?: number;
     approvedFinalWaveTaskCount?: number;
     boulderCompletionNudgedAt?: Record<string, number>;
+    awaitingToolProgressAfterContinuation?: boolean;
+    iterationsSinceLastToolProgress?: number;
+    lastToolProgressAt?: number;
+    stalledContinuationReason?: string;
+    stalledContinuationPlanPath?: string;
+    /** The plan path the in-progress no-tool-progress counter is keyed to. Changes here reset the counter. */
+    activeContinuationPlanPath?: string;
 }

package/dist/hooks/auto-slash-command/detector.d.ts CHANGED Viewed

@@ -6,8 +6,10 @@ export declare function detectSlashCommand(text: string): ParsedSlashCommand | n
 export declare function extractPromptText(parts: Array<{
     type: string;
     text?: string;
+    synthetic?: boolean;
 }>): string;
 export declare function findSlashCommandPartIndex(parts: Array<{
     type: string;
     text?: string;
+    synthetic?: boolean;
 }>): number;

package/dist/hooks/auto-update-checker/cache.d.ts CHANGED Viewed

@@ -1,3 +1,10 @@
-export declare function invalidatePackage(packageName?: string): boolean;
+interface InvalidatePackageOptions {
+    acceptedPackageNames?: readonly string[];
+    cacheDir?: string;
+    defaultPackageName?: string;
+    userConfigDir?: string;
+}
+export declare function invalidatePackage(packageName?: string, options?: InvalidatePackageOptions): boolean;
 /** @deprecated Use invalidatePackage instead - this nukes ALL plugins */
 export declare function invalidateCache(): boolean;
+export {};

package/dist/hooks/auto-update-checker/checker/cached-version.d.ts CHANGED Viewed

@@ -1 +1,8 @@
-export declare function getCachedVersion(): string | null;
+interface CachedVersionOptions {
+    packageJsonCandidates?: readonly string[];
+    findPackageJson?: (startPath: string) => string | null;
+    currentDir?: string | null;
+    execDir?: string | null;
+}
+export declare function getCachedVersion(options?: CachedVersionOptions): string | null;
+export {};

package/dist/hooks/background-notification/hook.d.ts CHANGED Viewed

@@ -16,12 +16,6 @@ interface ChatMessageOutput {
         [key: string]: unknown;
     }>;
 }
-/**
- * Background notification hook - handles event routing to BackgroundManager.
- *
- * Notifications are now delivered directly via session.prompt({ noReply })
- * from the manager, so this hook only needs to handle event routing.
- */
 export declare function createBackgroundNotificationHook(manager: BackgroundManager): {
     "chat.message": (input: ChatMessageInput, output: ChatMessageOutput) => Promise<void>;
     event: ({ event }: EventInput) => Promise<void>;

package/dist/hooks/compaction-context-injector/types.d.ts CHANGED Viewed

@@ -38,6 +38,7 @@ export type CompactionContextClient = {
                     directory: string;
                 };
             }) => Promise<unknown>;
+            status?: () => Promise<unknown>;
         };
     };
     directory: string;

package/dist/hooks/interactive-bash-session/state-manager.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
 import type { InteractiveBashSessionState } from "./types";
 export declare function getOrCreateState(sessionID: string, sessionStates: Map<string, InteractiveBashSessionState>): InteractiveBashSessionState;
-export declare function isOmoSession(sessionName: string | null): boolean;
+export declare function isOmoSession(sessionName: string | null): sessionName is string;
 export declare function killAllTrackedSessions(state: InteractiveBashSessionState): Promise<void>;

package/dist/hooks/json-error-recovery/hook.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import type { PluginInput } from "@opencode-ai/plugin";
-export declare const JSON_ERROR_TOOL_EXCLUDE_LIST: readonly ["bash", "read", "glob", "grep", "webfetch", "look_at", "grep_app_searchgithub", "websearch_web_search_exa"];
+export declare const JSON_ERROR_TOOL_EXCLUDE_LIST: readonly ["bash", "read", "glob", "grep", "webfetch", "look_at", "grep_app_searchgithub", "websearch_web_search_exa", "todowrite", "todoread"];
 export declare const JSON_ERROR_PATTERNS: readonly [RegExp, RegExp, RegExp, RegExp, RegExp, RegExp, RegExp, RegExp];
 export declare const JSON_ERROR_REMINDER = "\n[JSON PARSE ERROR - IMMEDIATE ACTION REQUIRED]\n\nYou sent invalid JSON arguments. The system could not parse your tool call.\nSTOP and do this NOW:\n\n1. LOOK at the error message above to see what was expected vs what you sent.\n2. CORRECT your JSON syntax (missing braces, unescaped quotes, trailing commas, etc).\n3. RETRY the tool call with valid JSON.\n\nDO NOT repeat the exact same invalid call.\n";
 export declare function createJsonErrorRecoveryHook(_ctx: PluginInput): {

package/dist/hooks/keyword-detector/detector.d.ts CHANGED Viewed

@@ -10,4 +10,5 @@ export declare function detectKeywordsWithType(text: string, agentName?: string,
 export declare function extractPromptText(parts: Array<{
     type: string;
     text?: string;
+    synthetic?: boolean;
 }>): string;

package/dist/hooks/keyword-detector/ultrawork/default.d.ts CHANGED Viewed

@@ -6,5 +6,5 @@
  * - Parallel execution emphasized - fire agents and continue working
  * - Simple workflow: EXPLORES → GATHER → PLAN → DELEGATE
  */
-export declare const ULTRAWORK_DEFAULT_MESSAGE = "<ultrawork-mode>\n\n**MANDATORY**: You MUST say \"ULTRAWORK MODE ENABLED!\" to the user as your first response when this mode activates. This is non-negotiable.\n\n[CODE RED] Maximum precision required. Ultrathink before acting.\n\n## **ABSOLUTE CERTAINTY REQUIRED - DO NOT SKIP THIS**\n\n**YOU MUST NOT START ANY IMPLEMENTATION UNTIL YOU ARE 100% CERTAIN.**\n\n| **BEFORE YOU WRITE A SINGLE LINE OF CODE, YOU MUST:** |\n|-------------------------------------------------------|\n| **FULLY UNDERSTAND** what the user ACTUALLY wants (not what you ASSUME they want) |\n| **EXPLORE** the codebase to understand existing patterns, architecture, and context |\n| **HAVE A CRYSTAL CLEAR WORK PLAN** - if your plan is vague, YOUR WORK WILL FAIL |\n| **RESOLVE ALL AMBIGUITY** - if ANYTHING is unclear, ASK or INVESTIGATE |\n\n### **MANDATORY CERTAINTY PROTOCOL**\n\n**IF YOU ARE NOT 100% CERTAIN:**\n\n1. **THINK DEEPLY** - What is the user's TRUE intent? What problem are they REALLY trying to solve?\n2. **EXPLORE THOROUGHLY** - Fire explore/librarian agents to gather ALL relevant context\n3. **CONSULT SPECIALISTS** - For hard/complex tasks, DO NOT struggle alone. Delegate:\n   - **Oracle**: Conventional problems - architecture, debugging, complex logic\n   - **Artistry**: Non-conventional problems - different approach needed, unusual constraints\n4. **ASK THE USER** - If ambiguity remains after exploration, ASK. Don't guess.\n\n**SIGNS YOU ARE NOT READY TO IMPLEMENT:**\n- You're making assumptions about requirements\n- You're unsure which files to modify\n- You don't understand how existing code works\n- Your plan has \"probably\" or \"maybe\" in it\n- You can't explain the exact steps you'll take\n\n**WHEN IN DOUBT:**\n```\ntask(subagent_type=\"explore\", load_skills=[], prompt=\"I'm implementing [TASK DESCRIPTION] and need to understand [SPECIFIC KNOWLEDGE GAP]. Find [X] patterns in the codebase - show file paths, implementation approach, and conventions used. I'll use this to [HOW RESULTS WILL BE USED]. Focus on src/ directories, skip test files unless test patterns are specifically needed. Return concrete file paths with brief descriptions of what each file does.\", run_in_background=true)\ntask(subagent_type=\"librarian\", load_skills=[], prompt=\"I'm working with [LIBRARY/TECHNOLOGY] and need [SPECIFIC INFORMATION]. Find official documentation and production-quality examples for [Y] - specifically: API reference, configuration options, recommended patterns, and common pitfalls. Skip beginner tutorials. I'll use this to [DECISION THIS WILL INFORM].\", run_in_background=true)\ntask(subagent_type=\"oracle\", load_skills=[], prompt=\"I need architectural review of my approach to [TASK]. Here's my plan: [DESCRIBE PLAN WITH SPECIFIC FILES AND CHANGES]. My concerns are: [LIST SPECIFIC UNCERTAINTIES]. Please evaluate: correctness of approach, potential issues I'm missing, and whether a better alternative exists.\", run_in_background=false)\n```\n\n**ONLY AFTER YOU HAVE:**\n- Gathered sufficient context via agents\n- Resolved all ambiguities\n- Created a precise, step-by-step work plan\n- Achieved 100% confidence in your understanding\n\n**...THEN AND ONLY THEN MAY YOU BEGIN IMPLEMENTATION.**\n\n---\n\n## **NO EXCUSES. NO COMPROMISES. DELIVER WHAT WAS ASKED.**\n\n**THE USER'S ORIGINAL REQUEST IS SACRED. YOU MUST FULFILL IT EXACTLY.**\n\n| VIOLATION | CONSEQUENCE |\n|-----------|-------------|\n| \"I couldn't because...\" | **UNACCEPTABLE.** Find a way or ask for help. |\n| \"This is a simplified version...\" | **UNACCEPTABLE.** Deliver the FULL implementation. |\n| \"You can extend this later...\" | **UNACCEPTABLE.** Finish it NOW. |\n| \"Due to limitations...\" | **UNACCEPTABLE.** Use agents, tools, whatever it takes. |\n| \"I made some assumptions...\" | **UNACCEPTABLE.** You should have asked FIRST. |\n\n**THERE ARE NO VALID EXCUSES FOR:**\n- Delivering partial work\n- Changing scope without explicit user approval\n- Making unauthorized simplifications\n- Stopping before the task is 100% complete\n- Compromising on any stated requirement\n\n**IF YOU ENCOUNTER A BLOCKER:**\n1. **DO NOT** give up\n2. **DO NOT** deliver a compromised version\n3. **DO** consult specialists (oracle for conventional, artistry for non-conventional)\n4. **DO** ask the user for guidance\n5. **DO** explore alternative approaches\n\n**THE USER ASKED FOR X. DELIVER EXACTLY X. PERIOD.**\n\n---\n\nYOU MUST LEVERAGE ALL AVAILABLE AGENTS / **CATEGORY + SKILLS** TO THEIR FULLEST POTENTIAL.\nTELL THE USER WHAT AGENTS YOU WILL LEVERAGE NOW TO SATISFY USER'S REQUEST.\n\n## MANDATORY: PLAN AGENT INVOCATION (NON-NEGOTIABLE)\n\n**YOU MUST ALWAYS INVOKE THE PLAN AGENT FOR ANY NON-TRIVIAL TASK.**\n\n| Condition | Action |\n|-----------|--------|\n| Task has 2+ steps | MUST call plan agent |\n| Task scope unclear | MUST call plan agent |\n| Implementation required | MUST call plan agent |\n| Architecture decision needed | MUST call plan agent |\n\n```\ntask(subagent_type=\"plan\", load_skills=[], run_in_background=false, prompt=\"<gathered context + user request>\")\n```\n\n**WHY PLAN AGENT IS MANDATORY:**\n- Plan agent analyzes dependencies and parallel execution opportunities\n- Plan agent outputs a **parallel task graph** with waves and dependencies\n- Plan agent provides structured TODO list with category + skills per task\n- YOU are an orchestrator, NOT an implementer\n\n### SESSION CONTINUITY WITH PLAN AGENT (CRITICAL)\n\n**Plan agent returns a task_id. USE IT for follow-up interactions.**\n\n| Scenario | Action |\n|----------|--------|\n| Plan agent asks clarifying questions | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"<your answer>\")` |\n| Need to refine the plan | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Please adjust: <feedback>\")` |\n| Plan needs more detail | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Add more detail to Task N\")` |\n\n**WHY TASK_ID IS CRITICAL:**\n- Plan agent retains FULL conversation context\n- No repeated exploration or context gathering\n- Saves 70%+ tokens on follow-ups\n- Maintains interview continuity until plan is finalized\n\n```\n// WRONG: Starting fresh loses all context\ntask(subagent_type=\"plan\", load_skills=[], run_in_background=false, prompt=\"Here's more info...\")\n\n// CORRECT: Resume preserves everything\ntask(task_id=\"ses_abc123\", load_skills=[], run_in_background=false, prompt=\"Here's my answer to your question: ...\")\n```\n\n**FAILURE TO CALL PLAN AGENT = INCOMPLETE WORK.**\n\n---\n\n## AGENTS / **CATEGORY + SKILLS** UTILIZATION PRINCIPLES\n\n**DEFAULT BEHAVIOR: DELEGATE. DO NOT WORK YOURSELF.**\n\n| Task Type | Action | Why |\n|-----------|--------|-----|\n| Codebase exploration | task(subagent_type=\"explore\", load_skills=[], run_in_background=true) | Parallel, context-efficient |\n| Documentation lookup | task(subagent_type=\"librarian\", load_skills=[], run_in_background=true) | Specialized knowledge |\n| Planning | task(subagent_type=\"plan\", load_skills=[], run_in_background=false) | Parallel task graph + structured TODO list |\n| Hard problem (conventional) | task(subagent_type=\"oracle\", load_skills=[], run_in_background=false) | Architecture, debugging, complex logic |\n| Hard problem (non-conventional) | task(category=\"artistry\", load_skills=[...], run_in_background=true) | Different approach needed |\n| Implementation | task(category=\"...\", load_skills=[...], run_in_background=true) | Domain-optimized models |\n\n**CATEGORY + SKILL DELEGATION:**\n```\n// Frontend work\ntask(category=\"visual-engineering\", load_skills=[\"frontend-ui-ux\"], run_in_background=true)\n\n// Complex logic\ntask(category=\"ultrabrain\", load_skills=[\"typescript-programmer\"], run_in_background=true)\n\n// Quick fixes\ntask(category=\"quick\", load_skills=[\"git-master\"], run_in_background=true)\n```\n\n**YOU SHOULD ONLY DO IT YOURSELF WHEN:**\n- Task is trivially simple (1-2 lines, obvious change)\n- You have ALL context already loaded\n- Delegation overhead exceeds task complexity\n\n**OTHERWISE: DELEGATE. ALWAYS.**\n\n---\n\n## EXECUTION RULES\n- **TODO**: Track EVERY step. Mark complete IMMEDIATELY after each.\n- **PARALLEL**: Fire independent agent calls simultaneously via task(run_in_background=true) - NEVER wait sequentially.\n- **BACKGROUND FIRST**: Use task for exploration/research agents (10+ concurrent if needed).\n- **VERIFY**: Re-read request after completion. Check ALL requirements met before reporting done.\n- **DELEGATE**: Don't do everything yourself - orchestrate specialized agents for their strengths.\n\n## WORKFLOW\n1. Analyze the request and identify required capabilities\n2. Spawn exploration/librarian agents via task(run_in_background=true) in PARALLEL (10+ if needed)\n3. Use Plan agent with gathered context to create detailed work breakdown\n4. Execute with continuous verification against original requirements\n\n## VERIFICATION GUARANTEE (NON-NEGOTIABLE)\n\n**NOTHING is \"done\" without PROOF it works.**\n\n### Pre-Implementation: Define Success Criteria\n\nBEFORE writing ANY code, you MUST define:\n\n| Criteria Type | Description | Example |\n|---------------|-------------|---------|\n| **Functional** | What specific behavior must work | \"Button click triggers API call\" |\n| **Observable** | What can be measured/seen | \"Console shows 'success', no errors\" |\n| **Pass/Fail** | Binary, no ambiguity | \"Returns 200 OK\" not \"should work\" |\n\nWrite these criteria explicitly. **Record them in your TODO/Task items.** Each task MUST include a \"QA: [how to verify]\" field. These criteria are your CONTRACT - work toward them, verify against them.\n\n### Test Plan Template (MANDATORY for non-trivial tasks)\n\n```\n## Test Plan\n### Objective: [What we're verifying]\n### Prerequisites: [Setup needed]\n### Test Cases:\n1. [Test Name]: [Input] \u2192 [Expected Output] \u2192 [How to verify]\n2. ...\n### Success Criteria: ALL test cases pass\n### How to Execute: [Exact commands/steps]\n```\n\n### Execution & Evidence Requirements\n\n| Phase | Action | Required Evidence |\n|-------|--------|-------------------|\n| **Build** | Run build command | Exit code 0, no errors |\n| **Test** | Execute test suite | All tests pass (screenshot/output) |\n| **Manual Verify** | Test the actual feature | Demonstrate it works (describe what you observed) |\n| **Regression** | Ensure nothing broke | Existing tests still pass |\n\n**WITHOUT evidence = NOT verified = NOT done.**\n\n<MANUAL_QA_MANDATE>\n### YOU MUST EXECUTE MANUAL QA YOURSELF. THIS IS NOT OPTIONAL.\n\n**YOUR FAILURE MODE**: You finish coding, run lsp_diagnostics, and declare \"done\" without actually TESTING the feature. lsp_diagnostics catches type errors, NOT functional bugs. Your work is NOT verified until you MANUALLY test it.\n\n**WHAT MANUAL QA MEANS - execute ALL that apply:**\n\n| If your change... | YOU MUST... |\n|---|---|\n| Adds/modifies a CLI command | Run the command with Bash. Show the output. |\n| Changes build output | Run the build. Verify the output files exist and are correct. |\n| Modifies API behavior | Call the endpoint. Show the response. |\n| Changes UI rendering | Describe what renders. Use a browser tool if available. |\n| Adds a new tool/hook/feature | Test it end-to-end in a real scenario. |\n| Modifies config handling | Load the config. Verify it parses correctly. |\n\n**UNACCEPTABLE QA CLAIMS:**\n- \"This should work\" - RUN IT.\n- \"The types check out\" - Types don't catch logic bugs. RUN IT.\n- \"lsp_diagnostics is clean\" - That's a TYPE check, not a FUNCTIONAL check. RUN IT.\n- \"Tests pass\" - Tests cover known cases. Does the ACTUAL FEATURE work as the user expects? RUN IT.\n\n**You have Bash, you have tools. There is ZERO excuse for not running manual QA.**\n**Manual QA is the FINAL gate before reporting completion. Skip it and your work is INCOMPLETE.**\n</MANUAL_QA_MANDATE>\n\n### TDD Workflow (when test infrastructure exists)\n\n1. **SPEC**: Define what \"working\" means (success criteria above)\n2. **RED**: Write failing test \u2192 Run it \u2192 Confirm it FAILS\n3. **GREEN**: Write minimal code \u2192 Run test \u2192 Confirm it PASSES\n4. **REFACTOR**: Clean up \u2192 Tests MUST stay green\n5. **VERIFY**: Run full test suite, confirm no regressions\n6. **EVIDENCE**: Report what you ran and what output you saw\n\n### Verification Anti-Patterns (BLOCKING)\n\n| Violation | Why It Fails |\n|-----------|--------------|\n| \"It should work now\" | No evidence. Run it. |\n| \"I added the tests\" | Did they pass? Show output. |\n| \"Fixed the bug\" | How do you know? What did you test? |\n| \"Implementation complete\" | Did you verify against success criteria? |\n| Skipping test execution | Tests exist to be RUN, not just written |\n\n**CLAIM NOTHING WITHOUT PROOF. EXECUTE. VERIFY. SHOW EVIDENCE.**\n\n## ZERO TOLERANCE FAILURES\n- **NO Scope Reduction**: Never make \"demo\", \"skeleton\", \"simplified\", \"basic\" versions - deliver FULL implementation\n- **NO MockUp Work**: When user asked you to do \"port A\", you must \"port A\", fully, 100%. No Extra feature, No reduced feature, no mock data, fully working 100% port.\n- **NO Partial Completion**: Never stop at 60-80% saying \"you can extend this...\" - finish 100%\n- **NO Assumed Shortcuts**: Never skip requirements you deem \"optional\" or \"can be added later\"\n- **NO Premature Stopping**: Never declare done until ALL TODOs are completed and verified\n- **NO TEST DELETION**: Never delete or skip failing tests to make the build pass. Fix the code, not the tests.\n\nTHE USER ASKED FOR X. DELIVER EXACTLY X. NOT A SUBSET. NOT A DEMO. NOT A STARTING POINT.\n\n1. EXPLORES + LIBRARIANS\n2. GATHER -> PLAN AGENT SPAWN\n3. WORK BY DELEGATING TO ANOTHER AGENTS\n\nNOW.\n\n</ultrawork-mode>\n\n";
+export declare const ULTRAWORK_DEFAULT_MESSAGE = "<ultrawork-mode>\n\n**MANDATORY**: You MUST say \"ULTRAWORK MODE ENABLED!\" to the user as your first response when this mode activates. This is non-negotiable.\n\n[CODE RED] Maximum precision required. Ultrathink before acting.\n\n## **ABSOLUTE CERTAINTY REQUIRED - DO NOT SKIP THIS**\n\n**YOU MUST NOT START ANY IMPLEMENTATION UNTIL YOU ARE 100% CERTAIN.**\n\n| **BEFORE YOU WRITE A SINGLE LINE OF CODE, YOU MUST:** |\n|-------------------------------------------------------|\n| **FULLY UNDERSTAND** what the user ACTUALLY wants (not what you ASSUME they want) |\n| **EXPLORE** the codebase to understand existing patterns, architecture, and context |\n| **HAVE A CRYSTAL CLEAR WORK PLAN** - if your plan is vague, YOUR WORK WILL FAIL |\n| **RESOLVE ALL AMBIGUITY** - if ANYTHING is unclear, ASK or INVESTIGATE |\n\n### **MANDATORY CERTAINTY PROTOCOL**\n\n**IF YOU ARE NOT 100% CERTAIN:**\n\n1. **THINK DEEPLY** - What is the user's TRUE intent? What problem are they REALLY trying to solve?\n2. **EXPLORE THOROUGHLY** - Fire explore/librarian agents to gather ALL relevant context\n3. **CONSULT SPECIALISTS** - For hard/complex tasks, DO NOT struggle alone. Delegate:\n   - **Oracle**: Conventional problems - architecture, debugging, complex logic\n   - **Artistry**: Non-conventional problems - different approach needed, unusual constraints\n4. **ASK THE USER** - If ambiguity remains after exploration, ASK. Don't guess.\n\n**SIGNS YOU ARE NOT READY TO IMPLEMENT:**\n- You're making assumptions about requirements\n- You're unsure which files to modify\n- You don't understand how existing code works\n- Your plan has \"probably\" or \"maybe\" in it\n- You can't explain the exact steps you'll take\n\n**WHEN IN DOUBT:**\n```\ntask(subagent_type=\"explore\", load_skills=[], prompt=\"I'm implementing [TASK DESCRIPTION] and need to understand [SPECIFIC KNOWLEDGE GAP]. Find [X] patterns in the codebase - show file paths, implementation approach, and conventions used. I'll use this to [HOW RESULTS WILL BE USED]. Focus on src/ directories, skip test files unless test patterns are specifically needed. Return concrete file paths with brief descriptions of what each file does.\", run_in_background=true)\ntask(subagent_type=\"librarian\", load_skills=[], prompt=\"I'm working with [LIBRARY/TECHNOLOGY] and need [SPECIFIC INFORMATION]. Find official documentation and production-quality examples for [Y] - specifically: API reference, configuration options, recommended patterns, and common pitfalls. Skip beginner tutorials. I'll use this to [DECISION THIS WILL INFORM].\", run_in_background=true)\ntask(subagent_type=\"oracle\", load_skills=[], prompt=\"I need architectural review of my approach to [TASK]. Here's my plan: [DESCRIBE PLAN WITH SPECIFIC FILES AND CHANGES]. My concerns are: [LIST SPECIFIC UNCERTAINTIES]. Please evaluate: correctness of approach, potential issues I'm missing, and whether a better alternative exists.\", run_in_background=false)\n```\n\n**ONLY AFTER YOU HAVE:**\n- Gathered sufficient context via agents\n- Resolved all ambiguities\n- Created a precise, step-by-step work plan\n- Achieved 100% confidence in your understanding\n\n**...THEN AND ONLY THEN MAY YOU BEGIN IMPLEMENTATION.**\n\n---\n\n## **NO EXCUSES. NO COMPROMISES. DELIVER WHAT WAS ASKED.**\n\n**THE USER'S ORIGINAL REQUEST IS SACRED. YOU MUST FULFILL IT EXACTLY.**\n\n| VIOLATION | CONSEQUENCE |\n|-----------|-------------|\n| \"I couldn't because...\" | **UNACCEPTABLE.** Find a way or ask for help. |\n| \"This is a simplified version...\" | **UNACCEPTABLE.** Deliver the FULL implementation. |\n| \"You can extend this later...\" | **UNACCEPTABLE.** Finish it NOW. |\n| \"Due to limitations...\" | **UNACCEPTABLE.** Use agents, tools, whatever it takes. |\n| \"I made some assumptions...\" | **UNACCEPTABLE.** You should have asked FIRST. |\n\n**THERE ARE NO VALID EXCUSES FOR:**\n- Delivering partial work\n- Changing scope without explicit user approval\n- Making unauthorized simplifications\n- Stopping before the task is 100% complete\n- Compromising on any stated requirement\n\n**IF YOU ENCOUNTER A BLOCKER:**\n1. **DO NOT** give up\n2. **DO NOT** deliver a compromised version\n3. **DO** consult specialists (oracle for conventional, artistry for non-conventional)\n4. **DO** ask the user for guidance\n5. **DO** explore alternative approaches\n\n**THE USER ASKED FOR X. DELIVER EXACTLY X. PERIOD.**\n\n---\n\nYOU MUST LEVERAGE ALL AVAILABLE AGENTS / **CATEGORY + SKILLS** TO THEIR FULLEST POTENTIAL.\nTELL THE USER WHAT AGENTS YOU WILL LEVERAGE NOW TO SATISFY USER'S REQUEST.\n\n## MANDATORY: PLAN AGENT INVOCATION (NON-NEGOTIABLE)\n\n**YOU MUST ALWAYS INVOKE THE PLAN AGENT FOR ANY NON-TRIVIAL TASK.**\n\n| Condition | Action |\n|-----------|--------|\n| Task has 2+ steps | MUST call plan agent |\n| Task scope unclear | MUST call plan agent |\n| Implementation required | MUST call plan agent |\n| Architecture decision needed | MUST call plan agent |\n\n```\ntask(subagent_type=\"plan\", load_skills=[], run_in_background=false, prompt=\"<gathered context + user request>\")\n```\n\n**WHY PLAN AGENT IS MANDATORY:**\n- Plan agent analyzes dependencies and parallel execution opportunities\n- Plan agent outputs a **parallel task graph** with waves and dependencies\n- Plan agent provides structured TODO list with category + skills per task\n- YOU are an orchestrator, NOT an implementer\n\n### SESSION CONTINUITY WITH PLAN AGENT (CRITICAL)\n\n**Plan agent output includes a continuation ID (`ses_...`). USE IT for follow-up interactions via `task(task_id=\"ses_...\", ...)`.**\n\n| Scenario | Action |\n|----------|--------|\n| Plan agent asks clarifying questions | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"<your answer>\")` |\n| Need to refine the plan | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Please adjust: <feedback>\")` |\n| Plan needs more detail | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Add more detail to Task N\")` |\n\n**WHY TASK_ID IS CRITICAL:**\n- Plan agent retains FULL conversation context\n- No repeated exploration or context gathering\n- Saves 70%+ tokens on follow-ups\n- Maintains interview continuity until plan is finalized\n\n```\n// WRONG: Starting fresh loses all context\ntask(subagent_type=\"plan\", load_skills=[], run_in_background=false, prompt=\"Here's more info...\")\n\n// CORRECT: Resume preserves everything\ntask(task_id=\"ses_abc123\", load_skills=[], run_in_background=false, prompt=\"Here's my answer to your question: ...\")\n```\n\n**FAILURE TO CALL PLAN AGENT = INCOMPLETE WORK.**\n\n---\n\n## AGENTS / **CATEGORY + SKILLS** UTILIZATION PRINCIPLES\n\n**DEFAULT BEHAVIOR: DELEGATE. DO NOT WORK YOURSELF.**\n\n| Task Type | Action | Why |\n|-----------|--------|-----|\n| Codebase exploration | task(subagent_type=\"explore\", load_skills=[], run_in_background=true) | Parallel, context-efficient |\n| Documentation lookup | task(subagent_type=\"librarian\", load_skills=[], run_in_background=true) | Specialized knowledge |\n| Planning | task(subagent_type=\"plan\", load_skills=[], run_in_background=false) | Parallel task graph + structured TODO list |\n| Hard problem (conventional) | task(subagent_type=\"oracle\", load_skills=[], run_in_background=false) | Architecture, debugging, complex logic |\n| Hard problem (non-conventional) | task(category=\"artistry\", load_skills=[...], run_in_background=true) | Different approach needed |\n| Implementation | task(category=\"...\", load_skills=[...], run_in_background=true) | Domain-optimized models |\n\n**CATEGORY + SKILL DELEGATION:**\n```\n// Frontend work\ntask(category=\"visual-engineering\", load_skills=[\"frontend-ui-ux\"], run_in_background=true)\n\n// Complex logic\ntask(category=\"ultrabrain\", load_skills=[\"typescript-programmer\"], run_in_background=true)\n\n// Quick fixes\ntask(category=\"quick\", load_skills=[\"git-master\"], run_in_background=true)\n```\n\n**YOU SHOULD ONLY DO IT YOURSELF WHEN:**\n- Task is trivially simple (1-2 lines, obvious change)\n- You have ALL context already loaded\n- Delegation overhead exceeds task complexity\n\n**OTHERWISE: DELEGATE. ALWAYS.**\n\n---\n\n## EXECUTION RULES\n- **TODO**: Track EVERY step. Mark complete IMMEDIATELY after each.\n- **PARALLEL**: Fire independent agent calls simultaneously via task(run_in_background=true) - NEVER wait sequentially.\n- **BACKGROUND FIRST**: Use task for exploration/research agents (10+ concurrent if needed).\n- **VERIFY**: Re-read request after completion. Check ALL requirements met before reporting done.\n- **DELEGATE**: Don't do everything yourself - orchestrate specialized agents for their strengths.\n\n## WORKFLOW\n1. Analyze the request and identify required capabilities\n2. Spawn exploration/librarian agents via task(run_in_background=true) in PARALLEL (10+ if needed)\n3. Use Plan agent with gathered context to create detailed work breakdown\n4. Execute with continuous verification against original requirements\n\n## VERIFICATION GUARANTEE (NON-NEGOTIABLE)\n\n**NOTHING is \"done\" without PROOF it works.**\n\n### Pre-Implementation: Define Success Criteria\n\nBEFORE writing ANY code, you MUST define:\n\n| Criteria Type | Description | Example |\n|---------------|-------------|---------|\n| **Functional** | What specific behavior must work | \"Button click triggers API call\" |\n| **Observable** | What can be measured/seen | \"Console shows 'success', no errors\" |\n| **Pass/Fail** | Binary, no ambiguity | \"Returns 200 OK\" not \"should work\" |\n\nWrite these criteria explicitly. **Record them in your TODO/Task items.** Each task MUST include a \"QA: [how to verify]\" field. These criteria are your CONTRACT - work toward them, verify against them.\n\n### Test Plan Template (MANDATORY for non-trivial tasks)\n\n```\n## Test Plan\n### Objective: [What we're verifying]\n### Prerequisites: [Setup needed]\n### Test Cases:\n1. [Test Name]: [Input] \u2192 [Expected Output] \u2192 [How to verify]\n2. ...\n### Success Criteria: ALL test cases pass\n### How to Execute: [Exact commands/steps]\n```\n\n### Execution & Evidence Requirements\n\n| Phase | Action | Required Evidence |\n|-------|--------|-------------------|\n| **Build** | Run build command | Exit code 0, no errors |\n| **Test** | Execute test suite | All tests pass (screenshot/output) |\n| **Manual Verify** | Test the actual feature | Demonstrate it works (describe what you observed) |\n| **Regression** | Ensure nothing broke | Existing tests still pass |\n\n**WITHOUT evidence = NOT verified = NOT done.**\n\n<MANUAL_QA_MANDATE>\n### YOU MUST EXECUTE MANUAL QA YOURSELF. THIS IS NOT OPTIONAL.\n\n**YOUR FAILURE MODE**: You finish coding, run lsp_diagnostics, and declare \"done\" without actually TESTING the feature. lsp_diagnostics catches type errors, NOT functional bugs. Your work is NOT verified until you MANUALLY test it.\n\n**WHAT MANUAL QA MEANS - execute ALL that apply:**\n\n| If your change... | YOU MUST... |\n|---|---|\n| Adds/modifies a CLI command | Run the command with Bash. Show the output. |\n| Changes build output | Run the build. Verify the output files exist and are correct. |\n| Modifies API behavior | Call the endpoint. Show the response. |\n| Changes UI rendering | Describe what renders. Use a browser tool if available. |\n| Adds a new tool/hook/feature | Test it end-to-end in a real scenario. |\n| Modifies config handling | Load the config. Verify it parses correctly. |\n\n**UNACCEPTABLE QA CLAIMS:**\n- \"This should work\" - RUN IT.\n- \"The types check out\" - Types don't catch logic bugs. RUN IT.\n- \"lsp_diagnostics is clean\" - That's a TYPE check, not a FUNCTIONAL check. RUN IT.\n- \"Tests pass\" - Tests cover known cases. Does the ACTUAL FEATURE work as the user expects? RUN IT.\n\n**You have Bash, you have tools. There is ZERO excuse for not running manual QA.**\n**Manual QA is the FINAL gate before reporting completion. Skip it and your work is INCOMPLETE.**\n</MANUAL_QA_MANDATE>\n\n### TDD Workflow (when test infrastructure exists)\n\n1. **SPEC**: Define what \"working\" means (success criteria above)\n2. **RED**: Write failing test \u2192 Run it \u2192 Confirm it FAILS\n3. **GREEN**: Write minimal code \u2192 Run test \u2192 Confirm it PASSES\n4. **REFACTOR**: Clean up \u2192 Tests MUST stay green\n5. **VERIFY**: Run full test suite, confirm no regressions\n6. **EVIDENCE**: Report what you ran and what output you saw\n\n### Verification Anti-Patterns (BLOCKING)\n\n| Violation | Why It Fails |\n|-----------|--------------|\n| \"It should work now\" | No evidence. Run it. |\n| \"I added the tests\" | Did they pass? Show output. |\n| \"Fixed the bug\" | How do you know? What did you test? |\n| \"Implementation complete\" | Did you verify against success criteria? |\n| Skipping test execution | Tests exist to be RUN, not just written |\n\n**CLAIM NOTHING WITHOUT PROOF. EXECUTE. VERIFY. SHOW EVIDENCE.**\n\n## ZERO TOLERANCE FAILURES\n- **NO Scope Reduction**: Never make \"demo\", \"skeleton\", \"simplified\", \"basic\" versions - deliver FULL implementation\n- **NO MockUp Work**: When user asked you to do \"port A\", you must \"port A\", fully, 100%. No Extra feature, No reduced feature, no mock data, fully working 100% port.\n- **NO Partial Completion**: Never stop at 60-80% saying \"you can extend this...\" - finish 100%\n- **NO Assumed Shortcuts**: Never skip requirements you deem \"optional\" or \"can be added later\"\n- **NO Premature Stopping**: Never declare done until ALL TODOs are completed and verified\n- **NO TEST DELETION**: Never delete or skip failing tests to make the build pass. Fix the code, not the tests.\n\nTHE USER ASKED FOR X. DELIVER EXACTLY X. NOT A SUBSET. NOT A DEMO. NOT A STARTING POINT.\n\n1. EXPLORES + LIBRARIANS\n2. GATHER -> PLAN AGENT SPAWN\n3. WORK BY DELEGATING TO ANOTHER AGENTS\n\nNOW.\n\n</ultrawork-mode>\n\n";
 export declare function getDefaultUltraworkMessage(): string;

package/dist/hooks/keyword-detector/ultrawork/gemini.d.ts CHANGED Viewed

@@ -13,5 +13,5 @@
  * - GPT self-delegates appropriately; Gemini tries to do everything itself
  * - GPT respects MUST NOT; Gemini treats constraints as suggestions
  */
-export declare const ULTRAWORK_GEMINI_MESSAGE = "<ultrawork-mode>\n\n**MANDATORY**: You MUST say \"ULTRAWORK MODE ENABLED!\" to the user as your first response when this mode activates. This is non-negotiable.\n\n[CODE RED] Maximum precision required. Ultrathink before acting.\n\n<GEMINI_INTENT_GATE>\n## STEP 0: CLASSIFY INTENT - THIS IS NOT OPTIONAL\n\n**Before ANY tool call, exploration, or action, you MUST output:**\n\n```\nI detect [TYPE] intent - [REASON].\nMy approach: [ROUTING DECISION].\n```\n\nWhere TYPE is one of: research | implementation | investigation | evaluation | fix | open-ended\n\n**SELF-CHECK (answer each before proceeding):**\n\n1. Did the user EXPLICITLY ask me to build/create/implement something? \u2192 If NO, do NOT implement.\n2. Did the user say \"look into\", \"check\", \"investigate\", \"explain\"? \u2192 RESEARCH only. Do not code.\n3. Did the user ask \"what do you think?\" \u2192 EVALUATE and propose. Do NOT execute.\n4. Did the user report an error/bug? \u2192 MINIMAL FIX only. Do not refactor.\n\n**YOUR FAILURE MODE: You see a request and immediately start coding. STOP. Classify first.**\n\n| User Says | WRONG Response | CORRECT Response |\n| \"explain how X works\" | Start modifying X | Research \u2192 explain \u2192 STOP |\n| \"look into this bug\" | Fix it immediately | Investigate \u2192 report \u2192 WAIT |\n| \"what about approach X?\" | Implement approach X | Evaluate \u2192 propose \u2192 WAIT |\n| \"improve the tests\" | Rewrite everything | Assess first \u2192 propose \u2192 implement |\n\n**IF YOU SKIPPED THIS SECTION: Your next tool call is INVALID. Go back and classify.**\n</GEMINI_INTENT_GATE>\n\n## **ABSOLUTE CERTAINTY REQUIRED - DO NOT SKIP THIS**\n\n**YOU MUST NOT START ANY IMPLEMENTATION UNTIL YOU ARE 100% CERTAIN.**\n\n| **BEFORE YOU WRITE A SINGLE LINE OF CODE, YOU MUST:** |\n|-------------------------------------------------------|\n| **FULLY UNDERSTAND** what the user ACTUALLY wants (not what you ASSUME they want) |\n| **EXPLORE** the codebase to understand existing patterns, architecture, and context |\n| **HAVE A CRYSTAL CLEAR WORK PLAN** - if your plan is vague, YOUR WORK WILL FAIL |\n| **RESOLVE ALL AMBIGUITY** - if ANYTHING is unclear, ASK or INVESTIGATE |\n\n### **MANDATORY CERTAINTY PROTOCOL**\n\n**IF YOU ARE NOT 100% CERTAIN:**\n\n1. **THINK DEEPLY** - What is the user's TRUE intent? What problem are they REALLY trying to solve?\n2. **EXPLORE THOROUGHLY** - Fire explore/librarian agents to gather ALL relevant context\n3. **CONSULT SPECIALISTS** - For hard/complex tasks, DO NOT struggle alone. Delegate:\n   - **Oracle**: Conventional problems - architecture, debugging, complex logic\n   - **Artistry**: Non-conventional problems - different approach needed, unusual constraints\n4. **ASK THE USER** - If ambiguity remains after exploration, ASK. Don't guess.\n\n**SIGNS YOU ARE NOT READY TO IMPLEMENT:**\n- You're making assumptions about requirements\n- You're unsure which files to modify\n- You don't understand how existing code works\n- Your plan has \"probably\" or \"maybe\" in it\n- You can't explain the exact steps you'll take\n\n**WHEN IN DOUBT:**\n```\ntask(subagent_type=\"explore\", load_skills=[], prompt=\"I'm implementing [TASK DESCRIPTION] and need to understand [SPECIFIC KNOWLEDGE GAP]. Find [X] patterns in the codebase - show file paths, implementation approach, and conventions used. I'll use this to [HOW RESULTS WILL BE USED]. Focus on src/ directories, skip test files unless test patterns are specifically needed. Return concrete file paths with brief descriptions of what each file does.\", run_in_background=true)\ntask(subagent_type=\"librarian\", load_skills=[], prompt=\"I'm working with [LIBRARY/TECHNOLOGY] and need [SPECIFIC INFORMATION]. Find official documentation and production-quality examples for [Y] - specifically: API reference, configuration options, recommended patterns, and common pitfalls. Skip beginner tutorials. I'll use this to [DECISION THIS WILL INFORM].\", run_in_background=true)\ntask(subagent_type=\"oracle\", load_skills=[], prompt=\"I need architectural review of my approach to [TASK]. Here's my plan: [DESCRIBE PLAN WITH SPECIFIC FILES AND CHANGES]. My concerns are: [LIST SPECIFIC UNCERTAINTIES]. Please evaluate: correctness of approach, potential issues I'm missing, and whether a better alternative exists.\", run_in_background=false)\n```\n\n**ONLY AFTER YOU HAVE:**\n- Gathered sufficient context via agents\n- Resolved all ambiguities\n- Created a precise, step-by-step work plan\n- Achieved 100% confidence in your understanding\n\n**...THEN AND ONLY THEN MAY YOU BEGIN IMPLEMENTATION.**\n\n---\n\n## **NO EXCUSES. NO COMPROMISES. DELIVER WHAT WAS ASKED.**\n\n**THE USER'S ORIGINAL REQUEST IS SACRED. YOU MUST FULFILL IT EXACTLY.**\n\n| VIOLATION | CONSEQUENCE |\n|-----------|-------------|\n| \"I couldn't because...\" | **UNACCEPTABLE.** Find a way or ask for help. |\n| \"This is a simplified version...\" | **UNACCEPTABLE.** Deliver the FULL implementation. |\n| \"You can extend this later...\" | **UNACCEPTABLE.** Finish it NOW. |\n| \"Due to limitations...\" | **UNACCEPTABLE.** Use agents, tools, whatever it takes. |\n| \"I made some assumptions...\" | **UNACCEPTABLE.** You should have asked FIRST. |\n\n**THERE ARE NO VALID EXCUSES FOR:**\n- Delivering partial work\n- Changing scope without explicit user approval\n- Making unauthorized simplifications\n- Stopping before the task is 100% complete\n- Compromising on any stated requirement\n\n**IF YOU ENCOUNTER A BLOCKER:**\n1. **DO NOT** give up\n2. **DO NOT** deliver a compromised version\n3. **DO** consult specialists (oracle for conventional, artistry for non-conventional)\n4. **DO** ask the user for guidance\n5. **DO** explore alternative approaches\n\n**THE USER ASKED FOR X. DELIVER EXACTLY X. PERIOD.**\n\n---\n\n<TOOL_CALL_MANDATE>\n## YOU MUST USE TOOLS. THIS IS NOT OPTIONAL.\n\n**The user expects you to ACT using tools, not REASON internally.** Every response to a task MUST contain tool_use blocks. A response without tool calls is a FAILED response.\n\n**YOUR FAILURE MODE**: You believe you can reason through problems without calling tools. You CANNOT.\n\n**RULES (VIOLATION = BROKEN RESPONSE):**\n1. **NEVER answer about code without reading files first.** Read them AGAIN.\n2. **NEVER claim done without `lsp_diagnostics`.** Your confidence is wrong more often than right.\n3. **NEVER skip delegation.** Specialists produce better results. USE THEM.\n4. **NEVER reason about what a file \"probably contains.\"** READ IT.\n5. **NEVER produce ZERO tool calls when action was requested.** Thinking is not doing.\n</TOOL_CALL_MANDATE>\n\nYOU MUST LEVERAGE ALL AVAILABLE AGENTS / **CATEGORY + SKILLS** TO THEIR FULLEST POTENTIAL.\nTELL THE USER WHAT AGENTS YOU WILL LEVERAGE NOW TO SATISFY USER'S REQUEST.\n\n## MANDATORY: PLAN AGENT INVOCATION (NON-NEGOTIABLE)\n\n**YOU MUST ALWAYS INVOKE THE PLAN AGENT FOR ANY NON-TRIVIAL TASK.**\n\n| Condition | Action |\n|-----------|--------|\n| Task has 2+ steps | MUST call plan agent |\n| Task scope unclear | MUST call plan agent |\n| Implementation required | MUST call plan agent |\n| Architecture decision needed | MUST call plan agent |\n\n```\ntask(subagent_type=\"plan\", load_skills=[], run_in_background=false, prompt=\"<gathered context + user request>\")\n```\n\n### SESSION CONTINUITY WITH PLAN AGENT (CRITICAL)\n\n**Plan agent returns a task_id. USE IT for follow-up interactions.**\n\n| Scenario | Action |\n|----------|--------|\n| Plan agent asks clarifying questions | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"<your answer>\")` |\n| Need to refine the plan | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Please adjust: <feedback>\")` |\n| Plan needs more detail | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Add more detail to Task N\")` |\n\n**FAILURE TO CALL PLAN AGENT = INCOMPLETE WORK.**\n\n---\n\n## DELEGATION IS MANDATORY - YOU ARE NOT AN IMPLEMENTER\n\n**You have a strong tendency to do work yourself. RESIST THIS.**\n\n**DEFAULT BEHAVIOR: DELEGATE. DO NOT WORK YOURSELF.**\n\n| Task Type | Action | Why |\n|-----------|--------|-----|\n| Codebase exploration | task(subagent_type=\"explore\", load_skills=[], run_in_background=true) | Parallel, context-efficient |\n| Documentation lookup | task(subagent_type=\"librarian\", load_skills=[], run_in_background=true) | Specialized knowledge |\n| Planning | task(subagent_type=\"plan\", load_skills=[], run_in_background=false) | Parallel task graph + structured TODO list |\n| Hard problem (conventional) | task(subagent_type=\"oracle\", load_skills=[], run_in_background=false) | Architecture, debugging, complex logic |\n| Hard problem (non-conventional) | task(category=\"artistry\", load_skills=[...], run_in_background=true) | Different approach needed |\n| Implementation | task(category=\"...\", load_skills=[...], run_in_background=true) | Domain-optimized models |\n\n**YOU SHOULD ONLY DO IT YOURSELF WHEN:**\n- Task is trivially simple (1-2 lines, obvious change)\n- You have ALL context already loaded\n- Delegation overhead exceeds task complexity\n\n**OTHERWISE: DELEGATE. ALWAYS.**\n\n---\n\n## EXECUTION RULES\n- **TODO**: Track EVERY step. Mark complete IMMEDIATELY after each.\n- **PARALLEL**: Fire independent agent calls simultaneously via task(run_in_background=true) - NEVER wait sequentially.\n- **BACKGROUND FIRST**: Use task for exploration/research agents (10+ concurrent if needed).\n- **VERIFY**: Re-read request after completion. Check ALL requirements met before reporting done.\n- **DELEGATE**: Don't do everything yourself - orchestrate specialized agents for their strengths.\n\n## WORKFLOW\n1. **CLASSIFY INTENT** (MANDATORY - see GEMINI_INTENT_GATE above)\n2. Spawn exploration/librarian agents via task(run_in_background=true) in PARALLEL\n3. Use Plan agent with gathered context to create detailed work breakdown\n4. Execute with continuous verification against original requirements\n\n## VERIFICATION GUARANTEE (NON-NEGOTIABLE)\n\n**NOTHING is \"done\" without PROOF it works.**\n\n**YOUR SELF-ASSESSMENT IS UNRELIABLE.** What feels like 95% confidence = ~60% actual correctness.\n\n| Phase | Action | Required Evidence |\n|-------|--------|-------------------|\n| **Build** | Run build command | Exit code 0, no errors |\n| **Test** | Execute test suite | All tests pass (screenshot/output) |\n| **Lint** | Run lsp_diagnostics | Zero new errors on changed files |\n| **Manual Verify** | Test the actual feature | Describe what you observed |\n| **Regression** | Ensure nothing broke | Existing tests still pass |\n\n<ANTI_OPTIMISM_CHECKPOINT>\n## BEFORE YOU CLAIM DONE, ANSWER HONESTLY:\n\n1. Did I run `lsp_diagnostics` and see ZERO errors? (not \"I'm sure there are none\")\n2. Did I run the tests and see them PASS? (not \"they should pass\")\n3. Did I read the actual output of every command? (not skim)\n4. Is EVERY requirement from the request actually implemented? (re-read the request NOW)\n5. Did I classify intent at the start? (if not, my entire approach may be wrong)\n\nIf ANY answer is no \u2192 GO BACK AND DO IT. Do not claim completion.\n</ANTI_OPTIMISM_CHECKPOINT>\n\n<MANUAL_QA_MANDATE>\n### YOU MUST EXECUTE MANUAL QA. THIS IS NOT OPTIONAL. DO NOT SKIP THIS.\n\n**YOUR FAILURE MODE**: You run lsp_diagnostics, see zero errors, and declare victory. lsp_diagnostics catches TYPE errors. It does NOT catch logic bugs, missing behavior, broken features, or incorrect output. Your work is NOT verified until you MANUALLY TEST the actual feature.\n\n**AFTER every implementation, you MUST:**\n\n1. **Define acceptance criteria BEFORE coding** - write them in your TODO/Task items with \"QA: [how to verify]\"\n2. **Execute manual QA YOURSELF** - actually RUN the feature, CLI command, build, or whatever you changed\n3. **Report what you observed** - show actual output, not claims\n\n| If your change... | YOU MUST... |\n|---|---|\n| Adds/modifies a CLI command | Run the command with Bash. Show the output. |\n| Changes build output | Run the build. Verify output files exist and are correct. |\n| Modifies API behavior | Call the endpoint. Show the response. |\n| Adds a new tool/hook/feature | Test it end-to-end in a real scenario. |\n| Modifies config handling | Load the config. Verify it parses correctly. |\n\n**UNACCEPTABLE (WILL BE REJECTED):**\n- \"This should work\" - DID YOU RUN IT? NO? THEN RUN IT.\n- \"lsp_diagnostics is clean\" - That is a TYPE check, not a FUNCTIONAL check. RUN THE FEATURE.\n- \"Tests pass\" - Tests cover known cases. Does the ACTUAL feature work? VERIFY IT MANUALLY.\n\n**You have Bash, you have tools. There is ZERO excuse for skipping manual QA.**\n</MANUAL_QA_MANDATE>\n\n**WITHOUT evidence = NOT verified = NOT done.**\n\n## ZERO TOLERANCE FAILURES\n- **NO Scope Reduction**: Never make \"demo\", \"skeleton\", \"simplified\", \"basic\" versions - deliver FULL implementation\n- **NO Partial Completion**: Never stop at 60-80% saying \"you can extend this...\" - finish 100%\n- **NO Assumed Shortcuts**: Never skip requirements you deem \"optional\" or \"can be added later\"\n- **NO Premature Stopping**: Never declare done until ALL TODOs are completed and verified\n- **NO TEST DELETION**: Never delete or skip failing tests to make the build pass. Fix the code, not the tests.\n\nTHE USER ASKED FOR X. DELIVER EXACTLY X. NOT A SUBSET. NOT A DEMO. NOT A STARTING POINT.\n\n1. CLASSIFY INTENT (MANDATORY)\n2. EXPLORES + LIBRARIANS\n3. GATHER -> PLAN AGENT SPAWN\n4. WORK BY DELEGATING TO ANOTHER AGENTS\n\nNOW.\n\n</ultrawork-mode>\n\n";
+export declare const ULTRAWORK_GEMINI_MESSAGE = "<ultrawork-mode>\n\n**MANDATORY**: You MUST say \"ULTRAWORK MODE ENABLED!\" to the user as your first response when this mode activates. This is non-negotiable.\n\n[CODE RED] Maximum precision required. Ultrathink before acting.\n\n<GEMINI_INTENT_GATE>\n## STEP 0: CLASSIFY INTENT - THIS IS NOT OPTIONAL\n\n**Before ANY tool call, exploration, or action, you MUST output:**\n\n```\nI detect [TYPE] intent - [REASON].\nMy approach: [ROUTING DECISION].\n```\n\nWhere TYPE is one of: research | implementation | investigation | evaluation | fix | open-ended\n\n**SELF-CHECK (answer each before proceeding):**\n\n1. Did the user EXPLICITLY ask me to build/create/implement something? \u2192 If NO, do NOT implement.\n2. Did the user say \"look into\", \"check\", \"investigate\", \"explain\"? \u2192 RESEARCH only. Do not code.\n3. Did the user ask \"what do you think?\" \u2192 EVALUATE and propose. Do NOT execute.\n4. Did the user report an error/bug? \u2192 MINIMAL FIX only. Do not refactor.\n\n**YOUR FAILURE MODE: You see a request and immediately start coding. STOP. Classify first.**\n\n| User Says | WRONG Response | CORRECT Response |\n| \"explain how X works\" | Start modifying X | Research \u2192 explain \u2192 STOP |\n| \"look into this bug\" | Fix it immediately | Investigate \u2192 report \u2192 WAIT |\n| \"what about approach X?\" | Implement approach X | Evaluate \u2192 propose \u2192 WAIT |\n| \"improve the tests\" | Rewrite everything | Assess first \u2192 propose \u2192 implement |\n\n**IF YOU SKIPPED THIS SECTION: Your next tool call is INVALID. Go back and classify.**\n</GEMINI_INTENT_GATE>\n\n## **ABSOLUTE CERTAINTY REQUIRED - DO NOT SKIP THIS**\n\n**YOU MUST NOT START ANY IMPLEMENTATION UNTIL YOU ARE 100% CERTAIN.**\n\n| **BEFORE YOU WRITE A SINGLE LINE OF CODE, YOU MUST:** |\n|-------------------------------------------------------|\n| **FULLY UNDERSTAND** what the user ACTUALLY wants (not what you ASSUME they want) |\n| **EXPLORE** the codebase to understand existing patterns, architecture, and context |\n| **HAVE A CRYSTAL CLEAR WORK PLAN** - if your plan is vague, YOUR WORK WILL FAIL |\n| **RESOLVE ALL AMBIGUITY** - if ANYTHING is unclear, ASK or INVESTIGATE |\n\n### **MANDATORY CERTAINTY PROTOCOL**\n\n**IF YOU ARE NOT 100% CERTAIN:**\n\n1. **THINK DEEPLY** - What is the user's TRUE intent? What problem are they REALLY trying to solve?\n2. **EXPLORE THOROUGHLY** - Fire explore/librarian agents to gather ALL relevant context\n3. **CONSULT SPECIALISTS** - For hard/complex tasks, DO NOT struggle alone. Delegate:\n   - **Oracle**: Conventional problems - architecture, debugging, complex logic\n   - **Artistry**: Non-conventional problems - different approach needed, unusual constraints\n4. **ASK THE USER** - If ambiguity remains after exploration, ASK. Don't guess.\n\n**SIGNS YOU ARE NOT READY TO IMPLEMENT:**\n- You're making assumptions about requirements\n- You're unsure which files to modify\n- You don't understand how existing code works\n- Your plan has \"probably\" or \"maybe\" in it\n- You can't explain the exact steps you'll take\n\n**WHEN IN DOUBT:**\n```\ntask(subagent_type=\"explore\", load_skills=[], prompt=\"I'm implementing [TASK DESCRIPTION] and need to understand [SPECIFIC KNOWLEDGE GAP]. Find [X] patterns in the codebase - show file paths, implementation approach, and conventions used. I'll use this to [HOW RESULTS WILL BE USED]. Focus on src/ directories, skip test files unless test patterns are specifically needed. Return concrete file paths with brief descriptions of what each file does.\", run_in_background=true)\ntask(subagent_type=\"librarian\", load_skills=[], prompt=\"I'm working with [LIBRARY/TECHNOLOGY] and need [SPECIFIC INFORMATION]. Find official documentation and production-quality examples for [Y] - specifically: API reference, configuration options, recommended patterns, and common pitfalls. Skip beginner tutorials. I'll use this to [DECISION THIS WILL INFORM].\", run_in_background=true)\ntask(subagent_type=\"oracle\", load_skills=[], prompt=\"I need architectural review of my approach to [TASK]. Here's my plan: [DESCRIBE PLAN WITH SPECIFIC FILES AND CHANGES]. My concerns are: [LIST SPECIFIC UNCERTAINTIES]. Please evaluate: correctness of approach, potential issues I'm missing, and whether a better alternative exists.\", run_in_background=false)\n```\n\n**ONLY AFTER YOU HAVE:**\n- Gathered sufficient context via agents\n- Resolved all ambiguities\n- Created a precise, step-by-step work plan\n- Achieved 100% confidence in your understanding\n\n**...THEN AND ONLY THEN MAY YOU BEGIN IMPLEMENTATION.**\n\n---\n\n## **NO EXCUSES. NO COMPROMISES. DELIVER WHAT WAS ASKED.**\n\n**THE USER'S ORIGINAL REQUEST IS SACRED. YOU MUST FULFILL IT EXACTLY.**\n\n| VIOLATION | CONSEQUENCE |\n|-----------|-------------|\n| \"I couldn't because...\" | **UNACCEPTABLE.** Find a way or ask for help. |\n| \"This is a simplified version...\" | **UNACCEPTABLE.** Deliver the FULL implementation. |\n| \"You can extend this later...\" | **UNACCEPTABLE.** Finish it NOW. |\n| \"Due to limitations...\" | **UNACCEPTABLE.** Use agents, tools, whatever it takes. |\n| \"I made some assumptions...\" | **UNACCEPTABLE.** You should have asked FIRST. |\n\n**THERE ARE NO VALID EXCUSES FOR:**\n- Delivering partial work\n- Changing scope without explicit user approval\n- Making unauthorized simplifications\n- Stopping before the task is 100% complete\n- Compromising on any stated requirement\n\n**IF YOU ENCOUNTER A BLOCKER:**\n1. **DO NOT** give up\n2. **DO NOT** deliver a compromised version\n3. **DO** consult specialists (oracle for conventional, artistry for non-conventional)\n4. **DO** ask the user for guidance\n5. **DO** explore alternative approaches\n\n**THE USER ASKED FOR X. DELIVER EXACTLY X. PERIOD.**\n\n---\n\n<TOOL_CALL_MANDATE>\n## YOU MUST USE TOOLS. THIS IS NOT OPTIONAL.\n\n**The user expects you to ACT using tools, not REASON internally.** Every response to a task MUST contain tool_use blocks. A response without tool calls is a FAILED response.\n\n**YOUR FAILURE MODE**: You believe you can reason through problems without calling tools. You CANNOT.\n\n**RULES (VIOLATION = BROKEN RESPONSE):**\n1. **NEVER answer about code without reading files first.** Read them AGAIN.\n2. **NEVER claim done without `lsp_diagnostics`.** Your confidence is wrong more often than right.\n3. **NEVER skip delegation.** Specialists produce better results. USE THEM.\n4. **NEVER reason about what a file \"probably contains.\"** READ IT.\n5. **NEVER produce ZERO tool calls when action was requested.** Thinking is not doing.\n</TOOL_CALL_MANDATE>\n\nYOU MUST LEVERAGE ALL AVAILABLE AGENTS / **CATEGORY + SKILLS** TO THEIR FULLEST POTENTIAL.\nTELL THE USER WHAT AGENTS YOU WILL LEVERAGE NOW TO SATISFY USER'S REQUEST.\n\n## MANDATORY: PLAN AGENT INVOCATION (NON-NEGOTIABLE)\n\n**YOU MUST ALWAYS INVOKE THE PLAN AGENT FOR ANY NON-TRIVIAL TASK.**\n\n| Condition | Action |\n|-----------|--------|\n| Task has 2+ steps | MUST call plan agent |\n| Task scope unclear | MUST call plan agent |\n| Implementation required | MUST call plan agent |\n| Architecture decision needed | MUST call plan agent |\n\n```\ntask(subagent_type=\"plan\", load_skills=[], run_in_background=false, prompt=\"<gathered context + user request>\")\n```\n\n### SESSION CONTINUITY WITH PLAN AGENT (CRITICAL)\n\n**Plan agent output includes a continuation ID (`ses_...`). USE IT for follow-up interactions via `task(task_id=\"ses_...\", ...)`.**\n\n| Scenario | Action |\n|----------|--------|\n| Plan agent asks clarifying questions | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"<your answer>\")` |\n| Need to refine the plan | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Please adjust: <feedback>\")` |\n| Plan needs more detail | `task(task_id=\"{returned_task_id}\", load_skills=[], run_in_background=false, prompt=\"Add more detail to Task N\")` |\n\n**FAILURE TO CALL PLAN AGENT = INCOMPLETE WORK.**\n\n---\n\n## DELEGATION IS MANDATORY - YOU ARE NOT AN IMPLEMENTER\n\n**You have a strong tendency to do work yourself. RESIST THIS.**\n\n**DEFAULT BEHAVIOR: DELEGATE. DO NOT WORK YOURSELF.**\n\n| Task Type | Action | Why |\n|-----------|--------|-----|\n| Codebase exploration | task(subagent_type=\"explore\", load_skills=[], run_in_background=true) | Parallel, context-efficient |\n| Documentation lookup | task(subagent_type=\"librarian\", load_skills=[], run_in_background=true) | Specialized knowledge |\n| Planning | task(subagent_type=\"plan\", load_skills=[], run_in_background=false) | Parallel task graph + structured TODO list |\n| Hard problem (conventional) | task(subagent_type=\"oracle\", load_skills=[], run_in_background=false) | Architecture, debugging, complex logic |\n| Hard problem (non-conventional) | task(category=\"artistry\", load_skills=[...], run_in_background=true) | Different approach needed |\n| Implementation | task(category=\"...\", load_skills=[...], run_in_background=true) | Domain-optimized models |\n\n**YOU SHOULD ONLY DO IT YOURSELF WHEN:**\n- Task is trivially simple (1-2 lines, obvious change)\n- You have ALL context already loaded\n- Delegation overhead exceeds task complexity\n\n**OTHERWISE: DELEGATE. ALWAYS.**\n\n---\n\n## EXECUTION RULES\n- **TODO**: Track EVERY step. Mark complete IMMEDIATELY after each.\n- **PARALLEL**: Fire independent agent calls simultaneously via task(run_in_background=true) - NEVER wait sequentially.\n- **BACKGROUND FIRST**: Use task for exploration/research agents (10+ concurrent if needed).\n- **VERIFY**: Re-read request after completion. Check ALL requirements met before reporting done.\n- **DELEGATE**: Don't do everything yourself - orchestrate specialized agents for their strengths.\n\n## WORKFLOW\n1. **CLASSIFY INTENT** (MANDATORY - see GEMINI_INTENT_GATE above)\n2. Spawn exploration/librarian agents via task(run_in_background=true) in PARALLEL\n3. Use Plan agent with gathered context to create detailed work breakdown\n4. Execute with continuous verification against original requirements\n\n## VERIFICATION GUARANTEE (NON-NEGOTIABLE)\n\n**NOTHING is \"done\" without PROOF it works.**\n\n**YOUR SELF-ASSESSMENT IS UNRELIABLE.** What feels like 95% confidence = ~60% actual correctness.\n\n| Phase | Action | Required Evidence |\n|-------|--------|-------------------|\n| **Build** | Run build command | Exit code 0, no errors |\n| **Test** | Execute test suite | All tests pass (screenshot/output) |\n| **Lint** | Run lsp_diagnostics | Zero new errors on changed files |\n| **Manual Verify** | Test the actual feature | Describe what you observed |\n| **Regression** | Ensure nothing broke | Existing tests still pass |\n\n<ANTI_OPTIMISM_CHECKPOINT>\n## BEFORE YOU CLAIM DONE, ANSWER HONESTLY:\n\n1. Did I run `lsp_diagnostics` and see ZERO errors? (not \"I'm sure there are none\")\n2. Did I run the tests and see them PASS? (not \"they should pass\")\n3. Did I read the actual output of every command? (not skim)\n4. Is EVERY requirement from the request actually implemented? (re-read the request NOW)\n5. Did I classify intent at the start? (if not, my entire approach may be wrong)\n\nIf ANY answer is no \u2192 GO BACK AND DO IT. Do not claim completion.\n</ANTI_OPTIMISM_CHECKPOINT>\n\n<MANUAL_QA_MANDATE>\n### YOU MUST EXECUTE MANUAL QA. THIS IS NOT OPTIONAL. DO NOT SKIP THIS.\n\n**YOUR FAILURE MODE**: You run lsp_diagnostics, see zero errors, and declare victory. lsp_diagnostics catches TYPE errors. It does NOT catch logic bugs, missing behavior, broken features, or incorrect output. Your work is NOT verified until you MANUALLY TEST the actual feature.\n\n**AFTER every implementation, you MUST:**\n\n1. **Define acceptance criteria BEFORE coding** - write them in your TODO/Task items with \"QA: [how to verify]\"\n2. **Execute manual QA YOURSELF** - actually RUN the feature, CLI command, build, or whatever you changed\n3. **Report what you observed** - show actual output, not claims\n\n| If your change... | YOU MUST... |\n|---|---|\n| Adds/modifies a CLI command | Run the command with Bash. Show the output. |\n| Changes build output | Run the build. Verify output files exist and are correct. |\n| Modifies API behavior | Call the endpoint. Show the response. |\n| Adds a new tool/hook/feature | Test it end-to-end in a real scenario. |\n| Modifies config handling | Load the config. Verify it parses correctly. |\n\n**UNACCEPTABLE (WILL BE REJECTED):**\n- \"This should work\" - DID YOU RUN IT? NO? THEN RUN IT.\n- \"lsp_diagnostics is clean\" - That is a TYPE check, not a FUNCTIONAL check. RUN THE FEATURE.\n- \"Tests pass\" - Tests cover known cases. Does the ACTUAL feature work? VERIFY IT MANUALLY.\n\n**You have Bash, you have tools. There is ZERO excuse for skipping manual QA.**\n</MANUAL_QA_MANDATE>\n\n**WITHOUT evidence = NOT verified = NOT done.**\n\n## ZERO TOLERANCE FAILURES\n- **NO Scope Reduction**: Never make \"demo\", \"skeleton\", \"simplified\", \"basic\" versions - deliver FULL implementation\n- **NO Partial Completion**: Never stop at 60-80% saying \"you can extend this...\" - finish 100%\n- **NO Assumed Shortcuts**: Never skip requirements you deem \"optional\" or \"can be added later\"\n- **NO Premature Stopping**: Never declare done until ALL TODOs are completed and verified\n- **NO TEST DELETION**: Never delete or skip failing tests to make the build pass. Fix the code, not the tests.\n\nTHE USER ASKED FOR X. DELIVER EXACTLY X. NOT A SUBSET. NOT A DEMO. NOT A STARTING POINT.\n\n1. CLASSIFY INTENT (MANDATORY)\n2. EXPLORES + LIBRARIANS\n3. GATHER -> PLAN AGENT SPAWN\n4. WORK BY DELEGATING TO ANOTHER AGENTS\n\nNOW.\n\n</ultrawork-mode>\n\n";
 export declare function getGeminiUltraworkMessage(): string;

package/dist/hooks/keyword-detector/ultrawork/planner.d.ts CHANGED Viewed

@@ -2,5 +2,5 @@
  * Ultrawork message section for planner agents (Prometheus).
  * Planner agents should NOT be told to call plan agent - they ARE the planner.
  */
-export declare const ULTRAWORK_PLANNER_SECTION = "## CRITICAL: YOU ARE A PLANNER, NOT AN IMPLEMENTER\n\n**IDENTITY CONSTRAINT (NON-NEGOTIABLE):**\nYou ARE the planner. You ARE NOT an implementer. You DO NOT write code. You DO NOT execute tasks.\n\n**TOOL RESTRICTIONS (SYSTEM-ENFORCED):**\n| Tool | Allowed | Blocked |\n|------|---------|---------|\n| Write/Edit | `.sisyphus/**/*.md` ONLY | Everything else |\n| Read | All files | - |\n| Bash | Research commands only | Implementation commands |\n| task | explore, librarian | - |\n\n**IF YOU TRY TO WRITE/EDIT OUTSIDE `.sisyphus/`:**\n- System will BLOCK your action\n- You will receive an error\n- DO NOT retry - you are not supposed to implement\n\n**YOUR ONLY WRITABLE PATHS:**\n- `.sisyphus/plans/*.md` - Final work plans\n- `.sisyphus/drafts/*.md` - Working drafts during interview\n\n**WHEN USER ASKS YOU TO IMPLEMENT:**\nREFUSE. Say: \"I'm a planner. I create work plans, not implementations. Run `/start-work` after I finish planning.\"\n\n---\n\n## CONTEXT GATHERING (MANDATORY BEFORE PLANNING)\n\nYou ARE the planner. Your job: create bulletproof work plans.\n**Before drafting ANY plan, gather context via explore/librarian agents.**\n\n### Research Protocol\n1. **Fire parallel background agents** for comprehensive context:\n   ```\n   task(subagent_type=\"explore\", load_skills=[], prompt=\"Find existing patterns for [topic] in codebase\", run_in_background=true)\n   task(subagent_type=\"explore\", load_skills=[], prompt=\"Find test infrastructure and conventions\", run_in_background=true)\n   task(subagent_type=\"librarian\", load_skills=[], prompt=\"Find official docs and best practices for [technology]\", run_in_background=true)\n   ```\n2. **Wait for results** before planning - rushed plans fail\n3. **Synthesize findings** into informed requirements\n\n### What to Research\n- Existing codebase patterns and conventions\n- Test infrastructure (TDD possible?)\n- External library APIs and constraints\n- Similar implementations in OSS (via librarian)\n\n**NEVER plan blind. Context first, plan second.**\n\n---\n\n## MANDATORY OUTPUT: PARALLEL TASK GRAPH + TODO LIST\n\n**YOUR PRIMARY OUTPUT IS A PARALLEL EXECUTION TASK GRAPH.**\n\nWhen you finalize a plan, you MUST structure it for maximum parallel execution:\n\n### 1. Parallel Execution Waves (REQUIRED)\n\nAnalyze task dependencies and group independent tasks into parallel waves:\n\n```\nWave 1 (Start Immediately - No Dependencies):\n\u251C\u2500\u2500 Task 1: [description] \u2192 category: X, skills: [a, b]\n\u2514\u2500\u2500 Task 4: [description] \u2192 category: Y, skills: [c]\n\nWave 2 (After Wave 1 Completes):\n\u251C\u2500\u2500 Task 2: [depends: 1] \u2192 category: X, skills: [a]\n\u251C\u2500\u2500 Task 3: [depends: 1] \u2192 category: Z, skills: [d]\n\u2514\u2500\u2500 Task 5: [depends: 4] \u2192 category: Y, skills: [c]\n\nWave 3 (After Wave 2 Completes):\n\u2514\u2500\u2500 Task 6: [depends: 2, 3] \u2192 category: X, skills: [a, b]\n\nCritical Path: Task 1 \u2192 Task 2 \u2192 Task 6\nEstimated Parallel Speedup: ~40% faster than sequential\n```\n\n### 2. Dependency Matrix (REQUIRED)\n\n| Task | Depends On | Blocks | Can Parallelize With |\n|------|------------|--------|---------------------|\n| 1 | None | 2, 3 | 4 |\n| 2 | 1 | 6 | 3, 5 |\n| 3 | 1 | 6 | 2, 5 |\n| 4 | None | 5 | 1 |\n| 5 | 4 | None | 2, 3 |\n| 6 | 2, 3 | None | None (final) |\n\n### 3. TODO List Structure (REQUIRED)\n\nEach TODO item MUST include:\n\n```markdown\n- [ ] N. [Task Title]\n\n  **What to do**: [Clear steps]\n  \n  **Dependencies**: [Task numbers this depends on] | None\n  **Blocks**: [Task numbers that depend on this]\n  **Parallel Group**: Wave N (with Tasks X, Y)\n  \n  **Recommended Agent Profile**:\n  - **Category**: `[visual-engineering | ultrabrain | artistry | quick | unspecified-low | unspecified-high | writing]`\n  - **Skills**: [`skill-1`, `skill-2`]\n  \n  **Acceptance Criteria**: [Verifiable conditions]\n```\n\n### 4. Agent Dispatch Summary (REQUIRED)\n\n| Wave | Tasks | Dispatch Command |\n|------|-------|------------------|\n| 1 | 1, 4 | `task(category=\"...\", load_skills=[...], run_in_background=true)` \u00D7 2 |\n| 2 | 2, 3, 5 | `task(...)` \u00D7 3 after Wave 1 completes |\n| 3 | 6 | `task(...)` final integration |\n\n**WHY PARALLEL TASK GRAPH IS MANDATORY:**\n- Orchestrator (Sisyphus) executes tasks in parallel waves\n- Independent tasks run simultaneously via background agents\n- Proper dependency tracking prevents race conditions\n- Category + skills ensure optimal model routing per task";
+export declare const ULTRAWORK_PLANNER_SECTION = "## CRITICAL: YOU ARE A PLANNER, NOT AN IMPLEMENTER\n\n**IDENTITY CONSTRAINT (NON-NEGOTIABLE):**\nYou ARE the planner. You ARE NOT an implementer. You DO NOT write code. You DO NOT execute tasks.\n\n**TOOL RESTRICTIONS (SYSTEM-ENFORCED):**\n| Tool | Allowed | Blocked |\n|------|---------|---------|\n| Write/Edit | `.omo/**/*.md` ONLY | Everything else |\n| Read | All files | - |\n| Bash | Research commands only | Implementation commands |\n| task | explore, librarian | - |\n\n**IF YOU TRY TO WRITE/EDIT OUTSIDE `.omo/`:**\n- System will BLOCK your action\n- You will receive an error\n- DO NOT retry - you are not supposed to implement\n\n**YOUR ONLY WRITABLE PATHS:**\n- `.omo/plans/*.md` - Final work plans\n- `.omo/drafts/*.md` - Working drafts during interview\n\n**WHEN USER ASKS YOU TO IMPLEMENT:**\nREFUSE. Say: \"I'm a planner. I create work plans, not implementations. Run `/start-work` after I finish planning.\"\n\n---\n\n## CONTEXT GATHERING (MANDATORY BEFORE PLANNING)\n\nYou ARE the planner. Your job: create bulletproof work plans.\n**Before drafting ANY plan, gather context via explore/librarian agents.**\n\n### Research Protocol\n1. **Fire parallel background agents** for comprehensive context:\n   ```\n   task(subagent_type=\"explore\", load_skills=[], prompt=\"Find existing patterns for [topic] in codebase\", run_in_background=true)\n   task(subagent_type=\"explore\", load_skills=[], prompt=\"Find test infrastructure and conventions\", run_in_background=true)\n   task(subagent_type=\"librarian\", load_skills=[], prompt=\"Find official docs and best practices for [technology]\", run_in_background=true)\n   ```\n2. **Wait for results** before planning - rushed plans fail\n3. **Synthesize findings** into informed requirements\n\n### What to Research\n- Existing codebase patterns and conventions\n- Test infrastructure (TDD possible?)\n- External library APIs and constraints\n- Similar implementations in OSS (via librarian)\n\n**NEVER plan blind. Context first, plan second.**\n\n---\n\n## MANDATORY OUTPUT: PARALLEL TASK GRAPH + TODO LIST\n\n**YOUR PRIMARY OUTPUT IS A PARALLEL EXECUTION TASK GRAPH.**\n\nWhen you finalize a plan, you MUST structure it for maximum parallel execution:\n\n### 1. Parallel Execution Waves (REQUIRED)\n\nAnalyze task dependencies and group independent tasks into parallel waves:\n\n```\nWave 1 (Start Immediately - No Dependencies):\n\u251C\u2500\u2500 Task 1: [description] \u2192 category: X, skills: [a, b]\n\u2514\u2500\u2500 Task 4: [description] \u2192 category: Y, skills: [c]\n\nWave 2 (After Wave 1 Completes):\n\u251C\u2500\u2500 Task 2: [depends: 1] \u2192 category: X, skills: [a]\n\u251C\u2500\u2500 Task 3: [depends: 1] \u2192 category: Z, skills: [d]\n\u2514\u2500\u2500 Task 5: [depends: 4] \u2192 category: Y, skills: [c]\n\nWave 3 (After Wave 2 Completes):\n\u2514\u2500\u2500 Task 6: [depends: 2, 3] \u2192 category: X, skills: [a, b]\n\nCritical Path: Task 1 \u2192 Task 2 \u2192 Task 6\nEstimated Parallel Speedup: ~40% faster than sequential\n```\n\n### 2. Dependency Matrix (REQUIRED)\n\n| Task | Depends On | Blocks | Can Parallelize With |\n|------|------------|--------|---------------------|\n| 1 | None | 2, 3 | 4 |\n| 2 | 1 | 6 | 3, 5 |\n| 3 | 1 | 6 | 2, 5 |\n| 4 | None | 5 | 1 |\n| 5 | 4 | None | 2, 3 |\n| 6 | 2, 3 | None | None (final) |\n\n### 3. TODO List Structure (REQUIRED)\n\nEach TODO item MUST include:\n\n```markdown\n- [ ] N. [Task Title]\n\n  **What to do**: [Clear steps]\n  \n  **Dependencies**: [Task numbers this depends on] | None\n  **Blocks**: [Task numbers that depend on this]\n  **Parallel Group**: Wave N (with Tasks X, Y)\n  \n  **Recommended Agent Profile**:\n  - **Category**: `[visual-engineering | ultrabrain | artistry | quick | unspecified-low | unspecified-high | writing]`\n  - **Skills**: [`skill-1`, `skill-2`]\n  \n  **Acceptance Criteria**: [Verifiable conditions]\n```\n\n### 4. Agent Dispatch Summary (REQUIRED)\n\n| Wave | Tasks | Dispatch Command |\n|------|-------|------------------|\n| 1 | 1, 4 | `task(category=\"...\", load_skills=[...], run_in_background=true)` \u00D7 2 |\n| 2 | 2, 3, 5 | `task(...)` \u00D7 3 after Wave 1 completes |\n| 3 | 6 | `task(...)` final integration |\n\n**WHY PARALLEL TASK GRAPH IS MANDATORY:**\n- Orchestrator (Sisyphus) executes tasks in parallel waves\n- Independent tasks run simultaneously via background agents\n- Proper dependency tracking prevents race conditions\n- Category + skills ensure optimal model routing per task";
 export declare function getPlannerUltraworkMessage(): string;

package/dist/hooks/prometheus-md-only/constants.d.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 export declare const HOOK_NAME = "prometheus-md-only";
 export declare const PROMETHEUS_AGENT = "prometheus";
 export declare const ALLOWED_EXTENSIONS: string[];
-export declare const ALLOWED_PATH_PREFIX = ".sisyphus";
+export declare const ALLOWED_PATH_PREFIX = ".omo";
 export declare const BLOCKED_TOOLS: string[];
 export declare const PLANNING_CONSULT_WARNING: string;
 export declare const PROMETHEUS_WORKFLOW_REMINDER: string;

package/dist/hooks/prometheus-md-only/path-policy.d.ts CHANGED Viewed

@@ -1,10 +1,10 @@
 /**
  * Cross-platform path validator for Prometheus file writes.
  * Uses path.resolve/relative instead of string matching to handle:
- * - Windows backslashes (e.g., .sisyphus\\plans\\x.md)
- * - Mixed separators (e.g., .sisyphus\\plans/x.md)
+ * - Windows backslashes (e.g., .omo\\plans\\x.md)
+ * - Mixed separators (e.g., .omo\\plans/x.md)
  * - Case-insensitive directory/extension matching
  * - Workspace confinement (blocks paths outside root or via traversal)
- * - Nested project paths (e.g., parent/.sisyphus/... when ctx.directory is parent)
+ * - Nested project paths (e.g., parent/.omo/... when ctx.directory is parent)
  */
 export declare function isAllowedFile(filePath: string, workspaceRoot: string): boolean;

package/dist/hooks/ralph-loop/completion-promise-detector-test-input.d.ts ADDED Viewed

@@ -0,0 +1,11 @@
+import type { PluginInput } from "@opencode-ai/plugin";
+export type SessionMessage = {
+    info?: {
+        role?: string;
+    };
+    parts?: Array<{
+        type: string;
+        text?: string;
+    }>;
+};
+export declare function createPluginInput(messages: SessionMessage[]): PluginInput;

package/dist/hooks/ralph-loop/constants.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 export declare const HOOK_NAME = "ralph-loop";
-export declare const DEFAULT_STATE_FILE = ".sisyphus/ralph-loop.local.md";
+export declare const DEFAULT_STATE_FILE = ".omo/ralph-loop.local.md";
 export declare const COMPLETION_TAG_PATTERN: RegExp;
 export declare const DEFAULT_MAX_ITERATIONS = 100;
 export declare const ULTRAWORK_MAX_ITERATIONS = 500;

package/dist/hooks/ralph-loop/continuation-prompt-injector.d.ts CHANGED Viewed

@@ -1,6 +1,9 @@
 import type { PluginInput } from "@opencode-ai/plugin";
 export type ContinuationPromptResult = {
     status: "dispatched";
+} | {
+    status: "deferred";
+    reason: "active" | "reserved";
 } | {
     status: "rejected";
     error: Error;
@@ -11,4 +14,5 @@ export declare function injectContinuationPrompt(ctx: PluginInput, options: {
     directory: string;
     apiTimeoutMs: number;
     inheritFromSessionID?: string;
+    idleSettleMs?: number;
 }): Promise<ContinuationPromptResult>;

package/dist/hooks/ralph-loop/iteration-continuation.d.ts CHANGED Viewed

@@ -3,6 +3,7 @@ import type { RalphLoopState } from "./types";
 type ContinuationOptions = {
     directory: string;
     apiTimeoutMs: number;
+    idleSettleMs: number;
     previousSessionID: string;
     loopState: {
         setSessionID: (sessionID: string) => RalphLoopState | null;
@@ -10,6 +11,10 @@ type ContinuationOptions = {
 };
 export type ContinuationResult = {
     status: "dispatched";
+    sessionID: string;
+} | {
+    status: "dispatch_deferred";
+    reason: "active" | "reserved";
 } | {
     status: "session_creation_rejected";
 } | {

package/dist/hooks/ralph-loop/loop-state-controller.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import type { RalphLoopOptions, RalphLoopState } from "./types";
+import type { IterationCommitExpectation, RalphLoopOptions, RalphLoopState } from "./types";
 export declare function createLoopStateController(options: {
     directory: string;
     stateDir: string | undefined;
@@ -14,9 +14,9 @@ export declare function createLoopStateController(options: {
     cancelLoop(sessionID: string): boolean;
     getState(): RalphLoopState | null;
     clear(): boolean;
-    incrementIteration(): RalphLoopState | null;
+    incrementIteration(expected?: IterationCommitExpectation): RalphLoopState | null;
     setSessionID(sessionID: string): RalphLoopState | null;
-    setMessageCountAtStart(sessionID: string, messageCountAtStart: number): RalphLoopState | null;
+    setMessageCountAtStart(sessionID: string, messageCountAtStart: number, expectedStartedAt?: string): RalphLoopState | null;
     markVerificationPending(sessionID: string): RalphLoopState | null;
     setVerificationSessionID(sessionID: string, verificationSessionID: string): RalphLoopState | null;
     restartAfterFailedVerification(sessionID: string, messageCountAtStart?: number): RalphLoopState | null;

package/dist/hooks/ralph-loop/pending-verification-handler.d.ts CHANGED Viewed

@@ -1,9 +1,10 @@
 import type { PluginInput } from "@opencode-ai/plugin";
 import type { RalphLoopState } from "./types";
+import type { IterationCommitExpectation } from "./types";
 type LoopStateController = {
     restartAfterFailedVerification: (sessionID: string, messageCountAtStart?: number) => RalphLoopState | null;
     clearVerificationState: (sessionID: string, messageCountAtStart?: number) => RalphLoopState | null;
-    incrementIteration: () => RalphLoopState | null;
+    incrementIteration: (expected?: IterationCommitExpectation) => RalphLoopState | null;
     clear: () => boolean;
     setVerificationSessionID: (sessionID: string, verificationSessionID: string) => RalphLoopState | null;
 };

package/dist/hooks/ralph-loop/ralph-loop-event-handler.d.ts CHANGED Viewed

@@ -1,9 +1,9 @@
 import type { PluginInput } from "@opencode-ai/plugin";
-import type { RalphLoopOptions, RalphLoopState } from "./types";
+import type { IterationCommitExpectation, RalphLoopOptions, RalphLoopState } from "./types";
 type LoopStateController = {
     getState: () => RalphLoopState | null;
     clear: () => boolean;
-    incrementIteration: () => RalphLoopState | null;
+    incrementIteration: (expected?: IterationCommitExpectation) => RalphLoopState | null;
     setSessionID: (sessionID: string) => RalphLoopState | null;
     markVerificationPending: (sessionID: string) => RalphLoopState | null;
     setVerificationSessionID: (sessionID: string, verificationSessionID: string) => RalphLoopState | null;

package/dist/hooks/ralph-loop/storage.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
-import type { RalphLoopState } from "./types";
+import type { IterationCommitExpectation, RalphLoopState } from "./types";
 export declare function getStateFilePath(directory: string, customPath?: string): string;
 export declare function readState(directory: string, customPath?: string): RalphLoopState | null;
 export declare function writeState(directory: string, state: RalphLoopState, customPath?: string): boolean;
 export declare function clearState(directory: string, customPath?: string): boolean;
-export declare function incrementIteration(directory: string, customPath?: string): RalphLoopState | null;
+export declare function incrementIteration(directory: string, customPath?: string, expected?: IterationCommitExpectation): RalphLoopState | null;

package/dist/hooks/ralph-loop/types.d.ts CHANGED Viewed

@@ -15,6 +15,10 @@ export interface RalphLoopState {
     verification_pending?: boolean;
     strategy?: "reset" | "continue";
 }
+export interface IterationCommitExpectation {
+    iteration: number;
+    sessionID: string;
+}
 export interface RalphLoopOptions {
     config?: RalphLoopConfig;
     getTranscriptPath?: (sessionId: string) => string;

package/dist/hooks/ralph-loop/verification-failure-handler.d.ts CHANGED Viewed

@@ -1,8 +1,8 @@
 import type { PluginInput } from "@opencode-ai/plugin";
-import type { RalphLoopState } from "./types";
+import type { IterationCommitExpectation, RalphLoopState } from "./types";
 type LoopStateController = {
     clearVerificationState: (sessionID: string, messageCountAtStart?: number) => RalphLoopState | null;
-    incrementIteration: () => RalphLoopState | null;
+    incrementIteration: (expected?: IterationCommitExpectation) => RalphLoopState | null;
     clear: () => boolean;
 };
 export declare function handleFailedVerification(ctx: PluginInput, input: {

package/dist/hooks/rules-injector/injector.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { readFileSync, statSync } from "node:fs";
+import { statSync } from "node:fs";
 import { homedir } from "node:os";
 import type { FindRuleFilesOptions } from "./rule-file-finder";
 import { createContentHash, isDuplicateByContentHash, isDuplicateByRealPath, shouldApplyRule } from "./matcher";
@@ -16,13 +16,20 @@ type DynamicTruncator = {
         truncated: boolean;
     }>;
 };
+type RuleFileReader = (path: string, encoding: "utf-8") => string;
+export interface ParsedRuleCacheStats {
+    entries: number;
+    bodyBytes: number;
+}
+export declare function clearParsedRuleCache(): void;
+export declare function getParsedRuleCacheStats(): ParsedRuleCacheStats;
 export declare function createRuleInjectionProcessor(deps: {
     workspaceDirectory: string;
     truncator: DynamicTruncator;
     getSessionCache: (sessionID: string) => SessionInjectedRulesCache;
     getSessionRuleScanCache?: (sessionID: string) => RuleScanCache;
     ruleFinderOptions?: FindRuleFilesOptions;
-    readFileSync?: typeof readFileSync;
+    readFileSync?: RuleFileReader;
     statSync?: typeof statSync;
     homedir?: typeof homedir;
     shouldApplyRule?: typeof shouldApplyRule;

package/dist/hooks/rules-injector/matcher.d.ts CHANGED Viewed

@@ -3,6 +3,11 @@ export interface MatchResult {
     applies: boolean;
     reason?: string;
 }
+export interface MatcherCacheStats {
+    entries: number;
+}
+export declare function resetMatcherCache(): void;
+export declare function getMatcherCacheStats(): MatcherCacheStats;
 /**
  * Check if a rule should apply to the current file based on metadata
  */

package/dist/hooks/rules-injector/project-root-finder.d.ts CHANGED Viewed

@@ -3,6 +3,10 @@ export declare function clearProjectRootCache(): void;
  * Find project root by walking up from startPath.
  * Checks for PROJECT_MARKERS (.git, pyproject.toml, package.json, etc.)
  *
+ * Memoizes every directory visited during the walk so subsequent lookups for
+ * any descendant path resolve in O(1) without re-running marker existsSync
+ * probes.
+ *
  * @param startPath - Starting path to search from (file or directory)
  * @returns Project root path or null if not found
  */

package/dist/hooks/rules-injector/rule-scan-cache.d.ts CHANGED Viewed

@@ -1,6 +1,13 @@
+import type { RuleFileCandidate } from "./types";
+export type DirectoryScanEntry = {
+    path: string;
+    realPath: string;
+};
 export type RuleScanCache = {
-    get: (key: string) => string[] | undefined;
-    set: (key: string, value: string[]) => void;
+    get: (key: string) => RuleFileCandidate[] | undefined;
+    set: (key: string, value: RuleFileCandidate[]) => void;
+    getDirScan: (dir: string) => DirectoryScanEntry[] | undefined;
+    setDirScan: (dir: string, entries: DirectoryScanEntry[]) => void;
     clear: () => void;
 };
 export declare function createRuleScanCache(): RuleScanCache;

package/dist/hooks/runtime-fallback/constants.d.ts CHANGED Viewed

@@ -17,3 +17,13 @@ export declare const RETRYABLE_ERROR_PATTERNS: RegExp[];
  * Hook name for identification and logging
  */
 export declare const HOOK_NAME = "runtime-fallback";
+/**
+ * First-prompt watchdog: how long to wait for the first sign of progress
+ * (assistant text/reasoning/finish) from a subagent session before assuming
+ * the provider is silently stuck and dispatching the configured fallback.
+ *
+ * Tuned to be longer than typical first-token latency (well under 30s in
+ * practice) yet much shorter than the 30-minute outer poll timeout that
+ * would otherwise be the only safety net.
+ */
+export declare const DEFAULT_FIRST_PROMPT_WATCHDOG_MS = 90000;

package/dist/hooks/runtime-fallback/first-prompt-watchdog.d.ts ADDED Viewed

@@ -0,0 +1,25 @@
+import type { HookDeps } from "./types";
+import type { AutoRetryHelpers } from "./auto-retry";
+export interface FirstPromptWatchdog {
+    onUserMessage(sessionID: string, model?: string, agent?: string): void;
+    onAssistantProgress(sessionID: string): void;
+    onSessionTerminal(sessionID: string): void;
+    dispose(): void;
+}
+/**
+ * Translate an OpenCode session event into the appropriate watchdog signal.
+ *
+ * Progress semantics for cancelling the watchdog:
+ *   - assistant `info.error` set: the existing message-update-handler will
+ *     deal with the error path; the watchdog has done its job.
+ *   - assistant `info.finish` set: the response completed.
+ *   - any assistant part with a known type (`text`, `reasoning`, `tool`,
+ *     `tool_use`, `tool_result`, `tool-call`, `step-start`, `file`, ...):
+ *     the model has started responding. A subagent that immediately runs
+ *     tools is *working*, not silent — so any part presence cancels.
+ */
+export declare function observeEventForWatchdog(event: {
+    type: string;
+    properties?: unknown;
+}, watchdog: FirstPromptWatchdog): void;
+export declare function createFirstPromptWatchdog(deps: HookDeps, helpers: AutoRetryHelpers, watchdogMs?: number): FirstPromptWatchdog;

package/dist/hooks/runtime-fallback/hook.d.ts CHANGED Viewed

@@ -1,2 +1,15 @@
+import { createAutoRetryHelpers } from "./auto-retry";
+import { createChatMessageHandler } from "./chat-message-handler";
+import { createEventHandler } from "./event-handler";
+import { createFirstPromptWatchdog } from "./first-prompt-watchdog";
+import { createMessageUpdateHandler } from "./message-update-handler";
 import type { RuntimeFallbackHook, RuntimeFallbackOptions, RuntimeFallbackPluginInput } from "./types";
-export declare function createRuntimeFallbackHook(ctx: RuntimeFallbackPluginInput, options?: RuntimeFallbackOptions): RuntimeFallbackHook;
+type RuntimeFallbackHookFactories = {
+    createAutoRetryHelpers: typeof createAutoRetryHelpers;
+    createEventHandler: typeof createEventHandler;
+    createMessageUpdateHandler: typeof createMessageUpdateHandler;
+    createChatMessageHandler: typeof createChatMessageHandler;
+    createFirstPromptWatchdog: typeof createFirstPromptWatchdog;
+};
+export declare function createRuntimeFallbackHook(ctx: RuntimeFallbackPluginInput, options?: RuntimeFallbackOptions, factoryOverrides?: Partial<RuntimeFallbackHookFactories>): RuntimeFallbackHook;
+export {};