npm - oh-my-codex - Versions diffs - 0.14.0 → 0.14.2 - Mend

oh-my-codex 0.14.0 → 0.14.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

package/Cargo.lock +5 -5
package/Cargo.toml +1 -1
package/README.md +14 -8
package/crates/omx-explore/src/main.rs +94 -1
package/crates/omx-sparkshell/src/codex_bridge.rs +59 -12
package/crates/omx-sparkshell/tests/execution.rs +48 -0
package/dist/cli/__tests__/explore.test.js +33 -1
package/dist/cli/__tests__/explore.test.js.map +1 -1
package/dist/cli/__tests__/index.test.js +11 -2
package/dist/cli/__tests__/index.test.js.map +1 -1
package/dist/cli/__tests__/package-bin-contract.test.js +5 -0
package/dist/cli/__tests__/package-bin-contract.test.js.map +1 -1
package/dist/cli/__tests__/question.test.js +139 -25
package/dist/cli/__tests__/question.test.js.map +1 -1
package/dist/cli/__tests__/session-scoped-runtime.test.js +30 -0
package/dist/cli/__tests__/session-scoped-runtime.test.js.map +1 -1
package/dist/cli/__tests__/setup-agents-overwrite.test.js +32 -7
package/dist/cli/__tests__/setup-agents-overwrite.test.js.map +1 -1
package/dist/cli/__tests__/setup-refresh.test.js +8 -6
package/dist/cli/__tests__/setup-refresh.test.js.map +1 -1
package/dist/cli/__tests__/sparkshell-cli.test.js +23 -0
package/dist/cli/__tests__/sparkshell-cli.test.js.map +1 -1
package/dist/cli/__tests__/uninstall.test.js +65 -5
package/dist/cli/__tests__/uninstall.test.js.map +1 -1
package/dist/cli/__tests__/update.test.js +360 -26
package/dist/cli/__tests__/update.test.js.map +1 -1
package/dist/cli/explore.d.ts.map +1 -1
package/dist/cli/explore.js +18 -3
package/dist/cli/explore.js.map +1 -1
package/dist/cli/index.d.ts +2 -1
package/dist/cli/index.d.ts.map +1 -1
package/dist/cli/index.js +7 -2
package/dist/cli/index.js.map +1 -1
package/dist/cli/setup.d.ts.map +1 -1
package/dist/cli/setup.js +25 -3
package/dist/cli/setup.js.map +1 -1
package/dist/cli/sparkshell.d.ts.map +1 -1
package/dist/cli/sparkshell.js +11 -1
package/dist/cli/sparkshell.js.map +1 -1
package/dist/cli/team.d.ts.map +1 -1
package/dist/cli/team.js +159 -394
package/dist/cli/team.js.map +1 -1
package/dist/cli/uninstall.d.ts.map +1 -1
package/dist/cli/uninstall.js +3 -1
package/dist/cli/uninstall.js.map +1 -1
package/dist/cli/update.d.ts +37 -9
package/dist/cli/update.d.ts.map +1 -1
package/dist/cli/update.js +204 -26
package/dist/cli/update.js.map +1 -1
package/dist/config/__tests__/generator-idempotent.test.js +51 -14
package/dist/config/__tests__/generator-idempotent.test.js.map +1 -1
package/dist/config/__tests__/generator-notify.test.js +35 -10
package/dist/config/__tests__/generator-notify.test.js.map +1 -1
package/dist/config/generator.d.ts +1 -0
package/dist/config/generator.d.ts.map +1 -1
package/dist/config/generator.js +61 -7
package/dist/config/generator.js.map +1 -1
package/dist/hooks/__tests__/code-review-skill-contract.test.d.ts +2 -0
package/dist/hooks/__tests__/code-review-skill-contract.test.d.ts.map +1 -0
package/dist/hooks/__tests__/code-review-skill-contract.test.js +56 -0
package/dist/hooks/__tests__/code-review-skill-contract.test.js.map +1 -0
package/dist/hooks/__tests__/deep-interview-contract.test.js +31 -0
package/dist/hooks/__tests__/deep-interview-contract.test.js.map +1 -1
package/dist/hooks/__tests__/explicit-terminal-stop-docs-contract.test.d.ts +2 -0
package/dist/hooks/__tests__/explicit-terminal-stop-docs-contract.test.d.ts.map +1 -0
package/dist/hooks/__tests__/explicit-terminal-stop-docs-contract.test.js +43 -0
package/dist/hooks/__tests__/explicit-terminal-stop-docs-contract.test.js.map +1 -0
package/dist/hooks/__tests__/explicit-terminal-stop-model-docs-contract.test.d.ts +2 -0
package/dist/hooks/__tests__/explicit-terminal-stop-model-docs-contract.test.d.ts.map +1 -0
package/dist/hooks/__tests__/explicit-terminal-stop-model-docs-contract.test.js +38 -0
package/dist/hooks/__tests__/explicit-terminal-stop-model-docs-contract.test.js.map +1 -0
package/dist/hooks/__tests__/keyword-detector.test.js +108 -0
package/dist/hooks/__tests__/keyword-detector.test.js.map +1 -1
package/dist/hooks/__tests__/prompt-guidance-test-helpers.d.ts.map +1 -1
package/dist/hooks/__tests__/prompt-guidance-test-helpers.js +16 -1
package/dist/hooks/__tests__/prompt-guidance-test-helpers.js.map +1 -1
package/dist/hooks/keyword-detector.d.ts.map +1 -1
package/dist/hooks/keyword-detector.js +34 -8
package/dist/hooks/keyword-detector.js.map +1 -1
package/dist/mcp/__tests__/bootstrap.test.js +7 -25
package/dist/mcp/__tests__/bootstrap.test.js.map +1 -1
package/dist/mcp/__tests__/server-lifecycle.test.js +60 -0
package/dist/mcp/__tests__/server-lifecycle.test.js.map +1 -1
package/dist/mcp/__tests__/state-server.test.js +177 -0
package/dist/mcp/__tests__/state-server.test.js.map +1 -1
package/dist/mcp/bootstrap.d.ts.map +1 -1
package/dist/mcp/bootstrap.js +36 -18
package/dist/mcp/bootstrap.js.map +1 -1
package/dist/mcp/state-server.d.ts +17 -0
package/dist/mcp/state-server.d.ts.map +1 -1
package/dist/mcp/state-server.js +55 -1
package/dist/mcp/state-server.js.map +1 -1
package/dist/notifications/__tests__/index.test.js +0 -3
package/dist/notifications/__tests__/index.test.js.map +1 -1
package/dist/notifications/__tests__/session-status.test.js +90 -0
package/dist/notifications/__tests__/session-status.test.js.map +1 -1
package/dist/notifications/session-status.d.ts +2 -0
package/dist/notifications/session-status.d.ts.map +1 -1
package/dist/notifications/session-status.js +19 -4
package/dist/notifications/session-status.js.map +1 -1
package/dist/question/__tests__/deep-interview.test.js +44 -0
package/dist/question/__tests__/deep-interview.test.js.map +1 -1
package/dist/question/__tests__/renderer.test.js +192 -12
package/dist/question/__tests__/renderer.test.js.map +1 -1
package/dist/question/__tests__/state.test.js +21 -1
package/dist/question/__tests__/state.test.js.map +1 -1
package/dist/question/deep-interview.d.ts +3 -0
package/dist/question/deep-interview.d.ts.map +1 -1
package/dist/question/deep-interview.js +18 -1
package/dist/question/deep-interview.js.map +1 -1
package/dist/question/renderer.d.ts +4 -2
package/dist/question/renderer.d.ts.map +1 -1
package/dist/question/renderer.js +87 -18
package/dist/question/renderer.js.map +1 -1
package/dist/runtime/__tests__/run-outcome.test.js +38 -0
package/dist/runtime/__tests__/run-outcome.test.js.map +1 -1
package/dist/runtime/__tests__/run-state.test.d.ts +2 -0
package/dist/runtime/__tests__/run-state.test.d.ts.map +1 -0
package/dist/runtime/__tests__/run-state.test.js +37 -0
package/dist/runtime/__tests__/run-state.test.js.map +1 -0
package/dist/runtime/run-loop.d.ts +5 -1
package/dist/runtime/run-loop.d.ts.map +1 -1
package/dist/runtime/run-loop.js +8 -3
package/dist/runtime/run-loop.js.map +1 -1
package/dist/runtime/run-outcome.d.ts +18 -0
package/dist/runtime/run-outcome.d.ts.map +1 -1
package/dist/runtime/run-outcome.js +156 -7
package/dist/runtime/run-outcome.js.map +1 -1
package/dist/runtime/run-state.d.ts +5 -1
package/dist/runtime/run-state.d.ts.map +1 -1
package/dist/runtime/run-state.js +13 -3
package/dist/runtime/run-state.js.map +1 -1
package/dist/runtime/terminal-lifecycle.d.ts +11 -0
package/dist/runtime/terminal-lifecycle.d.ts.map +1 -0
package/dist/runtime/terminal-lifecycle.js +52 -0
package/dist/runtime/terminal-lifecycle.js.map +1 -0
package/dist/scripts/__tests__/codex-native-hook.test.js +370 -56
package/dist/scripts/__tests__/codex-native-hook.test.js.map +1 -1
package/dist/scripts/__tests__/postinstall.test.d.ts +2 -0
package/dist/scripts/__tests__/postinstall.test.d.ts.map +1 -0
package/dist/scripts/__tests__/postinstall.test.js +178 -0
package/dist/scripts/__tests__/postinstall.test.js.map +1 -0
package/dist/scripts/codex-native-hook.d.ts +1 -0
package/dist/scripts/codex-native-hook.d.ts.map +1 -1
package/dist/scripts/codex-native-hook.js +115 -56
package/dist/scripts/codex-native-hook.js.map +1 -1
package/dist/scripts/postinstall.d.ts +22 -0
package/dist/scripts/postinstall.d.ts.map +1 -0
package/dist/scripts/postinstall.js +105 -0
package/dist/scripts/postinstall.js.map +1 -0
package/dist/state/__tests__/operations.test.js +60 -0
package/dist/state/__tests__/operations.test.js.map +1 -1
package/dist/state/operations.d.ts.map +1 -1
package/dist/state/operations.js +18 -1
package/dist/state/operations.js.map +1 -1
package/dist/team/__tests__/role-router.test.js +6 -0
package/dist/team/__tests__/role-router.test.js.map +1 -1
package/dist/team/__tests__/runtime.test.js +108 -2
package/dist/team/__tests__/runtime.test.js.map +1 -1
package/dist/team/runtime.d.ts.map +1 -1
package/dist/team/runtime.js +18 -4
package/dist/team/runtime.js.map +1 -1
package/dist/utils/__tests__/dep-versions.test.js +25 -8
package/dist/utils/__tests__/dep-versions.test.js.map +1 -1
package/dist/utils/__tests__/paths.test.js +45 -0
package/dist/utils/__tests__/paths.test.js.map +1 -1
package/dist/utils/paths.d.ts +2 -0
package/dist/utils/paths.d.ts.map +1 -1
package/dist/utils/paths.js +22 -7
package/dist/utils/paths.js.map +1 -1
package/dist/verification/__tests__/ci-rust-gates.test.js +1 -1
package/dist/verification/__tests__/ci-rust-gates.test.js.map +1 -1
package/package.json +3 -2
package/prompts/architect.md +4 -0
package/prompts/code-reviewer.md +3 -0
package/skills/code-review/SKILL.md +94 -28
package/skills/deep-interview/SKILL.md +91 -0
package/src/scripts/__tests__/codex-native-hook.test.ts +468 -64
package/src/scripts/__tests__/postinstall.test.ts +210 -0
package/src/scripts/codex-native-hook.ts +136 -53
package/src/scripts/postinstall-bootstrap.js +23 -0
package/src/scripts/postinstall.ts +161 -0
package/templates/AGENTS.md +1 -1
package/templates/model-instructions/explore-lightweight-AGENTS.md +11 -0
package/templates/model-instructions/sparkshell-lightweight-AGENTS.md +10 -0

package/skills/code-review/SKILL.md CHANGED Viewed

@@ -15,8 +15,6 @@ This skill activates when:
 - After implementing a major feature
 - User wants quality assessment
-## What It Does
 ## GPT-5.4 Guidance Alignment
 - Default to concise, evidence-dense progress and completion reporting unless the user or risk level requires more detail.
@@ -24,30 +22,49 @@ This skill activates when:
 - If correctness depends on additional inspection, retrieval, execution, or verification, keep using the relevant tools until the review is grounded.
 - Continue through clear, low-risk, reversible next steps automatically; ask only when the next step is materially branching, destructive, or preference-dependent.
-Delegates to the `code-reviewer` agent (THOROUGH tier) for deep analysis:
+Delegates to the `code-reviewer` and `architect` agents in parallel for a two-lane review:
 1. **Identify Changes**
    - Run `git diff` to find changed files
    - Determine scope of review (specific files or entire PR)
-2. **Review Categories**
+2. **Launch Parallel Review Lanes**
+   - **`code-reviewer` lane** - owns spec compliance, security, code quality, performance, and maintainability findings
+   - **`architect` lane** - owns the devil's-advocate / design-tradeoff perspective
+   - Both lanes run in parallel and produce distinct outputs before final synthesis
+3. **Review Categories**
    - **Security** - Hardcoded secrets, injection risks, XSS, CSRF
    - **Code Quality** - Function size, complexity, nesting depth
    - **Performance** - Algorithm efficiency, N+1 queries, caching
    - **Best Practices** - Naming, documentation, error handling
    - **Maintainability** - Duplication, coupling, testability
-3. **Severity Rating**
+4. **Severity Rating**
    - **CRITICAL** - Security vulnerability (must fix before merge)
    - **HIGH** - Bug or major code smell (should fix before merge)
    - **MEDIUM** - Minor issue (fix when possible)
    - **LOW** - Style/suggestion (consider fixing)
-4. **Specific Recommendations**
+5. **Architectural Status Contract**
+   - **CLEAR** - No unresolved architectural blocker was found
+   - **WATCH** - Non-blocking design/tradeoff concern that must appear in the final synthesis
+   - **BLOCK** - Unresolved design concern that prevents a merge-ready verdict
+6. **Specific Recommendations**
    - File:line locations for each issue
    - Concrete fix suggestions
    - Code examples where applicable
+7. **Final Synthesis**
+   - Combine the `code-reviewer` recommendation and the architect status into one final verdict
+   - Deterministic merge gating rules:
+     - If architect status is **BLOCK**, final recommendation is **REQUEST CHANGES**
+     - Else if `code-reviewer` recommendation is **REQUEST CHANGES**, final recommendation is **REQUEST CHANGES**
+     - Else if architect status is **WATCH**, final recommendation is **COMMENT**
+     - Else final recommendation follows the `code-reviewer` lane
+   - The final report must make architect blockers impossible to miss
 ## Agent Delegation
 ```
@@ -58,6 +75,8 @@ delegate(
 Review code changes for quality, security, and maintainability.
+This is the code/spec/security lane. Do not absorb architectural ownership.
 Scope: [git diff or specific files]
 Review Checklist:
@@ -74,6 +93,29 @@ Output: Code review report with:
 - Fix recommendations
 - Approval recommendation (APPROVE / REQUEST CHANGES / COMMENT)"
 )
+delegate(
+  role="architect",
+  tier="THOROUGH",
+  prompt="ARCHITECTURE / DEVIL'S-ADVOCATE REVIEW TASK
+Review the same code changes from the architecture/tradeoff perspective.
+Scope: [git diff or specific files]
+Focus:
+- System boundaries and interfaces
+- Hidden coupling or long-term maintainability risks
+- Tradeoff tension the main reviewer might miss
+- Strongest counterargument against approving as-is
+Output:
+- Architectural Status: CLEAR / WATCH / BLOCK
+- File:line evidence for each concern
+- Concrete tradeoff or design recommendation"
+)
+Run both lanes in parallel, then synthesize them with the deterministic rules above.
 ```
 ## External Model Consultation (Preferred)
@@ -112,45 +154,59 @@ CODE REVIEW REPORT
 ==================
 Files Reviewed: 8
-Total Issues: 15
+Total Issues: 12
+Architectural Status: WATCH
 CRITICAL (0)
 -----------
 (none)
-HIGH (3)
+HIGH (0)
 --------
+(none)
+MEDIUM (7)
+----------
 1. src/api/auth.ts:42
-   Issue: User input not sanitized before SQL query
-   Risk: SQL injection vulnerability
-   Fix: Use parameterized queries or ORM
+   Issue: Email normalization logic is duplicated instead of reusing the shared helper
+   Risk: Validation rules can drift between authentication paths
+   Fix: Route both paths through the shared normalization helper
 2. src/components/UserProfile.tsx:89
-   Issue: Password displayed in plain text in logs
-   Risk: Credential exposure
-   Fix: Remove password from log statements
+   Issue: Derived permissions are recalculated on every render
+   Risk: Avoidable work during profile refreshes
+   Fix: Memoize the derived permissions list or compute it upstream
 3. src/utils/validation.ts:15
-   Issue: Email regex allows invalid formats
-   Risk: Accepts malformed emails
-   Fix: Use proven email validation library
-MEDIUM (7)
-----------
-...
+   Issue: Form-layer and server-layer validation messages are defined separately
+   Risk: User-facing validation guidance can become inconsistent
+   Fix: Share one validation message helper across both call sites
 LOW (5)
 -------
 ...
-RECOMMENDATION: REQUEST CHANGES
+ARCHITECTURE WATCHLIST
+----------------------
+- src/review/orchestrator.ts:88
+  Concern: Review result synthesis relies on implicit ordering rather than an explicit blocker contract
+  Status: WATCH
+  Recommendation: Define deterministic merge gating before expanding reviewers
+SYNTHESIS
+---------
+- code-reviewer recommendation: COMMENT
+- architect status: WATCH
+- final recommendation: COMMENT
+RECOMMENDATION: COMMENT
-Critical security issues must be addressed before merge.
+Address any WATCH concerns before treating the change as merge-ready.
 ```
 ## Review Checklist
-The code-reviewer agent checks:
+The `code-reviewer` lane checks:
 ### Security
 - [ ] No hardcoded secrets (API keys, passwords, tokens)
@@ -180,11 +236,21 @@ The code-reviewer agent checks:
 - [ ] Tests for critical paths
 - [ ] No commented-out code
+## Architect Lane Checklist
+The `architect` lane checks:
+- [ ] Boundary or interface changes are explicit
+- [ ] New coupling/tradeoff risks are surfaced
+- [ ] Long-horizon maintainability concerns are evidence-backed
+- [ ] Architectural status is one of `CLEAR`, `WATCH`, or `BLOCK`
+- [ ] Any `BLOCK` concern cites the reason merge-ready status should be withheld
 ## Approval Criteria
-**APPROVE** - No CRITICAL or HIGH issues, minor improvements only
-**REQUEST CHANGES** - CRITICAL or HIGH issues present
-**COMMENT** - Only LOW/MEDIUM issues, no blocking concerns
+**APPROVE** - `code-reviewer` returns APPROVE and architect status is `CLEAR`
+**REQUEST CHANGES** - `code-reviewer` returns REQUEST CHANGES or architect status is `BLOCK`
+**COMMENT** - `code-reviewer` returns COMMENT with architect status `CLEAR`, architect status is `WATCH`, or only LOW/MEDIUM improvements remain
 ## Scenario Examples
@@ -207,7 +273,7 @@ Includes coordinated review execution across specialized agents.
 ```
 /ralph code-review then fix all issues
 ```
-Review code, get feedback, fix until approved.
+On the explicit Ralph path, review findings should flow into automatic fix follow-up without another permission prompt. Plain `code-review` itself remains read-only and does **not** promise auto-fix.
 **With Ultrawork:**
 ```

package/skills/deep-interview/SKILL.md CHANGED Viewed

@@ -52,6 +52,7 @@ If no flag is provided, use **Standard**.
 - Reduce user effort: ask only the highest-leverage unresolved question, and never ask the user for codebase facts that can be discovered directly
 - For brownfield work, prefer evidence-backed confirmation questions such as "I found X in Y. Should this change follow that pattern?"
 - In Codex CLI, deep-interview uses `omx question` as the required OMX-owned structured questioning path for every interview round
+- If you launch `omx question` in a background terminal, immediately wait for that background terminal to finish and read its JSON answer before scoring ambiguity, asking another round, or handing off
 - If `omx question` is unavailable in the current runtime, treat that as a blocker/error for deep-interview rather than falling back to `request_user_input` or plain-text questioning
 - Re-score ambiguity after each answer and show progress transparently
 - Do not hand off to execution while ambiguity remains above threshold unless user explicitly opts to proceed with warning
@@ -154,6 +155,96 @@ Round {n} | Target: {weakest_dimension} | Ambiguity: {score}%
 {question}
 ```
+`omx question` payload guidance for interview rounds:
+- Use canonical `type` values instead of authoring raw `multi_select` flags by hand. `type: "single-answerable"` is the default for one-path decisions; `type: "multi-answerable"` is the canonical shape for bounded multi-select rounds. The runtime will keep `multi_select` aligned with `type`.
+- Use `single-answerable` when exactly one answer should drive the next branch, the options are mutually exclusive, or selecting more than one answer would blur the decision boundary. Typical cases: handoff lane selection, choosing the primary failure mode, or confirming which of several competing interpretations is correct.
+- Use `multi-answerable` when multiple options may all be true at once and you need to capture a bounded set of coexisting constraints, non-goals, risks, or acceptance checks in one round. Typical cases: selecting all out-of-scope items, all success metrics that must hold, or all deployment constraints that apply together.
+- If one selected option would immediately require a follow-up question to disambiguate the others, prefer a `single-answerable` round now and ask the follow-up next. Do not hide a branching interview tree inside one overloaded multi-select prompt.
+- Keep interview options bounded and concrete. If the valid answers are already known, set `allow_other: false`; only leave `allow_other: true` when the interview genuinely needs one user-supplied option that cannot be enumerated in advance.
+- Read answers structurally. For `single-answerable`, expect one decisive selection in `answer.value` plus `answer.selected_values`. For `multi-answerable`, treat `answer.selected_values` as the source of truth for all chosen constraints/non-goals and preserve the full set in the transcript/spec.
+Canonical bounded single-choice payload:
+```json
+{
+  "question": "Which execution lane should own this once the interview is complete?",
+  "type": "single-answerable",
+  "options": [
+    {
+      "label": "Plan first",
+      "value": "ralplan",
+      "description": "Need architecture and test-shape review before execution"
+    },
+    {
+      "label": "Execute directly",
+      "value": "autopilot",
+      "description": "Requirements are already explicit enough for planning plus execution"
+    },
+    {
+      "label": "Refine further",
+      "value": "refine",
+      "description": "Clarification is still needed before any handoff"
+    }
+  ],
+  "allow_other": false,
+  "other_label": "Other",
+  "source": "deep-interview"
+}
+```
+Canonical bounded multi-select payload:
+```json
+{
+  "question": "Which non-goals must stay out of scope for the first pass?",
+  "type": "multi-answerable",
+  "options": [
+    {
+      "label": "No UI redesign",
+      "value": "no-ui-redesign",
+      "description": "Keep layout and styling unchanged"
+    },
+    {
+      "label": "No new dependencies",
+      "value": "no-new-dependencies",
+      "description": "Work within the existing toolchain"
+    },
+    {
+      "label": "No API contract changes",
+      "value": "no-api-contract-changes",
+      "description": "Preserve external request and response shapes"
+    }
+  ],
+  "allow_other": false,
+  "other_label": "Other",
+  "source": "deep-interview"
+}
+```
+Canonical answer-shape reminders:
+```json
+{
+  "answer": {
+    "kind": "option",
+    "value": "ralplan",
+    "selected_labels": ["Plan first"],
+    "selected_values": ["ralplan"]
+  }
+}
+```
+```json
+{
+  "answer": {
+    "kind": "multi",
+    "value": ["no-new-dependencies", "no-api-contract-changes"],
+    "selected_labels": ["No new dependencies", "No API contract changes"],
+    "selected_values": ["no-new-dependencies", "no-api-contract-changes"]
+  }
+}
+```
 ### 2c) Score ambiguity
 Score each weighted dimension in `[0.0, 1.0]` with justification + gap.