npm - okstra - Versions diffs - 0.18.2 → 0.18.3 - Mend

okstra 0.18.2 → 0.18.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/package.json +1 -1
package/runtime/BUILD.json +2 -2
package/runtime/python/okstra_token_usage/collect.py +104 -28
package/runtime/skills/okstra-report-writer/SKILL.md +1 -1
package/runtime/templates/reports/final-report.template.md +22 -8

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "okstra",
-  "version": "0.18.2",
+  "version": "0.18.3",
   "description": "Multi-agent cross-verification orchestrator runtime + Claude Code skills.",
   "license": "MIT",
   "author": "devonshin",

package/runtime/BUILD.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "package": "0.18.2",
-  "builtAt": "2026-05-13T13:51:20.597Z",
+  "package": "0.18.3",
+  "builtAt": "2026-05-13T13:59:58.844Z",
   "repoRoot": "/home/runner/work/okstra/okstra"
 }

package/runtime/python/okstra_token_usage/collect.py CHANGED Viewed

@@ -2,6 +2,7 @@
 from __future__ import annotations
 import json
+from datetime import datetime
 from pathlib import Path
 from .blocks import na_block, usage_block
 from .claude import claude_session_totals, find_claude_team_sessions
@@ -11,6 +12,76 @@ from .paths import claude_project_dir, utc_now
 from .pricing import codex_cost_usd, gemini_cost_usd
+def match_prefixes(worker_id: str) -> list[str]:
+    """Return the agentName prefixes that should be attributed to ``worker_id``.
+    The Agent harness records the `name` arg on every dispatch as `agentName`
+    in the subagent jsonl. Lead frequently appends suffixes (`-002`,
+    `-reverify-r1`, `-impl`, `-2`) when it dispatches the same role multiple
+    times or in different sub-flows. We treat every `agentName` matching one of
+    these prefixes — either exactly or as `<prefix>-<suffix>` — as belonging
+    to this worker so its tokens get aggregated. For implementation runs the
+    executor variant `<provider>-executor` is also attributed back to the
+    matching provider worker.
+    """
+    if not worker_id:
+        return []
+    if worker_id == "report-writer":
+        return ["report-writer"]
+    prefixes = [worker_id]
+    if not worker_id.endswith("-worker"):
+        prefixes.append(f"{worker_id}-worker")
+        prefixes.append(f"{worker_id}-executor")
+    return prefixes
+def agent_matches(agent_name: str, prefixes: list[str]) -> bool:
+    if not agent_name:
+        return False
+    for prefix in prefixes:
+        if agent_name == prefix or agent_name.startswith(f"{prefix}-"):
+            return True
+    return False
+def _aggregate_totals(items: list[dict]) -> dict:
+    """Sum token + tool counters across multiple session totals dicts.
+    `startedAt` / `endedAt` collapse to the union window; `durationMs` is
+    recomputed from that window so re-tries and convergence rounds count
+    against a single contiguous span. `model` and `agentName` keep the first
+    non-empty value (the canonical role identity).
+    """
+    aggregate: dict = {
+        "totalTokens": 0, "inputTokens": 0, "outputTokens": 0,
+        "cacheCreationTokens": 0, "cacheReadTokens": 0,
+        "toolUses": 0, "durationMs": 0,
+        "agentName": None, "model": None,
+        "startedAt": None, "endedAt": None,
+    }
+    for t in items:
+        for k in ("totalTokens", "inputTokens", "outputTokens",
+                  "cacheCreationTokens", "cacheReadTokens", "toolUses"):
+            aggregate[k] += t.get(k, 0) or 0
+        if aggregate["agentName"] is None and t.get("agentName"):
+            aggregate["agentName"] = t["agentName"]
+        if aggregate["model"] is None and t.get("model"):
+            aggregate["model"] = t["model"]
+        s, e = t.get("startedAt"), t.get("endedAt")
+        if s and (aggregate["startedAt"] is None or s < aggregate["startedAt"]):
+            aggregate["startedAt"] = s
+        if e and (aggregate["endedAt"] is None or e > aggregate["endedAt"]):
+            aggregate["endedAt"] = e
+    if aggregate["startedAt"] and aggregate["endedAt"]:
+        try:
+            a = datetime.fromisoformat(aggregate["startedAt"].replace("Z", "+00:00"))
+            b = datetime.fromisoformat(aggregate["endedAt"].replace("Z", "+00:00"))
+            aggregate["durationMs"] = max(0, int((b - a).total_seconds() * 1000))
+        except ValueError:
+            pass
+    return aggregate
 def collect(team_state_path: Path, project_root: Path | None = None) -> dict:
     state = json.loads(team_state_path.read_text())
     cwd = project_root or _infer_project_root(team_state_path, state)
@@ -26,19 +97,20 @@ def collect(team_state_path: Path, project_root: Path | None = None) -> dict:
         team_name = f"okstra-{task_id}" if task_id else ""
     lead_sid = (state.get("lead") or {}).get("sessionId")
-    # 1) Claude sessions (lead + claude-side workers).
+    # 1) Claude sessions (lead + claude-side workers). Cache totals at scan
+    # time so we don't re-read the jsonl when a worker matches multiple
+    # sessions.
     claude_sessions = find_claude_team_sessions(cwd, team_name, lead_sid)
-    by_agent: dict[str, tuple[str, Path]] = {}
+    by_agent: dict[str, list[tuple[str, Path, dict]]] = {}
     lead_path: Path | None = None
     for sid, path in claude_sessions.items():
         if sid == lead_sid:
             lead_path = path
             continue
-        # Read agentName lazily.
         totals = claude_session_totals(path)
         agent = totals.get("agentName")
         if agent:
-            by_agent[agent] = (sid, path)
+            by_agent.setdefault(agent, []).append((sid, path, totals))
     # Lead.
     if lead_path is not None:
@@ -50,35 +122,39 @@ def collect(team_state_path: Path, project_root: Path | None = None) -> dict:
             f"lead session jsonl not found under {claude_project_dir(cwd)} (sessionId={lead_sid})"
         )
-    # Workers.
+    # Workers — match by prefix and aggregate every session that belongs to
+    # the same role (re-dispatches with `-002`, convergence `-reverify-r1`,
+    # implementation `-executor`, report-writer `-impl` / `-2`, etc.).
     for worker in state.get("workers", []):
         worker_id = worker.get("workerId")
         agent = worker.get("agent")
-        # Subagent agentName convention: workerId itself is "claude" but agentName is "claude-worker"; report-writer == "report-writer".
-        agent_name_candidates = []
-        if worker_id:
-            agent_name_candidates.append(worker_id)
-            if not worker_id.endswith("-worker") and worker_id != "report-writer":
-                agent_name_candidates.append(f"{worker_id}-worker")
-        # Claude wrapper jsonl (also for codex/gemini-worker, since these are Claude subagents).
-        wrapper = None
-        for cand in agent_name_candidates:
-            if cand in by_agent:
-                wrapper = by_agent[cand]
-                break
-        if wrapper is None:
-            worker["usage"] = na_block(f"no Claude subagent jsonl found with agentName matching {agent_name_candidates}")
+        prefixes = match_prefixes(worker_id) if worker_id else []
+        matched: list[tuple[str, Path, dict]] = []
+        for agent_name, entries in by_agent.items():
+            if agent_matches(agent_name, prefixes):
+                matched.extend(entries)
+        if not matched:
+            worker["usage"] = na_block(
+                f"no Claude subagent jsonl found with agentName matching prefixes {prefixes}"
+            )
             continue
-        sid, path = wrapper
-        totals = claude_session_totals(path)
-        block = usage_block(totals, source="claude-jsonl")
-        block["sessionId"] = sid
-        # For codex/gemini workers, also try to find the underlying CLI session
-        # within the wrapper subagent's time window.
-        wrapper_start = totals.get("startedAt") or ""
-        wrapper_end = totals.get("endedAt") or ""
+        # Stable order by startedAt so the "primary" session is the first one.
+        matched.sort(key=lambda x: x[2].get("startedAt") or "")
+        primary_sid, _primary_path, _primary_totals = matched[0]
+        aggregate = _aggregate_totals([t for _, _, t in matched])
+        block = usage_block(aggregate, source="claude-jsonl")
+        block["sessionId"] = primary_sid
+        if len(matched) > 1:
+            block["additionalSessionIds"] = [sid for sid, _, _ in matched[1:]]
+            block["matchedAgentNames"] = sorted({t.get("agentName") for _, _, t in matched if t.get("agentName")})
+        # For codex/gemini workers, find every CLI session that fell inside the
+        # aggregated wrapper window.
+        wrapper_start = aggregate.get("startedAt") or ""
+        wrapper_end = aggregate.get("endedAt") or ""
         if agent in ("codex", "gemini"):
             if agent == "codex":
                 cli = find_codex_session(cwd, wrapper_start, wrapper_end)

package/runtime/skills/okstra-report-writer/SKILL.md CHANGED Viewed

@@ -90,7 +90,7 @@ Behaviour contract:
 After the spawner completes, the report-writer worker MUST update Section 6 ("Recommended Next Steps") to list every newly created task-key together with its entry command, so the user can pick the follow-up up immediately:
 ```
-- Follow-up: `<task-group>/<new-task-id>` — `okstra --task-key <task-group>/<new-task-id> --task-type <suggested>`
+- Follow-up: `<task-group>/<new-task-id>` — Claude Code 세션 안 `/okstra-run task-key=<task-group>/<new-task-id> task-type=<suggested>` / 별도 터미널 `scripts/okstra.sh --task-key <task-group>/<new-task-id> --task-type <suggested>`
 ```
 ## Phase 7 token-usage collector (BLOCKING)

package/runtime/templates/reports/final-report.template.md CHANGED Viewed

@@ -13,8 +13,12 @@
 > 다음 `implementation` run은 아래 체크박스가 `[x]`로 표시되어 있을 때에만 진입할 수 있습니다 (`okstra_ctl.run._validate_approved_plan` 가 이 마커를 line-anchored 정규식으로 검사하여 통과/거부합니다). 본문(`Sections 1`–`4.5`)을 끝까지 읽고, `4.5.9 Open Questions`가 비어 있거나 모두 해소된 뒤 승인해 주세요.
 - 승인 여부 (사용자가 직접 편집): `- [ ] Approved` ← 승인하려면 `[ ]` 를 `[x]` 로 변경하여 저장하세요.
-- 승인 후 다음 단계 명령어 (방법 A — 수동 편집): `okstra --task-key {{TASK_KEY}} --task-type implementation --approved-plan <이 보고서 경로>`
-- 승인 + 실행 한 번에 (방법 B — CLI 자체를 승인 의사로): `okstra --task-key {{TASK_KEY}} --task-type implementation --approved-plan <이 보고서 경로> --approve`
+- 승인 후 다음 단계 명령어 (방법 A — 수동 편집):
+  - Claude Code 세션 안: `/okstra-run task-key={{TASK_KEY}} task-type=implementation approved-plan=<이 보고서 경로>`
+  - 별도 터미널: `scripts/okstra.sh --task-key {{TASK_KEY}} --task-type implementation --approved-plan <이 보고서 경로>`
+- 승인 + 실행 한 번에 (방법 B — 진입 명령 자체를 승인 의사로):
+  - Claude Code 세션 안: `/okstra-run task-key={{TASK_KEY}} task-type=implementation approved-plan=<이 보고서 경로> approve`
+  - 별도 터미널: `scripts/okstra.sh --task-key {{TASK_KEY}} --task-type implementation --approved-plan <이 보고서 경로> --approve`
   - 방법 B 는 `--approve` 입력 행위 자체를 승인 의사로 모델링합니다. 런타임이 본 블록의 체크박스를 자동으로 `[x]` 로 바꾸고, 본 섹션 하단에 `승인 일시 (CLI ack): <ISO8601>` audit 라인을 한 줄 덧붙입니다.
 - 승인을 보류하거나 거부하려면 체크박스는 `[ ]` 로 두고 `--approve` 도 사용하지 마세요. 필요한 변경 사항은 `4.5.9 Open Questions` 또는 `Section 5 Clarification Requests` 에 기록한 뒤 같은 phase 를 재실행해 주세요.
@@ -270,7 +274,11 @@ H1 이 `skip` 이거나 H3 가 `cancel` 인 경우, 본 섹션 다음의 4.6.4 ~
   - `resolved`: 다음 run에서 lead가 답변을 받아 검증을 마쳤습니다.
   - `obsolete`: 이후 분석 결과로 더 이상 필요 없어진 항목입니다.
-이 보고서에 답을 채우신 뒤에는 `okstra --resume-clarification --task-key {{TASK_KEY}}` 한 줄로 같은 phase를 다시 실행하실 수 있습니다(자동으로 `$EDITOR`가 이 파일을 열고, 저장하면 같은 phase가 `--clarification-response`로 carry-in 되어 재실행됩니다). 스크립트로 자동화하실 때는 기존 형식 `okstra --task-key {{TASK_KEY}} --task-type {{TASK_TYPE}} --clarification-response <이 파일 경로>`도 그대로 사용하실 수 있습니다.
+이 보고서에 답을 채우신 뒤에는 한 줄로 같은 phase를 다시 실행하실 수 있습니다(자동으로 `$EDITOR`가 이 파일을 열고, 저장하면 같은 phase가 `--clarification-response`로 carry-in 되어 재실행됩니다).
+- Claude Code 세션 안: `/okstra-run resume-clarification task-key={{TASK_KEY}}`
+- 별도 터미널: `scripts/okstra.sh --resume-clarification --task-key {{TASK_KEY}}`
+스크립트로 자동화하실 때는 셸 형식 `scripts/okstra.sh --task-key {{TASK_KEY}} --task-type {{TASK_TYPE}} --clarification-response <이 파일 경로>`도 그대로 사용하실 수 있습니다. Node `okstra` admin CLI 는 `--task-key`/`--task-type`/`--resume-clarification` 을 받지 않으므로 위 두 진입점 중 하나를 사용하세요.
 ### 5.1 추가 자료 요청 (Additional Materials Requested)
@@ -298,16 +306,22 @@ H1 이 `skip` 이거나 H3 가 `cancel` 인 경우, 본 섹션 다음의 4.6.4 ~
 This section is **always present** in every final report — never omit the heading. If there are no concrete actions to take, write the single line `- No further action required. Final verdict in section 2 stands.` under the heading and stop.
-When concrete actions exist, list them as a numbered list using the rules below. Each item must include the exact command(s) the user can copy-paste. Prefer the `--task-key` shorthand for follow-up runs and `--resume-clarification` for clarification answer turn-arounds; show the equivalent full-args form only when useful.
+When concrete actions exist, list them as a numbered list using the rules below. Each item must include the exact command(s) the user can copy-paste. Show **both** the Claude Code in-session form (`/okstra-run …`) and the external-terminal shell form (`scripts/okstra.sh …`) — the Node `okstra` admin CLI does NOT accept `--task-key` / `--task-type` / `--resume-clarification`. Prefer the `task-key` shorthand for follow-up runs and `resume-clarification` for clarification answer turn-arounds; show the equivalent full-args form only when useful.
 1. **Highest-priority next action.** State what to do and why in one sentence, then the command. Example shortcut forms:
-   - Same phase rerun: `okstra --task-key {{TASK_KEY}} --task-type {{TASK_TYPE}}`
-   - Next phase: `okstra --task-key {{TASK_KEY}} --task-type <next-phase>` (omit `--task-type` to use the manifest's `workflow.nextRecommendedPhase` automatically when it is a concrete phase, not `pending-routing-decision` / `done-or-follow-up`).
+   - Same phase rerun:
+     - Claude Code 세션 안: `/okstra-run task-key={{TASK_KEY}} task-type={{TASK_TYPE}}`
+     - 별도 터미널: `scripts/okstra.sh --task-key {{TASK_KEY}} --task-type {{TASK_TYPE}}`
+   - Next phase (omit `task-type` to use the manifest's `workflow.nextRecommendedPhase` automatically when it is a concrete phase, not `pending-routing-decision` / `done-or-follow-up`):
+     - Claude Code 세션 안: `/okstra-run task-key={{TASK_KEY}} task-type=<next-phase>`
+     - 별도 터미널: `scripts/okstra.sh --task-key {{TASK_KEY}} --task-type <next-phase>`
 2. **Additional verification needed before implementation or release.** List read-only checks (test commands, log queries, dashboard URLs) that the user should run before moving to the next phase. No state-mutating commands here.
 3. **Follow-up tasks or related tasks if needed.** Reference them by `task-key` when they already exist; otherwise describe the new brief to draft.
 4. **If section 5 has any `open` rows**, the highest-priority next step MUST be the clarification turn-around. Show both forms:
-   - Preferred (interactive): `okstra --resume-clarification --task-key {{TASK_KEY}}` — opens this file in `$EDITOR`, then auto-reruns the same phase with `--clarification-response` carry-in.
-   - Scripted: `okstra --task-key {{TASK_KEY}} --task-type {{TASK_TYPE}} --clarification-response <path-to-this-file-after-editing>`.
+   - Preferred (interactive) — opens this file in `$EDITOR`, then auto-reruns the same phase with `--clarification-response` carry-in:
+     - Claude Code 세션 안: `/okstra-run resume-clarification task-key={{TASK_KEY}}`
+     - 별도 터미널: `scripts/okstra.sh --resume-clarification --task-key {{TASK_KEY}}`
+   - Scripted: `scripts/okstra.sh --task-key {{TASK_KEY}} --task-type {{TASK_TYPE}} --clarification-response <path-to-this-file-after-editing>`.
 Empty-state placeholder, copy verbatim when nothing else applies: