triflux 4.2.6 → 4.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (63) hide show
  1. package/package.json +2 -1
  2. package/skills/tfx-workspace/evals/evals.json +0 -79
  3. package/skills/tfx-workspace/iteration-1/benchmark.json +0 -162
  4. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/eval_metadata.json +0 -11
  5. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/old_skill/grading.json +0 -9
  6. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/old_skill/outputs/analysis.md +0 -154
  7. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/old_skill/timing.json +0 -5
  8. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/with_skill/grading.json +0 -9
  9. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/with_skill/outputs/analysis.md +0 -126
  10. package/skills/tfx-workspace/iteration-1/codex-gemini-remap/with_skill/timing.json +0 -5
  11. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/eval_metadata.json +0 -11
  12. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/old_skill/grading.json +0 -9
  13. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/old_skill/outputs/analysis.md +0 -119
  14. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/old_skill/timing.json +0 -5
  15. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/with_skill/grading.json +0 -9
  16. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/with_skill/outputs/analysis.md +0 -115
  17. package/skills/tfx-workspace/iteration-1/doctor-diagnosis/with_skill/timing.json +0 -5
  18. package/skills/tfx-workspace/iteration-1/hub-start-sequence/eval_metadata.json +0 -10
  19. package/skills/tfx-workspace/iteration-1/hub-start-sequence/old_skill/grading.json +0 -8
  20. package/skills/tfx-workspace/iteration-1/hub-start-sequence/old_skill/outputs/analysis.md +0 -86
  21. package/skills/tfx-workspace/iteration-1/hub-start-sequence/old_skill/timing.json +0 -5
  22. package/skills/tfx-workspace/iteration-1/hub-start-sequence/with_skill/grading.json +0 -8
  23. package/skills/tfx-workspace/iteration-1/hub-start-sequence/with_skill/outputs/analysis.md +0 -81
  24. package/skills/tfx-workspace/iteration-1/hub-start-sequence/with_skill/timing.json +0 -5
  25. package/skills/tfx-workspace/iteration-1/multi-team-creation/eval_metadata.json +0 -12
  26. package/skills/tfx-workspace/iteration-1/multi-team-creation/old_skill/grading.json +0 -10
  27. package/skills/tfx-workspace/iteration-1/multi-team-creation/old_skill/outputs/analysis.md +0 -316
  28. package/skills/tfx-workspace/iteration-1/multi-team-creation/old_skill/timing.json +0 -5
  29. package/skills/tfx-workspace/iteration-1/multi-team-creation/with_skill/grading.json +0 -10
  30. package/skills/tfx-workspace/iteration-1/multi-team-creation/with_skill/outputs/analysis.md +0 -352
  31. package/skills/tfx-workspace/iteration-1/multi-team-creation/with_skill/timing.json +0 -5
  32. package/skills/tfx-workspace/iteration-1/review.html +0 -1325
  33. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/eval_metadata.json +0 -12
  34. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/old_skill/grading.json +0 -10
  35. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/old_skill/outputs/analysis.md +0 -97
  36. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/old_skill/timing.json +0 -5
  37. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/with_skill/grading.json +0 -10
  38. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/with_skill/outputs/analysis.md +0 -94
  39. package/skills/tfx-workspace/iteration-1/routing-implement-shortcut/with_skill/timing.json +0 -5
  40. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/eval_metadata.json +0 -12
  41. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/old_skill/grading.json +0 -10
  42. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/old_skill/outputs/analysis.md +0 -209
  43. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/old_skill/timing.json +0 -5
  44. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/with_skill/grading.json +0 -10
  45. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/with_skill/outputs/analysis.md +0 -193
  46. package/skills/tfx-workspace/iteration-1/routing-multi-task-triage/with_skill/timing.json +0 -5
  47. package/skills/tfx-workspace/iteration-2/benchmark.json +0 -62
  48. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/eval_metadata.json +0 -13
  49. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/old_skill/grading.json +0 -11
  50. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/old_skill/outputs/analysis.md +0 -382
  51. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/old_skill/timing.json +0 -5
  52. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/with_skill/grading.json +0 -11
  53. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/with_skill/outputs/analysis.md +0 -333
  54. package/skills/tfx-workspace/iteration-2/multi-team-creation-refactored/with_skill/timing.json +0 -5
  55. package/skills/tfx-workspace/iteration-2/review.html +0 -1325
  56. package/skills/tfx-workspace/skill-snapshot/tfx-auto/SKILL.md +0 -217
  57. package/skills/tfx-workspace/skill-snapshot/tfx-auto-codex/SKILL.md +0 -77
  58. package/skills/tfx-workspace/skill-snapshot/tfx-codex/SKILL.md +0 -65
  59. package/skills/tfx-workspace/skill-snapshot/tfx-doctor/SKILL.md +0 -94
  60. package/skills/tfx-workspace/skill-snapshot/tfx-gemini/SKILL.md +0 -82
  61. package/skills/tfx-workspace/skill-snapshot/tfx-hub/SKILL.md +0 -133
  62. package/skills/tfx-workspace/skill-snapshot/tfx-multi/SKILL.md +0 -426
  63. package/skills/tfx-workspace/skill-snapshot/tfx-setup/SKILL.md +0 -101
@@ -1,119 +0,0 @@
1
- # tfx-doctor Routing Analysis
2
-
3
- ## User Request
4
- "HUD가 안 보이고 codex도 안 되는데 어떻게 해?"
5
-
6
- ---
7
-
8
- ## 1. Mode Selection
9
-
10
- **Mode used: default (진단만)**
11
-
12
- Rationale:
13
- - The user is reporting two symptoms: HUD not visible and Codex not working.
14
- - The request does not contain any explicit repair intent ("--fix"), cache reset request ("캐시 초기화", "리셋", "reset"), or destructive intent.
15
- - The skill's auto-suggest trigger list includes both "HUD가 안 보여" and "codex/gemini가 안 돼", which directly match the user's message.
16
- - Because no `--fix` or `--reset` flag is implied, the skill begins in read-only diagnostic mode.
17
- - After the diagnostic report is shown, `--fix` would be **suggested** to the user as a next step.
18
-
19
- ---
20
-
21
- ## 2. Exact Bash Command That Would Be Run
22
-
23
- ```bash
24
- Bash("triflux doctor")
25
- ```
26
-
27
- No additional flags. This is the read-only diagnostic path.
28
-
29
- ---
30
-
31
- ## 3. Diagnostics Checked
32
-
33
- The `triflux doctor` command (default mode) checks all of the following:
34
-
35
- | Diagnostic Item | Relevance to This Request |
36
- |----------------|--------------------------|
37
- | tfx-route.sh 설치 상태 | General health baseline |
38
- | HUD 설치 및 설정 상태 | **Directly relevant** — user reports HUD not visible |
39
- | Codex/Gemini/Claude CLI 경로 (크로스 셸) | **Directly relevant** — user reports Codex not working |
40
- | 스킬 설치 상태 | General health |
41
- | 플러그인 등록 상태 | General health |
42
- | MCP 인벤토리 캐시 | Could affect HUD and CLI display |
43
- | CLI 이슈 트래커 | May log the Codex failure |
44
- | 잔존 팀(orphan teams) 감지 (`~/.claude/teams/`) | General health |
45
-
46
- All eight diagnostic areas are checked in default mode — none are skipped.
47
-
48
- ---
49
-
50
- ## 4. Whether --fix Would Be Suggested
51
-
52
- **Yes.** After the diagnostic report is displayed, `--fix` would be recommended to the user as the next step if any issues are found (e.g., HUD misconfiguration, missing Codex CLI path, corrupted cache). The skill definition explicitly states:
53
-
54
- > 수정 모드 (`/tfx-doctor --fix`): 진단 전에 자동 수정을 시도합니다.
55
-
56
- The agent would prompt: "문제가 발견되었습니다. `/tfx-doctor --fix`를 실행하여 자동 수정을 시도하시겠습니까?"
57
-
58
- ---
59
-
60
- ## 5. Whether --reset Would Be Used (and Why/Why Not)
61
-
62
- **No. `--reset` would NOT be used.**
63
-
64
- Reasons:
65
- - The user's message contains no reset/cache-clear intent ("캐시 초기화", "리셋", "reset").
66
- - `--reset` is a destructive operation that wipes all triflux-related caches (8 files including claude-usage-cache.json, mcp-inventory.json, etc.).
67
- - The symptoms described (HUD not visible, Codex not working) are diagnostic-first scenarios — they should be investigated before resorting to full cache deletion.
68
- - Per the skill definition, `--reset` is reserved for explicit cache-initialization requests.
69
- - If `--fix` still leaves issues unresolved, the agent would then consider suggesting `--reset` as a last resort, but only with user confirmation.
70
-
71
- ---
72
-
73
- ## 6. Expected Report Format
74
-
75
- After `triflux doctor` runs, the agent reports results in this structure:
76
-
77
- ```
78
- ## triflux doctor 진단 결과
79
-
80
- | 항목 | 상태 | 비고 |
81
- |------|------|------|
82
- | tfx-route.sh | ✓ / ✗ | ... |
83
- | HUD | ✓ / ✗ | 설치됨/설치 안됨/설정 오류 |
84
- | Codex CLI 경로 | ✓ / ✗ | 경로 발견/미발견 |
85
- | Gemini CLI 경로 | ✓ / ✗ | ... |
86
- | Claude CLI 경로 | ✓ / ✗ | ... |
87
- | 스킬 설치 상태 | ✓ / ✗ | ... |
88
- | 플러그인 등록 | ✓ / ✗ | ... |
89
- | MCP 인벤토리 캐시 | ✓ / ✗ | ... |
90
- | CLI 이슈 트래커 | ✓ / ✗ | ... |
91
- | orphan teams | ✓ / ✗ | ... |
92
-
93
- 이슈가 발견되었습니다. `/tfx-doctor --fix`로 자동 수정을 시도할 수 있습니다.
94
- ```
95
-
96
- If no issues are found:
97
- ```
98
- 모든 진단 항목이 정상입니다.
99
- ```
100
-
101
- If `--fix` is subsequently run and issues still remain after repair:
102
- ```
103
- Codex/Gemini 설치는 수동으로 진행해야 합니다. (설치 안내 링크 또는 명령어 제공)
104
- ```
105
-
106
- ---
107
-
108
- ## Summary
109
-
110
- | Decision Point | Result |
111
- |----------------|--------|
112
- | Skill triggered | tfx-doctor |
113
- | Mode | default (read-only diagnostic) |
114
- | Command | `Bash("triflux doctor")` |
115
- | HUD diagnosed | Yes |
116
- | Codex CLI path diagnosed | Yes |
117
- | --fix suggested after report | Yes (if issues found) |
118
- | --reset used | No |
119
- | --reset trigger condition | Only if user explicitly requests cache reset |
@@ -1,5 +0,0 @@
1
- {
2
- "total_tokens": 14482,
3
- "duration_ms": 48260,
4
- "total_duration_seconds": 48.3
5
- }
@@ -1,9 +0,0 @@
1
- {
2
- "expectations": [
3
- {"text": "Runs 'triflux doctor' as first diagnostic step", "passed": true, "evidence": "Agent output: 'Exact command: Bash(\"triflux doctor\")'"},
4
- {"text": "Suggests '--fix' mode for auto-repair", "passed": true, "evidence": "Agent output: '--fix would be suggested to the user after the diagnosis report is returned'"},
5
- {"text": "Mentions HUD and CLI path checks in explanation", "passed": true, "evidence": "Agent output: 'HUD installation and config, Codex/Gemini/Claude CLI paths — directly relevant to symptoms'"},
6
- {"text": "Does NOT jump straight to --reset (that's for cache only)", "passed": true, "evidence": "Agent output: '--reset is destructive and reserved for explicit reset requests; user never said 리셋/초기화/reset'"}
7
- ],
8
- "summary": {"passed": 4, "failed": 0, "total": 4, "pass_rate": 1.0}
9
- }
@@ -1,115 +0,0 @@
1
- # tfx-doctor Routing Analysis
2
-
3
- ## User Request
4
-
5
- > "HUD가 안 보이고 codex도 안 되는데 어떻게 해?"
6
-
7
- ---
8
-
9
- ## Skill Matched
10
-
11
- **tfx-doctor** (`skills/tfx-doctor/SKILL.md`)
12
-
13
- The request directly matches two of the documented auto-suggestion triggers:
14
- - "HUD가 안 보여" → maps to "HUD가 안 보이고"
15
- - "codex/gemini가 안 돼" → maps to "codex도 안 되는데"
16
-
17
- ---
18
-
19
- ## Mode Selected
20
-
21
- **Default mode** (`/tfx-doctor` — 진단만, 읽기 전용)
22
-
23
- Rationale: The user is reporting symptoms ("안 보이고", "안 되는데") but has not asked for an automatic fix, a reset, or a cache wipe. The skill definition states that the default mode is read-only diagnosis only. `--fix` would be *suggested* after the diagnosis if issues are found, but it would not be applied automatically without user consent. `--reset` is not appropriate here because the user has not said "캐시 초기화", "리셋", or "reset".
24
-
25
- ---
26
-
27
- ## Exact Bash Command That Would Be Run
28
-
29
- ```bash
30
- Bash("triflux doctor")
31
- ```
32
-
33
- No flags. This is the single command executed in default mode.
34
-
35
- ---
36
-
37
- ## Diagnostics Checked
38
-
39
- The skill definition lists the following items that `triflux doctor` inspects:
40
-
41
- | # | Diagnostic Item | Relevance to this Request |
42
- |---|-----------------|--------------------------|
43
- | 1 | tfx-route.sh 설치 상태 | Baseline routing check |
44
- | 2 | HUD 설치 및 설정 상태 | Directly relevant — HUD가 안 보임 |
45
- | 3 | Codex/Gemini/Claude CLI 경로 (크로스 셸) | Directly relevant — codex 안 됨 |
46
- | 4 | 스킬 설치 상태 | General health |
47
- | 5 | 플러그인 등록 상태 | General health |
48
- | 6 | MCP 인벤토리 캐시 | Could affect HUD/Codex behaviour |
49
- | 7 | CLI 이슈 트래커 | May surface logged errors |
50
- | 8 | 잔존 팀(orphan teams) 감지 (`~/.claude/teams/`) | General health |
51
-
52
- Both primary symptoms (HUD invisible, Codex not working) are covered by items 2 and 3.
53
-
54
- ---
55
-
56
- ## --fix Suggestion
57
-
58
- **Yes — `--fix` would be suggested** after the diagnosis report is returned to the user.
59
-
60
- The skill's error-handling table states: "if issues remain after `--fix`, manual installation of Codex/Gemini is guided." This implies the flow is:
61
-
62
- 1. Run default diagnosis → report findings.
63
- 2. If issues are found, offer the user the option to re-run with `--fix`.
64
- 3. User decides; skill does not auto-escalate.
65
-
66
- ---
67
-
68
- ## --reset Decision
69
-
70
- **`--reset` would NOT be used.**
71
-
72
- Reasons:
73
- - The user did not request a cache wipe, full reset, or use the words "리셋", "초기화", or "reset".
74
- - `--reset` is a destructive, irreversible operation (deletes all cache files listed in the skill) and must only be triggered by explicit user intent.
75
- - The reported symptoms (HUD invisible, Codex not working) are diagnostic problems, not confirmed cache-corruption problems. A reset would be premature without diagnosis confirming a cache issue.
76
-
77
- ---
78
-
79
- ## Expected Report Format
80
-
81
- After `triflux doctor` completes, the output is relayed to the user verbatim (per the skill: "결과를 사용자에게 보고합니다"). Based on the diagnostic items, the expected report structure is:
82
-
83
- ```
84
- [triflux doctor] 진단 결과
85
- ─────────────────────────────────
86
- ✓ / ✗ tfx-route.sh 설치 상태
87
- ✓ / ✗ HUD 설치 및 설정 상태
88
- ✓ / ✗ Codex CLI 경로
89
- ✓ / ✗ Gemini CLI 경로
90
- ✓ / ✗ Claude CLI 경로
91
- ✓ / ✗ 스킬 설치 상태
92
- ✓ / ✗ 플러그인 등록 상태
93
- ✓ / ✗ MCP 인벤토리 캐시
94
- ✓ / ✗ CLI 이슈 트래커
95
- ✓ / ✗ 잔존 팀(orphan teams)
96
- ─────────────────────────────────
97
- N개 이슈 발견. --fix로 자동 수정하려면: /tfx-doctor --fix
98
- ```
99
-
100
- If `--fix` is subsequently accepted by the user, the report repeats after remediation, showing whether items moved from ✗ to ✓. Any items that `--fix` cannot resolve (e.g., Codex not installed) are surfaced with a manual-installation note.
101
-
102
- ---
103
-
104
- ## Summary
105
-
106
- | Decision Point | Answer |
107
- |----------------|--------|
108
- | Skill triggered | tfx-doctor |
109
- | Mode | default (진단만) |
110
- | Command run | `triflux doctor` |
111
- | HUD checked | Yes |
112
- | CLI paths checked | Yes (Codex, Gemini, Claude) |
113
- | --fix suggested | Yes, after diagnosis |
114
- | --fix auto-applied | No |
115
- | --reset used | No |
@@ -1,5 +0,0 @@
1
- {
2
- "total_tokens": 14499,
3
- "duration_ms": 53804,
4
- "total_duration_seconds": 53.8
5
- }
@@ -1,10 +0,0 @@
1
- {
2
- "eval_id": 5,
3
- "eval_name": "hub-start-sequence",
4
- "prompt": "/tfx-hub start",
5
- "assertions": [
6
- "Runs 'node hub/server.mjs' with run_in_background=true",
7
- "Mentions port 27888 and /mcp endpoint",
8
- "Does NOT try to run any triage or routing"
9
- ]
10
- }
@@ -1,8 +0,0 @@
1
- {
2
- "expectations": [
3
- {"text": "Runs 'node hub/server.mjs' with run_in_background=true", "passed": true, "evidence": "Agent output: 'Bash(\"node hub/server.mjs\", run_in_background=true)'"},
4
- {"text": "Mentions port 27888 and /mcp endpoint", "passed": true, "evidence": "Agent output: 'Port: 27888, MCP endpoint: http://127.0.0.1:27888/mcp'"},
5
- {"text": "Does NOT try to run any triage or routing", "passed": true, "evidence": "Agent correctly identified as command match, not fallthrough"}
6
- ],
7
- "summary": {"passed": 3, "failed": 0, "total": 3, "pass_rate": 1.0}
8
- }
@@ -1,86 +0,0 @@
1
- # Routing Analysis: `/tfx-hub start`
2
-
3
- **Skill source:** `skills/tfx-workspace/skill-snapshot/tfx-hub/SKILL.md`
4
- **Input:** `/tfx-hub start`
5
- **Run mode:** DRY RUN — no commands executed
6
-
7
- ---
8
-
9
- ## 1. Command Match vs. Fallthrough
10
-
11
- This input **matches a command** — specifically the `start` command.
12
-
13
- The skill's input interpretation table explicitly lists:
14
-
15
- ```
16
- /tfx-hub start → 커맨드 매칭 → 허브 시작
17
- ```
18
-
19
- The argument `start` is a recognized command keyword (alongside `stop`, `status`, `--port`). Therefore, the fallthrough path is NOT taken.
20
-
21
- ---
22
-
23
- ## 2. Exact Bash Command That Would Be Run
24
-
25
- ```bash
26
- Bash("node hub/server.mjs", run_in_background=true)
27
- ```
28
-
29
- This is quoted verbatim from the `### start — 허브 시작` section of the skill definition.
30
-
31
- ---
32
-
33
- ## 3. run_in_background Setting
34
-
35
- `run_in_background` would be set to **`true`**.
36
-
37
- The skill definition explicitly passes `run_in_background=true` as a parameter to the `Bash` call for the `start` command. The hub process is a long-running server and must not block the agent thread.
38
-
39
- ---
40
-
41
- ## 4. Port and Endpoint
42
-
43
- - **Port:** `27888`
44
- - **MCP endpoint:** `http://127.0.0.1:27888/mcp`
45
- - **Status endpoint:** `http://127.0.0.1:27888/status`
46
-
47
- The skill states: "Streamable HTTP MCP 서버를 `http://127.0.0.1:27888/mcp` 에서 시작"
48
-
49
- Supporting runtime details:
50
- - SQLite WAL DB: `~/.claude/cache/tfx-hub/state.db`
51
- - PID file: `~/.claude/cache/tfx-hub/hub.pid`
52
- - Port can be overridden via env var `TFX_HUB_PORT`; DB path via `TFX_HUB_DB`
53
-
54
- ---
55
-
56
- ## 5. Post-Start Registration Steps
57
-
58
- The skill documents a section titled **"각 CLI 등록 방법"** (How to register with each CLI) describing steps to run after the hub starts. These are not executed automatically by the `start` command — they are listed as manual follow-up actions:
59
-
60
- ```bash
61
- # Codex
62
- codex mcp add tfx-hub --url http://127.0.0.1:27888/mcp
63
-
64
- # Gemini (settings.json)
65
- # mcpServers.tfx-hub.url = "http://127.0.0.1:27888/mcp"
66
-
67
- # Claude
68
- claude mcp add --transport http tfx-hub http://127.0.0.1:27888/mcp
69
- ```
70
-
71
- The `start` command itself only launches `node hub/server.mjs` in the background. Registration with individual CLI agents is a separate, post-start step described in the skill but not triggered automatically. The skill does not indicate these registration calls are part of the `start` flow — they are presented as supplementary instructions under their own heading.
72
-
73
- ---
74
-
75
- ## Summary Table
76
-
77
- | Field | Value |
78
- |-------------------------|--------------------------------------------|
79
- | Routing outcome | Command match (`start`) |
80
- | Fallthrough triggered | No |
81
- | Exact command | `Bash("node hub/server.mjs", run_in_background=true)` |
82
- | run_in_background | `true` |
83
- | Hub port | `27888` |
84
- | MCP endpoint | `http://127.0.0.1:27888/mcp` |
85
- | Status endpoint | `http://127.0.0.1:27888/status` |
86
- | Post-start registration | Manual — not auto-executed by start command |
@@ -1,5 +0,0 @@
1
- {
2
- "total_tokens": 14904,
3
- "duration_ms": 51754,
4
- "total_duration_seconds": 51.8
5
- }
@@ -1,8 +0,0 @@
1
- {
2
- "expectations": [
3
- {"text": "Runs 'node hub/server.mjs' with run_in_background=true", "passed": true, "evidence": "Agent output: 'Bash(\"node hub/server.mjs\", run_in_background=true)'"},
4
- {"text": "Mentions port 27888 and /mcp endpoint", "passed": true, "evidence": "Agent output: 'Port 27888, MCP endpoint at http://127.0.0.1:27888/mcp'"},
5
- {"text": "Does NOT try to run any triage or routing", "passed": true, "evidence": "Agent correctly identified this as a command match (start), not fallthrough to triage"}
6
- ],
7
- "summary": {"passed": 3, "failed": 0, "total": 3, "pass_rate": 1.0}
8
- }
@@ -1,81 +0,0 @@
1
- # Routing Analysis: `/tfx-hub start`
2
-
3
- ## Source
4
- Skill definition: `skills/tfx-hub/SKILL.md`
5
-
6
- ---
7
-
8
- ## 1. Command Match vs. Fallthrough
9
-
10
- **Result: Command match — `start`**
11
-
12
- The skill defines an explicit routing table under "입력 해석 규칙":
13
-
14
- ```
15
- /tfx-hub start → 커맨드 매칭 → 허브 시작
16
- ```
17
-
18
- The argument `start` is listed as a command keyword. The fallthrough rule only applies when the argument does NOT match `start`, `stop`, `status`, or `--port`. Therefore `/tfx-hub start` is handled by the `start` command branch, not the free-form fallthrough.
19
-
20
- ---
21
-
22
- ## 2. Exact Bash Command
23
-
24
- ```bash
25
- Bash("node hub/server.mjs", run_in_background=true)
26
- ```
27
-
28
- Quoted verbatim from the skill's `### start — 허브 시작` section.
29
-
30
- ---
31
-
32
- ## 3. `run_in_background`
33
-
34
- **Set to `true`.**
35
-
36
- The skill explicitly passes `run_in_background=true` in the `start` command call. This is the only command in the skill that uses background execution.
37
-
38
- ---
39
-
40
- ## 4. Port and Endpoint
41
-
42
- - **Port:** `27888` (default; overridable via environment variable `TFX_HUB_PORT`)
43
- - **MCP endpoint:** `http://127.0.0.1:27888/mcp`
44
- - **Status endpoint:** `http://127.0.0.1:27888/status`
45
-
46
- Additional runtime artefacts written on start:
47
- - SQLite WAL DB: `~/.claude/cache/tfx-hub/state.db`
48
- - PID file: `~/.claude/cache/tfx-hub/hub.pid`
49
-
50
- ---
51
-
52
- ## 5. Post-Start Registration Steps
53
-
54
- The skill describes registering the running hub with each CLI agent under "각 CLI 등록 방법":
55
-
56
- ```bash
57
- # Codex
58
- codex mcp add tfx-hub --url http://127.0.0.1:27888/mcp
59
-
60
- # Gemini (settings.json)
61
- # mcpServers.tfx-hub.url = "http://127.0.0.1:27888/mcp"
62
-
63
- # Claude
64
- claude mcp add --transport http tfx-hub http://127.0.0.1:27888/mcp
65
- ```
66
-
67
- These steps are documented but are listed as per-CLI manual registration steps — the skill does not show them being executed automatically as part of the `start` command block itself. The `start` block contains only the single `Bash("node hub/server.mjs", run_in_background=true)` call.
68
-
69
- ---
70
-
71
- ## Summary Table
72
-
73
- | Attribute | Value |
74
- |-----------|-------|
75
- | Routing outcome | Command match (`start`) |
76
- | Fallthrough triggered | No |
77
- | Bash command | `Bash("node hub/server.mjs", run_in_background=true)` |
78
- | `run_in_background` | `true` |
79
- | Port | `27888` |
80
- | MCP endpoint | `http://127.0.0.1:27888/mcp` |
81
- | Post-start registration | Documented (manual, per-CLI); not auto-executed by `start` |
@@ -1,5 +0,0 @@
1
- {
2
- "total_tokens": 14821,
3
- "duration_ms": 47208,
4
- "total_duration_seconds": 47.2
5
- }
@@ -1,12 +0,0 @@
1
- {
2
- "eval_id": 3,
3
- "eval_name": "multi-team-creation",
4
- "prompt": "/tfx-multi 인증 리팩터링 + UI 개선 + 보안 리뷰",
5
- "assertions": [
6
- "Creates exactly one TeamCreate with tfx- prefix naming",
7
- "Creates 3 TaskCreate calls (one per subtask)",
8
- "Spawns 3 Agent wrappers with mode: bypassPermissions",
9
- "Uses tfx-route.sh inside Agent wrapper (not direct codex/gemini)",
10
- "Includes Phase 5 cleanup (TeamDelete)"
11
- ]
12
- }
@@ -1,10 +0,0 @@
1
- {
2
- "expectations": [
3
- {"text": "Creates exactly one TeamCreate with tfx- prefix naming", "passed": true, "evidence": "Agent output: TeamCreate({ team_name: 'tfx-<id>' })"},
4
- {"text": "Creates 3 TaskCreate calls (one per subtask)", "passed": true, "evidence": "Agent output: 'Three TaskCreate calls (one per subtask), preserving taskIds'"},
5
- {"text": "Spawns 3 Agent wrappers with mode: bypassPermissions", "passed": true, "evidence": "Agent output: 'mode: bypassPermissions — included in all 3 Agent calls. Mandatory.'"},
6
- {"text": "Uses tfx-route.sh inside Agent wrapper (not direct codex/gemini)", "passed": true, "evidence": "Agent output: 'all wrappers internally call bash ~/.claude/scripts/tfx-route.sh — never direct codex exec or gemini -y -p'"},
7
- {"text": "Includes Phase 5 cleanup (TeamDelete)", "passed": true, "evidence": "Agent output: 'TeamDelete is called unconditionally (success or failure), with 30-second wait'"}
8
- ],
9
- "summary": {"passed": 5, "failed": 0, "total": 5, "pass_rate": 1.0}
10
- }