oh-my-customcodex 0.3.10 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (37) hide show
  1. package/README.md +9 -8
  2. package/dist/cli/index.js +2 -9
  3. package/dist/index.js +1 -1
  4. package/package.json +1 -1
  5. package/templates/.claude/agents/mgr-creator.md +11 -0
  6. package/templates/.claude/agents/mgr-sauron.md +1 -1
  7. package/templates/.claude/agents/tracker-checkpoint.md +77 -0
  8. package/templates/.claude/output-styles/korean-engineer.md +24 -0
  9. package/templates/.claude/rules/MUST-agent-design.md +2 -1
  10. package/templates/.claude/rules/MUST-completion-verification.md +13 -0
  11. package/templates/.claude/rules/SHOULD-interaction.md +2 -0
  12. package/templates/.claude/skills/agent-eval-framework/SKILL.md +92 -0
  13. package/templates/.claude/skills/agora/SKILL.md +11 -0
  14. package/templates/.claude/skills/codex-exec/SKILL.md +12 -0
  15. package/templates/.claude/skills/dag-orchestration/SKILL.md +20 -0
  16. package/templates/.claude/skills/evaluator-optimizer/SKILL.md +20 -0
  17. package/templates/.claude/skills/harness-eval/SKILL.md +13 -0
  18. package/templates/.claude/skills/pipeline-guards/SKILL.md +19 -0
  19. package/templates/.claude/skills/roundtable-debate/SKILL.md +60 -0
  20. package/templates/.claude/skills/sauron-watch/SKILL.md +16 -4
  21. package/templates/.claude/skills/sdd-dev/SKILL.md +6 -3
  22. package/templates/.claude/skills/sdd-dev/templates/decision-record.md +45 -0
  23. package/templates/.claude/skills/secretary-routing/SKILL.md +3 -0
  24. package/templates/.github/scripts/verify-fork-list.sh +97 -0
  25. package/templates/AGENTS.md.en +12 -26
  26. package/templates/AGENTS.md.ko +12 -26
  27. package/templates/CLAUDE.md +5 -4
  28. package/templates/CLAUDE.md.en +8 -7
  29. package/templates/CLAUDE.md.ko +8 -7
  30. package/templates/guides/agent-eval/README.md +48 -0
  31. package/templates/guides/agent-eval/index.yaml +6 -0
  32. package/templates/guides/browser-automation/README.md +12 -0
  33. package/templates/guides/index.yaml +12 -0
  34. package/templates/guides/multi-agent-debate-patterns/README.md +26 -0
  35. package/templates/guides/multi-agent-debate-patterns/index.yaml +6 -0
  36. package/templates/manifest.json +5 -5
  37. package/templates/workflows/auto-dev.yaml +7 -1
@@ -0,0 +1,45 @@
1
+ ---
2
+ title: {Decision title}
3
+ date: YYYY-MM-DD
4
+ status: proposed | accepted | superseded | deprecated
5
+ context: guides/harness-engineering/README.md
6
+ decision_makers: [{agent or role}]
7
+ ---
8
+
9
+ # {Decision title}
10
+
11
+ ## Context
12
+
13
+ {What is the problem and why is a decision needed? Include relevant constraints, goals, and the situation that makes this decision necessary.}
14
+
15
+ ## Options Considered
16
+
17
+ 1. **Option A**: {Description}
18
+ - Pros: {benefits}
19
+ - Cons: {drawbacks, trade-offs}
20
+
21
+ 2. **Option B**: {Description}
22
+ - Pros: {benefits}
23
+ - Cons: {drawbacks, trade-offs}
24
+
25
+ 3. **Option C** *(if applicable)*: {Description}
26
+ - Pros: {benefits}
27
+ - Cons: {drawbacks, trade-offs}
28
+
29
+ ## Decision
30
+
31
+ **Chosen**: Option {A|B|C}
32
+
33
+ {Explain the rationale for the choice. Why does this option best satisfy the constraints and goals from the Context section?}
34
+
35
+ ## Consequences
36
+
37
+ - **Positive**: {What improves as a result of this decision}
38
+ - **Negative**: {Trade-offs and costs accepted}
39
+ - **Risks**: {Future considerations, potential issues to monitor}
40
+
41
+ ## References
42
+
43
+ - guides/harness-engineering/README.md
44
+ - {related skill or agent, e.g. .codex/skills/action-validator/SKILL.md}
45
+ - {link to issue or PR if applicable}
@@ -24,6 +24,7 @@ Routes agent management tasks to the appropriate manager agent. This skill conta
24
24
  | mgr-claude-code-bible | Claude Code spec compliance | "spec check", "verify compliance" |
25
25
  | sys-memory-keeper | Memory operations | "save memory", "recall", "memory search" |
26
26
  | sys-naggy | TODO management | "todo", "track tasks", "task list" |
27
+ | tracker-checkpoint | Pipeline checkpoint state | "pipeline resume", "checkpoint", "state restore" |
27
28
 
28
29
  ## Routing Decision (Priority Order)
29
30
 
@@ -51,6 +52,7 @@ verify → mgr-sauron
51
52
  spec → mgr-claude-code-bible
52
53
  memory → sys-memory-keeper
53
54
  todo → sys-naggy
55
+ checkpoint → tracker-checkpoint
54
56
  improve-report → omcodex:improve-report (skill invocation)
55
57
  auto-improve → omcodex:auto-improve (skill invocation)
56
58
  batch → multiple (parallel)
@@ -106,6 +108,7 @@ When command requires multiple independent operations:
106
108
  | mgr-claude-code-bible | sonnet | Spec compliance checks |
107
109
  | sys-memory-keeper | sonnet | Memory operations, search |
108
110
  | sys-naggy | haiku | Simple TODO tracking |
111
+ | tracker-checkpoint | sonnet | Pipeline state recovery |
109
112
 
110
113
  ## No Match Fallback
111
114
 
@@ -0,0 +1,97 @@
1
+ #!/usr/bin/env bash
2
+ # Verify R006 Context Fork Criteria matches actual SKILL.md frontmatter.
3
+ # Usage: bash .github/scripts/verify-fork-list.sh
4
+ set -euo pipefail
5
+
6
+ ROOT="$(cd "$(dirname "$0")/../.." && pwd)"
7
+ RULE_FILE="${ROOT}/.codex/rules/MUST-agent-design.md"
8
+ SKILLS_DIR="${ROOT}/.codex/skills"
9
+
10
+ if [[ ! -f "${RULE_FILE}" ]]; then
11
+ echo "error: ${RULE_FILE} not found" >&2
12
+ exit 1
13
+ fi
14
+
15
+ if [[ ! -d "${SKILLS_DIR}" ]]; then
16
+ echo "error: ${SKILLS_DIR} not found" >&2
17
+ exit 1
18
+ fi
19
+
20
+ DOC_LINE="$(grep -E 'Current: [0-9]+/12 \(' "${RULE_FILE}" | head -1 || true)"
21
+
22
+ if [[ -z "${DOC_LINE}" ]]; then
23
+ echo "error: R006 Context Fork Criteria line not found" >&2
24
+ exit 1
25
+ fi
26
+
27
+ DOC_COUNT="$(printf '%s\n' "${DOC_LINE}" | sed -E 's#.*Current: ([0-9]+)/12.*#\1#')"
28
+ DOC_LIST="$(printf '%s\n' "${DOC_LINE}" | sed -E 's#.*Current: [0-9]+/12 \(([^)]*)\).*#\1#' | tr ',' '\n' | sed 's/^ *//; s/ *$//' | sort)"
29
+
30
+ ACTUAL_LIST="$(
31
+ for skill_file in "${SKILLS_DIR}"/*/SKILL.md; do
32
+ [[ -f "${skill_file}" ]] || continue
33
+ if awk '
34
+ BEGIN { in_frontmatter = 0; found = 0 }
35
+ NR == 1 && $0 == "---" { in_frontmatter = 1; next }
36
+ in_frontmatter && $0 == "---" { exit }
37
+ in_frontmatter && $0 ~ /^context:[[:space:]]*fork[[:space:]]*$/ { found = 1 }
38
+ END { exit found ? 0 : 1 }
39
+ ' "${skill_file}"; then
40
+ skill_name="$(awk '
41
+ NR == 1 && $0 == "---" { in_frontmatter = 1; next }
42
+ in_frontmatter && $0 == "---" { exit }
43
+ in_frontmatter && $0 ~ /^name:[[:space:]]*/ {
44
+ sub(/^name:[[:space:]]*/, "")
45
+ gsub(/^"|"$/, "")
46
+ print
47
+ exit
48
+ }
49
+ ' "${skill_file}")"
50
+ if [[ -z "${skill_name}" ]]; then
51
+ echo "error: context: fork skill has no frontmatter name: ${skill_file}" >&2
52
+ exit 1
53
+ fi
54
+ printf '%s\n' "${skill_name}"
55
+ fi
56
+ done | sort
57
+ )"
58
+
59
+ ACTUAL_COUNT="$(printf '%s\n' "${ACTUAL_LIST}" | sed '/^$/d' | wc -l | tr -d ' ')"
60
+ DOC_LIST_COUNT="$(printf '%s\n' "${DOC_LIST}" | sed '/^$/d' | wc -l | tr -d ' ')"
61
+
62
+ DOC_TMP="$(mktemp)"
63
+ ACTUAL_TMP="$(mktemp)"
64
+ trap 'rm -f "${DOC_TMP}" "${ACTUAL_TMP}"' EXIT
65
+
66
+ printf '%s\n' "${DOC_LIST}" | sed '/^$/d' > "${DOC_TMP}"
67
+ printf '%s\n' "${ACTUAL_LIST}" | sed '/^$/d' > "${ACTUAL_TMP}"
68
+
69
+ MISSING="$(comm -23 "${ACTUAL_TMP}" "${DOC_TMP}" || true)"
70
+ EXTRA="$(comm -13 "${ACTUAL_TMP}" "${DOC_TMP}" || true)"
71
+
72
+ echo "R006 documented count: ${DOC_COUNT}"
73
+ echo "R006 listed skills: ${DOC_LIST_COUNT}"
74
+ echo "Actual fork skill count: ${ACTUAL_COUNT}"
75
+ echo ""
76
+ echo "Actual fork skills:"
77
+ sed 's/^/ - /' "${ACTUAL_TMP}"
78
+
79
+ if [[ "${DOC_COUNT}" != "${ACTUAL_COUNT}" || "${DOC_LIST_COUNT}" != "${ACTUAL_COUNT}" || -n "${MISSING}" || -n "${EXTRA}" ]]; then
80
+ echo ""
81
+ echo "ERROR: R006 fork list drift detected"
82
+ [[ "${DOC_COUNT}" != "${ACTUAL_COUNT}" ]] && echo " - documented count ${DOC_COUNT} != actual count ${ACTUAL_COUNT}"
83
+ [[ "${DOC_LIST_COUNT}" != "${ACTUAL_COUNT}" ]] && echo " - listed skill count ${DOC_LIST_COUNT} != actual count ${ACTUAL_COUNT}"
84
+ if [[ -n "${MISSING}" ]]; then
85
+ echo " - missing from R006:"
86
+ printf '%s\n' "${MISSING}" | sed 's/^/ - /'
87
+ fi
88
+ if [[ -n "${EXTRA}" ]]; then
89
+ echo " - extra in R006:"
90
+ printf '%s\n' "${EXTRA}" | sed 's/^/ - /'
91
+ fi
92
+ echo " Fix: update Context Fork Criteria in ${RULE_FILE}"
93
+ exit 1
94
+ fi
95
+
96
+ echo ""
97
+ echo "OK: R006 fork list matches actual SKILL.md frontmatter (${ACTUAL_COUNT}/12)"
@@ -128,7 +128,7 @@ NO EXCEPTIONS. NO EXCUSES.
128
128
  project/
129
129
  +-- AGENTS.md # Entry point
130
130
  +-- .codex/
131
- | +-- agents/ # Subagent definitions (44 files)
131
+ | +-- agents/ # Subagent definitions (49 files)
132
132
  | +-- rules/ # Global rules (R000-R020)
133
133
  | +-- hooks/ # Hook scripts (security, validation, HUD)
134
134
  | +-- contexts/ # Context files (ecomode)
@@ -164,17 +164,18 @@ This is the core oh-my-customcodex philosophy: **"No expert? CREATE one, connect
164
164
  |------|-------|--------|
165
165
  | SW Engineer/Language | 6 | lang-golang-expert, lang-python-expert, lang-rust-expert, lang-kotlin-expert, lang-typescript-expert, lang-java21-expert |
166
166
  | SW Engineer/Backend | 6 | be-fastapi-expert, be-springboot-expert, be-go-backend-expert, be-express-expert, be-nestjs-expert, be-django-expert |
167
- | SW Engineer/Frontend | 4 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent |
167
+ | SW Engineer/Frontend | 5 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent, fe-design-expert |
168
168
  | SW Engineer/Tooling | 3 | tool-npm-expert, tool-optimizer, tool-bun-expert |
169
169
  | DE Engineer | 6 | de-airflow-expert, de-dbt-expert, de-spark-expert, de-kafka-expert, de-snowflake-expert, de-pipeline-expert |
170
- | SW Engineer/Database | 3 | db-supabase-expert, db-postgres-expert, db-redis-expert |
170
+ | SW Engineer/Database | 4 | db-supabase-expert, db-postgres-expert, db-redis-expert, db-alembic-expert |
171
171
  | Security | 1 | sec-codeql-expert |
172
172
  | SW Architect | 2 | arch-documenter, arch-speckit-agent |
173
173
  | Infra Engineer | 2 | infra-docker-expert, infra-aws-expert |
174
174
  | QA Team | 3 | qa-planner, qa-writer, qa-engineer |
175
175
  | Manager | 6 | mgr-creator, mgr-updater, mgr-supplier, mgr-gitnerd, mgr-sauron, mgr-claude-code-bible |
176
- | System | 2 | sys-memory-keeper, sys-naggy |
177
- | **Total** | **44** | |
176
+ | System | 3 | sys-memory-keeper, sys-naggy, tracker-checkpoint |
177
+ | Auxiliary | 2 | slack-cli-expert, wiki-curator |
178
+ | **Total** | **49** | |
178
179
 
179
180
  ## Agent Teams (MUST when enabled)
180
181
 
@@ -219,38 +220,23 @@ Task tool + routing skills remain the fallback for simple/cost-sensitive tasks.
219
220
 
220
221
  ## External Dependencies
221
222
 
222
- ### Required Plugins
223
-
224
- Install via `/plugin install <name>`:
225
-
226
- | Plugin | Source | Purpose |
227
- |--------|--------|---------|
228
- | superpowers | claude-plugins-official | TDD, debugging, collaboration patterns |
229
- | openai-docs | superpowers-marketplace | OpenAI and Codex development documentation |
230
- | elements-of-style | superpowers-marketplace | Writing clarity guidelines |
231
- | obsidian-skills | - | Obsidian markdown support |
232
- | context7 | claude-plugins-official | Library documentation lookup |
233
-
234
- ### Recommended MCP Servers
223
+ ### Recommended Codex MCP Servers
235
224
 
236
225
  | Server | Purpose |
237
226
  |--------|---------|
238
227
  | omx-memory | Session memory persistence (Chroma-based) |
228
+ | context7 | Library documentation lookup MCP server when a project needs it |
239
229
 
240
230
  ### Setup Commands
241
231
 
242
232
  ```bash
243
- # Add marketplace
244
- /plugin marketplace add obra/superpowers-marketplace
245
-
246
- # Install plugins
247
- /plugin install superpowers
248
- /plugin install openai-docs
249
- /plugin install elements-of-style
250
-
251
233
  # MCP setup (omx-memory)
252
234
  npm install -g omx-memory
253
235
  omx-memory setup
254
236
  ```
255
237
 
238
+ ### Claude Code Compatibility Note
239
+
240
+ Projects that run in the Claude Code plugin ecosystem may separately install plugins such as `superpowers`, `openai-docs`, `elements-of-style`, and `context7`. They are not required Codex init steps.
241
+
256
242
  <!-- omcodex:git-workflow -->
@@ -128,7 +128,7 @@ oh-my-customcodex로 구동됩니다.
128
128
  project/
129
129
  +-- AGENTS.md # 진입점
130
130
  +-- .codex/
131
- | +-- agents/ # 서브에이전트 정의 (44 파일)
131
+ | +-- agents/ # 서브에이전트 정의 (49 파일)
132
132
  | +-- rules/ # 전역 규칙 (R000-R020)
133
133
  | +-- hooks/ # 훅 스크립트 (보안, 검증, HUD)
134
134
  | +-- contexts/ # 컨텍스트 파일 (ecomode)
@@ -164,17 +164,18 @@ project/
164
164
  |------|------|----------|
165
165
  | SW Engineer/Language | 6 | lang-golang-expert, lang-python-expert, lang-rust-expert, lang-kotlin-expert, lang-typescript-expert, lang-java21-expert |
166
166
  | SW Engineer/Backend | 6 | be-fastapi-expert, be-springboot-expert, be-go-backend-expert, be-express-expert, be-nestjs-expert, be-django-expert |
167
- | SW Engineer/Frontend | 4 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent |
167
+ | SW Engineer/Frontend | 5 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent, fe-design-expert |
168
168
  | SW Engineer/Tooling | 3 | tool-npm-expert, tool-optimizer, tool-bun-expert |
169
169
  | DE Engineer | 6 | de-airflow-expert, de-dbt-expert, de-spark-expert, de-kafka-expert, de-snowflake-expert, de-pipeline-expert |
170
- | SW Engineer/Database | 3 | db-supabase-expert, db-postgres-expert, db-redis-expert |
170
+ | SW Engineer/Database | 4 | db-supabase-expert, db-postgres-expert, db-redis-expert, db-alembic-expert |
171
171
  | Security | 1 | sec-codeql-expert |
172
172
  | SW Architect | 2 | arch-documenter, arch-speckit-agent |
173
173
  | Infra Engineer | 2 | infra-docker-expert, infra-aws-expert |
174
174
  | QA Team | 3 | qa-planner, qa-writer, qa-engineer |
175
175
  | Manager | 6 | mgr-creator, mgr-updater, mgr-supplier, mgr-gitnerd, mgr-sauron, mgr-claude-code-bible |
176
- | System | 2 | sys-memory-keeper, sys-naggy |
177
- | **총계** | **44** | |
176
+ | System | 3 | sys-memory-keeper, sys-naggy, tracker-checkpoint |
177
+ | Auxiliary | 2 | slack-cli-expert, wiki-curator |
178
+ | **총계** | **49** | |
178
179
 
179
180
  ## Agent Teams (MUST when enabled)
180
181
 
@@ -219,38 +220,23 @@ Codex CLI의 Agent Teams 기능이 활성화되어 있으면 (`OMCODEX_AGENT_TEA
219
220
 
220
221
  ## 외부 의존성
221
222
 
222
- ### 필수 플러그인
223
-
224
- `/plugin install <이름>`으로 설치:
225
-
226
- | 플러그인 | 소스 | 용도 |
227
- |----------|------|------|
228
- | superpowers | claude-plugins-official | TDD, 디버깅, 협업 패턴 |
229
- | openai-docs | superpowers-marketplace | Codex CLI 개발 문서 |
230
- | elements-of-style | superpowers-marketplace | 글쓰기 명확성 가이드라인 |
231
- | obsidian-skills | - | 옵시디언 마크다운 지원 |
232
- | context7 | claude-plugins-official | 라이브러리 문서 조회 |
233
-
234
- ### 권장 MCP 서버
223
+ ### Codex 권장 MCP 서버
235
224
 
236
225
  | 서버 | 용도 |
237
226
  |------|------|
238
227
  | omx-memory | 세션 메모리 영속성 (Chroma 기반) |
228
+ | context7 | 라이브러리 문서 조회용 MCP 서버 (프로젝트 필요 시 설정) |
239
229
 
240
230
  ### 설치 명령어
241
231
 
242
232
  ```bash
243
- # 마켓플레이스 추가
244
- /plugin marketplace add obra/superpowers-marketplace
245
-
246
- # 플러그인 설치
247
- /plugin install superpowers
248
- /plugin install openai-docs
249
- /plugin install elements-of-style
250
-
251
233
  # MCP 설정 (omx-memory)
252
234
  npm install -g omx-memory
253
235
  omx-memory setup
254
236
  ```
255
237
 
238
+ ### Claude Code 호환 참고
239
+
240
+ Claude Code 플러그인 생태계를 쓰는 프로젝트에서는 `superpowers`, `openai-docs`, `elements-of-style`, `context7` 같은 플러그인을 별도로 설치할 수 있습니다. Codex 초기화의 필수 단계는 아닙니다.
241
+
256
242
  <!-- omcodex:git-workflow -->
@@ -114,7 +114,7 @@ oh-my-customcodex로 구동됩니다.
114
114
  project/
115
115
  +-- AGENTS.md # 진입점
116
116
  +-- .codex/
117
- | +-- agents/ # 서브에이전트 정의 (48 파일)
117
+ | +-- agents/ # 서브에이전트 정의 (49 파일)
118
118
  | +-- rules/ # 전역 규칙 (R000-R022)
119
119
  | +-- hooks/ # 훅 스크립트 (보안, 검증, HUD)
120
120
  | +-- contexts/ # 컨텍스트 파일 (ecomode)
@@ -166,7 +166,7 @@ oh-my-customcodex는 소프트웨어 컴파일과 동일한 구조를 따릅니
166
166
  | SW Engineer/Language | 6 | lang-golang-expert, lang-python-expert, lang-rust-expert, lang-kotlin-expert, lang-typescript-expert, lang-java21-expert |
167
167
  | SW Engineer/Backend | 6 | be-fastapi-expert, be-springboot-expert, be-go-backend-expert, be-express-expert, be-nestjs-expert, be-django-expert |
168
168
  | SW Engineer/Frontend | 5 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent, fe-design-expert |
169
- | SW Engineer/Tooling | 4 | tool-npm-expert, tool-optimizer, tool-bun-expert, slack-cli-expert |
169
+ | SW Engineer/Tooling | 3 | tool-npm-expert, tool-optimizer, tool-bun-expert |
170
170
  | DE Engineer | 6 | de-airflow-expert, de-dbt-expert, de-spark-expert, de-kafka-expert, de-snowflake-expert, de-pipeline-expert |
171
171
  | SW Engineer/Database | 4 | db-supabase-expert, db-postgres-expert, db-redis-expert, db-alembic-expert |
172
172
  | Security | 1 | sec-codeql-expert |
@@ -174,8 +174,9 @@ oh-my-customcodex는 소프트웨어 컴파일과 동일한 구조를 따릅니
174
174
  | Infra Engineer | 2 | infra-docker-expert, infra-aws-expert |
175
175
  | QA Team | 3 | qa-planner, qa-writer, qa-engineer |
176
176
  | Manager | 6 | mgr-creator, mgr-updater, mgr-supplier, mgr-gitnerd, mgr-sauron, mgr-claude-code-bible |
177
- | System | 3 | sys-memory-keeper, sys-naggy, wiki-curator |
178
- | **총계** | **48** | |
177
+ | System | 3 | sys-memory-keeper, sys-naggy, tracker-checkpoint |
178
+ | Auxiliary | 2 | slack-cli-expert, wiki-curator |
179
+ | **총계** | **49** | |
179
180
 
180
181
  ## Agent Teams (MUST when enabled)
181
182
 
@@ -131,7 +131,7 @@ NO EXCEPTIONS. NO EXCUSES.
131
131
  project/
132
132
  +-- AGENTS.md # Entry point
133
133
  +-- .codex/
134
- | +-- agents/ # Subagent definitions (48 files)
134
+ | +-- agents/ # Subagent definitions (49 files)
135
135
  | +-- skills/ # Skills (109 directories)
136
136
  | +-- rules/ # Global rules (22 files)
137
137
  | +-- hooks/ # Hook scripts (security, validation, HUD)
@@ -167,7 +167,7 @@ This is the core oh-my-customcodex philosophy: **"No expert? CREATE one, connect
167
167
  | SW Engineer/Language | 6 | lang-golang-expert, lang-python-expert, lang-rust-expert, lang-kotlin-expert, lang-typescript-expert, lang-java21-expert |
168
168
  | SW Engineer/Backend | 6 | be-fastapi-expert, be-springboot-expert, be-go-backend-expert, be-express-expert, be-nestjs-expert, be-django-expert |
169
169
  | SW Engineer/Frontend | 5 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent, fe-design-expert |
170
- | SW Engineer/Tooling | 4 | tool-npm-expert, tool-optimizer, tool-bun-expert, slack-cli-expert |
170
+ | SW Engineer/Tooling | 3 | tool-npm-expert, tool-optimizer, tool-bun-expert |
171
171
  | DE Engineer | 6 | de-airflow-expert, de-dbt-expert, de-spark-expert, de-kafka-expert, de-snowflake-expert, de-pipeline-expert |
172
172
  | SW Engineer/Database | 4 | db-supabase-expert, db-postgres-expert, db-redis-expert, db-alembic-expert |
173
173
  | Security | 1 | sec-codeql-expert |
@@ -175,8 +175,9 @@ This is the core oh-my-customcodex philosophy: **"No expert? CREATE one, connect
175
175
  | Infra Engineer | 2 | infra-docker-expert, infra-aws-expert |
176
176
  | QA Team | 3 | qa-planner, qa-writer, qa-engineer |
177
177
  | Manager | 6 | mgr-creator, mgr-updater, mgr-supplier, mgr-gitnerd, mgr-sauron, mgr-claude-code-bible |
178
- | System | 3 | sys-memory-keeper, sys-naggy, wiki-curator |
179
- | **Total** | **48** | |
178
+ | System | 3 | sys-memory-keeper, sys-naggy, tracker-checkpoint |
179
+ | Auxiliary | 2 | slack-cli-expert, wiki-curator |
180
+ | **Total** | **49** | |
180
181
 
181
182
  ## Agent Teams (MUST when enabled)
182
183
 
@@ -221,9 +222,9 @@ Task tool + routing skills remain the fallback for simple/cost-sensitive tasks.
221
222
 
222
223
  ## External Dependencies
223
224
 
224
- ### Required Plugins
225
+ ### Claude Code Plugins
225
226
 
226
- Install via `/plugin install <name>`:
227
+ Install in Claude Code via `/plugin install <name>`:
227
228
 
228
229
  | Plugin | Source | Purpose |
229
230
  |--------|--------|---------|
@@ -239,7 +240,7 @@ Install via `/plugin install <name>`:
239
240
  |--------|---------|
240
241
  | omx-memory | Session memory persistence |
241
242
 
242
- ### Setup Commands
243
+ ### Claude Code Setup Commands
243
244
 
244
245
  ```bash
245
246
  # Add marketplace
@@ -131,7 +131,7 @@ oh-my-customcodex로 구동됩니다.
131
131
  project/
132
132
  +-- AGENTS.md # 진입점
133
133
  +-- .codex/
134
- | +-- agents/ # 서브에이전트 정의 (48 파일)
134
+ | +-- agents/ # 서브에이전트 정의 (49 파일)
135
135
  | +-- skills/ # 스킬 (109 디렉토리)
136
136
  | +-- rules/ # 전역 규칙 (22 파일)
137
137
  | +-- hooks/ # 훅 스크립트 (보안, 검증, HUD)
@@ -167,7 +167,7 @@ project/
167
167
  | SW Engineer/Language | 6 | lang-golang-expert, lang-python-expert, lang-rust-expert, lang-kotlin-expert, lang-typescript-expert, lang-java21-expert |
168
168
  | SW Engineer/Backend | 6 | be-fastapi-expert, be-springboot-expert, be-go-backend-expert, be-express-expert, be-nestjs-expert, be-django-expert |
169
169
  | SW Engineer/Frontend | 5 | fe-vercel-agent, fe-vuejs-agent, fe-svelte-agent, fe-flutter-agent, fe-design-expert |
170
- | SW Engineer/Tooling | 4 | tool-npm-expert, tool-optimizer, tool-bun-expert, slack-cli-expert |
170
+ | SW Engineer/Tooling | 3 | tool-npm-expert, tool-optimizer, tool-bun-expert |
171
171
  | DE Engineer | 6 | de-airflow-expert, de-dbt-expert, de-spark-expert, de-kafka-expert, de-snowflake-expert, de-pipeline-expert |
172
172
  | SW Engineer/Database | 4 | db-supabase-expert, db-postgres-expert, db-redis-expert, db-alembic-expert |
173
173
  | Security | 1 | sec-codeql-expert |
@@ -175,8 +175,9 @@ project/
175
175
  | Infra Engineer | 2 | infra-docker-expert, infra-aws-expert |
176
176
  | QA Team | 3 | qa-planner, qa-writer, qa-engineer |
177
177
  | Manager | 6 | mgr-creator, mgr-updater, mgr-supplier, mgr-gitnerd, mgr-sauron, mgr-claude-code-bible |
178
- | System | 3 | sys-memory-keeper, sys-naggy, wiki-curator |
179
- | **총계** | **48** | |
178
+ | System | 3 | sys-memory-keeper, sys-naggy, tracker-checkpoint |
179
+ | Auxiliary | 2 | slack-cli-expert, wiki-curator |
180
+ | **총계** | **49** | |
180
181
 
181
182
  ## Agent Teams (MUST when enabled)
182
183
 
@@ -221,9 +222,9 @@ Codex CLI의 Agent Teams 기능이 활성화되어 있으면 (`OMCODEX_AGENT_TEA
221
222
 
222
223
  ## 외부 의존성
223
224
 
224
- ### 필수 플러그인
225
+ ### Claude Code 플러그인
225
226
 
226
- `/plugin install <이름>`으로 설치:
227
+ Claude Code 환경에서 `/plugin install <이름>`으로 설치:
227
228
 
228
229
  | 플러그인 | 소스 | 용도 |
229
230
  |----------|------|------|
@@ -239,7 +240,7 @@ Codex CLI의 Agent Teams 기능이 활성화되어 있으면 (`OMCODEX_AGENT_TEA
239
240
  |------|------|
240
241
  | omx-memory | 세션 메모리 영속성 |
241
242
 
242
- ### 설치 명령어
243
+ ### Claude Code 설치 명령어
243
244
 
244
245
  ```bash
245
246
  # 마켓플레이스 추가
@@ -0,0 +1,48 @@
1
+ # Agent Eval Guide
2
+
3
+ ## Evaluation Order
4
+
5
+ Agent evaluation uses two phases:
6
+
7
+ 1. **Correctness gate**: verify the task outcome against explicit acceptance criteria.
8
+ 2. **Efficiency review**: compare only correctness-passing runs against an ideal trajectory.
9
+
10
+ Do not optimize step count or latency before correctness is proven.
11
+
12
+ ## Four Metrics
13
+
14
+ | Metric | Definition | Typical Use |
15
+ |--------|------------|-------------|
16
+ | `correctness` | Passed criteria divided by total criteria | Release or completion gate |
17
+ | `step_ratio` | Observed steps divided by ideal steps | Detect avoidable loops |
18
+ | `tool_call_ratio` | Observed tool calls divided by ideal tool calls | Detect noisy retrieval or tool misuse |
19
+ | `latency_ratio` | Observed duration divided by ideal duration | Detect runtime regressions |
20
+
21
+ ## Ideal Trajectory
22
+
23
+ ```yaml
24
+ task: "create a small routing skill"
25
+ capability: "tool_use"
26
+ ideal:
27
+ steps: 5
28
+ tool_calls: 8
29
+ latency_ms: 180000
30
+ acceptance_criteria:
31
+ - "Skill frontmatter is valid"
32
+ - "Routing docs reference the skill"
33
+ - "Tests or static checks pass"
34
+ ```
35
+
36
+ ## Interpreting Ratios
37
+
38
+ - `1.00`: observed matched the ideal.
39
+ - `< 1.00`: faster or shorter than ideal; verify no evidence was skipped.
40
+ - `1.00-1.25`: usually acceptable.
41
+ - `> 1.25`: advisory improvement candidate.
42
+ - correctness below `1.00`: fail regardless of efficiency.
43
+
44
+ ## Integration
45
+
46
+ - Use `agent-eval-framework` for task-level scoring.
47
+ - Use `harness-eval` when running repeatable benchmark suites.
48
+ - Use `omcustomcodex:improve-report` to turn repeated ratio regressions into improvement suggestions.
@@ -0,0 +1,6 @@
1
+ name: agent-eval
2
+ description: Quantitative agent evaluation with correctness-first 4-metric evidence
3
+ source:
4
+ type: internal
5
+ files:
6
+ - README.md
@@ -75,6 +75,18 @@ Capture at least one of:
75
75
 
76
76
  When summarizing evidence for the model, preserve reference tokens and URLs so follow-up steps can still target the right page elements.
77
77
 
78
+ ## Build + Vision + Verify Loop
79
+
80
+ For browser-visible changes, treat a successful build as the start of verification, not the end:
81
+
82
+ 1. Build or start the local app.
83
+ 2. Open the page in the available browser surface.
84
+ 3. Capture screenshot, console, and network evidence.
85
+ 4. Feed concrete failures back to the implementation agent.
86
+ 5. Repeat until build, render, and runtime evidence all pass.
87
+
88
+ This is the Codex Browser Use pattern in portable form. Prefer the in-app Browser Use plugin when available; otherwise use Playwright or the existing browser MCP surface.
89
+
78
90
  ## Design And Strategy Workflows
79
91
 
80
92
  ### Product strategy sessions
@@ -40,6 +40,18 @@ guides:
40
40
  source:
41
41
  type: internal
42
42
 
43
+ - name: agent-eval
44
+ description: Quantitative agent evaluation with correctness-first 4-metric evidence
45
+ path: ./agent-eval/
46
+ source:
47
+ type: internal
48
+
49
+ - name: multi-agent-debate-patterns
50
+ description: Anti-groupthink debate patterns for Agora and roundtable-debate workflows
51
+ path: ./multi-agent-debate-patterns/
52
+ source:
53
+ type: internal
54
+
43
55
  # Languages
44
56
  - name: golang
45
57
  description: Go language reference from Effective Go
@@ -0,0 +1,26 @@
1
+ # Multi-Agent Debate Patterns
2
+
3
+ ## Pattern Choice
4
+
5
+ | Pattern | Goal | Use When |
6
+ |---------|------|----------|
7
+ | `agora` | Reach adversarial consensus | Release gates, design approval, high-risk specs |
8
+ | `roundtable-debate` | Preserve dissent | Strategy choices, tradeoffs, ambiguous product or architecture decisions |
9
+
10
+ ## Failure Modes
11
+
12
+ - **Anchoring**: later reviewers inherit the first opinion.
13
+ - **Groupthink**: reviewers converge because convergence looks productive.
14
+ - **Degeneration of thought**: debate continues without adding new evidence.
15
+
16
+ ## Controls
17
+
18
+ 1. Start with independent parallel analysis.
19
+ 2. Assign a devil's advocate.
20
+ 3. Protect minority findings unless explicitly rejected with evidence.
21
+ 4. Cap debate at two rounds.
22
+ 5. Switch from debate to evidence gathering when facts are missing.
23
+
24
+ ## Decision Record
25
+
26
+ Keep the final recommendation, rejected alternatives, and protected dissent together. Future agents should be able to see not only what was chosen, but which minority risk remains live.
@@ -0,0 +1,6 @@
1
+ name: multi-agent-debate-patterns
2
+ description: Anti-groupthink debate patterns for Agora and roundtable-debate workflows
3
+ source:
4
+ type: internal
5
+ files:
6
+ - README.md
@@ -1,6 +1,6 @@
1
1
  {
2
- "version": "0.3.10",
3
- "lastUpdated": "2026-04-24T09:10:47.000Z",
2
+ "version": "0.4.1",
3
+ "lastUpdated": "2026-04-27T01:00:00.000Z",
4
4
  "components": [
5
5
  {
6
6
  "name": "rules",
@@ -12,19 +12,19 @@
12
12
  "name": "agents",
13
13
  "path": ".codex/agents",
14
14
  "description": "AI agent definitions (flat .md files with prefixes)",
15
- "files": 48
15
+ "files": 49
16
16
  },
17
17
  {
18
18
  "name": "skills",
19
19
  "path": ".agents/skills",
20
20
  "description": "Reusable skill modules (project-scoped repo skills)",
21
- "files": 112
21
+ "files": 114
22
22
  },
23
23
  {
24
24
  "name": "guides",
25
25
  "path": "guides",
26
26
  "description": "Reference documentation",
27
- "files": 40
27
+ "files": 42
28
28
  },
29
29
  {
30
30
  "name": "hooks",
@@ -29,7 +29,13 @@ steps:
29
29
  foreach: release-group
30
30
 
31
31
  - name: implement
32
- prompt: "Execute implementation plan with appropriate agents"
32
+ prompt: |
33
+ Execute implementation plan with appropriate agents.
34
+
35
+ Codex-native sensitive-path policy:
36
+ - Codex-managed `.codex/` edits use the normal edit/patch flow.
37
+ - Do not adopt upstream Claude-only `/tmp` bypass guidance as the default path.
38
+ - If a port requires `.claude` template parity changes, make the change explicit and verify sensitive-path guard tests.
33
39
  description: Execute implementation plan with appropriate agents
34
40
  foreach: planned-issue
35
41