adi_dev_workflow 1.1.1 → 1.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/index.js +8 -8
- package/frameworks/agents/qa-staff-engineer.md +311 -311
- package/frameworks/agents/qa-validation-expert.md +458 -458
- package/frameworks/agents/tech-review-conformance.md +200 -200
- package/frameworks/commands/ministack/README.md +2 -0
- package/frameworks/commands/ministack/code-review.md +2 -0
- package/frameworks/commands/ministack/generate-intent.md +2 -0
- package/frameworks/commands/ministack/generate-scope.md +2 -0
- package/frameworks/commands/ministack/generate-tasks.md +2 -0
- package/frameworks/commands/ministack/generate-tech-direction.md +2 -0
- package/frameworks/commands/ministack/run-ministack-tasks.md +3 -0
- package/frameworks/commands/ministack/run-ministack-withlinear.md +2 -0
- package/frameworks/commands/ministack/status.md +2 -0
- package/frameworks/commands/sdd/code-review.md +2 -0
- package/frameworks/commands/sdd/generate-prd.md +2 -0
- package/frameworks/commands/sdd/generate-task-plan.md +2 -0
- package/frameworks/commands/sdd/generate-tech-direction.md +2 -0
- package/frameworks/commands/sdd/generate-tech-spec.md +2 -0
- package/frameworks/commands/sdd/generate-tests.md +2 -0
- package/frameworks/commands/sdd/run_tasks.md +3 -0
- package/frameworks/commands/sdd/run_tasks_withlinear.md +2 -0
- package/frameworks/commands/sdd/status.md +2 -0
- package/frameworks/commands/sdd/validate-sdd.md +2 -0
- package/frameworks/commands/sync-tasks-to-linear.md +2 -0
- package/frameworks/commands/taskcard/generate-taskcard.md +2 -0
- package/frameworks/commands/taskcard/run-taskcard.md +2 -0
- package/frameworks/config/ai-framework-config.yaml +112 -0
- package/frameworks/skills/ministack-tasks-expert/SKILL.md +204 -204
- package/frameworks/skills/ministack-tasks-expert/templates/task_plan_template.md +78 -78
- package/frameworks/skills/ministack-tasks-expert/templates/task_template.md +103 -103
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/benchmark.json +99 -99
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/benchmark.md +64 -64
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/eval_metadata.json +12 -12
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/with_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/with_skill/outputs/response.md +134 -134
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/with_skill/outputs/transcript.md +68 -68
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/with_skill/timing.json +5 -5
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/without_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/without_skill/outputs/response.md +525 -525
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/without_skill/outputs/transcript.md +30 -30
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-1-happy-path/without_skill/timing.json +5 -5
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/eval_metadata.json +12 -12
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/with_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/with_skill/outputs/response.md +1126 -1126
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/with_skill/outputs/transcript.md +131 -131
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/with_skill/timing.json +5 -5
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/without_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/without_skill/outputs/response.md +452 -452
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/without_skill/outputs/transcript.md +78 -78
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-2-spec-simples/without_skill/timing.json +5 -5
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/eval_metadata.json +12 -12
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/with_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/with_skill/outputs/response.md +101 -101
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/with_skill/outputs/transcript.md +133 -133
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/with_skill/timing.json +5 -5
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/without_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/without_skill/outputs/response.md +248 -248
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/without_skill/outputs/transcript.md +49 -49
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/eval-3-sem-user-stories/without_skill/timing.json +5 -5
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-1/review.html +1325 -1325
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/benchmark.json +94 -94
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/benchmark.md +67 -67
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/eval_metadata.json +12 -12
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/with_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/with_skill/outputs/response.md +117 -117
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/with_skill/outputs/transcript.md +91 -91
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/with_skill/timing.json +1 -1
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/without_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/without_skill/outputs/response.md +694 -694
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/without_skill/outputs/transcript.md +45 -45
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-1-happy-path/without_skill/timing.json +1 -1
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/eval_metadata.json +12 -12
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/with_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/with_skill/outputs/response.md +1087 -1087
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/with_skill/outputs/transcript.md +124 -124
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/with_skill/timing.json +1 -1
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/without_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/without_skill/outputs/response.md +458 -458
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/without_skill/outputs/transcript.md +84 -84
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-2-spec-simples/without_skill/timing.json +1 -1
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/eval_metadata.json +12 -12
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/with_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/with_skill/outputs/response.md +70 -70
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/with_skill/outputs/transcript.md +148 -148
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/with_skill/timing.json +1 -1
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/without_skill/grading.json +32 -32
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/without_skill/outputs/response.md +249 -249
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/without_skill/outputs/transcript.md +80 -80
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/eval-3-sem-user-stories/without_skill/timing.json +1 -1
- package/frameworks/skills/sdd-task-plan-expert-workspace/iteration-2/review.html +1325 -1325
- package/frameworks/skills/sdd-tech-spec-expert/SKILL.md +317 -317
- package/frameworks/skills/sdd-tech-spec-expert/evals/evals.json +199 -199
- package/frameworks/skills/sdd-tech-spec-expert/templates/spec_tech_template.md +290 -290
- package/frameworks/skills/sdd-tech-spec-expert/templates/tech_direction-template.md +23 -23
- package/package.json +28 -28
- package/src/cli.js +121 -121
- package/src/installer.js +155 -136
- package/src/transformer.js +86 -86
|
@@ -1,91 +1,91 @@
|
|
|
1
|
-
# Transcript -- Tool Calls
|
|
2
|
-
|
|
3
|
-
## 1. Read skill and templates (parallel)
|
|
4
|
-
|
|
5
|
-
| Tool | Parameters |
|
|
6
|
-
|------|-----------|
|
|
7
|
-
| Read | `.claude/skills/sdd-task-plan-expert/SKILL.md` |
|
|
8
|
-
| Read | `.claude/skills/sdd-task-plan-expert/templates/task_plan_template.md` |
|
|
9
|
-
| Read | `.claude/skills/sdd-task-plan-expert/templates/task_template.md` |
|
|
10
|
-
| Read | `docs/feature-user/v1/spec_tech.md` |
|
|
11
|
-
|
|
12
|
-
> SKILL.md was read in full. Templates were read in full. SPEC_TECH triggered persisted-output due to size (49.8KB).
|
|
13
|
-
|
|
14
|
-
## 2. Read full SPEC_TECH (persisted output)
|
|
15
|
-
|
|
16
|
-
| Tool | Parameters |
|
|
17
|
-
|------|-----------|
|
|
18
|
-
| Read | Persisted output file (full SPEC_TECH content) |
|
|
19
|
-
|
|
20
|
-
> Still truncated. Proceeded with offset-based reads.
|
|
21
|
-
|
|
22
|
-
## 3. Read SPEC_TECH in chunks
|
|
23
|
-
|
|
24
|
-
| Tool | Parameters |
|
|
25
|
-
|------|-----------|
|
|
26
|
-
| Read | `docs/feature-user/v1/spec_tech.md`, offset=1, limit=200 |
|
|
27
|
-
| Read | `docs/feature-user/v1/spec_tech.md`, offset=200, limit=300 |
|
|
28
|
-
| Read | `docs/feature-user/v1/spec_tech.md`, offset=498, limit=200 |
|
|
29
|
-
| Read | `docs/feature-user/v1/spec_tech.md`, offset=697, limit=200 |
|
|
30
|
-
|
|
31
|
-
> Sections 1-16 of the SPEC_TECH were fully read.
|
|
32
|
-
|
|
33
|
-
## 4. Passo 1 -- Read ALL project rules
|
|
34
|
-
|
|
35
|
-
Rules already loaded from system-reminder context (CLAUDE.md and all .claude/rules/* files were provided as context). Confirmed reading:
|
|
36
|
-
- `CLAUDE.md`
|
|
37
|
-
- `.claude/rules/code-conventions.md`
|
|
38
|
-
- `.claude/rules/database.md`
|
|
39
|
-
- `.claude/rules/fx-di.md`
|
|
40
|
-
- `.claude/rules/grpc.md`
|
|
41
|
-
- `.claude/rules/protobuf.md`
|
|
42
|
-
- `.claude/rules/repository.md`
|
|
43
|
-
- `.claude/rules/service.md`
|
|
44
|
-
- `.claude/rules/sqlc.md`
|
|
45
|
-
|
|
46
|
-
## 5. Passo 2 -- Explore codebase (parallel)
|
|
47
|
-
|
|
48
|
-
| Tool | Parameters |
|
|
49
|
-
|------|-----------|
|
|
50
|
-
| Glob | pattern=`**/*.go`, path=project root |
|
|
51
|
-
| Glob | pattern=`internal/db/migrations/*`, path=project root |
|
|
52
|
-
| Glob | pattern=`internal/db/queries/*`, path=project root |
|
|
53
|
-
|
|
54
|
-
> Found 24 Go files. Found 2 migration files. No query files in `internal/db/queries/` (queries are in `internal/db/sqlc/queries/`).
|
|
55
|
-
|
|
56
|
-
## 6. Read existing implementation files (parallel)
|
|
57
|
-
|
|
58
|
-
| Tool | Parameters |
|
|
59
|
-
|------|-----------|
|
|
60
|
-
| Read | `internal/repository/user_repository.go` |
|
|
61
|
-
| Read | `internal/service/user_service.go` |
|
|
62
|
-
| Read | `internal/handler/grpc/user_handler.go` |
|
|
63
|
-
| Read | `internal/infra/grpc/interceptors/auth.go` |
|
|
64
|
-
| Read | `internal/infra/config/config.go` |
|
|
65
|
-
| Read | `internal/pkg/identity/identity.go` |
|
|
66
|
-
|
|
67
|
-
> All 6 files read successfully. Confirmed that the entire feature is already implemented.
|
|
68
|
-
|
|
69
|
-
## 7. Create output directory
|
|
70
|
-
|
|
71
|
-
| Tool | Parameters |
|
|
72
|
-
|------|-----------|
|
|
73
|
-
| Bash | `mkdir -p ...outputs/` |
|
|
74
|
-
|
|
75
|
-
## 8. Write output files
|
|
76
|
-
|
|
77
|
-
| Tool | Parameters |
|
|
78
|
-
|------|-----------|
|
|
79
|
-
| Write | `response.md` -- main response with feature name confirmation and macro-phases |
|
|
80
|
-
| Write | `transcript.md` -- this file |
|
|
81
|
-
|
|
82
|
-
---
|
|
83
|
-
|
|
84
|
-
## Summary of Findings
|
|
85
|
-
|
|
86
|
-
- **Feature name extracted**: "Modulo de Usuario -- Vakinha Burger" from SPEC_TECH section 1
|
|
87
|
-
- **Feature directory**: `feature-user` (already exists at `docs/feature-user/v1/`)
|
|
88
|
-
- **Critical finding**: The entire feature is already implemented in the codebase. All files referenced in sections 3.1 and 15 of the SPEC_TECH exist with complete implementations.
|
|
89
|
-
- **Macro-phases proposed**: 5 phases (Fundacao, Dados, Negocio, Apresentacao, Testes) with 11 tasks
|
|
90
|
-
- **User Stories covered**: US-01 through US-04, all mapped to phases
|
|
91
|
-
- **First interaction completed**: Feature name confirmed + macro-phases proposed + awaiting user confirmation
|
|
1
|
+
# Transcript -- Tool Calls
|
|
2
|
+
|
|
3
|
+
## 1. Read skill and templates (parallel)
|
|
4
|
+
|
|
5
|
+
| Tool | Parameters |
|
|
6
|
+
|------|-----------|
|
|
7
|
+
| Read | `.claude/skills/sdd-task-plan-expert/SKILL.md` |
|
|
8
|
+
| Read | `.claude/skills/sdd-task-plan-expert/templates/task_plan_template.md` |
|
|
9
|
+
| Read | `.claude/skills/sdd-task-plan-expert/templates/task_template.md` |
|
|
10
|
+
| Read | `docs/feature-user/v1/spec_tech.md` |
|
|
11
|
+
|
|
12
|
+
> SKILL.md was read in full. Templates were read in full. SPEC_TECH triggered persisted-output due to size (49.8KB).
|
|
13
|
+
|
|
14
|
+
## 2. Read full SPEC_TECH (persisted output)
|
|
15
|
+
|
|
16
|
+
| Tool | Parameters |
|
|
17
|
+
|------|-----------|
|
|
18
|
+
| Read | Persisted output file (full SPEC_TECH content) |
|
|
19
|
+
|
|
20
|
+
> Still truncated. Proceeded with offset-based reads.
|
|
21
|
+
|
|
22
|
+
## 3. Read SPEC_TECH in chunks
|
|
23
|
+
|
|
24
|
+
| Tool | Parameters |
|
|
25
|
+
|------|-----------|
|
|
26
|
+
| Read | `docs/feature-user/v1/spec_tech.md`, offset=1, limit=200 |
|
|
27
|
+
| Read | `docs/feature-user/v1/spec_tech.md`, offset=200, limit=300 |
|
|
28
|
+
| Read | `docs/feature-user/v1/spec_tech.md`, offset=498, limit=200 |
|
|
29
|
+
| Read | `docs/feature-user/v1/spec_tech.md`, offset=697, limit=200 |
|
|
30
|
+
|
|
31
|
+
> Sections 1-16 of the SPEC_TECH were fully read.
|
|
32
|
+
|
|
33
|
+
## 4. Passo 1 -- Read ALL project rules
|
|
34
|
+
|
|
35
|
+
Rules already loaded from system-reminder context (CLAUDE.md and all .claude/rules/* files were provided as context). Confirmed reading:
|
|
36
|
+
- `CLAUDE.md`
|
|
37
|
+
- `.claude/rules/code-conventions.md`
|
|
38
|
+
- `.claude/rules/database.md`
|
|
39
|
+
- `.claude/rules/fx-di.md`
|
|
40
|
+
- `.claude/rules/grpc.md`
|
|
41
|
+
- `.claude/rules/protobuf.md`
|
|
42
|
+
- `.claude/rules/repository.md`
|
|
43
|
+
- `.claude/rules/service.md`
|
|
44
|
+
- `.claude/rules/sqlc.md`
|
|
45
|
+
|
|
46
|
+
## 5. Passo 2 -- Explore codebase (parallel)
|
|
47
|
+
|
|
48
|
+
| Tool | Parameters |
|
|
49
|
+
|------|-----------|
|
|
50
|
+
| Glob | pattern=`**/*.go`, path=project root |
|
|
51
|
+
| Glob | pattern=`internal/db/migrations/*`, path=project root |
|
|
52
|
+
| Glob | pattern=`internal/db/queries/*`, path=project root |
|
|
53
|
+
|
|
54
|
+
> Found 24 Go files. Found 2 migration files. No query files in `internal/db/queries/` (queries are in `internal/db/sqlc/queries/`).
|
|
55
|
+
|
|
56
|
+
## 6. Read existing implementation files (parallel)
|
|
57
|
+
|
|
58
|
+
| Tool | Parameters |
|
|
59
|
+
|------|-----------|
|
|
60
|
+
| Read | `internal/repository/user_repository.go` |
|
|
61
|
+
| Read | `internal/service/user_service.go` |
|
|
62
|
+
| Read | `internal/handler/grpc/user_handler.go` |
|
|
63
|
+
| Read | `internal/infra/grpc/interceptors/auth.go` |
|
|
64
|
+
| Read | `internal/infra/config/config.go` |
|
|
65
|
+
| Read | `internal/pkg/identity/identity.go` |
|
|
66
|
+
|
|
67
|
+
> All 6 files read successfully. Confirmed that the entire feature is already implemented.
|
|
68
|
+
|
|
69
|
+
## 7. Create output directory
|
|
70
|
+
|
|
71
|
+
| Tool | Parameters |
|
|
72
|
+
|------|-----------|
|
|
73
|
+
| Bash | `mkdir -p ...outputs/` |
|
|
74
|
+
|
|
75
|
+
## 8. Write output files
|
|
76
|
+
|
|
77
|
+
| Tool | Parameters |
|
|
78
|
+
|------|-----------|
|
|
79
|
+
| Write | `response.md` -- main response with feature name confirmation and macro-phases |
|
|
80
|
+
| Write | `transcript.md` -- this file |
|
|
81
|
+
|
|
82
|
+
---
|
|
83
|
+
|
|
84
|
+
## Summary of Findings
|
|
85
|
+
|
|
86
|
+
- **Feature name extracted**: "Modulo de Usuario -- Vakinha Burger" from SPEC_TECH section 1
|
|
87
|
+
- **Feature directory**: `feature-user` (already exists at `docs/feature-user/v1/`)
|
|
88
|
+
- **Critical finding**: The entire feature is already implemented in the codebase. All files referenced in sections 3.1 and 15 of the SPEC_TECH exist with complete implementations.
|
|
89
|
+
- **Macro-phases proposed**: 5 phases (Fundacao, Dados, Negocio, Apresentacao, Testes) with 11 tasks
|
|
90
|
+
- **User Stories covered**: US-01 through US-04, all mapped to phases
|
|
91
|
+
- **First interaction completed**: Feature name confirmed + macro-phases proposed + awaiting user confirmation
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"total_tokens": 64193, "duration_ms": 125607, "total_duration_seconds": 125.6}
|
|
1
|
+
{"total_tokens": 64193, "duration_ms": 125607, "total_duration_seconds": 125.6}
|
|
@@ -1,32 +1,32 @@
|
|
|
1
|
-
{
|
|
2
|
-
"eval_id": 1,
|
|
3
|
-
"eval_name": "happy-path-spec-tech-usuario",
|
|
4
|
-
"configuration": "without_skill",
|
|
5
|
-
"expectations": [
|
|
6
|
-
{
|
|
7
|
-
"text": "Extrai o nome da feature do SPEC_TECH e confirma com o usuario antes de prosseguir",
|
|
8
|
-
"passed": false,
|
|
9
|
-
"evidence": "Gerou o task plan completo com 12 tasks sem confirmar o nome da feature com o usuario. Identificou 'Modulo de Usuario v1' mas nao perguntou se estava correto."
|
|
10
|
-
},
|
|
11
|
-
{
|
|
12
|
-
"text": "Faz apenas UMA pergunta por vez (nao bombardeia com multiplas perguntas no mesmo turno)",
|
|
13
|
-
"passed": false,
|
|
14
|
-
"evidence": "Nenhuma pergunta foi feita ao usuario. O output completo (695 linhas) foi gerado de uma vez sem interacao."
|
|
15
|
-
},
|
|
16
|
-
{
|
|
17
|
-
"text": "Propoe macro-fases de alto nivel e aguarda validacao antes de criar tasks",
|
|
18
|
-
"passed": false,
|
|
19
|
-
"evidence": "Pulou diretamente para tasks detalhadas (TASK 01-12) sem propor macro-fases primeiro e aguardar validacao."
|
|
20
|
-
},
|
|
21
|
-
{
|
|
22
|
-
"text": "Le as rules do projeto (.claude/rules/ e CLAUDE.md) ANTES de gerar tasks",
|
|
23
|
-
"passed": false,
|
|
24
|
-
"evidence": "Transcript mostra apenas leitura do SPEC_TECH e arquivos de implementacao. Nenhuma leitura de .claude/rules/ ou CLAUDE.md foi registrada."
|
|
25
|
-
},
|
|
26
|
-
{
|
|
27
|
-
"text": "NAO inicia execucao automatica de tasks — apenas apresenta o plano e aguarda",
|
|
28
|
-
"passed": true,
|
|
29
|
-
"evidence": "Apresentou apenas o plano sem executar nenhuma task."
|
|
30
|
-
}
|
|
31
|
-
]
|
|
32
|
-
}
|
|
1
|
+
{
|
|
2
|
+
"eval_id": 1,
|
|
3
|
+
"eval_name": "happy-path-spec-tech-usuario",
|
|
4
|
+
"configuration": "without_skill",
|
|
5
|
+
"expectations": [
|
|
6
|
+
{
|
|
7
|
+
"text": "Extrai o nome da feature do SPEC_TECH e confirma com o usuario antes de prosseguir",
|
|
8
|
+
"passed": false,
|
|
9
|
+
"evidence": "Gerou o task plan completo com 12 tasks sem confirmar o nome da feature com o usuario. Identificou 'Modulo de Usuario v1' mas nao perguntou se estava correto."
|
|
10
|
+
},
|
|
11
|
+
{
|
|
12
|
+
"text": "Faz apenas UMA pergunta por vez (nao bombardeia com multiplas perguntas no mesmo turno)",
|
|
13
|
+
"passed": false,
|
|
14
|
+
"evidence": "Nenhuma pergunta foi feita ao usuario. O output completo (695 linhas) foi gerado de uma vez sem interacao."
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
"text": "Propoe macro-fases de alto nivel e aguarda validacao antes de criar tasks",
|
|
18
|
+
"passed": false,
|
|
19
|
+
"evidence": "Pulou diretamente para tasks detalhadas (TASK 01-12) sem propor macro-fases primeiro e aguardar validacao."
|
|
20
|
+
},
|
|
21
|
+
{
|
|
22
|
+
"text": "Le as rules do projeto (.claude/rules/ e CLAUDE.md) ANTES de gerar tasks",
|
|
23
|
+
"passed": false,
|
|
24
|
+
"evidence": "Transcript mostra apenas leitura do SPEC_TECH e arquivos de implementacao. Nenhuma leitura de .claude/rules/ ou CLAUDE.md foi registrada."
|
|
25
|
+
},
|
|
26
|
+
{
|
|
27
|
+
"text": "NAO inicia execucao automatica de tasks — apenas apresenta o plano e aguarda",
|
|
28
|
+
"passed": true,
|
|
29
|
+
"evidence": "Apresentou apenas o plano sem executar nenhuma task."
|
|
30
|
+
}
|
|
31
|
+
]
|
|
32
|
+
}
|