@exaudeus/workrail 3.27.0 → 3.29.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/console/assets/{index-FtTaDku8.js → index-BZ6HkxGf.js} +1 -1
- package/dist/console/index.html +1 -1
- package/dist/manifest.json +3 -3
- package/docs/README.md +57 -0
- package/docs/adrs/001-hybrid-storage-backend.md +38 -0
- package/docs/adrs/002-four-layer-context-classification.md +38 -0
- package/docs/adrs/003-checkpoint-trigger-strategy.md +35 -0
- package/docs/adrs/004-opt-in-encryption-strategy.md +36 -0
- package/docs/adrs/005-agent-first-workflow-execution-tokens.md +105 -0
- package/docs/adrs/006-append-only-session-run-event-log.md +76 -0
- package/docs/adrs/007-resume-and-checkpoint-only-sessions.md +51 -0
- package/docs/adrs/008-blocked-nodes-architectural-upgrade.md +178 -0
- package/docs/adrs/009-bridge-mode-single-instance-mcp.md +195 -0
- package/docs/adrs/010-release-pipeline.md +89 -0
- package/docs/architecture/README.md +7 -0
- package/docs/architecture/refactor-audit.md +364 -0
- package/docs/authoring-v2.md +527 -0
- package/docs/authoring.md +873 -0
- package/docs/changelog-recent.md +201 -0
- package/docs/configuration.md +505 -0
- package/docs/ctc-mcp-proposal.md +518 -0
- package/docs/design/README.md +22 -0
- package/docs/design/agent-cascade-protocol.md +96 -0
- package/docs/design/autonomous-console-design-candidates.md +253 -0
- package/docs/design/autonomous-console-design-review.md +111 -0
- package/docs/design/autonomous-platform-mvp-discovery.md +525 -0
- package/docs/design/claude-code-source-deep-dive.md +713 -0
- package/docs/design/console-cyberpunk-ui-discovery.md +504 -0
- package/docs/design/console-execution-trace-candidates-final.md +160 -0
- package/docs/design/console-execution-trace-candidates.md +211 -0
- package/docs/design/console-execution-trace-design-candidates-v2.md +113 -0
- package/docs/design/console-execution-trace-design-review.md +74 -0
- package/docs/design/console-execution-trace-discovery.md +394 -0
- package/docs/design/console-execution-trace-final-review.md +77 -0
- package/docs/design/console-execution-trace-review.md +92 -0
- package/docs/design/console-performance-discovery.md +415 -0
- package/docs/design/console-ui-backlog.md +280 -0
- package/docs/design/daemon-architecture-discovery.md +853 -0
- package/docs/design/daemon-design-candidates.md +318 -0
- package/docs/design/daemon-design-review-findings.md +119 -0
- package/docs/design/daemon-engine-design-candidates.md +210 -0
- package/docs/design/daemon-engine-design-review.md +131 -0
- package/docs/design/daemon-execution-engine-discovery.md +280 -0
- package/docs/design/daemon-gap-analysis.md +554 -0
- package/docs/design/daemon-owns-console-plan.md +168 -0
- package/docs/design/daemon-owns-console-review.md +91 -0
- package/docs/design/daemon-owns-console.md +195 -0
- package/docs/design/data-model-erd.md +11 -0
- package/docs/design/design-candidates-consolidate-dev-staleness.md +98 -0
- package/docs/design/design-candidates-walk-cache-depth-limit.md +80 -0
- package/docs/design/design-review-consolidate-dev-staleness.md +54 -0
- package/docs/design/design-review-walk-cache-depth-limit.md +48 -0
- package/docs/design/implementation-plan-consolidate-dev-staleness.md +142 -0
- package/docs/design/implementation-plan-walk-cache-depth-limit.md +141 -0
- package/docs/design/layer3b-ghost-nodes-design-candidates.md +229 -0
- package/docs/design/layer3b-ghost-nodes-design-review.md +93 -0
- package/docs/design/layer3b-ghost-nodes-implementation-plan.md +219 -0
- package/docs/design/list-workflows-latency-fix-plan.md +128 -0
- package/docs/design/list-workflows-latency-fix-review.md +55 -0
- package/docs/design/list-workflows-latency-fix.md +109 -0
- package/docs/design/native-context-management-api.md +11 -0
- package/docs/design/performance-sweep-2026-04.md +96 -0
- package/docs/design/routines-guide.md +219 -0
- package/docs/design/sequence-diagrams.md +11 -0
- package/docs/design/subagent-design-principles.md +220 -0
- package/docs/design/temporal-patterns-design-candidates.md +312 -0
- package/docs/design/temporal-patterns-design-review-findings.md +163 -0
- package/docs/design/test-isolation-from-config-file.md +335 -0
- package/docs/design/v2-core-design-locks.md +2746 -0
- package/docs/design/v2-lock-registry.json +734 -0
- package/docs/design/workflow-authoring-v2.md +1044 -0
- package/docs/design/workflow-docs-spec.md +218 -0
- package/docs/design/workflow-extension-points.md +687 -0
- package/docs/design/workrail-auto-trigger-system.md +359 -0
- package/docs/design/workrail-config-file-discovery.md +513 -0
- package/docs/docker.md +110 -0
- package/docs/generated/v2-lock-closure-plan.md +26 -0
- package/docs/generated/v2-lock-coverage.json +797 -0
- package/docs/generated/v2-lock-coverage.md +177 -0
- package/docs/ideas/backlog.md +3927 -0
- package/docs/ideas/design-candidates-mcp-resilience.md +208 -0
- package/docs/ideas/design-review-findings-mcp-resilience.md +119 -0
- package/docs/ideas/implementation_plan.md +249 -0
- package/docs/ideas/third-party-workflow-setup-design-thinking.md +1948 -0
- package/docs/implementation/02-architecture.md +316 -0
- package/docs/implementation/04-testing-strategy.md +124 -0
- package/docs/implementation/09-simple-workflow-guide.md +835 -0
- package/docs/implementation/13-advanced-validation-guide.md +874 -0
- package/docs/implementation/README.md +21 -0
- package/docs/integrations/claude-code.md +300 -0
- package/docs/integrations/firebender.md +315 -0
- package/docs/migration/v0.1.0.md +147 -0
- package/docs/naming-conventions.md +45 -0
- package/docs/planning/README.md +104 -0
- package/docs/planning/github-ticketing-playbook.md +195 -0
- package/docs/plans/README.md +24 -0
- package/docs/plans/agent-managed-ticketing-design.md +605 -0
- package/docs/plans/agentic-orchestration-roadmap.md +112 -0
- package/docs/plans/assessment-gates-engine-handoff.md +536 -0
- package/docs/plans/content-coherence-and-references.md +151 -0
- package/docs/plans/library-extraction-plan.md +340 -0
- package/docs/plans/mr-review-workflow-redesign.md +1451 -0
- package/docs/plans/native-context-management-epic.md +11 -0
- package/docs/plans/perf-fixes-design-candidates.md +225 -0
- package/docs/plans/perf-fixes-design-review-findings.md +61 -0
- package/docs/plans/perf-fixes-new-issues-candidates.md +264 -0
- package/docs/plans/perf-fixes-new-issues-review.md +110 -0
- package/docs/plans/prompt-fragments.md +53 -0
- package/docs/plans/ui-ux-workflow-design-candidates.md +120 -0
- package/docs/plans/ui-ux-workflow-discovery.md +100 -0
- package/docs/plans/ui-ux-workflow-review.md +48 -0
- package/docs/plans/v2-followup-enhancements.md +587 -0
- package/docs/plans/workflow-categories-candidates.md +105 -0
- package/docs/plans/workflow-categories-discovery.md +110 -0
- package/docs/plans/workflow-categories-review.md +51 -0
- package/docs/plans/workflow-discovery-model-candidates.md +94 -0
- package/docs/plans/workflow-discovery-model-discovery.md +74 -0
- package/docs/plans/workflow-discovery-model-review.md +48 -0
- package/docs/plans/workflow-source-setup-phase-1.md +245 -0
- package/docs/plans/workflow-source-setup-phase-2.md +361 -0
- package/docs/plans/workflow-staleness-detection-candidates.md +104 -0
- package/docs/plans/workflow-staleness-detection-review.md +58 -0
- package/docs/plans/workflow-staleness-detection.md +80 -0
- package/docs/plans/workflow-v2-design.md +69 -0
- package/docs/plans/workflow-v2-roadmap.md +74 -0
- package/docs/plans/workflow-validation-design.md +98 -0
- package/docs/plans/workflow-validation-roadmap.md +108 -0
- package/docs/plans/workrail-platform-vision.md +420 -0
- package/docs/reference/agent-context-cleaner-snippet.md +94 -0
- package/docs/reference/agent-context-guidance.md +140 -0
- package/docs/reference/context-optimization.md +284 -0
- package/docs/reference/example-workflow-repository-template/.github/workflows/validate.yml +125 -0
- package/docs/reference/example-workflow-repository-template/README.md +268 -0
- package/docs/reference/example-workflow-repository-template/workflows/example-workflow.json +80 -0
- package/docs/reference/external-workflow-repositories.md +916 -0
- package/docs/reference/feature-flags-architecture.md +472 -0
- package/docs/reference/feature-flags.md +349 -0
- package/docs/reference/god-tier-workflow-validation.md +272 -0
- package/docs/reference/loop-optimization.md +209 -0
- package/docs/reference/loop-validation.md +176 -0
- package/docs/reference/loops.md +465 -0
- package/docs/reference/mcp-platform-constraints.md +59 -0
- package/docs/reference/recovery.md +88 -0
- package/docs/reference/releases.md +177 -0
- package/docs/reference/troubleshooting.md +105 -0
- package/docs/reference/workflow-execution-contract.md +998 -0
- package/docs/roadmap/README.md +22 -0
- package/docs/roadmap/legacy-planning-status.md +103 -0
- package/docs/roadmap/now-next-later.md +70 -0
- package/docs/roadmap/open-work-inventory.md +389 -0
- package/docs/tickets/README.md +39 -0
- package/docs/tickets/next-up.md +76 -0
- package/docs/workflow-management.md +317 -0
- package/docs/workflow-templates.md +423 -0
- package/docs/workflow-validation.md +184 -0
- package/docs/workflows.md +254 -0
- package/package.json +3 -1
- package/spec/authoring-spec.json +61 -16
- package/workflows/workflow-for-workflows.json +252 -93
- package/workflows/workflow-for-workflows.v2.json +188 -77
|
@@ -32,7 +32,7 @@
|
|
|
32
32
|
"BASELINE DISCIPLINE: choose both an authoring baseline and an outcome baseline whenever possible. Copy structural patterns, not domain language.",
|
|
33
33
|
"VALIDATION GATE: validate with real validators, not regex approximations. When validator output and authoring assumptions conflict, runtime wins.",
|
|
34
34
|
"DEEP REVIEW: authoring integrity and outcome effectiveness are separate concerns. A workflow is not ready unless both pass.",
|
|
35
|
-
"
|
|
35
|
+
"RIGOR: always run the deepest review path -- state economy audit, execution simulation, adversarial review, and redesign if hard gates fail. There is no reduced-rigor mode.",
|
|
36
36
|
"ARTIFACT STRATEGY: the workflow JSON file is the primary output. Intermediate notes go in output.notesMarkdown. Do not create extra planning artifacts unless the workflow is genuinely complex.",
|
|
37
37
|
"V2 DURABILITY: use output.notesMarkdown as the primary durable record. Do not mirror execution state into CONTEXT.md or markdown checkpoint files.",
|
|
38
38
|
"ANTI-PATTERNS TO AVOID IN AUTHORED WORKFLOWS: no pseudo-function metaGuidance, no learning-path branching, no satisfaction-score loops, no heavy clarification batteries, no regex-as-primary-validation, no celebration phases.",
|
|
@@ -70,7 +70,7 @@
|
|
|
70
70
|
"id": "authoring-guide-v2",
|
|
71
71
|
"title": "Workflow Authoring Guide (v2)",
|
|
72
72
|
"source": "docs/authoring-v2.md",
|
|
73
|
-
"resolveFrom": "
|
|
73
|
+
"resolveFrom": "package",
|
|
74
74
|
"purpose": "Current v2 authoring principles, references guidance, and durable execution patterns.",
|
|
75
75
|
"authoritative": true
|
|
76
76
|
},
|
|
@@ -78,7 +78,7 @@
|
|
|
78
78
|
"id": "workflow-authoring-reference",
|
|
79
79
|
"title": "Workflow Authoring Reference",
|
|
80
80
|
"source": "docs/design/workflow-authoring-v2.md",
|
|
81
|
-
"resolveFrom": "
|
|
81
|
+
"resolveFrom": "package",
|
|
82
82
|
"purpose": "Detailed v2 workflow authoring patterns for loops, conditions, references, and workflow structure.",
|
|
83
83
|
"authoritative": true
|
|
84
84
|
},
|
|
@@ -86,7 +86,7 @@
|
|
|
86
86
|
"id": "routines-guide",
|
|
87
87
|
"title": "Routines Guide",
|
|
88
88
|
"source": "docs/design/routines-guide.md",
|
|
89
|
-
"resolveFrom": "
|
|
89
|
+
"resolveFrom": "package",
|
|
90
90
|
"purpose": "Current guide for deciding when to use delegation, direct execution, or template injection in authored workflows.",
|
|
91
91
|
"authoritative": false
|
|
92
92
|
},
|
|
@@ -141,23 +141,38 @@
|
|
|
141
141
|
],
|
|
142
142
|
"procedure": [
|
|
143
143
|
"Read the schema, authoring spec, v2 authoring guides, and the strongest relevant example workflows.",
|
|
144
|
-
"Decide `authoringMode`: `create` or `modernize_existing`.",
|
|
145
144
|
"Classify the target workflow archetype: `review_audit`, `coding_execution`, `diagnostic_investigation`, `planning_design`, `linear_operational`, or `content_analysis`.",
|
|
146
|
-
"Classify `workflowComplexity`: Simple, Medium, or Complex.
|
|
147
|
-
"Choose an `authoringBaseline` for engine-native authoring quality and an `outcomeBaseline` for the kind of job the authored workflow should perform. If no good baseline exists for one of them, set it to `none` and explain why."
|
|
148
|
-
"If `authoringMode = modernize_existing`, build a value inventory BEFORE forming opinions about what to change. Read the original and classify each meaningful mechanism: (1) enforcement mechanisms (forcing functions, hard gates, required outputs), (2) domain knowledge (problem-specific principles the agent would not otherwise know), (3) behavioral rules (persistent constraints on how the agent works). This inventory is the preservation checklist.",
|
|
149
|
-
"If `authoringMode = modernize_existing`, identify what must stay the same about purpose, what feels stale, and what modernization constraints apply."
|
|
145
|
+
"Classify `workflowComplexity`: Simple, Medium, or Complex.",
|
|
146
|
+
"Choose an `authoringBaseline` for engine-native authoring quality and an `outcomeBaseline` for the kind of job the authored workflow should perform. If no good baseline exists for one of them, set it to `none` and explain why."
|
|
150
147
|
],
|
|
151
148
|
"outputRequired": {
|
|
152
149
|
"notesMarkdown": "Task understanding, baseline choices, patterns to borrow or avoid, and any real open questions.",
|
|
153
|
-
"context": "Capture authoringMode, workflowArchetype, workflowComplexity,
|
|
150
|
+
"context": "Capture authoringMode, workflowArchetype, workflowComplexity, taskDescription, intendedAudience, successCriteria, domainConstraints, targetWorkflowPath, modernizationGoals, authoringBaseline, outcomeBaseline, baselineDecisionRationale, authoringPatternsToBorrow, outcomePatternsToBorrow, patternsToAvoid, openQuestions, and valueInventory (modernize_existing only)."
|
|
154
151
|
},
|
|
155
152
|
"verify": [
|
|
156
153
|
"The task is understood well enough to design the workflow without guessing blindly.",
|
|
157
154
|
"Both authoring and outcome baselines are explicit, or their absence is justified."
|
|
158
155
|
]
|
|
159
156
|
},
|
|
160
|
-
"requireConfirmation": true
|
|
157
|
+
"requireConfirmation": true,
|
|
158
|
+
"promptFragments": [
|
|
159
|
+
{
|
|
160
|
+
"id": "phase-0-modernize-inventory",
|
|
161
|
+
"when": {
|
|
162
|
+
"var": "authoringMode",
|
|
163
|
+
"equals": "modernize_existing"
|
|
164
|
+
},
|
|
165
|
+
"text": "Decide `authoringMode`: `create` or `modernize_existing`."
|
|
166
|
+
},
|
|
167
|
+
{
|
|
168
|
+
"id": "phase-0-modernize-scope",
|
|
169
|
+
"when": {
|
|
170
|
+
"var": "authoringMode",
|
|
171
|
+
"equals": "modernize_existing"
|
|
172
|
+
},
|
|
173
|
+
"text": "If `authoringMode = modernize_existing`, build a value inventory BEFORE forming opinions about what to change. Read the original and classify each meaningful mechanism: (1) enforcement mechanisms (forcing functions, hard gates, required outputs), (2) domain knowledge (problem-specific principles the agent would not otherwise know), (3) behavioral rules (persistent constraints on how the agent works). This inventory is the preservation checklist."
|
|
174
|
+
}
|
|
175
|
+
]
|
|
161
176
|
},
|
|
162
177
|
{
|
|
163
178
|
"id": "phase-1-define-effectiveness-target",
|
|
@@ -187,10 +202,6 @@
|
|
|
187
202
|
{
|
|
188
203
|
"id": "phase-2-design-workflow-architecture",
|
|
189
204
|
"title": "Phase 2: Design the Workflow Architecture",
|
|
190
|
-
"runCondition": {
|
|
191
|
-
"var": "workflowComplexity",
|
|
192
|
-
"not_equals": "Simple"
|
|
193
|
-
},
|
|
194
205
|
"promptBlocks": {
|
|
195
206
|
"goal": "Decide the workflow architecture before you write JSON.",
|
|
196
207
|
"constraints": [
|
|
@@ -200,8 +211,7 @@
|
|
|
200
211
|
"procedure": [
|
|
201
212
|
"Decide the phase list, one-line goal for each phase, and overall ordering.",
|
|
202
213
|
"Design loops with explicit exit rules, bounded maxIterations, and real reasons for another pass.",
|
|
203
|
-
"Decide confirmation gates, delegation vs template injection vs direct execution, promptFragments, references, artifacts, and metaGuidance."
|
|
204
|
-
"If `authoringMode = modernize_existing`, decide preserve-in-place, restructure, or rewrite. For each item in valueInventory, record: `preserved` (structurally present with equivalent enforcement), `replaced` (new mechanism prevents same failure mode -- justify equivalence), or `dropped` (intentionally removed -- justify the loss). Phase-level mapping alone is insufficient; track what was inside each restructured or removed phase."
|
|
214
|
+
"Decide confirmation gates, delegation vs template injection vs direct execution, promptFragments, references, artifacts, and metaGuidance."
|
|
205
215
|
],
|
|
206
216
|
"outputRequired": {
|
|
207
217
|
"notesMarkdown": "Structured workflow outline, loop design, confirmation design, delegation design, artifact plan, and modernization mapping.",
|
|
@@ -212,6 +222,14 @@
|
|
|
212
222
|
]
|
|
213
223
|
},
|
|
214
224
|
"promptFragments": [
|
|
225
|
+
{
|
|
226
|
+
"id": "phase-2-simple-scope",
|
|
227
|
+
"when": {
|
|
228
|
+
"var": "workflowComplexity",
|
|
229
|
+
"equals": "Simple"
|
|
230
|
+
},
|
|
231
|
+
"text": "This is a Simple workflow. Keep the architecture lightweight: a flat phase list, no loops required, minimal confirmations, no delegation. The goal is clarity and direct execution, not structural sophistication."
|
|
232
|
+
},
|
|
215
233
|
{
|
|
216
234
|
"id": "phase-2-simple-direct",
|
|
217
235
|
"when": {
|
|
@@ -219,19 +237,19 @@
|
|
|
219
237
|
"equals": "Simple"
|
|
220
238
|
},
|
|
221
239
|
"text": "For Simple workflows, keep the architecture linear and compact. Do not invent loops or ceremony unless the task truly needs them."
|
|
240
|
+
},
|
|
241
|
+
{
|
|
242
|
+
"id": "phase-2-modernize-mapping",
|
|
243
|
+
"when": {
|
|
244
|
+
"var": "authoringMode",
|
|
245
|
+
"equals": "modernize_existing"
|
|
246
|
+
},
|
|
247
|
+
"text": "If `authoringMode = modernize_existing`, decide preserve-in-place, restructure, or rewrite. For each item in valueInventory, record: `preserved` (structurally present with equivalent enforcement), `replaced` (new mechanism prevents same failure mode -- justify equivalence), or `dropped` (intentionally removed -- justify the loss). Phase-level mapping alone is insufficient; track what was inside each restructured or removed phase."
|
|
222
248
|
}
|
|
223
249
|
],
|
|
224
250
|
"requireConfirmation": {
|
|
225
|
-
"
|
|
226
|
-
|
|
227
|
-
"var": "workflowComplexity",
|
|
228
|
-
"not_equals": "Simple"
|
|
229
|
-
},
|
|
230
|
-
{
|
|
231
|
-
"var": "rigorMode",
|
|
232
|
-
"not_equals": "QUICK"
|
|
233
|
-
}
|
|
234
|
-
]
|
|
251
|
+
"var": "workflowComplexity",
|
|
252
|
+
"not_equals": "Simple"
|
|
235
253
|
}
|
|
236
254
|
},
|
|
237
255
|
{
|
|
@@ -257,18 +275,16 @@
|
|
|
257
275
|
"The authored workflow has an explicit plan for false-confidence resistance and quality review."
|
|
258
276
|
]
|
|
259
277
|
},
|
|
260
|
-
"
|
|
261
|
-
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
"equals": "THOROUGH"
|
|
265
|
-
},
|
|
266
|
-
{
|
|
278
|
+
"promptFragments": [
|
|
279
|
+
{
|
|
280
|
+
"id": "phase-3-simple-scope",
|
|
281
|
+
"when": {
|
|
267
282
|
"var": "workflowComplexity",
|
|
268
|
-
"equals": "
|
|
269
|
-
}
|
|
270
|
-
|
|
271
|
-
|
|
283
|
+
"equals": "Simple"
|
|
284
|
+
},
|
|
285
|
+
"text": "This is a Simple workflow. Quality architecture should be proportional: identify one primary false-confidence mode and one key hard gate. Skip full reviewer family design -- a single self-executed review pass is sufficient."
|
|
286
|
+
}
|
|
287
|
+
]
|
|
272
288
|
},
|
|
273
289
|
{
|
|
274
290
|
"id": "phase-4-draft-or-revise",
|
|
@@ -344,10 +360,6 @@
|
|
|
344
360
|
"promptFragments": [
|
|
345
361
|
{
|
|
346
362
|
"id": "phase-5a-thorough",
|
|
347
|
-
"when": {
|
|
348
|
-
"var": "rigorMode",
|
|
349
|
-
"equals": "THOROUGH"
|
|
350
|
-
},
|
|
351
363
|
"text": "After structural validation passes, also check the workflow manually against required-level authoring-spec rules and fix any failures before moving on."
|
|
352
364
|
}
|
|
353
365
|
],
|
|
@@ -388,13 +400,13 @@
|
|
|
388
400
|
"equals": false
|
|
389
401
|
},
|
|
390
402
|
"promptBlocks": {
|
|
391
|
-
"goal": "
|
|
403
|
+
"goal": "Stop execution. A structurally broken workflow must not proceed to the quality gate loop. Surface the errors and require user intervention.",
|
|
392
404
|
"constraints": [
|
|
393
405
|
"Present the situation honestly."
|
|
394
406
|
],
|
|
395
407
|
"procedure": [
|
|
396
408
|
"List the remaining validation errors and assess their severity.",
|
|
397
|
-
"
|
|
409
|
+
"Stop and require user intervention. Do not proceed into the quality gate loop with a structurally broken workflow. The user must explicitly decide how to resolve each remaining error before this workflow can continue."
|
|
398
410
|
]
|
|
399
411
|
},
|
|
400
412
|
"requireConfirmation": true
|
|
@@ -410,7 +422,7 @@
|
|
|
410
422
|
"contractRef": "wr.contracts.loop_control",
|
|
411
423
|
"loopId": "quality_gate_loop"
|
|
412
424
|
},
|
|
413
|
-
"maxIterations":
|
|
425
|
+
"maxIterations": 3
|
|
414
426
|
},
|
|
415
427
|
"body": [
|
|
416
428
|
{
|
|
@@ -435,7 +447,21 @@
|
|
|
435
447
|
"Weak or unused fields are either wired meaningfully or removed."
|
|
436
448
|
]
|
|
437
449
|
},
|
|
438
|
-
"requireConfirmation": false
|
|
450
|
+
"requireConfirmation": false,
|
|
451
|
+
"assessmentRefs": [
|
|
452
|
+
"state-economy-gate"
|
|
453
|
+
],
|
|
454
|
+
"assessmentConsequences": [
|
|
455
|
+
{
|
|
456
|
+
"when": {
|
|
457
|
+
"anyEqualsLevel": "low"
|
|
458
|
+
},
|
|
459
|
+
"effect": {
|
|
460
|
+
"kind": "require_followup",
|
|
461
|
+
"guidance": "state_economy low -- one or more context fields are unused, weakly consumed, or carry no decision weight. Remove or wire them before proceeding: trace a concrete downstream use for each field, or delete it from the workflow."
|
|
462
|
+
}
|
|
463
|
+
}
|
|
464
|
+
]
|
|
439
465
|
},
|
|
440
466
|
{
|
|
441
467
|
"id": "phase-6b-execution-simulation",
|
|
@@ -463,14 +489,6 @@
|
|
|
463
489
|
]
|
|
464
490
|
},
|
|
465
491
|
"promptFragments": [
|
|
466
|
-
{
|
|
467
|
-
"id": "phase-6b-quick",
|
|
468
|
-
"when": {
|
|
469
|
-
"var": "rigorMode",
|
|
470
|
-
"equals": "QUICK"
|
|
471
|
-
},
|
|
472
|
-
"text": "For QUICK rigor, keep the simulation compact but still answer where the workflow would likely disappoint the user if it disappointed them at all."
|
|
473
|
-
},
|
|
474
492
|
{
|
|
475
493
|
"id": "phase-6b-modernize-check",
|
|
476
494
|
"when": {
|
|
@@ -480,7 +498,21 @@
|
|
|
480
498
|
"text": "For modernize_existing: after tracing the workflow forward, check each item in valueInventory. For each enforcement mechanism and domain knowledge item: would the modernized workflow produce the same behavior? Any item where the answer is no or weaker is a loss -- fix it directly or record the accepted tradeoff with justification."
|
|
481
499
|
}
|
|
482
500
|
],
|
|
483
|
-
"requireConfirmation": false
|
|
501
|
+
"requireConfirmation": false,
|
|
502
|
+
"assessmentRefs": [
|
|
503
|
+
"simulation-outcome-gate"
|
|
504
|
+
],
|
|
505
|
+
"assessmentConsequences": [
|
|
506
|
+
{
|
|
507
|
+
"when": {
|
|
508
|
+
"anyEqualsLevel": "low"
|
|
509
|
+
},
|
|
510
|
+
"effect": {
|
|
511
|
+
"kind": "require_followup",
|
|
512
|
+
"guidance": "simulation_outcome low -- the simulation found likely unsatisfying or false-confidence outputs that were not fixed inline. Address the identified weak steps or degraded-path failures before the adversarial review."
|
|
513
|
+
}
|
|
514
|
+
}
|
|
515
|
+
]
|
|
484
516
|
},
|
|
485
517
|
{
|
|
486
518
|
"id": "phase-6c-adversarial-quality-review",
|
|
@@ -492,11 +524,11 @@
|
|
|
492
524
|
"Reviewer-family or validator output is evidence, not authority."
|
|
493
525
|
],
|
|
494
526
|
"procedure": [
|
|
495
|
-
"Score these dimensions 0-2 with one sentence of evidence each: `voiceClarity`, `ceremonyLevel`, `loopSoundness`, `delegationBoundedness`, `artifactClarity`, `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, `handoffUtility`, `
|
|
496
|
-
"
|
|
527
|
+
"Score these dimensions 0-2 with one sentence of evidence each: `voiceClarity`, `ceremonyLevel`, `loopSoundness`, `delegationBoundedness`, `artifactClarity`, `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, `handoffUtility`, and `complexityScaling` (0 = has appropriate fast paths or scope-sensitive branching for simpler inputs; 2 = single-weight, over-engineers simple cases)2 = single-weight), `enforcementStrength` (0 = behavioral rules have structural teeth; 2 = important rules are prose-only with no enforcement mechanism), and `modernizationDiscipline` (0 = every valueInventory item preserved, equivalently replaced with justification, or dropped with justification; 2 = items missing or replaced with weaker versions without justification -- score 0 for create mode).",
|
|
528
|
+
"Run an adversarial review bundle with these lenses: `engine_native_reviewer`, `task_effectiveness_reviewer`, `state_economy_reviewer`, `false_confidence_reviewer`, `domain_fit_reviewer`, and `maintainer_reviewer`.",
|
|
497
529
|
"Synthesize what the review confirmed, what it challenged, and what changed your mind.",
|
|
498
530
|
"When scoring `falseConfidenceResistance`, explicitly check: do the workflow's quality gates protect edge cases and degraded paths, or only the happy path? A workflow that passes its own checks on ideal input but fails silently on minimal or unexpected input scores 2.",
|
|
499
|
-
"Set hard-gate failures whenever any of these are materially weak: `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, or `handoffUtility
|
|
531
|
+
"Set hard-gate failures whenever any of these are materially weak: `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, or `handoffUtility`, and `complexityScaling` (0 = has appropriate fast paths or scope-sensitive branching for simpler inputs; 2 = single-weight, over-engineers simple cases).",
|
|
500
532
|
"Set `authoringIntegrityPassed = true` only if structural and authoring-quality dimensions are all acceptable. Set `outcomeEffectivenessPassed = true` only if the workflow is likely to achieve satisfying results for the user."
|
|
501
533
|
],
|
|
502
534
|
"outputRequired": {
|
|
@@ -509,20 +541,8 @@
|
|
|
509
541
|
},
|
|
510
542
|
"promptFragments": [
|
|
511
543
|
{
|
|
512
|
-
"id": "phase-6c-
|
|
513
|
-
"
|
|
514
|
-
"var": "rigorMode",
|
|
515
|
-
"equals": "STANDARD"
|
|
516
|
-
},
|
|
517
|
-
"text": "For STANDARD rigor, you may keep the review self-executed unless uncertainty remains material. If you do delegate, prefer a small adversarial bundle."
|
|
518
|
-
},
|
|
519
|
-
{
|
|
520
|
-
"id": "phase-6c-thorough",
|
|
521
|
-
"when": {
|
|
522
|
-
"var": "rigorMode",
|
|
523
|
-
"equals": "THOROUGH"
|
|
524
|
-
},
|
|
525
|
-
"text": "For THOROUGH rigor, assume the first review is not enough. Use adversarial reviewer lanes unless a hard limitation makes them impossible."
|
|
544
|
+
"id": "phase-6c-rigor",
|
|
545
|
+
"text": "Always use adversarial reviewer lanes. Assume the first review is not enough -- use the full adversarial bundle unless a hard limitation makes it impossible."
|
|
526
546
|
},
|
|
527
547
|
{
|
|
528
548
|
"id": "phase-6c-heritage-review",
|
|
@@ -533,7 +553,29 @@
|
|
|
533
553
|
"text": "For modernize_existing: add a heritage_reviewer to the adversarial bundle. Its job is to check each valueInventory item and find what was lost or weakened -- it ignores format improvements. It must answer: which enforcement mechanisms are now prose-only? Which domain knowledge items are absent? Which behavioral rules were removed without equivalent replacement? Heritage_reviewer findings drive enforcementStrength and modernizationDiscipline scores."
|
|
534
554
|
}
|
|
535
555
|
],
|
|
536
|
-
"requireConfirmation": false
|
|
556
|
+
"requireConfirmation": false,
|
|
557
|
+
"validationCriteria": [
|
|
558
|
+
{
|
|
559
|
+
"type": "contains",
|
|
560
|
+
"value": "complexityScaling",
|
|
561
|
+
"message": "Review must score complexityScaling"
|
|
562
|
+
}
|
|
563
|
+
],
|
|
564
|
+
"assessmentRefs": [
|
|
565
|
+
"authoring-integrity-gate",
|
|
566
|
+
"outcome-effectiveness-gate"
|
|
567
|
+
],
|
|
568
|
+
"assessmentConsequences": [
|
|
569
|
+
{
|
|
570
|
+
"when": {
|
|
571
|
+
"anyEqualsLevel": "low"
|
|
572
|
+
},
|
|
573
|
+
"effect": {
|
|
574
|
+
"kind": "require_followup",
|
|
575
|
+
"guidance": "authoring_integrity low -- structural or quality dimensions are unacceptable; fix voice, ceremony, loop, delegation, or state problems before this workflow can be trusted. outcome_effectiveness low -- task effectiveness, false-confidence resistance, coverage sharpness, or domain fit are materially weak; redesign, do not patch."
|
|
576
|
+
}
|
|
577
|
+
}
|
|
578
|
+
]
|
|
537
579
|
},
|
|
538
580
|
{
|
|
539
581
|
"id": "phase-6d-redesign-and-revalidate",
|
|
@@ -545,7 +587,6 @@
|
|
|
545
587
|
"If structure changes, re-run real validators before leaving this step."
|
|
546
588
|
],
|
|
547
589
|
"procedure": [
|
|
548
|
-
"If `authoringIntegrityPassed` and `outcomeEffectivenessPassed` are both true and `hardGateFailures` is empty, say that no redesign is needed.",
|
|
549
590
|
"Otherwise classify the needed redesign severity as `minor`, `architectural`, or `unsafe_to_ship` and apply the necessary fixes directly to the workflow file.",
|
|
550
591
|
"If the redesign changed structure, run the real validators again and update the validation state before leaving this step."
|
|
551
592
|
],
|
|
@@ -557,7 +598,19 @@
|
|
|
557
598
|
"Structural redesign problems are handled as redesign problems, not cosmetic ones."
|
|
558
599
|
]
|
|
559
600
|
},
|
|
560
|
-
"requireConfirmation": false
|
|
601
|
+
"requireConfirmation": false,
|
|
602
|
+
"runCondition": {
|
|
603
|
+
"or": [
|
|
604
|
+
{
|
|
605
|
+
"var": "authoringIntegrityPassed",
|
|
606
|
+
"equals": false
|
|
607
|
+
},
|
|
608
|
+
{
|
|
609
|
+
"var": "outcomeEffectivenessPassed",
|
|
610
|
+
"equals": false
|
|
611
|
+
}
|
|
612
|
+
]
|
|
613
|
+
}
|
|
561
614
|
},
|
|
562
615
|
{
|
|
563
616
|
"id": "phase-6e-quality-loop-decision",
|
|
@@ -597,7 +650,7 @@
|
|
|
597
650
|
"procedure": [
|
|
598
651
|
"Read spec/workflow-tags.json to see the available tags and their 'when' phrases.",
|
|
599
652
|
"Based on the workflow's purpose and description, select 1-3 tags from the closed set (coding, review_audit, investigation, design, documentation, tickets, learning, routines, authoring).",
|
|
600
|
-
"
|
|
653
|
+
"Check whether the workflow ID already exists in the `workflows` section. If it does, update the existing entry tags rather than adding a duplicate. If it does not exist, add a new entry under 'workflows' in spec/workflow-tags.json: { \"tags\": [\"<tag1>\"] }.",
|
|
601
654
|
"If the workflow is a test fixture or internal utility not meant for end-user discovery, add 'hidden': true.",
|
|
602
655
|
"Save the tags file. Do not modify any other field.",
|
|
603
656
|
"Write the 'about' field into the workflow JSON: a markdown string (100-400 words) written for a human deciding whether to use this workflow. Cover what it does, when to use it, what it produces, and how to get good results. This is a user-facing surface -- not agent instructions (use metaGuidance for that).",
|
|
@@ -645,5 +698,63 @@
|
|
|
645
698
|
"requireConfirmation": false
|
|
646
699
|
}
|
|
647
700
|
],
|
|
648
|
-
"validatedAgainstSpecVersion": 3
|
|
701
|
+
"validatedAgainstSpecVersion": 3,
|
|
702
|
+
"assessments": [
|
|
703
|
+
{
|
|
704
|
+
"id": "state-economy-gate",
|
|
705
|
+
"purpose": "Every context field in the authored workflow earns its keep: it is set, consumed, and influences a concrete decision or output.",
|
|
706
|
+
"dimensions": [
|
|
707
|
+
{
|
|
708
|
+
"id": "state_economy",
|
|
709
|
+
"purpose": "All context fields have a traceable downstream use. No field is captured speculatively or carried without purpose.",
|
|
710
|
+
"levels": [
|
|
711
|
+
"low",
|
|
712
|
+
"high"
|
|
713
|
+
]
|
|
714
|
+
}
|
|
715
|
+
]
|
|
716
|
+
},
|
|
717
|
+
{
|
|
718
|
+
"id": "simulation-outcome-gate",
|
|
719
|
+
"purpose": "A concrete execution simulation has been completed and identified weak steps, likely unsatisfying outputs, and false-confidence modes -- and any found were fixed inline.",
|
|
720
|
+
"dimensions": [
|
|
721
|
+
{
|
|
722
|
+
"id": "simulation_outcome",
|
|
723
|
+
"purpose": "Simulation completed over at least one happy path and one degraded/edge-case path. Issues found were fixed or explicitly accepted.",
|
|
724
|
+
"levels": [
|
|
725
|
+
"low",
|
|
726
|
+
"high"
|
|
727
|
+
]
|
|
728
|
+
}
|
|
729
|
+
]
|
|
730
|
+
},
|
|
731
|
+
{
|
|
732
|
+
"id": "authoring-integrity-gate",
|
|
733
|
+
"purpose": "The authored workflow is structurally sound and meets authoring quality standards: voice, ceremony, loops, delegation, and state are all acceptable.",
|
|
734
|
+
"dimensions": [
|
|
735
|
+
{
|
|
736
|
+
"id": "authoring_integrity",
|
|
737
|
+
"purpose": "Structural and authoring-quality dimensions passed the adversarial review. No hard gate failure on voice, ceremony, loopSoundness, delegationBoundedness, or stateMinimality.",
|
|
738
|
+
"levels": [
|
|
739
|
+
"low",
|
|
740
|
+
"high"
|
|
741
|
+
]
|
|
742
|
+
}
|
|
743
|
+
]
|
|
744
|
+
},
|
|
745
|
+
{
|
|
746
|
+
"id": "outcome-effectiveness-gate",
|
|
747
|
+
"purpose": "The authored workflow is likely to produce genuinely satisfying results: task effectiveness, false-confidence resistance, coverage sharpness, domain fit, and handoff utility are all acceptable.",
|
|
748
|
+
"dimensions": [
|
|
749
|
+
{
|
|
750
|
+
"id": "outcome_effectiveness",
|
|
751
|
+
"purpose": "The workflow passes adversarial review on task effectiveness, falseConfidenceResistance, coverageSharpness, domainFit, and handoffUtility. No hard gate failure on any outcome dimension.",
|
|
752
|
+
"levels": [
|
|
753
|
+
"low",
|
|
754
|
+
"high"
|
|
755
|
+
]
|
|
756
|
+
}
|
|
757
|
+
]
|
|
758
|
+
}
|
|
759
|
+
]
|
|
649
760
|
}
|