project-iris 0.0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +424 -0
- package/dist/bridge/agent-runner.js +190 -0
- package/dist/bridge/connector-factory.js +31 -0
- package/dist/bridge/connectors/antigravity-connector.js +18 -0
- package/dist/bridge/connectors/cursor-connector.js +31 -0
- package/dist/bridge/connectors/in-process-connector.js +29 -0
- package/dist/bridge/connectors/vscode-connector.js +31 -0
- package/dist/bridge/connectors/windsurf-connector.js +23 -0
- package/dist/bridge/filesystem-connector.js +110 -0
- package/dist/bridge/helper.js +203 -0
- package/dist/bridge/types.js +10 -0
- package/dist/cli.js +38 -0
- package/dist/commands/ask.js +259 -0
- package/dist/commands/bridge.js +88 -0
- package/dist/commands/develop.js +141 -0
- package/dist/commands/doctor.js +102 -0
- package/dist/commands/flow.js +301 -0
- package/dist/commands/framework.js +273 -0
- package/dist/commands/generate.js +59 -0
- package/dist/commands/install.js +73 -0
- package/dist/commands/pack.js +33 -0
- package/dist/commands/phase.js +38 -0
- package/dist/commands/run.js +199 -0
- package/dist/commands/status.js +114 -0
- package/dist/commands/uninstall.js +14 -0
- package/dist/commands/use.js +20 -0
- package/dist/commands/validate.js +102 -0
- package/dist/framework/framework-loader.js +97 -0
- package/dist/framework/framework-paths.js +48 -0
- package/dist/framework/framework-types.js +15 -0
- package/dist/iris/artifact-checker.js +78 -0
- package/dist/iris/artifacts/config.js +68 -0
- package/dist/iris/artifacts/generator.js +88 -0
- package/dist/iris/artifacts/types.js +1 -0
- package/dist/iris/bundle.js +44 -0
- package/dist/iris/doctrine/collector.js +124 -0
- package/dist/iris/fixer.js +149 -0
- package/dist/iris/flows/manifest.js +124 -0
- package/dist/iris/framework-context.js +49 -0
- package/dist/iris/framework-manager.js +215 -0
- package/dist/iris/fs/atomic.js +22 -0
- package/dist/iris/guard.js +38 -0
- package/dist/iris/importers/bmad.js +70 -0
- package/dist/iris/importers/index.js +9 -0
- package/dist/iris/importers/speckit.js +15 -0
- package/dist/iris/importers/specsmd.js +78 -0
- package/dist/iris/importers/types.js +8 -0
- package/dist/iris/importers/writer.js +139 -0
- package/dist/iris/include.js +49 -0
- package/dist/iris/installer.js +334 -0
- package/dist/iris/interactive/env.js +21 -0
- package/dist/iris/interactive/intent-interview.js +345 -0
- package/dist/iris/interactive/intent-schema.js +28 -0
- package/dist/iris/interactive/interview-io.js +22 -0
- package/dist/iris/interview/config.js +71 -0
- package/dist/iris/interview/types.js +16 -0
- package/dist/iris/interview/utils.js +38 -0
- package/dist/iris/manifest.js +54 -0
- package/dist/iris/packer.js +325 -0
- package/dist/iris/parsers/unit-parser.js +43 -0
- package/dist/iris/paths.js +18 -0
- package/dist/iris/policy.js +133 -0
- package/dist/iris/proc.js +56 -0
- package/dist/iris/report.js +53 -0
- package/dist/iris/resolver.js +66 -0
- package/dist/iris/router.js +114 -0
- package/dist/iris/routes.js +189 -0
- package/dist/iris/run-state.js +146 -0
- package/dist/iris/state.js +113 -0
- package/dist/iris/templates.js +70 -0
- package/dist/iris/tmp.js +24 -0
- package/dist/iris/uninstaller.js +181 -0
- package/dist/iris/utils/interpolate.js +42 -0
- package/dist/iris/validator.js +391 -0
- package/dist/iris/workflow/config.js +51 -0
- package/dist/iris/workflow/engine.js +129 -0
- package/dist/iris/workflow/steps.js +448 -0
- package/dist/iris/workflow/types.js +1 -0
- package/dist/lib.js +96 -0
- package/dist/utils/exit-codes.js +7 -0
- package/dist/workflows/bolt-execution.js +238 -0
- package/dist/workflows/bolt-plan.js +192 -0
- package/dist/workflows/intent-inception.js +210 -0
- package/dist/workflows/reporting.js +74 -0
- package/package.json +45 -0
- package/src/iris_bundle/.iris/aidlc/README.md +16 -0
- package/src/iris_bundle/.iris/aidlc/agents/iris-construction-agent.md +35 -0
- package/src/iris_bundle/.iris/aidlc/agents/iris-inception-agent.md +30 -0
- package/src/iris_bundle/.iris/aidlc/agents/iris-master-agent.md +35 -0
- package/src/iris_bundle/.iris/aidlc/agents/iris-operations-agent.md +29 -0
- package/src/iris_bundle/.iris/aidlc/commands/iris-construction-agent.md +18 -0
- package/src/iris_bundle/.iris/aidlc/commands/iris-inception-agent.md +18 -0
- package/src/iris_bundle/.iris/aidlc/commands/iris-master-agent.md +18 -0
- package/src/iris_bundle/.iris/aidlc/commands/iris-operations-agent.md +18 -0
- package/src/iris_bundle/.iris/aidlc/context/context-map.md +25 -0
- package/src/iris_bundle/.iris/aidlc/context/exclusion-rules.md +13 -0
- package/src/iris_bundle/.iris/aidlc/context/load-order.md +25 -0
- package/src/iris_bundle/.iris/aidlc/memory/intent-rules.md +9 -0
- package/src/iris_bundle/.iris/aidlc/memory/log-rules.md +5 -0
- package/src/iris_bundle/.iris/aidlc/memory/memory-bank.yaml +39 -0
- package/src/iris_bundle/.iris/aidlc/memory/unit-rules.md +9 -0
- package/src/iris_bundle/.iris/aidlc/quick-start.md +24 -0
- package/src/iris_bundle/.iris/aidlc/skills/execution/implementation.md +14 -0
- package/src/iris_bundle/.iris/aidlc/skills/execution/refactoring.md +13 -0
- package/src/iris_bundle/.iris/aidlc/skills/execution/scaffold-generation.md +15 -0
- package/src/iris_bundle/.iris/aidlc/skills/governance/escalation.md +13 -0
- package/src/iris_bundle/.iris/aidlc/skills/governance/quality-gates.md +14 -0
- package/src/iris_bundle/.iris/aidlc/skills/governance/stop-conditions.md +11 -0
- package/src/iris_bundle/.iris/aidlc/skills/reasoning/decomposition.md +23 -0
- package/src/iris_bundle/.iris/aidlc/skills/reasoning/risk-analysis.md +14 -0
- package/src/iris_bundle/.iris/aidlc/skills/reasoning/verification.md +21 -0
- package/src/iris_bundle/.iris/aidlc/standards/artifacts-registry.md +38 -0
- package/src/iris_bundle/.iris/aidlc/standards/decision-logging.md +16 -0
- package/src/iris_bundle/.iris/aidlc/standards/doctrine-structure.md +31 -0
- package/src/iris_bundle/.iris/aidlc/standards/documentation-rules.md +15 -0
- package/src/iris_bundle/.iris/aidlc/standards/file-structure.md +21 -0
- package/src/iris_bundle/.iris/aidlc/standards/naming-conventions.md +18 -0
- package/src/iris_bundle/.iris/aidlc/standards/phases-and-gates.md +25 -0
- package/src/iris_bundle/.iris/aidlc/standards/routes-and-routing.md +35 -0
- package/src/iris_bundle/.iris/aidlc/standards/tool-wrappers.md +32 -0
- package/src/iris_bundle/.iris/aidlc/templates/bolt.md +23 -0
- package/src/iris_bundle/.iris/aidlc/templates/doctrine-doc-template.md +33 -0
- package/src/iris_bundle/.iris/aidlc/templates/intent.md +23 -0
- package/src/iris_bundle/.iris/aidlc/templates/log.md +24 -0
- package/src/iris_bundle/.iris/aidlc/templates/review.md +21 -0
- package/src/iris_bundle/.iris/aidlc/templates/unit.md +31 -0
- package/src/iris_bundle/.iris/aidlc/validation/failure-modes.md +16 -0
- package/src/iris_bundle/.iris/aidlc/validation/phase-preconditions.md +21 -0
- package/src/iris_bundle/.iris/aidlc/validation/quality-checklist.md +20 -0
- package/src/iris_bundle/.iris/flows/specs-md/doctrine/templates/requirements.md +18 -0
- package/src/iris_bundle/.iris/flows/specs-md/doctrine/templates/system-context.md +17 -0
- package/src/iris_bundle/.iris/flows/specs-md/doctrine/templates/unit-briefs/construction.md +16 -0
- package/src/iris_bundle/.iris/flows/specs-md/doctrine/templates/unit-briefs/operations.md +14 -0
- package/src/iris_bundle/.iris/flows/specs-md/doctrine/templates/units.md +11 -0
- package/src/iris_bundle/.iris/flows/specs-md/flow.yaml +8 -0
- package/src/iris_bundle/.iris/flows/specs-md/policy.overlay.yaml +26 -0
- package/src/iris_bundle/.iris/flows/specs-md/routes.overlay.yaml +16 -0
- package/src/iris_bundle/.iris/policy.yaml +27 -0
- package/src/iris_bundle/.iris/routes.yaml +98 -0
- package/src/iris_bundle/.iris/state.yaml +7 -0
- package/src/iris_bundle/.iris/tools/claude/.claude/claude.md +9 -0
- package/src/iris_bundle/.iris/tools/claude/.claude/commands/compare-specs.md +203 -0
- package/src/iris_bundle/.iris/tools/claude/.claude/commands/iris-construction-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/claude/.claude/commands/iris-inception-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/claude/.claude/commands/iris-master-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/claude/.claude/commands/iris-operations-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/codex/AGENTS.md +15 -0
- package/src/iris_bundle/.iris/tools/cursor/.cursor/commands/iris-construction-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/cursor/.cursor/commands/iris-inception-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/cursor/.cursor/commands/iris-master-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/cursor/.cursor/commands/iris-operations-agent.md +25 -0
- package/src/iris_bundle/.iris/tools/gemini/.gemini/commands/iris-construction-agent.toml +29 -0
- package/src/iris_bundle/.iris/tools/gemini/.gemini/commands/iris-inception-agent.toml +29 -0
- package/src/iris_bundle/.iris/tools/gemini/.gemini/commands/iris-master-agent.toml +29 -0
- package/src/iris_bundle/.iris/tools/gemini/.gemini/commands/iris-operations-agent.toml +29 -0
- package/src/iris_bundle/frameworks/iris-core/.claude/claude.md +238 -0
- package/src/iris_bundle/frameworks/iris-core/.claude/commands/compare-iris.md +203 -0
- package/src/iris_bundle/frameworks/iris-core/.claude/commands/irismd-construction-agent.md +63 -0
- package/src/iris_bundle/frameworks/iris-core/.claude/commands/irismd-inception-agent.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/.claude/commands/irismd-master-agent.md +47 -0
- package/src/iris_bundle/frameworks/iris-core/.claude/commands/irismd-operations-agent.md +77 -0
- package/src/iris_bundle/frameworks/iris-core/.github/workflows/claude-code-review.yml +57 -0
- package/src/iris_bundle/frameworks/iris-core/.github/workflows/claude.yml +50 -0
- package/src/iris_bundle/frameworks/iris-core/.github/workflows/npm-package-ci.yml +46 -0
- package/src/iris_bundle/frameworks/iris-core/.github/workflows/npm-package-dev.yml +59 -0
- package/src/iris_bundle/frameworks/iris-core/.github/workflows/npm-package-release.yml +107 -0
- package/src/iris_bundle/frameworks/iris-core/.github/workflows/vscode-publish.yml +113 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/README.md +372 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/agents/construction-agent.md +80 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/agents/inception-agent.md +97 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/agents/master-agent.md +61 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/agents/operations-agent.md +89 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/commands/construction-agent.md +63 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/commands/inception-agent.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/commands/master-agent.md +47 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/commands/operations-agent.md +77 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/context-config.yaml +67 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/memory-bank.yaml +104 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/quick-start.md +322 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/construction/bolt-list.md +163 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/construction/bolt-replan.md +345 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/construction/bolt-start.md +442 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/construction/bolt-status.md +185 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/construction/navigator.md +196 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/bolt-plan.md +372 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/context.md +171 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/intent-create.md +211 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/intent-list.md +124 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/navigator.md +207 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/requirements.md +227 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/review.md +248 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/story-create.md +304 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/inception/units.md +278 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/master/analyze-context.md +239 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/master/answer-question.md +141 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/master/explain-flow.md +158 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/master/project-init.md +281 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/master/route-request.md +126 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/operations/build.md +237 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/operations/deploy.md +259 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/operations/monitor.md +265 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/operations/navigator.md +209 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/skills/operations/verify.md +224 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-template.md +226 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/ddd-construction-bolt/adr-template.md +49 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/ddd-construction-bolt/ddd-01-domain-model-template.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/ddd-construction-bolt/ddd-02-technical-design-template.md +67 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/ddd-construction-bolt/ddd-03-test-report-template.md +62 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/ddd-construction-bolt.md +528 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/simple-construction-bolt.md +347 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/bolt-types/spike-bolt.md +240 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/construction-log-template.md +129 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/standards/coding-standards.md +29 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/standards/system-architecture.md +22 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/construction/standards/tech-stack.md +19 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/inception-log-template.md +134 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/project/README.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/requirements-template.md +144 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/stories-template.md +38 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/story-template.md +147 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/system-context-template.md +29 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/unit-brief-template.md +177 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/inception/units-template.md +52 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/standards/catalog.yaml +345 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/standards/coding-standards.guide.md +553 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/standards/data-stack.guide.md +162 -0
- package/src/iris_bundle/frameworks/iris-core/.irismd/aidlc/templates/standards/tech-stack.guide.md +280 -0
- package/src/iris_bundle/frameworks/iris-core/.markdownlint.yaml +142 -0
- package/src/iris_bundle/frameworks/iris-core/LICENSE +21 -0
- package/src/iris_bundle/frameworks/iris-core/PRIVACY.md +38 -0
- package/src/iris_bundle/frameworks/iris-core/README.md +397 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/framework.yaml +4 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/interview.yaml +9 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/pack.yaml +2 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/policy.yaml +27 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/routes.yaml +98 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/templates/bolt.md +23 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/templates/doctrine-doc-template.md +33 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/templates/intent.md +23 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/templates/log.md +24 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/templates/review.md +21 -0
- package/src/iris_bundle/frameworks/iris-core/_iris_legacy/templates/unit.md +31 -0
- package/src/iris_bundle/frameworks/iris-core/artifacts.yaml +78 -0
- package/src/iris_bundle/frameworks/iris-core/dev_release_guide.md +324 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/.claude/skills/frontend-design/SKILL.md +106 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/CLAUDE.md +171 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/README.md +20 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/agents/construction-agent.mdx +358 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/agents/inception-agent.mdx +306 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/agents/master-agent.mdx +230 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/agents/operations-agent.mdx +344 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/agents/overview.mdx +187 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/architecture/flows.mdx +136 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/community.mdx +91 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/compare/overview.mdx +167 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/compare/vs-bmad.mdx +167 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/compare/vs-kiro.mdx +208 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/compare/vs-openspec.mdx +140 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/compare/vs-speckit.mdx +146 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/core-concepts/bolts.mdx +268 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/core-concepts/intents.mdx +164 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/core-concepts/memory-bank.mdx +209 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/core-concepts/standards.mdx +277 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/core-concepts/units.mdx +184 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/docs.json +148 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/faq.mdx +364 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/feedback.mdx +55 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/getting-started/installation.mdx +91 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/getting-started/quick-start.mdx +149 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/getting-started/vscode-extension.mdx +180 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/guides/bolt-types.mdx +182 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/extension-gallery/bolts.jpeg +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/extension-gallery/overview.jpeg +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/extension-gallery/specs.jpeg +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/extension-preview.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/favicon.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/hero-dark.svg +129 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/hero-light.svg +129 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/logo.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/old_favicon.svg +40 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/quickstart.cast +3788 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/images/quickstart.gif +0 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/index.mdx +179 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/methodology/ai-dlc-vs-agile.mdx +138 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/methodology/sdlc-reimagined.mdx +270 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/methodology/three-phases.mdx +225 -0
- package/src/iris_bundle/frameworks/iris-core/docs.iris.md/methodology/what-is-ai-dlc.mdx +96 -0
- package/src/iris_bundle/frameworks/iris-core/framework.yaml +4 -0
- package/src/iris_bundle/frameworks/iris-core/images/763995.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/images/763995.svg +354 -0
- package/src/iris_bundle/frameworks/iris-core/images/favicon-64.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/images/favicon.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/images/logo.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/images/old_favicon.svg +40 -0
- package/src/iris_bundle/frameworks/iris-core/images/specs_md_pixel_logo.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/images/specs_md_pixel_logo_big.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/interview.yaml +48 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/PRFAQ.md +193 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/016-analytics-tracker/bolt.md +122 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/016-analytics-tracker/implementation-plan.md +172 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/016-analytics-tracker/implementation-walkthrough.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/016-analytics-tracker/test-walkthrough.md +96 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/017-privacy-documentation/bolt.md +72 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-1/bolt.md +94 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-1/implementation-plan.md +297 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-1/implementation-walkthrough.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-1/test-walkthrough.md +99 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-2/bolt.md +88 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-2/implementation-plan.md +196 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-2/implementation-walkthrough.md +154 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-artifact-parser-2/test-walkthrough.md +119 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-extension-core-1/bolt.md +99 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-extension-core-1/implementation-plan.md +70 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-extension-core-1/implementation-walkthrough.md +45 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-extension-core-1/test-walkthrough.md +60 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-file-watcher-1/bolt.md +86 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-file-watcher-1/implementation-plan.md +154 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-file-watcher-1/implementation-walkthrough.md +43 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-file-watcher-1/test-walkthrough.md +74 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-1/bolt.md +89 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-1/implementation-plan.md +76 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-1/implementation-walkthrough.md +43 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-1/test-walkthrough.md +70 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-2/bolt.md +90 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-2/implementation-plan.md +93 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-2/implementation-walkthrough.md +44 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-2/test-walkthrough.md +54 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-3/bolt.md +90 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-3/implementation-plan.md +168 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-3/implementation-walkthrough.md +137 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-3/test-walkthrough.md +134 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-4/bolt.md +93 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-4/implementation-plan.md +176 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-4/implementation-walkthrough.md +159 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-4/test-walkthrough.md +105 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-5/bolt.md +104 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-sidebar-provider-5/implementation-plan.md +146 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-1/bolt.md +83 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-1/implementation-plan.md +161 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-1/implementation-walkthrough.md +58 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-1/test-walkthrough.md +104 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-2/bolt.md +83 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-2/implementation-plan.md +179 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-2/implementation-walkthrough.md +124 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-2/test-walkthrough.md +95 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-3/bolt.md +83 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-3/implementation-plan.md +196 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-3/implementation-walkthrough.md +207 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-3/test-walkthrough.md +194 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-4/bolt.md +92 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-4/implementation-plan.md +217 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-4/implementation-walkthrough.md +138 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-4/test-walkthrough.md +196 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-5/bolt.md +89 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-5/implementation-plan.md +181 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-5/implementation-walkthrough.md +160 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-webview-lit-migration-5/test-walkthrough.md +121 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-welcome-view-1/bolt.md +92 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-welcome-view-1/implementation-plan.md +73 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-welcome-view-1/implementation-walkthrough.md +44 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/bolts/bolt-welcome-view-1/test-walkthrough.md +49 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/glossary.md +197 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/requirements.md +129 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/research/approval-gates-simplification.md +839 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/research/archive/approval-gates-analysis.md +331 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/system-context.md +167 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/units/construction-agent/unit-brief.md +111 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/units/inception-agent/unit-brief.md +135 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/units/master-agent/unit-brief.md +580 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/units/operations-agent/unit-brief.md +72 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/001-multi-agent-orchestration/units.md +168 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/requirements.md +96 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/system-context.md +170 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/antigravity-installer/unit-brief.md +156 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/claude-code-installer/unit-brief.md +180 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/cline-installer/unit-brief.md +106 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/codex-installer/unit-brief.md +106 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/copilot-installer/unit-brief.md +139 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/cursor-installer/unit-brief.md +119 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/gemini-installer/unit-brief.md +107 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/installer-core/unit-brief.md +240 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/kilo-installer/unit-brief.md +106 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/kiro-installer/unit-brief.md +108 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/opencode-installer/unit-brief.md +107 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/roo-installer/unit-brief.md +107 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units/windsurf-installer/unit-brief.md +128 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/002-agentic-coding-tool-integration/units.md +188 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/003-memory-bank-system/requirements.md +196 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/003-memory-bank-system/system-context.md +181 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/003-memory-bank-system/units/artifact-storage/unit-brief.md +192 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/003-memory-bank-system/units/configuration-schema/unit-brief.md +204 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/003-memory-bank-system/units/context-loader/unit-brief.md +245 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/003-memory-bank-system/units.md +97 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/004-standards-system/requirements.md +125 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/004-standards-system/system-context.md +158 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/004-standards-system/units/facilitation-guides/unit-brief.md +250 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/004-standards-system/units/standards-catalog/unit-brief.md +355 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/004-standards-system/units/standards-templates/unit-brief.md +394 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/004-standards-system/units.md +110 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/requirements.md +188 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/system-context.md +229 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/units/01-specification-contract-testing/unit-brief.md +197 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/units/02-cli-installer-testing/unit-brief.md +377 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/units/03-golden-dataset-management/unit-brief.md +465 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/units/04-agent-behavior-evaluation/unit-brief.md +459 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/units/05-cicd-integration/unit-brief.md +587 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/005-testing-strategy/units.md +332 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/006-brownfield-support/requirements.md +214 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/requirements.md +308 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/system-context.md +335 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/construction-log.md +52 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/stories/001-initialize-mixpanel.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/stories/002-detect-shell.md +68 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/stories/003-check-telemetry-disabled.md +66 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/stories/004-track-installer-events.md +67 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/stories/005-track-selection-events.md +66 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/stories/006-cli-no-telemetry-flag.md +59 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/001-analytics-tracker/unit-brief.md +191 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/002-privacy-documentation/stories/001-create-privacy-md.md +58 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/002-privacy-documentation/stories/002-add-readme-section.md +61 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units/002-privacy-documentation/unit-brief.md +158 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/007-installer-analytics/units.md +453 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/008-terminal-dashboard/requirements.md +222 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/008-terminal-dashboard/system-context.md +198 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/008-terminal-dashboard/units.md +275 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/009-versioning-strategy/requirements.md +308 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/009-versioning-strategy/system-context.md +273 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/009-versioning-strategy/units.md +312 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/010-smart-unit-decomposition/requirements.md +111 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/010-smart-unit-decomposition/system-context.md +154 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/010-smart-unit-decomposition/units.md +102 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/inception-log.md +101 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/requirements.md +282 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/system-context.md +114 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/construction-log.md +57 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/stories/001-memory-bank-schema.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/stories/002-project-detection.md +54 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/stories/003-artifact-parsing.md +57 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/stories/004-frontmatter-parser.md +61 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/stories/005-bolt-dependencies.md +58 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/stories/006-activity-feed-derivation.md +70 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/artifact-parser/unit-brief.md +223 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/extension-core/construction-log.md +59 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/extension-core/stories/001-extension-activation.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/extension-core/stories/002-command-registration.md +54 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/extension-core/stories/003-file-operation-commands.md +57 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/extension-core/unit-brief.md +224 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/file-watcher/construction-log.md +52 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/file-watcher/stories/001-file-system-watcher.md +57 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/file-watcher/stories/002-debounced-refresh.md +53 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/file-watcher/unit-brief.md +173 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/construction-log.md +63 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/001-tree-data-provider.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/002-intent-unit-story-tree.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/003-bolt-tree.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/004-status-icons.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/005-pixel-logo-footer.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/006-webview-tab-architecture.md +62 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/007-command-center-bolts-tab.md +65 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/008-current-focus-card.md +62 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/009-up-next-queue.md +61 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/010-activity-feed-ui.md +63 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/011-filewatcher-statestore-integration.md +49 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/012-next-actions-ui.md +57 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/013-start-bolt-action.md +72 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/014-intent-selection-strategies.md +54 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/015-persist-expanded-state.md +56 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/016-bolt-filtering.md +72 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/017-activity-open-button.md +50 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/018-specs-view.md +63 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/stories/019-overview-view.md +84 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/sidebar-provider/unit-brief.md +305 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/020-fix-infinite-rerender.md +144 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/021-remove-duplicate-files.md +94 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/022-setup-esbuild.md +156 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/023-lit-scaffold.md +202 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/024-tabs-component.md +161 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/025-bolts-view-components.md +182 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/026-specs-view-components.md +223 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/027-overview-view-components.md +391 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/028-state-context.md +317 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/stories/029-ipc-typed-messaging.md +396 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/webview-lit-migration/unit-brief.md +133 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/welcome-view/construction-log.md +58 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/welcome-view/stories/001-welcome-view-ui.md +57 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/welcome-view/stories/002-install-button-flow.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/welcome-view/stories/003-post-installation-detection.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units/welcome-view/unit-brief.md +211 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/intents/011-vscode-extension/units.md +129 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/maintenance-log.md +21 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/project.yaml +16 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/research/test_strategy/promptfoo-specsmd-tutorial.md +911 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/research/test_strategy/promptfoo-tutorial.md +796 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/research/test_strategy/testing-strategy.md +1057 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/research/unified-modernization-model.md +559 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/research/vibe-to-production-academic-research.md +578 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/research/vibe-to-spec-flow-options.md +547 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/standards/coding-standards.md +217 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/standards/output-formatting.md +202 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/standards/skill-template.md +308 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/standards/system-architecture.md +177 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/standards/tech-stack.md +88 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/story-index.md +154 -0
- package/src/iris_bundle/frameworks/iris-core/memory-bank/term-mappings.md +121 -0
- package/src/iris_bundle/frameworks/iris-core/pack.yaml +2 -0
- package/src/iris_bundle/frameworks/iris-core/package.json +11 -0
- package/src/iris_bundle/frameworks/iris-core/policy.yaml +73 -0
- package/src/iris_bundle/frameworks/iris-core/resources/ai-dlc-specification.md +286 -0
- package/src/iris_bundle/frameworks/iris-core/resources/aidlc.pdf +0 -0
- package/src/iris_bundle/frameworks/iris-core/resources/images/aidlc-core-framework.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/resources/images/aidlc-phases-detail.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/resources/images/aidlc-workflow-steps.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/routes.yaml +98 -0
- package/src/iris_bundle/frameworks/iris-core/src/README.md +322 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/schemas/agent.schema.yaml +20 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/schemas/catalog.schema.yaml +60 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/schemas/context-config.schema.yaml +24 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/schemas/memory-bank.schema.yaml +61 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/schemas/skill.schema.yaml +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/analytics/analytics.test.ts +240 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/architecture/bolt-type-agnostic.test.ts +282 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/flow-consistency/code-examples.test.ts +93 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/flow-consistency/helpers.ts +79 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/flow-consistency/placeholder-consistency.test.ts +76 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/flow-consistency/reference-integrity.test.ts +92 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/flow-consistency/terminology-consistency.test.ts +72 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/schema-validation/markdown-schema.test.ts +55 -0
- package/src/iris_bundle/frameworks/iris-core/src/__tests__/unit/schema-validation/yaml-config-schema.test.ts +53 -0
- package/src/iris_bundle/frameworks/iris-core/src/bin/cli.js +21 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/README.md +372 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/agents/construction-agent.md +80 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/agents/inception-agent.md +97 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/agents/master-agent.md +61 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/agents/operations-agent.md +89 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/commands/construction-agent.md +63 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/commands/inception-agent.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/commands/master-agent.md +47 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/commands/operations-agent.md +77 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/context-config.yaml +67 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/memory-bank.yaml +104 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/quick-start.md +322 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/construction/bolt-list.md +163 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/construction/bolt-replan.md +345 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/construction/bolt-start.md +442 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/construction/bolt-status.md +185 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/construction/navigator.md +196 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/bolt-plan.md +372 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/context.md +171 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/intent-create.md +211 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/intent-list.md +124 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/navigator.md +207 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/requirements.md +227 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/review.md +248 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/story-create.md +304 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/inception/units.md +278 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/master/analyze-context.md +239 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/master/answer-question.md +141 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/master/explain-flow.md +158 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/master/project-init.md +281 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/master/route-request.md +126 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/operations/build.md +237 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/operations/deploy.md +259 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/operations/monitor.md +265 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/operations/navigator.md +209 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/skills/operations/verify.md +224 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-template.md +226 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/ddd-construction-bolt/adr-template.md +49 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/ddd-construction-bolt/ddd-01-domain-model-template.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/ddd-construction-bolt/ddd-02-technical-design-template.md +67 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/ddd-construction-bolt/ddd-03-test-report-template.md +62 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/ddd-construction-bolt.md +528 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/simple-construction-bolt.md +347 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/bolt-types/spike-bolt.md +240 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/construction-log-template.md +129 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/standards/coding-standards.md +29 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/standards/system-architecture.md +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/construction/standards/tech-stack.md +19 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/inception-log-template.md +134 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/project/README.md +55 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/requirements-template.md +144 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/stories-template.md +38 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/story-template.md +147 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/system-context-template.md +29 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/unit-brief-template.md +177 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/inception/units-template.md +52 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/standards/catalog.yaml +345 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/standards/coding-standards.guide.md +553 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/standards/data-stack.guide.md +162 -0
- package/src/iris_bundle/frameworks/iris-core/src/flows/aidlc/templates/standards/tech-stack.guide.md +280 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/InstallerFactory.js +36 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/analytics/env-detector.js +92 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/analytics/index.js +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/analytics/machine-id.js +33 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/analytics/tracker.js +232 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/cli-utils.js +342 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/constants.js +32 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installer.js +402 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/AntigravityInstaller.js +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/ClaudeInstaller.js +85 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/ClineInstaller.js +21 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/CodexInstaller.js +21 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/CopilotInstaller.js +113 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/CursorInstaller.js +63 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/GeminiInstaller.js +75 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/KiroInstaller.js +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/OpenCodeInstaller.js +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/RooInstaller.js +22 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/ToolInstaller.js +73 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/installers/WindsurfInstaller.js +76 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/markdown-validator.ts +175 -0
- package/src/iris_bundle/frameworks/iris-core/src/lib/yaml-validator.ts +99 -0
- package/src/iris_bundle/frameworks/iris-core/src/package-lock.json +9922 -0
- package/src/iris_bundle/frameworks/iris-core/src/package.json +118 -0
- package/src/iris_bundle/frameworks/iris-core/src/scripts/artifact-validator.js +594 -0
- package/src/iris_bundle/frameworks/iris-core/src/scripts/bolt-complete.js +606 -0
- package/src/iris_bundle/frameworks/iris-core/src/scripts/status-integrity.js +598 -0
- package/src/iris_bundle/frameworks/iris-core/src/specs_md_pixel_logo.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/src/tsconfig.json +16 -0
- package/src/iris_bundle/frameworks/iris-core/src/vitest.config.ts +12 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/.claude/skills/frontend-design/SKILL.md +42 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/.mocharc.json +5 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/.vscodeignore +17 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/DEVGUIDE.md +103 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/LICENSE +21 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/README.md +198 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/index.html +635 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-1-metrics-dashboard.html +542 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-10-dual-view-focus.html +1105 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-11-dual-view-grouped.html +2304 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-12-dependency-graph.html +1400 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-13-hierarchy-explorer.html +1278 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-14-swimlane-deps.html +1370 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-2-pipeline-flow.html +673 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-3-focus-mode.html +898 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-4-kanban-board.html +858 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-5-timeline.html +890 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-6-activity-feed.html +923 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-7-heatmap-grid.html +932 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-8-2-spec.md +657 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-8-2.html +2098 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-8-command-center.html +2043 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-8a-command-center-timeline.html +1222 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/design-mockups/variation-9-dual-view.html +1101 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/esbuild.webview.mjs +70 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/eslint.config.mjs +36 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/package-lock.json +5712 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/package.json +116 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/resources/extension-preview.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/resources/extension_icon.svg +40 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/resources/favicon-64.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/resources/favicon.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/resources/favicon.svg +40 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/resources/logo.png +0 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/extension.ts +142 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/activityFeed.ts +184 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/artifactParser.ts +477 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/boltTypeParser.ts +191 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/dependencyComputation.ts +157 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/frontmatterParser.ts +144 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/index.ts +93 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/memoryBankSchema.ts +140 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/projectDetection.ts +132 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/parser/types.ts +241 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/iconHelper.ts +82 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/index.ts +85 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/treeBuilder.ts +289 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/treeProvider.ts +225 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/types.ts +254 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/webviewMessaging.ts +306 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/sidebar/webviewProvider.ts +866 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/state/index.ts +114 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/state/selectors.ts +652 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/state/stateStore.ts +419 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/state/types.ts +311 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/parser/activityFeed.test.ts +269 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/parser/artifactParser.test.ts +440 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/parser/dependencyComputation.test.ts +288 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/parser/frontmatterParser.test.ts +191 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/parser/memoryBankSchema.test.ts +185 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/parser/projectDetection.test.ts +146 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/runTest.ts +20 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/sidebar/treeBuilder.test.ts +329 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/sidebar/types.test.ts +239 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/sidebar/webviewContent.test.ts +67 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/sidebar/webviewMessaging.test.ts +369 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/sidebar/webviewProvider.test.ts +282 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/state/selectors.test.ts +457 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/state/stateStore.test.ts +622 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/watcher/debounce.test.ts +155 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/test/watcher/fileWatcher.test.ts +77 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/watcher/debounce.ts +70 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/watcher/fileWatcher.ts +147 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/watcher/index.ts +39 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/watcher/types.ts +43 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/app.ts +870 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/activity-feed.ts +232 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/activity-item.ts +208 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/bolts-view.ts +201 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/completion-item.ts +299 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/completions-section.ts +197 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/current-bolts.ts +184 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/focus-card.ts +431 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/focus-section.ts +179 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/queue-item.ts +306 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/queue-section.ts +198 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/bolts/stories-list.ts +151 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/shared/base-element.ts +29 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/shared/empty-state.ts +82 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/shared/progress-bar.ts +120 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/shared/progress-ring.ts +100 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/shared/stage-pipeline.ts +133 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/components/tabs/view-tabs.ts +127 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/html.ts +542 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/index.ts +104 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/lit/index.ts +16 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/scripts.ts +241 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/styles/theme.ts +50 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/styles.ts +1194 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/types/messages.ts +40 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/types/vscode.ts +13 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/utils/messaging.ts +57 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/utils.ts +16 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/webview/vscode-api.ts +14 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/welcome/WelcomeViewProvider.ts +254 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/welcome/index.ts +9 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/src/welcome/installHandler.ts +82 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/tsconfig.json +30 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/tsconfig.test.json +26 -0
- package/src/iris_bundle/frameworks/iris-core/vs-code-extension/tsconfig.webview.json +23 -0
|
@@ -0,0 +1,911 @@
|
|
|
1
|
+
# Testing irismd Agents with Promptfoo
|
|
2
|
+
|
|
3
|
+
A practical guide to testing AI-DLC agents using Promptfoo, including test setup, golden datasets, and free model recommendations.
|
|
4
|
+
|
|
5
|
+
---
|
|
6
|
+
|
|
7
|
+
## Table of Contents
|
|
8
|
+
|
|
9
|
+
1. [Golden Datasets Explained](#golden-datasets-explained)
|
|
10
|
+
2. [Test Setup and Fixtures](#test-setup-and-fixtures)
|
|
11
|
+
3. [Free Coding Models on OpenRouter](#free-coding-models-on-openrouter)
|
|
12
|
+
4. [Testing Each Agent](#testing-each-agent)
|
|
13
|
+
5. [Complete Example Configuration](#complete-example-configuration)
|
|
14
|
+
|
|
15
|
+
---
|
|
16
|
+
|
|
17
|
+
## Golden Datasets Explained
|
|
18
|
+
|
|
19
|
+
### What is a Golden Dataset?
|
|
20
|
+
|
|
21
|
+
A **golden dataset** is a curated collection of **known-good input/output pairs** that serve as your quality baseline. Think of it as "these are examples of what correct agent behavior looks like."
|
|
22
|
+
|
|
23
|
+
```text
|
|
24
|
+
┌─────────────────────────────────────────────────────────────────────────┐
|
|
25
|
+
│ GOLDEN DATASET │
|
|
26
|
+
├─────────────────────────────────────────────────────────────────────────┤
|
|
27
|
+
│ │
|
|
28
|
+
│ INPUT (What user asks) OUTPUT (What agent should produce) │
|
|
29
|
+
│ ───────────────────── ───────────────────────────────── │
|
|
30
|
+
│ │
|
|
31
|
+
│ "Create an intent for → # Intent: User Authentication │
|
|
32
|
+
│ user authentication" ## Problem Statement │
|
|
33
|
+
│ Users need secure login... │
|
|
34
|
+
│ ## Success Criteria │
|
|
35
|
+
│ - 99.9% uptime... │
|
|
36
|
+
│ │
|
|
37
|
+
│ This is a GOLDEN EXAMPLE - we verified this is high quality │
|
|
38
|
+
│ Future outputs are compared against this baseline │
|
|
39
|
+
│ │
|
|
40
|
+
└─────────────────────────────────────────────────────────────────────────┘
|
|
41
|
+
```
|
|
42
|
+
|
|
43
|
+
### Why Golden Datasets Matter
|
|
44
|
+
|
|
45
|
+
| Problem | How Golden Datasets Solve It |
|
|
46
|
+
|---------|------------------------------|
|
|
47
|
+
| LLM outputs vary each run | Compare to known-good baseline using similarity |
|
|
48
|
+
| "Is this output good?" is subjective | Golden examples define what "good" looks like |
|
|
49
|
+
| Regressions are hard to detect | If similarity drops, something broke |
|
|
50
|
+
| New team members don't know quality bar | Golden examples document expectations |
|
|
51
|
+
|
|
52
|
+
### Golden Dataset Structure
|
|
53
|
+
|
|
54
|
+
```text
|
|
55
|
+
__tests__/
|
|
56
|
+
├── golden-datasets/
|
|
57
|
+
│ ├── inception-agent/
|
|
58
|
+
│ │ ├── inputs/
|
|
59
|
+
│ │ │ ├── 001-simple-auth.txt # User request
|
|
60
|
+
│ │ │ ├── 002-payment-system.txt
|
|
61
|
+
│ │ │ └── 003-refactoring-legacy.txt
|
|
62
|
+
│ │ ├── outputs/
|
|
63
|
+
│ │ │ ├── 001-simple-auth.md # Expected output
|
|
64
|
+
│ │ │ ├── 002-payment-system.md
|
|
65
|
+
│ │ │ └── 003-refactoring-legacy.md
|
|
66
|
+
│ │ └── context/ # Required state (fixtures)
|
|
67
|
+
│ │ ├── 001-simple-auth/
|
|
68
|
+
│ │ │ └── memory-bank/ # Memory bank state for test
|
|
69
|
+
│ │ └── 002-payment-system/
|
|
70
|
+
│ │
|
|
71
|
+
│ ├── construction-agent/
|
|
72
|
+
│ │ ├── inputs/
|
|
73
|
+
│ │ ├── outputs/
|
|
74
|
+
│ │ └── context/ # Pre-populated memory bank
|
|
75
|
+
│ │ ├── 001-start-bolt/
|
|
76
|
+
│ │ │ └── memory-bank/
|
|
77
|
+
│ │ │ ├── intents/
|
|
78
|
+
│ │ │ │ └── 001-user-auth/
|
|
79
|
+
│ │ │ ├── bolts/
|
|
80
|
+
│ │ │ │ └── bolt-auth-1.md
|
|
81
|
+
│ │ │ └── standards/
|
|
82
|
+
│ │ └── 002-continue-bolt/
|
|
83
|
+
│ │
|
|
84
|
+
│ └── master-agent/
|
|
85
|
+
│ ├── inputs/
|
|
86
|
+
│ ├── outputs/
|
|
87
|
+
│ └── context/
|
|
88
|
+
```
|
|
89
|
+
|
|
90
|
+
### Building Golden Examples
|
|
91
|
+
|
|
92
|
+
**Step 1: Run the agent and capture output**
|
|
93
|
+
|
|
94
|
+
```bash
|
|
95
|
+
# Run agent, save output
|
|
96
|
+
promptfoo eval --output captured.json
|
|
97
|
+
```
|
|
98
|
+
|
|
99
|
+
**Step 2: Human review**
|
|
100
|
+
|
|
101
|
+
- Is this output high quality?
|
|
102
|
+
- Does it follow our formatting rules?
|
|
103
|
+
- Would we be happy if users saw this?
|
|
104
|
+
|
|
105
|
+
**Step 3: If yes, promote to golden**
|
|
106
|
+
|
|
107
|
+
```bash
|
|
108
|
+
# Save as golden example
|
|
109
|
+
cp captured-output.md __tests__/golden-datasets/inception-agent/outputs/001-auth.md
|
|
110
|
+
```
|
|
111
|
+
|
|
112
|
+
**Step 4: Use in regression tests**
|
|
113
|
+
|
|
114
|
+
```yaml
|
|
115
|
+
# promptfoo.yaml
|
|
116
|
+
tests:
|
|
117
|
+
- vars:
|
|
118
|
+
request: file://golden-datasets/inception-agent/inputs/001-auth.txt
|
|
119
|
+
assert:
|
|
120
|
+
- type: similar
|
|
121
|
+
value: file://golden-datasets/inception-agent/outputs/001-auth.md
|
|
122
|
+
threshold: 0.85 # 85% similarity required
|
|
123
|
+
```
|
|
124
|
+
|
|
125
|
+
### Similarity Thresholds
|
|
126
|
+
|
|
127
|
+
| Threshold | Meaning | When to Use |
|
|
128
|
+
|-----------|---------|-------------|
|
|
129
|
+
| 0.95+ | Nearly identical | Exact format matters (templates) |
|
|
130
|
+
| 0.85-0.95 | Same content, minor variations | Most agent tests |
|
|
131
|
+
| 0.75-0.85 | Same concepts, different wording | Creative outputs |
|
|
132
|
+
| <0.75 | Significant difference | Likely a regression |
|
|
133
|
+
|
|
134
|
+
---
|
|
135
|
+
|
|
136
|
+
## Test Setup and Fixtures
|
|
137
|
+
|
|
138
|
+
### The Problem: Agents Need State
|
|
139
|
+
|
|
140
|
+
Each agent expects the memory bank to be in a specific state:
|
|
141
|
+
|
|
142
|
+
```text
|
|
143
|
+
┌─────────────────────────────────────────────────────────────────────────┐
|
|
144
|
+
│ AGENT STATE REQUIREMENTS │
|
|
145
|
+
├─────────────────────────────────────────────────────────────────────────┤
|
|
146
|
+
│ │
|
|
147
|
+
│ MASTER AGENT │
|
|
148
|
+
│ └── Needs: memory-bank.yaml exists │
|
|
149
|
+
│ └── Can work with: empty project OR existing intents │
|
|
150
|
+
│ │
|
|
151
|
+
│ INCEPTION AGENT │
|
|
152
|
+
│ └── Needs: memory-bank.yaml, standards/ (optional) │
|
|
153
|
+
│ └── Can work with: new intent OR continue existing │
|
|
154
|
+
│ │
|
|
155
|
+
│ CONSTRUCTION AGENT ← Most state requirements │
|
|
156
|
+
│ └── Needs: memory-bank.yaml │
|
|
157
|
+
│ └── Needs: intents/{intent}/ with requirements, units │
|
|
158
|
+
│ └── Needs: bolts/{bolt-id}/ with bolt files │
|
|
159
|
+
│ └── Needs: standards/ (tech-stack, coding-standards) │
|
|
160
|
+
│ │
|
|
161
|
+
│ OPERATIONS AGENT │
|
|
162
|
+
│ └── Needs: completed bolts │
|
|
163
|
+
│ └── Needs: deployment config │
|
|
164
|
+
│ │
|
|
165
|
+
└─────────────────────────────────────────────────────────────────────────┘
|
|
166
|
+
```
|
|
167
|
+
|
|
168
|
+
### Solution: Test Fixtures
|
|
169
|
+
|
|
170
|
+
**Fixtures** are pre-configured memory bank states that tests can load before running.
|
|
171
|
+
|
|
172
|
+
```text
|
|
173
|
+
__tests__/
|
|
174
|
+
└── fixtures/
|
|
175
|
+
└── memory-bank-states/
|
|
176
|
+
│
|
|
177
|
+
├── 01-empty-project/ # Fresh install
|
|
178
|
+
│ └── .irismd/
|
|
179
|
+
│ └── aidlc/
|
|
180
|
+
│ └── memory-bank.yaml
|
|
181
|
+
│
|
|
182
|
+
├── 02-initialized-project/ # After project-init
|
|
183
|
+
│ └── memory-bank/
|
|
184
|
+
│ ├── standards/
|
|
185
|
+
│ │ ├── tech-stack.md
|
|
186
|
+
│ │ └── coding-standards.md
|
|
187
|
+
│ └── project.yaml
|
|
188
|
+
│
|
|
189
|
+
├── 03-inception-started/ # Intent created, no units
|
|
190
|
+
│ └── memory-bank/
|
|
191
|
+
│ ├── standards/
|
|
192
|
+
│ └── intents/
|
|
193
|
+
│ └── 001-user-auth/
|
|
194
|
+
│ ├── requirements.md
|
|
195
|
+
│ └── system-context.md
|
|
196
|
+
│
|
|
197
|
+
├── 04-inception-complete/ # Ready for Construction
|
|
198
|
+
│ └── memory-bank/
|
|
199
|
+
│ ├── standards/
|
|
200
|
+
│ ├── intents/
|
|
201
|
+
│ │ └── 001-user-auth/
|
|
202
|
+
│ │ ├── requirements.md
|
|
203
|
+
│ │ ├── system-context.md
|
|
204
|
+
│ │ ├── units.md
|
|
205
|
+
│ │ └── units/
|
|
206
|
+
│ │ └── auth-service/
|
|
207
|
+
│ │ ├── unit-brief.md
|
|
208
|
+
│ │ └── stories/
|
|
209
|
+
│ │ ├── 001-auth-service.md
|
|
210
|
+
│ │ └── 002-auth-service.md
|
|
211
|
+
│ └── bolts/
|
|
212
|
+
│ ├── bolt-auth-service-1/
|
|
213
|
+
│ │ └── bolt.md # status: planned
|
|
214
|
+
│ └── bolt-auth-service-2/
|
|
215
|
+
│ └── bolt.md # status: planned
|
|
216
|
+
│
|
|
217
|
+
├── 05-construction-in-progress/ # Bolt partially complete
|
|
218
|
+
│ └── memory-bank/
|
|
219
|
+
│ ├── ... (all above)
|
|
220
|
+
│ └── bolts/
|
|
221
|
+
│ └── bolt-auth-service-1/
|
|
222
|
+
│ ├── bolt.md # status: in-progress, stage: design
|
|
223
|
+
│ └── ddd-01-domain-model.md # Completed artifact
|
|
224
|
+
│
|
|
225
|
+
└── 06-construction-complete/ # Ready for Operations
|
|
226
|
+
└── memory-bank/
|
|
227
|
+
├── ... (all above)
|
|
228
|
+
└── bolts/
|
|
229
|
+
└── bolt-auth-service-1/
|
|
230
|
+
├── bolt.md # status: completed
|
|
231
|
+
├── ddd-01-domain-model.md
|
|
232
|
+
├── ddd-02-technical-design.md
|
|
233
|
+
└── ddd-03-test-report.md
|
|
234
|
+
```
|
|
235
|
+
|
|
236
|
+
### Using Fixtures in Tests
|
|
237
|
+
|
|
238
|
+
#### Option 1: Copy Fixture Before Test (Recommended)
|
|
239
|
+
|
|
240
|
+
```yaml
|
|
241
|
+
# promptfoo.yaml
|
|
242
|
+
tests:
|
|
243
|
+
- description: "Construction agent continues bolt"
|
|
244
|
+
setup: |
|
|
245
|
+
# Copy fixture to test directory
|
|
246
|
+
rm -rf ./test-workspace
|
|
247
|
+
cp -r ./__tests__/fixtures/memory-bank-states/05-construction-in-progress ./test-workspace
|
|
248
|
+
vars:
|
|
249
|
+
workspace: ./test-workspace
|
|
250
|
+
command: "bolt-start --bolt-id=bolt-auth-service-1"
|
|
251
|
+
assert:
|
|
252
|
+
- type: contains
|
|
253
|
+
value: "Stage: design"
|
|
254
|
+
```
|
|
255
|
+
|
|
256
|
+
#### Option 2: Include State in Prompt Context
|
|
257
|
+
|
|
258
|
+
```yaml
|
|
259
|
+
# promptfoo.yaml
|
|
260
|
+
prompts:
|
|
261
|
+
- |
|
|
262
|
+
You are the Construction Agent.
|
|
263
|
+
|
|
264
|
+
## Current Memory Bank State
|
|
265
|
+
{{memory_bank_state}}
|
|
266
|
+
|
|
267
|
+
## User Request
|
|
268
|
+
{{request}}
|
|
269
|
+
|
|
270
|
+
tests:
|
|
271
|
+
- description: "Construction agent with pre-loaded state"
|
|
272
|
+
vars:
|
|
273
|
+
memory_bank_state: file://fixtures/memory-bank-states/05-construction-in-progress/state.md
|
|
274
|
+
request: "Continue bolt-auth-service-1"
|
|
275
|
+
```
|
|
276
|
+
|
|
277
|
+
#### Option 3: JavaScript Setup/Teardown
|
|
278
|
+
|
|
279
|
+
```javascript
|
|
280
|
+
// promptfoo.config.js
|
|
281
|
+
const fs = require('fs-extra');
|
|
282
|
+
const path = require('path');
|
|
283
|
+
|
|
284
|
+
module.exports = {
|
|
285
|
+
prompts: ['file://prompts/construction-agent.txt'],
|
|
286
|
+
|
|
287
|
+
providers: ['openrouter:meta-llama/llama-3.3-70b-instruct:free'],
|
|
288
|
+
|
|
289
|
+
tests: [
|
|
290
|
+
{
|
|
291
|
+
description: 'Start bolt from inception-complete state',
|
|
292
|
+
|
|
293
|
+
// Setup: Copy fixture before test
|
|
294
|
+
setup: async () => {
|
|
295
|
+
const fixture = path.join(__dirname, 'fixtures/memory-bank-states/04-inception-complete');
|
|
296
|
+
const workspace = path.join(__dirname, 'test-workspace');
|
|
297
|
+
await fs.remove(workspace);
|
|
298
|
+
await fs.copy(fixture, workspace);
|
|
299
|
+
return { workspace };
|
|
300
|
+
},
|
|
301
|
+
|
|
302
|
+
// Teardown: Clean up after test
|
|
303
|
+
teardown: async ({ workspace }) => {
|
|
304
|
+
await fs.remove(workspace);
|
|
305
|
+
},
|
|
306
|
+
|
|
307
|
+
vars: {
|
|
308
|
+
command: 'bolt-start --bolt-id=bolt-auth-service-1',
|
|
309
|
+
},
|
|
310
|
+
|
|
311
|
+
assert: [
|
|
312
|
+
{ type: 'contains', value: 'Stage 1: Domain Model' },
|
|
313
|
+
{ type: 'contains', value: '## Activities' },
|
|
314
|
+
],
|
|
315
|
+
},
|
|
316
|
+
],
|
|
317
|
+
};
|
|
318
|
+
```
|
|
319
|
+
|
|
320
|
+
### State Transition Testing
|
|
321
|
+
|
|
322
|
+
Test that agents correctly transition between states:
|
|
323
|
+
|
|
324
|
+
```yaml
|
|
325
|
+
# state-transition-tests.yaml
|
|
326
|
+
tests:
|
|
327
|
+
# Test: Inception creates correct state for Construction
|
|
328
|
+
- description: "Inception → Construction transition"
|
|
329
|
+
vars:
|
|
330
|
+
initial_state: file://fixtures/03-inception-started/
|
|
331
|
+
command: "bolt-plan"
|
|
332
|
+
assert:
|
|
333
|
+
- type: llm-rubric
|
|
334
|
+
value: |
|
|
335
|
+
The output should create bolt files that Construction Agent can execute.
|
|
336
|
+
Check:
|
|
337
|
+
1. Bolt files have correct frontmatter (id, unit, type, status: planned)
|
|
338
|
+
2. Stories are assigned to bolts
|
|
339
|
+
3. Dependencies are specified
|
|
340
|
+
Return PASS if Construction Agent could start these bolts.
|
|
341
|
+
|
|
342
|
+
# Test: Construction completes to Operations-ready state
|
|
343
|
+
- description: "Construction → Operations transition"
|
|
344
|
+
vars:
|
|
345
|
+
initial_state: file://fixtures/05-construction-in-progress/
|
|
346
|
+
command: "bolt-start --bolt-id=bolt-auth-service-1"
|
|
347
|
+
# Simulate completing all stages
|
|
348
|
+
assert:
|
|
349
|
+
- type: llm-rubric
|
|
350
|
+
value: |
|
|
351
|
+
After bolt completion, verify:
|
|
352
|
+
1. Bolt status is "completed"
|
|
353
|
+
2. All stage artifacts exist
|
|
354
|
+
3. Test report shows passing tests
|
|
355
|
+
Return PASS if Operations Agent could deploy this.
|
|
356
|
+
```
|
|
357
|
+
|
|
358
|
+
---
|
|
359
|
+
|
|
360
|
+
## Free Coding Models on OpenRouter
|
|
361
|
+
|
|
362
|
+
Since irismd agents are used by coding AI tools, here are the best **free** models for agent testing and as LLM-as-judge:
|
|
363
|
+
|
|
364
|
+
### Recommended Free Models
|
|
365
|
+
|
|
366
|
+
| Model ID | Context | Best For | Speed |
|
|
367
|
+
|----------|---------|----------|-------|
|
|
368
|
+
| `x-ai/grok-4.1-fast:free` | 2M | **Coding, tool calling, agentic** | Very Fast |
|
|
369
|
+
| `meta-llama/llama-4-maverick:free` | 1M | General + coding, multimodal | Fast |
|
|
370
|
+
| `meta-llama/llama-3.3-70b-instruct:free` | 128k | High quality reasoning | Medium |
|
|
371
|
+
| `qwen/qwen3-coder:free` | 256k | **Code-specialized** | Fast |
|
|
372
|
+
| `qwen/qwen3-235b-a22b:free` | 128k | Large MoE, general | Medium |
|
|
373
|
+
| `google/gemma-3-27b-it:free` | 128k | Good quality, fast | Fast |
|
|
374
|
+
| `mistralai/mistral-small-3.1-24b-instruct:free` | 128k | Balanced | Fast |
|
|
375
|
+
|
|
376
|
+
### Coding-Focused Recommendations
|
|
377
|
+
|
|
378
|
+
```yaml
|
|
379
|
+
# For testing coding agents (Construction Agent)
|
|
380
|
+
providers:
|
|
381
|
+
# Best free coding model - xAI optimized for agentic coding
|
|
382
|
+
- id: openrouter:x-ai/grok-4.1-fast:free
|
|
383
|
+
label: grok-coding-free
|
|
384
|
+
config:
|
|
385
|
+
temperature: 0
|
|
386
|
+
|
|
387
|
+
# Qwen's code-specialized model
|
|
388
|
+
- id: openrouter:qwen/qwen3-coder:free
|
|
389
|
+
label: qwen-coder-free
|
|
390
|
+
config:
|
|
391
|
+
temperature: 0
|
|
392
|
+
|
|
393
|
+
# Llama 4 Maverick - huge context, good at code
|
|
394
|
+
- id: openrouter:meta-llama/llama-4-maverick:free
|
|
395
|
+
label: llama4-maverick-free
|
|
396
|
+
config:
|
|
397
|
+
temperature: 0
|
|
398
|
+
```
|
|
399
|
+
|
|
400
|
+
### Model Selection by Test Type
|
|
401
|
+
|
|
402
|
+
```yaml
|
|
403
|
+
# evaluation-config.yaml
|
|
404
|
+
model_selection:
|
|
405
|
+
|
|
406
|
+
# Structure/format checks - use fast model
|
|
407
|
+
format_validation:
|
|
408
|
+
model: openrouter:google/gemma-3-27b-it:free
|
|
409
|
+
reason: "Fast, good at pattern matching"
|
|
410
|
+
|
|
411
|
+
# Code quality evaluation - use coding model
|
|
412
|
+
code_review:
|
|
413
|
+
model: openrouter:x-ai/grok-4.1-fast:free
|
|
414
|
+
reason: "Optimized for code understanding"
|
|
415
|
+
|
|
416
|
+
# Reasoning/logic checks - use large model
|
|
417
|
+
reasoning_validation:
|
|
418
|
+
model: openrouter:meta-llama/llama-3.3-70b-instruct:free
|
|
419
|
+
reason: "Best reasoning in free tier"
|
|
420
|
+
|
|
421
|
+
# General quality - balanced choice
|
|
422
|
+
general_quality:
|
|
423
|
+
model: openrouter:qwen/qwen3-235b-a22b:free
|
|
424
|
+
reason: "Large MoE, good all-around"
|
|
425
|
+
```
|
|
426
|
+
|
|
427
|
+
### Provider Configuration
|
|
428
|
+
|
|
429
|
+
```yaml
|
|
430
|
+
# promptfoo.yaml - Full provider setup
|
|
431
|
+
providers:
|
|
432
|
+
# PRIMARY: For most tests (fast, free, good at code)
|
|
433
|
+
- id: openrouter:x-ai/grok-4.1-fast:free
|
|
434
|
+
label: primary-free
|
|
435
|
+
config:
|
|
436
|
+
temperature: 0
|
|
437
|
+
headers:
|
|
438
|
+
HTTP-Referer: https://iris.md
|
|
439
|
+
|
|
440
|
+
# JUDGE: For LLM-as-judge evaluations
|
|
441
|
+
- id: openrouter:meta-llama/llama-3.3-70b-instruct:free
|
|
442
|
+
label: judge-free
|
|
443
|
+
config:
|
|
444
|
+
temperature: 0
|
|
445
|
+
headers:
|
|
446
|
+
HTTP-Referer: https://iris.md
|
|
447
|
+
|
|
448
|
+
# CODING: For code-specific tests
|
|
449
|
+
- id: openrouter:qwen/qwen3-coder:free
|
|
450
|
+
label: coding-free
|
|
451
|
+
config:
|
|
452
|
+
temperature: 0
|
|
453
|
+
headers:
|
|
454
|
+
HTTP-Referer: https://iris.md
|
|
455
|
+
|
|
456
|
+
# FALLBACK: If primary is rate-limited
|
|
457
|
+
- id: openrouter:google/gemma-3-27b-it:free
|
|
458
|
+
label: fallback-free
|
|
459
|
+
config:
|
|
460
|
+
temperature: 0
|
|
461
|
+
```
|
|
462
|
+
|
|
463
|
+
---
|
|
464
|
+
|
|
465
|
+
## Testing Each Agent
|
|
466
|
+
|
|
467
|
+
### Testing Master Agent
|
|
468
|
+
|
|
469
|
+
**State Required**: Minimal - just memory-bank.yaml
|
|
470
|
+
|
|
471
|
+
```yaml
|
|
472
|
+
# master-agent-tests.yaml
|
|
473
|
+
description: "Master Agent Routing Tests"
|
|
474
|
+
|
|
475
|
+
prompts:
|
|
476
|
+
- file://prompts/master-agent-system.txt
|
|
477
|
+
|
|
478
|
+
providers:
|
|
479
|
+
- openrouter:x-ai/grok-4.1-fast:free
|
|
480
|
+
|
|
481
|
+
defaultTest:
|
|
482
|
+
assert:
|
|
483
|
+
- type: not-contains
|
|
484
|
+
value: "ERROR"
|
|
485
|
+
|
|
486
|
+
tests:
|
|
487
|
+
# Routing to Inception
|
|
488
|
+
- description: "Routes new feature to Inception"
|
|
489
|
+
vars:
|
|
490
|
+
project_state: file://fixtures/02-initialized-project/state-summary.md
|
|
491
|
+
request: "I want to add user authentication"
|
|
492
|
+
assert:
|
|
493
|
+
- type: contains
|
|
494
|
+
value: "Inception"
|
|
495
|
+
- type: llm-rubric
|
|
496
|
+
value: "Does the response correctly identify this needs Inception phase?"
|
|
497
|
+
|
|
498
|
+
# Routing to Construction
|
|
499
|
+
- description: "Routes to Construction when bolts exist"
|
|
500
|
+
vars:
|
|
501
|
+
project_state: file://fixtures/04-inception-complete/state-summary.md
|
|
502
|
+
request: "Let's start building"
|
|
503
|
+
assert:
|
|
504
|
+
- type: contains
|
|
505
|
+
value: "Construction"
|
|
506
|
+
- type: contains
|
|
507
|
+
value: "bolt"
|
|
508
|
+
|
|
509
|
+
# Routing to Operations
|
|
510
|
+
- description: "Routes to Operations when ready to deploy"
|
|
511
|
+
vars:
|
|
512
|
+
project_state: file://fixtures/06-construction-complete/state-summary.md
|
|
513
|
+
request: "Deploy to staging"
|
|
514
|
+
assert:
|
|
515
|
+
- type: contains
|
|
516
|
+
value: "Operations"
|
|
517
|
+
```
|
|
518
|
+
|
|
519
|
+
### Testing Inception Agent
|
|
520
|
+
|
|
521
|
+
**State Required**: Initialized project with standards
|
|
522
|
+
|
|
523
|
+
```yaml
|
|
524
|
+
# inception-agent-tests.yaml
|
|
525
|
+
description: "Inception Agent Tests"
|
|
526
|
+
|
|
527
|
+
prompts:
|
|
528
|
+
- file://prompts/inception-agent-system.txt
|
|
529
|
+
|
|
530
|
+
providers:
|
|
531
|
+
- openrouter:meta-llama/llama-3.3-70b-instruct:free
|
|
532
|
+
|
|
533
|
+
tests:
|
|
534
|
+
# Intent Creation
|
|
535
|
+
- description: "Creates well-structured intent"
|
|
536
|
+
vars:
|
|
537
|
+
project_state: file://fixtures/02-initialized-project/state-summary.md
|
|
538
|
+
skill: "intent-create"
|
|
539
|
+
request: "User authentication with OAuth and MFA"
|
|
540
|
+
assert:
|
|
541
|
+
# Structure checks
|
|
542
|
+
- type: contains
|
|
543
|
+
value: "## Problem Statement"
|
|
544
|
+
- type: contains
|
|
545
|
+
value: "## Success Criteria"
|
|
546
|
+
# No ASCII tables (our formatting rule)
|
|
547
|
+
- type: not-contains
|
|
548
|
+
value: "|---|"
|
|
549
|
+
# Quality check
|
|
550
|
+
- type: llm-rubric
|
|
551
|
+
provider: openrouter:x-ai/grok-4.1-fast:free
|
|
552
|
+
value: |
|
|
553
|
+
Evaluate this intent:
|
|
554
|
+
1. Is the problem statement specific (not vague)?
|
|
555
|
+
2. Are success criteria measurable?
|
|
556
|
+
3. Does it follow numbered list format for options?
|
|
557
|
+
Return PASS if all criteria met.
|
|
558
|
+
|
|
559
|
+
# Requirements Gathering
|
|
560
|
+
- description: "Asks clarifying questions first"
|
|
561
|
+
vars:
|
|
562
|
+
project_state: file://fixtures/03-inception-started/state-summary.md
|
|
563
|
+
skill: "requirements"
|
|
564
|
+
request: "Add the requirements for auth"
|
|
565
|
+
assert:
|
|
566
|
+
- type: llm-rubric
|
|
567
|
+
value: |
|
|
568
|
+
The agent should ask clarifying questions before generating requirements.
|
|
569
|
+
Check if output contains questions like:
|
|
570
|
+
- Authentication method preference?
|
|
571
|
+
- Security requirements?
|
|
572
|
+
- Integration needs?
|
|
573
|
+
Return PASS if agent seeks clarification first.
|
|
574
|
+
```
|
|
575
|
+
|
|
576
|
+
### Testing Construction Agent
|
|
577
|
+
|
|
578
|
+
**State Required**: Complete inception with planned bolts
|
|
579
|
+
|
|
580
|
+
```yaml
|
|
581
|
+
# construction-agent-tests.yaml
|
|
582
|
+
description: "Construction Agent Tests"
|
|
583
|
+
|
|
584
|
+
prompts:
|
|
585
|
+
- file://prompts/construction-agent-system.txt
|
|
586
|
+
|
|
587
|
+
providers:
|
|
588
|
+
# Use coding-focused model
|
|
589
|
+
- openrouter:x-ai/grok-4.1-fast:free
|
|
590
|
+
|
|
591
|
+
tests:
|
|
592
|
+
# Bolt Start
|
|
593
|
+
- description: "Starts bolt with correct stage"
|
|
594
|
+
vars:
|
|
595
|
+
project_state: file://fixtures/04-inception-complete/state-summary.md
|
|
596
|
+
bolt_state: file://fixtures/04-inception-complete/memory-bank/bolts/bolt-auth-service-1/bolt.md
|
|
597
|
+
skill: "bolt-start"
|
|
598
|
+
bolt_id: "bolt-auth-service-1"
|
|
599
|
+
assert:
|
|
600
|
+
- type: contains
|
|
601
|
+
value: "Stage 1"
|
|
602
|
+
- type: contains
|
|
603
|
+
value: "Domain Model"
|
|
604
|
+
# Check it reads bolt type
|
|
605
|
+
- type: llm-rubric
|
|
606
|
+
value: "Does the agent reference the bolt type definition for stage activities?"
|
|
607
|
+
|
|
608
|
+
# Stage Completion
|
|
609
|
+
- description: "Stops at human gate after stage"
|
|
610
|
+
vars:
|
|
611
|
+
project_state: file://fixtures/05-construction-in-progress/state-summary.md
|
|
612
|
+
skill: "bolt-start"
|
|
613
|
+
bolt_id: "bolt-auth-service-1"
|
|
614
|
+
assert:
|
|
615
|
+
# Must stop and wait
|
|
616
|
+
- type: contains
|
|
617
|
+
value: "Human Validation"
|
|
618
|
+
- type: llm-rubric
|
|
619
|
+
value: |
|
|
620
|
+
Check that the agent:
|
|
621
|
+
1. Presents stage completion summary
|
|
622
|
+
2. Asks for confirmation before proceeding
|
|
623
|
+
3. Does NOT auto-advance to next stage
|
|
624
|
+
Return PASS if human gate is enforced.
|
|
625
|
+
|
|
626
|
+
# Code Generation Quality
|
|
627
|
+
- description: "Generates code following standards"
|
|
628
|
+
vars:
|
|
629
|
+
project_state: file://fixtures/05-construction-in-progress/state-summary.md
|
|
630
|
+
standards: file://fixtures/05-construction-in-progress/memory-bank/standards/
|
|
631
|
+
skill: "bolt-start"
|
|
632
|
+
stage: "implement"
|
|
633
|
+
assert:
|
|
634
|
+
- type: llm-rubric
|
|
635
|
+
provider: openrouter:qwen/qwen3-coder:free # Use code model for code review
|
|
636
|
+
value: |
|
|
637
|
+
Evaluate the generated code:
|
|
638
|
+
1. Does it follow the tech-stack standards?
|
|
639
|
+
2. Is naming consistent with coding-standards?
|
|
640
|
+
3. Is error handling included?
|
|
641
|
+
4. Are there appropriate comments?
|
|
642
|
+
Return PASS if code quality is acceptable.
|
|
643
|
+
```
|
|
644
|
+
|
|
645
|
+
### Testing Operations Agent
|
|
646
|
+
|
|
647
|
+
**State Required**: Completed construction with all bolts done
|
|
648
|
+
|
|
649
|
+
```yaml
|
|
650
|
+
# operations-agent-tests.yaml
|
|
651
|
+
description: "Operations Agent Tests"
|
|
652
|
+
|
|
653
|
+
prompts:
|
|
654
|
+
- file://prompts/operations-agent-system.txt
|
|
655
|
+
|
|
656
|
+
providers:
|
|
657
|
+
- openrouter:x-ai/grok-4.1-fast:free
|
|
658
|
+
|
|
659
|
+
tests:
|
|
660
|
+
# Deployment Progression
|
|
661
|
+
- description: "Enforces dev → staging → prod progression"
|
|
662
|
+
vars:
|
|
663
|
+
project_state: file://fixtures/06-construction-complete/state-summary.md
|
|
664
|
+
skill: "deploy"
|
|
665
|
+
request: "Deploy to production"
|
|
666
|
+
assert:
|
|
667
|
+
- type: llm-rubric
|
|
668
|
+
value: |
|
|
669
|
+
Agent should NOT allow direct production deployment.
|
|
670
|
+
Check that it:
|
|
671
|
+
1. Asks about dev/staging deployment status
|
|
672
|
+
2. Requires progression through environments
|
|
673
|
+
3. Warns about skipping stages
|
|
674
|
+
Return PASS if it blocks direct prod deployment.
|
|
675
|
+
|
|
676
|
+
# Production Approval Gate
|
|
677
|
+
- description: "Requires explicit approval for production"
|
|
678
|
+
vars:
|
|
679
|
+
project_state: file://fixtures/06-construction-complete/state-summary.md
|
|
680
|
+
deployment_state: "dev: deployed, staging: deployed, verified"
|
|
681
|
+
skill: "deploy"
|
|
682
|
+
request: "Deploy to production"
|
|
683
|
+
assert:
|
|
684
|
+
- type: contains
|
|
685
|
+
value: "APPROVAL"
|
|
686
|
+
- type: contains
|
|
687
|
+
value: "yes/no"
|
|
688
|
+
- type: llm-rubric
|
|
689
|
+
value: "Does the agent require explicit human approval before production deployment?"
|
|
690
|
+
```
|
|
691
|
+
|
|
692
|
+
---
|
|
693
|
+
|
|
694
|
+
## Complete Example Configuration
|
|
695
|
+
|
|
696
|
+
### Directory Structure
|
|
697
|
+
|
|
698
|
+
```text
|
|
699
|
+
irismd/
|
|
700
|
+
├── __tests__/
|
|
701
|
+
│ ├── evaluation/
|
|
702
|
+
│ │ ├── promptfoo.yaml # Main config
|
|
703
|
+
│ │ ├── providers.yaml # Model definitions
|
|
704
|
+
│ │ │
|
|
705
|
+
│ │ ├── agents/ # Per-agent tests
|
|
706
|
+
│ │ │ ├── master-agent.yaml
|
|
707
|
+
│ │ │ ├── inception-agent.yaml
|
|
708
|
+
│ │ │ ├── construction-agent.yaml
|
|
709
|
+
│ │ │ └── operations-agent.yaml
|
|
710
|
+
│ │ │
|
|
711
|
+
│ │ ├── rubrics/ # Reusable assertions
|
|
712
|
+
│ │ │ ├── output-formatting.yaml
|
|
713
|
+
│ │ │ ├── human-gates.yaml
|
|
714
|
+
│ │ │ └── code-quality.yaml
|
|
715
|
+
│ │ │
|
|
716
|
+
│ │ └── prompts/ # Agent system prompts
|
|
717
|
+
│ │ ├── master-agent-system.txt
|
|
718
|
+
│ │ ├── inception-agent-system.txt
|
|
719
|
+
│ │ ├── construction-agent-system.txt
|
|
720
|
+
│ │ └── operations-agent-system.txt
|
|
721
|
+
│ │
|
|
722
|
+
│ ├── golden-datasets/ # Known-good examples
|
|
723
|
+
│ │ ├── inception-agent/
|
|
724
|
+
│ │ ├── construction-agent/
|
|
725
|
+
│ │ └── master-agent/
|
|
726
|
+
│ │
|
|
727
|
+
│ └── fixtures/ # Test state setup
|
|
728
|
+
│ └── memory-bank-states/
|
|
729
|
+
│ ├── 01-empty-project/
|
|
730
|
+
│ ├── 02-initialized-project/
|
|
731
|
+
│ ├── 03-inception-started/
|
|
732
|
+
│ ├── 04-inception-complete/
|
|
733
|
+
│ ├── 05-construction-in-progress/
|
|
734
|
+
│ └── 06-construction-complete/
|
|
735
|
+
│
|
|
736
|
+
└── package.json
|
|
737
|
+
```
|
|
738
|
+
|
|
739
|
+
### Main Configuration
|
|
740
|
+
|
|
741
|
+
```yaml
|
|
742
|
+
# __tests__/evaluation/promptfoo.yaml
|
|
743
|
+
description: "irismd Agent Evaluation Suite"
|
|
744
|
+
|
|
745
|
+
# Import providers
|
|
746
|
+
providers: file://providers.yaml
|
|
747
|
+
|
|
748
|
+
# Import all agent tests
|
|
749
|
+
tests:
|
|
750
|
+
- file://agents/master-agent.yaml
|
|
751
|
+
- file://agents/inception-agent.yaml
|
|
752
|
+
- file://agents/construction-agent.yaml
|
|
753
|
+
- file://agents/operations-agent.yaml
|
|
754
|
+
|
|
755
|
+
# Shared assertions for all tests
|
|
756
|
+
defaultTest:
|
|
757
|
+
assert:
|
|
758
|
+
# Output formatting rules (embedded in every test)
|
|
759
|
+
- type: not-contains
|
|
760
|
+
value: "|---|"
|
|
761
|
+
description: "No ASCII tables"
|
|
762
|
+
- type: javascript
|
|
763
|
+
value: |
|
|
764
|
+
// Check for status indicators
|
|
765
|
+
const hasIndicators =
|
|
766
|
+
output.includes('✅') ||
|
|
767
|
+
output.includes('⏳') ||
|
|
768
|
+
output.includes('[ ]');
|
|
769
|
+
return hasIndicators || output.length < 100; // Short outputs exempt
|
|
770
|
+
```
|
|
771
|
+
|
|
772
|
+
### Provider Configuration
|
|
773
|
+
|
|
774
|
+
```yaml
|
|
775
|
+
# __tests__/evaluation/providers.yaml
|
|
776
|
+
|
|
777
|
+
# Fast coding model - primary choice
|
|
778
|
+
- id: openrouter:x-ai/grok-4.1-fast:free
|
|
779
|
+
label: grok-fast
|
|
780
|
+
config:
|
|
781
|
+
temperature: 0
|
|
782
|
+
headers:
|
|
783
|
+
HTTP-Referer: https://iris.md
|
|
784
|
+
|
|
785
|
+
# High-quality reasoning - for complex tests
|
|
786
|
+
- id: openrouter:meta-llama/llama-3.3-70b-instruct:free
|
|
787
|
+
label: llama-70b
|
|
788
|
+
config:
|
|
789
|
+
temperature: 0
|
|
790
|
+
|
|
791
|
+
# Code specialist - for code review assertions
|
|
792
|
+
- id: openrouter:qwen/qwen3-coder:free
|
|
793
|
+
label: qwen-coder
|
|
794
|
+
config:
|
|
795
|
+
temperature: 0
|
|
796
|
+
|
|
797
|
+
# Fast fallback
|
|
798
|
+
- id: openrouter:google/gemma-3-27b-it:free
|
|
799
|
+
label: gemma-fast
|
|
800
|
+
config:
|
|
801
|
+
temperature: 0
|
|
802
|
+
```
|
|
803
|
+
|
|
804
|
+
### Reusable Rubrics
|
|
805
|
+
|
|
806
|
+
```yaml
|
|
807
|
+
# __tests__/evaluation/rubrics/output-formatting.yaml
|
|
808
|
+
- name: no-ascii-tables
|
|
809
|
+
assert:
|
|
810
|
+
- type: not-contains
|
|
811
|
+
value: "|---|"
|
|
812
|
+
- type: not-contains
|
|
813
|
+
value: "+---+"
|
|
814
|
+
|
|
815
|
+
- name: numbered-list-format
|
|
816
|
+
assert:
|
|
817
|
+
- type: llm-rubric
|
|
818
|
+
provider: openrouter:google/gemma-3-27b-it:free
|
|
819
|
+
value: "Are options presented as numbered lists (1 - **Option**: Description) not tables?"
|
|
820
|
+
|
|
821
|
+
- name: status-indicators
|
|
822
|
+
assert:
|
|
823
|
+
- type: javascript
|
|
824
|
+
value: |
|
|
825
|
+
const indicators = ['✅', '⏳', '[ ]', '🚫'];
|
|
826
|
+
return indicators.some(i => output.includes(i));
|
|
827
|
+
|
|
828
|
+
- name: suggested-next-step
|
|
829
|
+
assert:
|
|
830
|
+
- type: contains
|
|
831
|
+
value: "Suggested Next Step"
|
|
832
|
+
- type: contains
|
|
833
|
+
value: "→"
|
|
834
|
+
```
|
|
835
|
+
|
|
836
|
+
```yaml
|
|
837
|
+
# __tests__/evaluation/rubrics/human-gates.yaml
|
|
838
|
+
- name: stops-at-validation
|
|
839
|
+
assert:
|
|
840
|
+
- type: llm-rubric
|
|
841
|
+
value: |
|
|
842
|
+
Check that the agent stops and waits for human input.
|
|
843
|
+
Signs of proper human gate:
|
|
844
|
+
- Contains "Validation Required" or "Approval Required"
|
|
845
|
+
- Asks a question and waits
|
|
846
|
+
- Does NOT auto-continue to next step
|
|
847
|
+
Return PASS if human gate is enforced.
|
|
848
|
+
|
|
849
|
+
- name: does-not-auto-advance
|
|
850
|
+
assert:
|
|
851
|
+
- type: not-contains
|
|
852
|
+
value: "Proceeding to"
|
|
853
|
+
- type: not-contains
|
|
854
|
+
value: "Moving on to"
|
|
855
|
+
- type: not-contains
|
|
856
|
+
value: "Automatically"
|
|
857
|
+
```
|
|
858
|
+
|
|
859
|
+
### Package.json Scripts
|
|
860
|
+
|
|
861
|
+
```json
|
|
862
|
+
{
|
|
863
|
+
"scripts": {
|
|
864
|
+
"eval": "cd __tests__/evaluation && promptfoo eval",
|
|
865
|
+
"eval:master": "cd __tests__/evaluation && promptfoo eval -c agents/master-agent.yaml",
|
|
866
|
+
"eval:inception": "cd __tests__/evaluation && promptfoo eval -c agents/inception-agent.yaml",
|
|
867
|
+
"eval:construction": "cd __tests__/evaluation && promptfoo eval -c agents/construction-agent.yaml",
|
|
868
|
+
"eval:operations": "cd __tests__/evaluation && promptfoo eval -c agents/operations-agent.yaml",
|
|
869
|
+
"eval:view": "cd __tests__/evaluation && promptfoo view",
|
|
870
|
+
"eval:ci": "cd __tests__/evaluation && promptfoo eval --ci",
|
|
871
|
+
"eval:baseline": "cd __tests__/evaluation && promptfoo eval --output baseline.json"
|
|
872
|
+
}
|
|
873
|
+
}
|
|
874
|
+
```
|
|
875
|
+
|
|
876
|
+
---
|
|
877
|
+
|
|
878
|
+
## Quick Start
|
|
879
|
+
|
|
880
|
+
```bash
|
|
881
|
+
# 1. Install promptfoo
|
|
882
|
+
npm install -g promptfoo
|
|
883
|
+
|
|
884
|
+
# 2. Set API key (free!)
|
|
885
|
+
export OPENROUTER_API_KEY=sk-or-...
|
|
886
|
+
|
|
887
|
+
# 3. Run all tests
|
|
888
|
+
npm run eval
|
|
889
|
+
|
|
890
|
+
# 4. View results
|
|
891
|
+
npm run eval:view
|
|
892
|
+
|
|
893
|
+
# 5. Run specific agent
|
|
894
|
+
npm run eval:construction
|
|
895
|
+
```
|
|
896
|
+
|
|
897
|
+
---
|
|
898
|
+
|
|
899
|
+
## Summary
|
|
900
|
+
|
|
901
|
+
| Concept | Purpose |
|
|
902
|
+
|---------|---------|
|
|
903
|
+
| **Golden Dataset** | Known-good input/output pairs for regression testing |
|
|
904
|
+
| **Fixtures** | Pre-configured memory bank states for test setup |
|
|
905
|
+
| **LLM-as-Judge** | Use free models to evaluate output quality |
|
|
906
|
+
| **Free Coding Models** | Grok 4.1 Fast, Qwen Coder, Llama 3.3 70B |
|
|
907
|
+
|
|
908
|
+
---
|
|
909
|
+
|
|
910
|
+
*Document created: 2025-12-10*
|
|
911
|
+
*Status: Tutorial / Reference*
|