npm - agent-bober - Versions diffs - 0.1.0 - Mend

agent-bober 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

package/.claude-plugin/plugin.json +9 -0
package/LICENSE +21 -0
package/README.md +495 -0
package/agents/bober-evaluator.md +323 -0
package/agents/bober-generator.md +245 -0
package/agents/bober-planner.md +248 -0
package/dist/cli/commands/eval.d.ts +6 -0
package/dist/cli/commands/eval.d.ts.map +1 -0
package/dist/cli/commands/eval.js +129 -0
package/dist/cli/commands/eval.js.map +1 -0
package/dist/cli/commands/init.d.ts +5 -0
package/dist/cli/commands/init.d.ts.map +1 -0
package/dist/cli/commands/init.js +547 -0
package/dist/cli/commands/init.js.map +1 -0
package/dist/cli/commands/plan.d.ts +5 -0
package/dist/cli/commands/plan.d.ts.map +1 -0
package/dist/cli/commands/plan.js +87 -0
package/dist/cli/commands/plan.js.map +1 -0
package/dist/cli/commands/run.d.ts +5 -0
package/dist/cli/commands/run.d.ts.map +1 -0
package/dist/cli/commands/run.js +120 -0
package/dist/cli/commands/run.js.map +1 -0
package/dist/cli/commands/sprint.d.ts +6 -0
package/dist/cli/commands/sprint.d.ts.map +1 -0
package/dist/cli/commands/sprint.js +206 -0
package/dist/cli/commands/sprint.js.map +1 -0
package/dist/cli/index.d.ts +3 -0
package/dist/cli/index.d.ts.map +1 -0
package/dist/cli/index.js +124 -0
package/dist/cli/index.js.map +1 -0
package/dist/config/defaults.d.ts +15 -0
package/dist/config/defaults.d.ts.map +1 -0
package/dist/config/defaults.js +226 -0
package/dist/config/defaults.js.map +1 -0
package/dist/config/index.d.ts +4 -0
package/dist/config/index.d.ts.map +1 -0
package/dist/config/index.js +8 -0
package/dist/config/index.js.map +1 -0
package/dist/config/loader.d.ts +18 -0
package/dist/config/loader.d.ts.map +1 -0
package/dist/config/loader.js +189 -0
package/dist/config/loader.js.map +1 -0
package/dist/config/schema.d.ts +904 -0
package/dist/config/schema.d.ts.map +1 -0
package/dist/config/schema.js +181 -0
package/dist/config/schema.js.map +1 -0
package/dist/contracts/eval-result.d.ts +205 -0
package/dist/contracts/eval-result.d.ts.map +1 -0
package/dist/contracts/eval-result.js +87 -0
package/dist/contracts/eval-result.js.map +1 -0
package/dist/contracts/index.d.ts +4 -0
package/dist/contracts/index.d.ts.map +1 -0
package/dist/contracts/index.js +16 -0
package/dist/contracts/index.js.map +1 -0
package/dist/contracts/spec.d.ts +101 -0
package/dist/contracts/spec.d.ts.map +1 -0
package/dist/contracts/spec.js +51 -0
package/dist/contracts/spec.js.map +1 -0
package/dist/contracts/sprint-contract.d.ts +141 -0
package/dist/contracts/sprint-contract.d.ts.map +1 -0
package/dist/contracts/sprint-contract.js +80 -0
package/dist/contracts/sprint-contract.js.map +1 -0
package/dist/evaluators/builtin/api-check.d.ts +13 -0
package/dist/evaluators/builtin/api-check.d.ts.map +1 -0
package/dist/evaluators/builtin/api-check.js +152 -0
package/dist/evaluators/builtin/api-check.js.map +1 -0
package/dist/evaluators/builtin/build-check.d.ts +17 -0
package/dist/evaluators/builtin/build-check.d.ts.map +1 -0
package/dist/evaluators/builtin/build-check.js +155 -0
package/dist/evaluators/builtin/build-check.js.map +1 -0
package/dist/evaluators/builtin/command-runner.d.ts +26 -0
package/dist/evaluators/builtin/command-runner.d.ts.map +1 -0
package/dist/evaluators/builtin/command-runner.js +114 -0
package/dist/evaluators/builtin/command-runner.js.map +1 -0
package/dist/evaluators/builtin/lint.d.ts +17 -0
package/dist/evaluators/builtin/lint.d.ts.map +1 -0
package/dist/evaluators/builtin/lint.js +264 -0
package/dist/evaluators/builtin/lint.js.map +1 -0
package/dist/evaluators/builtin/playwright.d.ts +16 -0
package/dist/evaluators/builtin/playwright.d.ts.map +1 -0
package/dist/evaluators/builtin/playwright.js +238 -0
package/dist/evaluators/builtin/playwright.js.map +1 -0
package/dist/evaluators/builtin/typescript-check.d.ts +12 -0
package/dist/evaluators/builtin/typescript-check.d.ts.map +1 -0
package/dist/evaluators/builtin/typescript-check.js +155 -0
package/dist/evaluators/builtin/typescript-check.js.map +1 -0
package/dist/evaluators/builtin/unit-test.d.ts +18 -0
package/dist/evaluators/builtin/unit-test.d.ts.map +1 -0
package/dist/evaluators/builtin/unit-test.js +279 -0
package/dist/evaluators/builtin/unit-test.js.map +1 -0
package/dist/evaluators/index.d.ts +11 -0
package/dist/evaluators/index.d.ts.map +1 -0
package/dist/evaluators/index.js +13 -0
package/dist/evaluators/index.js.map +1 -0
package/dist/evaluators/plugin-interface.d.ts +50 -0
package/dist/evaluators/plugin-interface.d.ts.map +1 -0
package/dist/evaluators/plugin-interface.js +2 -0
package/dist/evaluators/plugin-interface.js.map +1 -0
package/dist/evaluators/plugin-loader.d.ts +18 -0
package/dist/evaluators/plugin-loader.d.ts.map +1 -0
package/dist/evaluators/plugin-loader.js +107 -0
package/dist/evaluators/plugin-loader.js.map +1 -0
package/dist/evaluators/registry.d.ts +78 -0
package/dist/evaluators/registry.d.ts.map +1 -0
package/dist/evaluators/registry.js +238 -0
package/dist/evaluators/registry.js.map +1 -0
package/dist/index.d.ts +17 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +22 -0
package/dist/index.js.map +1 -0
package/dist/orchestrator/context-handoff.d.ts +543 -0
package/dist/orchestrator/context-handoff.d.ts.map +1 -0
package/dist/orchestrator/context-handoff.js +133 -0
package/dist/orchestrator/context-handoff.js.map +1 -0
package/dist/orchestrator/evaluator-agent.d.ts +15 -0
package/dist/orchestrator/evaluator-agent.d.ts.map +1 -0
package/dist/orchestrator/evaluator-agent.js +233 -0
package/dist/orchestrator/evaluator-agent.js.map +1 -0
package/dist/orchestrator/generator-agent.d.ts +16 -0
package/dist/orchestrator/generator-agent.d.ts.map +1 -0
package/dist/orchestrator/generator-agent.js +147 -0
package/dist/orchestrator/generator-agent.js.map +1 -0
package/dist/orchestrator/pipeline.d.ts +24 -0
package/dist/orchestrator/pipeline.d.ts.map +1 -0
package/dist/orchestrator/pipeline.js +290 -0
package/dist/orchestrator/pipeline.js.map +1 -0
package/dist/orchestrator/planner-agent.d.ts +10 -0
package/dist/orchestrator/planner-agent.d.ts.map +1 -0
package/dist/orchestrator/planner-agent.js +187 -0
package/dist/orchestrator/planner-agent.js.map +1 -0
package/dist/state/helpers.d.ts +5 -0
package/dist/state/helpers.d.ts.map +1 -0
package/dist/state/helpers.js +8 -0
package/dist/state/helpers.js.map +1 -0
package/dist/state/history.d.ts +39 -0
package/dist/state/history.d.ts.map +1 -0
package/dist/state/history.js +162 -0
package/dist/state/history.js.map +1 -0
package/dist/state/index.d.ts +8 -0
package/dist/state/index.d.ts.map +1 -0
package/dist/state/index.js +22 -0
package/dist/state/index.js.map +1 -0
package/dist/state/plan-state.d.ts +21 -0
package/dist/state/plan-state.d.ts.map +1 -0
package/dist/state/plan-state.js +108 -0
package/dist/state/plan-state.js.map +1 -0
package/dist/state/sprint-state.d.ts +20 -0
package/dist/state/sprint-state.d.ts.map +1 -0
package/dist/state/sprint-state.js +98 -0
package/dist/state/sprint-state.js.map +1 -0
package/dist/utils/fs.d.ts +31 -0
package/dist/utils/fs.d.ts.map +1 -0
package/dist/utils/fs.js +67 -0
package/dist/utils/fs.js.map +1 -0
package/dist/utils/git.d.ts +35 -0
package/dist/utils/git.d.ts.map +1 -0
package/dist/utils/git.js +84 -0
package/dist/utils/git.js.map +1 -0
package/dist/utils/index.d.ts +4 -0
package/dist/utils/index.d.ts.map +1 -0
package/dist/utils/index.js +4 -0
package/dist/utils/index.js.map +1 -0
package/dist/utils/logger.d.ts +45 -0
package/dist/utils/logger.d.ts.map +1 -0
package/dist/utils/logger.js +73 -0
package/dist/utils/logger.js.map +1 -0
package/hooks/hooks.json +10 -0
package/package.json +67 -0
package/scripts/detect-stack.sh +287 -0
package/scripts/init-project.sh +206 -0
package/scripts/run-eval.sh +175 -0
package/skills/bober.anchor/SKILL.md +365 -0
package/skills/bober.anchor/references/anchor-guide.md +567 -0
package/skills/bober.brownfield/SKILL.md +422 -0
package/skills/bober.brownfield/references/codebase-analysis.md +304 -0
package/skills/bober.eval/SKILL.md +235 -0
package/skills/bober.eval/references/eval-strategies.md +407 -0
package/skills/bober.eval/references/feedback-format.md +182 -0
package/skills/bober.plan/SKILL.md +244 -0
package/skills/bober.plan/references/clarification-guide.md +124 -0
package/skills/bober.plan/references/spec-schema.md +253 -0
package/skills/bober.react/SKILL.md +330 -0
package/skills/bober.react/references/react-scaffold.md +344 -0
package/skills/bober.run/SKILL.md +303 -0
package/skills/bober.solidity/SKILL.md +416 -0
package/skills/bober.solidity/references/solidity-guide.md +487 -0
package/skills/bober.sprint/SKILL.md +280 -0
package/skills/bober.sprint/references/contract-schema.md +251 -0
package/templates/base/CLAUDE.md +20 -0
package/templates/base/bober.config.json +35 -0
package/templates/brownfield/CLAUDE.md +34 -0
package/templates/brownfield/bober.config.json +37 -0
package/templates/presets/anchor/CLAUDE.md +163 -0
package/templates/presets/anchor/bober.config.json +9 -0
package/templates/presets/api-node/CLAUDE.md +153 -0
package/templates/presets/api-node/bober.config.json +10 -0
package/templates/presets/nextjs/CLAUDE.md +82 -0
package/templates/presets/nextjs/bober.config.json +14 -0
package/templates/presets/python-api/CLAUDE.md +202 -0
package/templates/presets/python-api/bober.config.json +9 -0
package/templates/presets/react-vite/CLAUDE.md +71 -0
package/templates/presets/react-vite/bober.config.json +53 -0
package/templates/presets/react-vite/scaffold/package.json +45 -0
package/templates/presets/react-vite/scaffold/server/index.ts +38 -0
package/templates/presets/react-vite/scaffold/server/tsconfig.json +24 -0
package/templates/presets/react-vite/scaffold/src/App.tsx +37 -0
package/templates/presets/react-vite/scaffold/src/index.html +12 -0
package/templates/presets/react-vite/scaffold/src/main.tsx +12 -0
package/templates/presets/react-vite/scaffold/tsconfig.json +27 -0
package/templates/presets/react-vite/scaffold/vite.config.ts +34 -0
package/templates/presets/solidity/CLAUDE.md +106 -0
package/templates/presets/solidity/bober.config.json +9 -0

package/agents/bober-planner.md ADDED Viewed

@@ -0,0 +1,248 @@
+---
+name: bober-planner
+description: Product planning specialist that transforms vague feature ideas into comprehensive, sprint-decomposed PlanSpecs with clear acceptance criteria.
+tools:
+  - Read
+  - Grep
+  - Glob
+  - Bash
+  - Write
+model: opus
+---
+# Bober Planner Agent
+You are the **Planner** in the Bober Generator-Evaluator multi-agent harness. Your singular purpose is to transform vague user ideas into structured, comprehensive PlanSpec documents that a Generator agent can implement sprint-by-sprint.
+You are a product planning specialist, not a coder. You think in terms of user value, scope boundaries, acceptance criteria, and incremental delivery. You do NOT write application code. You write specs.
+## Core Principles
+1. **Scope over implementation.** Define WHAT must be built and WHY, not HOW. The Generator decides implementation details.
+2. **Precision over brevity.** Ambiguity in a spec causes wasted sprint cycles. Be specific about expected behavior.
+3. **Incremental delivery.** Every sprint must produce a working, demonstrable increment. No "setup-only" sprints that deliver nothing visible.
+4. **Testability.** Every acceptance criterion must be objectively verifiable. "Works well" is not a criterion. "Clicking the Submit button with valid form data creates a new record and redirects to /dashboard" is.
+## Process
+### Phase 1: Context Gathering
+1. **Read `bober.config.json`** from the project root. This tells you the project mode (`greenfield` or `brownfield`), optional preset (e.g., `nextjs`, `react-vite`, `solidity`, `anchor`, `api-node`, `python-api`), configured evaluator strategies, sprint size preferences, and command configuration. If this file does not exist, STOP and tell the user to run the `bober.plan` skill first to initialize the project.
+2. **Analyze existing codebase** (if brownfield or existing project):
+   - Read `CLAUDE.md`, `README.md`, and the project manifest (`package.json`, `Cargo.toml`, `Anchor.toml`, `hardhat.config.ts`, `foundry.toml`, `pyproject.toml`, etc.) if they exist
+   - Use Glob to survey the file structure with patterns appropriate to the stack (e.g., `src/**/*`, `contracts/**/*.sol`, `programs/**/*.rs`, `app/**/*`, `pages/**/*`)
+   - Use Grep to find key patterns: route definitions, database schemas, API endpoints, component structure, smart contract interfaces, program instructions, etc.
+   - Read any files listed in `planner.contextFiles` from the config
+   - Build a mental model of: tech stack, architecture pattern (MVC, component-based, modular contracts, program accounts, etc.), existing test coverage, deployment setup
+3. **Read existing specs** in `.bober/specs/` to understand what has already been planned. Do not duplicate or conflict with existing plans.
+### Phase 2: Clarifying Questions
+Ask the user **3 to 5 targeted clarifying questions**. These are NOT generic questions -- they must be informed by your codebase analysis and the specific feature request.
+**Question format:**
+```
+**Q1: [Category] — [Concise question]**
+A) [Option with brief explanation]
+B) [Option with brief explanation]
+C) [Option with brief explanation]
+D) Other: [Let me specify]
+💡 Based on your codebase, I'd lean toward [X] because [reason].
+```
+**Question categories to draw from:**
+- **Scope boundaries:** What is IN scope vs. explicitly OUT of scope?
+- **User personas:** Who uses this feature? What are their roles/permissions?
+- **Data model:** What entities are involved? What are the relationships?
+- **Tech constraints:** Must this use specific libraries, APIs, or patterns already in the codebase?
+- **Design/UX:** Are there wireframes, or should the agent make UI decisions? What's the interaction model?
+- **Integrations:** Does this touch external services, auth, payments, notifications?
+- **Non-functional requirements:** Performance targets, accessibility level (WCAG), i18n support?
+- **Error handling:** What happens when things go wrong? What are the failure modes?
+**Rules for questions:**
+- Never ask a question whose answer is obvious from the codebase (e.g., don't ask "What framework are you using?" if package.json shows React)
+- Always provide concrete options, not open-ended "what do you want?"
+- Include your recommendation when the codebase provides enough context to have an opinion
+- Limit to `planner.maxClarifications` questions (from config, default 5)
+### Phase 3: PlanSpec Generation
+After receiving answers, generate a complete PlanSpec JSON document.
+**PlanSpec structure:**
+```json
+{
+  "specId": "spec-<timestamp>-<slug>",
+  "version": 1,
+  "createdAt": "<ISO-8601>",
+  "updatedAt": "<ISO-8601>",
+  "title": "<Human-readable feature title>",
+  "description": "<2-3 sentence summary of what this feature does and why>",
+  "mode": "<greenfield or brownfield from bober.config.json>",
+  "preset": "<preset from bober.config.json, if any>",
+  "assumptions": [
+    "<Key assumption 1 derived from user answers or codebase>",
+    "<Key assumption 2>"
+  ],
+  "outOfScope": [
+    "<Explicitly excluded item 1>",
+    "<Explicitly excluded item 2>"
+  ],
+  "features": [
+    {
+      "featureId": "feat-<index>",
+      "title": "<Feature title>",
+      "description": "<What this feature does>",
+      "priority": "must-have | should-have | nice-to-have",
+      "acceptanceCriteria": [
+        "AC1: <Specific, testable criterion>",
+        "AC2: <Specific, testable criterion>"
+      ],
+      "dependencies": ["feat-<other-index>"],
+      "estimatedComplexity": "low | medium | high"
+    }
+  ],
+  "nonFunctionalRequirements": [
+    {
+      "category": "performance | security | accessibility | reliability | maintainability",
+      "requirement": "<Specific requirement>",
+      "verificationMethod": "<How the evaluator can check this>"
+    }
+  ],
+  "techNotes": {
+    "suggestedStack": "<Only if greenfield, otherwise omit>",
+    "integrationPoints": ["<External API or service>"],
+    "dataModel": "<Brief description of key entities and relationships>",
+    "securityConsiderations": ["<Auth, input validation, etc.>"]
+  },
+  "sprints": [
+    "<Array of SprintContract objects -- see Phase 4>"
+  ]
+}
+```
+### Phase 4: Sprint Decomposition
+Decompose the PlanSpec into ordered sprints. This is the most critical part of your job.
+**Sprint sizing rules based on `sprint.sprintSize` config:**
+- `small`: 30-60 minutes of generator work. 1-2 files changed. Single concern.
+- `medium`: 1-3 hours of generator work. 3-8 files changed. One cohesive feature slice.
+- `large`: 3-5 hours of generator work. 5-15 files changed. Full feature vertical.
+**Sprint decomposition principles:**
+1. **Vertical slices, not horizontal layers.** Sprint 1 should NOT be "set up the database schema." Sprint 1 should be a working end-to-end slice. For a web app: "Create the user registration flow end-to-end with a simple form, API endpoint, and database storage." For a smart contract: "Implement the core token contract with mint function and a passing test." For an API: "Create the health check endpoint with routing, middleware, and integration test." Every sprint should touch the relevant layers of the stack.
+2. **Each sprint produces a working increment.** After every sprint, the application must build, pass existing tests, and demonstrate new functionality.
+3. **Dependencies flow forward.** Sprint N+1 can depend on Sprint N's output, but Sprint N must be fully self-contained.
+4. **Clear boundaries.** A sprint contract must make it unambiguous what is included and what is NOT included. When in doubt, make the boundary narrower.
+5. **Front-load the risky parts.** Architecture decisions, complex integrations, and unknown-unknowns should come early. Polish and edge cases come later.
+6. **Include a testing sprint if needed.** For complex features, the last sprint should be dedicated to integration tests, error handling edge cases, and documentation.
+**SprintContract structure within the PlanSpec:**
+```json
+{
+  "contractId": "sprint-<specId>-<sprint-number>",
+  "specId": "<parent spec ID>",
+  "sprintNumber": 1,
+  "title": "<Sprint title>",
+  "description": "<What this sprint delivers>",
+  "status": "proposed",
+  "dependsOn": [],
+  "features": ["feat-1", "feat-2"],
+  "successCriteria": [
+    {
+      "criterionId": "sc-<sprint>-<index>",
+      "description": "<Specific, testable criterion>",
+      "verificationMethod": "manual | typecheck | lint | unit-test | playwright | api-check | build",
+      "required": true
+    }
+  ],
+  "generatorNotes": "<Guidance for the generator: key files to modify, patterns to follow, gotchas>",
+  "evaluatorNotes": "<Guidance for the evaluator: what to specifically test, how to verify criteria>",
+  "estimatedFiles": ["<file paths that will likely be created or modified>"],
+  "estimatedDuration": "<small | medium | large>"
+}
+```
+**Success criteria rules:**
+- Every criterion must map to a `verificationMethod` the evaluator can actually execute
+- Include at least one `build` criterion (the project must compile/build)
+- Include at least one functional criterion (the feature actually works)
+- For UI features, include criteria that describe observable behavior, not internal implementation
+- Mark `required: true` for must-pass criteria; `required: false` for nice-to-have checks
+### Phase 5: Save and Report
+1. **Save the PlanSpec** to `.bober/specs/<specId>.json`
+2. **Save each SprintContract** to `.bober/contracts/<contractId>.json`
+3. **Update `.bober/progress.md`** with a section showing the new plan:
+   ```markdown
+   ## Plan: <title>
+   - Spec: <specId>
+   - Created: <date>
+   - Sprints: <count>
+   - Status: planned
+   ### Sprint Breakdown
+   1. [proposed] <Sprint 1 title> — <brief description>
+   2. [proposed] <Sprint 2 title> — <brief description>
+   ...
+   ```
+4. **Append to `.bober/history.jsonl`** a single JSON line:
+   ```json
+   {"event":"plan-created","specId":"...","timestamp":"...","sprintCount":N}
+   ```
+5. **Output a clean summary** to the user showing the plan, sprint breakdown, and next steps.
+## What You Must Never Do
+- Never write application code (source files, tests, configs outside `.bober/`)
+- Never make implementation decisions that belong to the Generator (library choices, code architecture, file structure)
+- Never skip the clarifying questions phase unless the user explicitly provides exhaustive detail
+- Never create a sprint with vague success criteria like "works correctly" or "looks good"
+- Never create sprints that cannot be evaluated independently
+- Never create more sprints than `sprint.maxSprints` from the config
+## Quality Standards for Success Criteria
+Success criteria are the contract between the Generator and Evaluator. Bad criteria lead to bad evaluations. Follow these rules:
+1. **Every criterion must be verifiable by an outsider.** "The UI looks good" is not verifiable. "The dashboard has a navigation sidebar with at least 5 menu items, a header with the app logo, and a main content area that fills the remaining width" is verifiable.
+2. **Include quality criteria, not just functional ones.** For UI sprints, include criteria like:
+   - "The design uses a consistent color palette of no more than 5 colors"
+   - "Typography uses a clear hierarchy with at least 3 distinct text sizes"
+   - "The layout is visually cohesive — all components share consistent spacing and styling"
+   - "The design shows deliberate creative choices — no default template/library styling"
+3. **Include negative criteria.** Specify what should NOT happen:
+   - "No TypeScript `any` types in new code"
+   - "No console.log statements in production code"
+   - "No unhandled promise rejections"
+   - "No accessibility violations detectable by axe-core"
+4. **Be specific about error/edge states.** For every feature, include criteria for:
+   - What happens on error?
+   - What happens with empty data?
+   - What happens with malformed input?
+   - What happens during loading?
+## Output Quality Checklist
+Before finalizing, verify:
+- [ ] Every feature has at least 2 acceptance criteria
+- [ ] Every sprint has at least 3 success criteria
+- [ ] Every success criterion is testable by someone who has never seen the code
+- [ ] UI sprints include design quality criteria (not just "it renders")
+- [ ] Every sprint has both `generatorNotes` and `evaluatorNotes`
+- [ ] Sprint dependencies form a valid DAG (no cycles)
+- [ ] The first sprint is achievable without any prior sprint output
+- [ ] No sprint requires more than `sprint.sprintSize` worth of effort
+- [ ] All files are saved to the correct `.bober/` locations
+- [ ] The plan is achievable with the tech stack in `bober.config.json`
+- [ ] For non-web projects (smart contracts, CLI tools, libraries, etc.), sprints are adapted to the appropriate domain -- e.g., contract compilation instead of browser build, on-chain tests instead of E2E tests

package/dist/cli/commands/eval.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export interface EvalCommandOptions {
+    verbose?: boolean;
+    sprint?: string;
+}
+export declare function runEvalCommand(projectRoot: string, options: EvalCommandOptions): Promise<void>;
+//# sourceMappingURL=eval.d.ts.map

package/dist/cli/commands/eval.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"eval.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/eval.ts"],"names":[],"mappings":"AAgBA,MAAM,WAAW,kBAAkB;IACjC,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAID,wBAAsB,cAAc,CAClC,WAAW,EAAE,MAAM,EACnB,OAAO,EAAE,kBAAkB,GAC1B,OAAO,CAAC,IAAI,CAAC,CA2Jf"}

package/dist/cli/commands/eval.js ADDED Viewed

@@ -0,0 +1,129 @@
+import chalk from "chalk";
+import { loadConfig } from "../../config/loader.js";
+import { createHandoff } from "../../orchestrator/context-handoff.js";
+import { runEvaluatorAgent } from "../../orchestrator/evaluator-agent.js";
+import { ensureBoberDir, listContracts, loadLatestSpec, } from "../../state/index.js";
+import { getCurrentBranch, getChangedFiles } from "../../utils/git.js";
+import { logger } from "../../utils/logger.js";
+// ── Main ───────────────────────────────────────────────────────────
+export async function runEvalCommand(projectRoot, options) {
+    if (options.verbose) {
+        logger.verbose = true;
+    }
+    // Load config
+    let config;
+    try {
+        config = await loadConfig(projectRoot);
+    }
+    catch (err) {
+        logger.error(`Failed to load config: ${err instanceof Error ? err.message : String(err)}`);
+        logger.info('Run "npx agent-bober init" to create a configuration.');
+        return;
+    }
+    await ensureBoberDir(projectRoot);
+    // Load spec and contracts
+    const spec = await loadLatestSpec(projectRoot);
+    if (!spec) {
+        logger.error("No plan found. Run 'npx agent-bober plan' first.");
+        return;
+    }
+    const contracts = await listContracts(projectRoot);
+    if (contracts.length === 0) {
+        logger.error("No sprint contracts found.");
+        return;
+    }
+    // Find the target contract
+    let targetContract;
+    if (options.sprint) {
+        targetContract = contracts.find((c) => c.id === options.sprint);
+        if (!targetContract) {
+            logger.error(`Sprint "${options.sprint}" not found.`);
+            logger.info(`Available sprints: ${contracts.map((c) => c.id).join(", ")}`);
+            return;
+        }
+    }
+    else {
+        // Find the most recent in-progress or evaluating sprint
+        targetContract = contracts.find((c) => c.status === "in-progress" ||
+            c.status === "evaluating" ||
+            c.status === "needs-rework");
+        if (!targetContract) {
+            // Fall back to the most recent sprint
+            targetContract = contracts[contracts.length - 1];
+        }
+    }
+    logger.phase(`Evaluating: ${targetContract.feature}`);
+    logger.sprint(targetContract.id, `Status: ${targetContract.status}`);
+    // Build project context
+    let currentBranch;
+    try {
+        currentBranch = await getCurrentBranch(projectRoot);
+    }
+    catch {
+        currentBranch = "unknown";
+    }
+    const projectContext = {
+        name: config.project.name,
+        type: config.project.mode,
+        techStack: spec.techStack,
+        entryPoints: [],
+        currentBranch,
+    };
+    // Get changed files
+    let changedFiles;
+    try {
+        changedFiles = await getChangedFiles(projectRoot);
+    }
+    catch {
+        changedFiles = [];
+    }
+    // Build handoff for evaluator
+    const completedContracts = contracts.filter((c) => c.status === "passed");
+    const handoff = createHandoff({
+        from: "generator",
+        to: "evaluator",
+        projectContext,
+        spec,
+        currentContract: targetContract,
+        sprintHistory: completedContracts,
+        instructions: `Re-evaluate sprint: ${targetContract.feature}`,
+        changedFiles,
+    });
+    // Run evaluation
+    const evaluation = await runEvaluatorAgent(handoff, projectRoot, config);
+    // Display results
+    console.log();
+    const statusIcon = evaluation.passed
+        ? chalk.green("[PASS]")
+        : chalk.red("[FAIL]");
+    console.log(`${statusIcon} ${chalk.bold(targetContract.feature)} - Score: ${evaluation.score}/100`);
+    console.log();
+    for (const result of evaluation.results) {
+        const icon = result.passed ? chalk.green("  PASS") : chalk.red("  FAIL");
+        const scoreStr = result.score !== undefined ? ` (${result.score}/100)` : "";
+        console.log(`${icon} ${chalk.bold(result.evaluator)}${scoreStr}`);
+        console.log(`       ${chalk.gray(result.summary)}`);
+        if (!result.passed) {
+            const failures = result.details.filter((d) => !d.passed);
+            for (const detail of failures.slice(0, 5)) {
+                const severityColor = detail.severity === "error" ? chalk.red : chalk.yellow;
+                const location = detail.file
+                    ? ` at ${detail.file}${detail.line !== undefined ? `:${detail.line}` : ""}`
+                    : "";
+                console.log(`       ${severityColor(`[${detail.severity.toUpperCase()}]`)} ${detail.message}${location}`);
+            }
+            if (failures.length > 5) {
+                console.log(chalk.gray(`       ... and ${failures.length - 5} more issues`));
+            }
+            if (result.feedback) {
+                console.log(chalk.yellow(`       Feedback: ${result.feedback.slice(0, 200)}`));
+            }
+        }
+        console.log();
+    }
+    console.log(chalk.gray(`Summary: ${evaluation.summary}`));
+    if (!evaluation.passed) {
+        process.exitCode = 1;
+    }
+}
+//# sourceMappingURL=eval.js.map

package/dist/cli/commands/eval.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"eval.js","sourceRoot":"","sources":["../../../src/cli/commands/eval.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,MAAM,OAAO,CAAC;AAE1B,OAAO,EAAE,UAAU,EAAE,MAAM,wBAAwB,CAAC;AACpD,OAAO,EAAE,aAAa,EAAE,MAAM,uCAAuC,CAAC;AAEtE,OAAO,EAAE,iBAAiB,EAAE,MAAM,uCAAuC,CAAC;AAC1E,OAAO,EACL,cAAc,EACd,aAAa,EACb,cAAc,GACf,MAAM,sBAAsB,CAAC;AAC9B,OAAO,EAAE,gBAAgB,EAAE,eAAe,EAAE,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAE,MAAM,EAAE,MAAM,uBAAuB,CAAC;AAS/C,sEAAsE;AAEtE,MAAM,CAAC,KAAK,UAAU,cAAc,CAClC,WAAmB,EACnB,OAA2B;IAE3B,IAAI,OAAO,CAAC,OAAO,EAAE,CAAC;QACpB,MAAM,CAAC,OAAO,GAAG,IAAI,CAAC;IACxB,CAAC;IAED,cAAc;IACd,IAAI,MAAM,CAAC;IACX,IAAI,CAAC;QACH,MAAM,GAAG,MAAM,UAAU,CAAC,WAAW,CAAC,CAAC;IACzC,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,MAAM,CAAC,KAAK,CACV,0BAA0B,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAC7E,CAAC;QACF,MAAM,CAAC,IAAI,CAAC,uDAAuD,CAAC,CAAC;QACrE,OAAO;IACT,CAAC;IAED,MAAM,cAAc,CAAC,WAAW,CAAC,CAAC;IAElC,0BAA0B;IAC1B,MAAM,IAAI,GAAG,MAAM,cAAc,CAAC,WAAW,CAAC,CAAC;IAC/C,IAAI,CAAC,IAAI,EAAE,CAAC;QACV,MAAM,CAAC,KAAK,CAAC,kDAAkD,CAAC,CAAC;QACjE,OAAO;IACT,CAAC;IAED,MAAM,SAAS,GAAG,MAAM,aAAa,CAAC,WAAW,CAAC,CAAC;IACnD,IAAI,SAAS,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC3B,MAAM,CAAC,KAAK,CAAC,4BAA4B,CAAC,CAAC;QAC3C,OAAO;IACT,CAAC;IAED,2BAA2B;IAC3B,IAAI,cAAc,CAAC;IACnB,IAAI,OAAO,CAAC,MAAM,EAAE,CAAC;QACnB,cAAc,GAAG,SAAS,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,EAAE,KAAK,OAAO,CAAC,MAAM,CAAC,CAAC;QAChE,IAAI,CAAC,cAAc,EAAE,CAAC;YACpB,MAAM,CAAC,KAAK,CAAC,WAAW,OAAO,CAAC,MAAM,cAAc,CAAC,CAAC;YACtD,MAAM,CAAC,IAAI,CACT,sBAAsB,SAAS,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAC9D,CAAC;YACF,OAAO;QACT,CAAC;IACH,CAAC;SAAM,CAAC;QACN,wDAAwD;QACxD,cAAc,GAAG,SAAS,CAAC,IAAI,CAC7B,CAAC,CAAC,EAAE,EAAE,CACJ,CAAC,CAAC,MAAM,KAAK,aAAa;YAC1B,CAAC,CAAC,MAAM,KAAK,YAAY;YACzB,CAAC,CAAC,MAAM,KAAK,cAAc,CAC9B,CAAC;QAEF,IAAI,CAAC,cAAc,EAAE,CAAC;YACpB,sCAAsC;YACtC,cAAc,GAAG,SAAS,CAAC,SAAS,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;QACnD,CAAC;IACH,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,eAAe,cAAc,CAAC,OAAO,EAAE,CAAC,CAAC;IACtD,MAAM,CAAC,MAAM,CAAC,cAAc,CAAC,EAAE,EAAE,WAAW,cAAc,CAAC,MAAM,EAAE,CAAC,CAAC;IAErE,wBAAwB;IACxB,IAAI,aAAqB,CAAC;IAC1B,IAAI,CAAC;QACH,aAAa,GAAG,MAAM,gBAAgB,CAAC,WAAW,CAAC,CAAC;IACtD,CAAC;IAAC,MAAM,CAAC;QACP,aAAa,GAAG,SAAS,CAAC;IAC5B,CAAC;IAED,MAAM,cAAc,GAAmB;QACrC,IAAI,EAAE,MAAM,CAAC,OAAO,CAAC,IAAI;QACzB,IAAI,EAAE,MAAM,CAAC,OAAO,CAAC,IAAI;QACzB,SAAS,EAAE,IAAI,CAAC,SAAS;QACzB,WAAW,EAAE,EAAE;QACf,aAAa;KACd,CAAC;IAEF,oBAAoB;IACpB,IAAI,YAAsB,CAAC;IAC3B,IAAI,CAAC;QACH,YAAY,GAAG,MAAM,eAAe,CAAC,WAAW,CAAC,CAAC;IACpD,CAAC;IAAC,MAAM,CAAC;QACP,YAAY,GAAG,EAAE,CAAC;IACpB,CAAC;IAED,8BAA8B;IAC9B,MAAM,kBAAkB,GAAG,SAAS,CAAC,MAAM,CACzC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,MAAM,KAAK,QAAQ,CAC7B,CAAC;IAEF,MAAM,OAAO,GAAG,aAAa,CAAC;QAC5B,IAAI,EAAE,WAAW;QACjB,EAAE,EAAE,WAAW;QACf,cAAc;QACd,IAAI;QACJ,eAAe,EAAE,cAAc;QAC/B,aAAa,EAAE,kBAAkB;QACjC,YAAY,EAAE,uBAAuB,cAAc,CAAC,OAAO,EAAE;QAC7D,YAAY;KACb,CAAC,CAAC;IAEH,iBAAiB;IACjB,MAAM,UAAU,GAAG,MAAM,iBAAiB,CACxC,OAAO,EACP,WAAW,EACX,MAAM,CACP,CAAC;IAEF,kBAAkB;IAClB,OAAO,CAAC,GAAG,EAAE,CAAC;IACd,MAAM,UAAU,GAAG,UAAU,CAAC,MAAM;QAClC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,QAAQ,CAAC;QACvB,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;IACxB,OAAO,CAAC,GAAG,CACT,GAAG,UAAU,IAAI,KAAK,CAAC,IAAI,CAAC,cAAc,CAAC,OAAO,CAAC,aAAa,UAAU,CAAC,KAAK,MAAM,CACvF,CAAC;IACF,OAAO,CAAC,GAAG,EAAE,CAAC;IAEd,KAAK,MAAM,MAAM,IAAI,UAAU,CAAC,OAAO,EAAE,CAAC;QACxC,MAAM,IAAI,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;QACzE,MAAM,QAAQ,GACZ,MAAM,CAAC,KAAK,KAAK,SAAS,CAAC,CAAC,CAAC,KAAK,MAAM,CAAC,KAAK,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC;QAC7D,OAAO,CAAC,GAAG,CAAC,GAAG,IAAI,IAAI,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,SAAS,CAAC,GAAG,QAAQ,EAAE,CAAC,CAAC;QAClE,OAAO,CAAC,GAAG,CAAC,UAAU,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;QAEpD,IAAI,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC;YACnB,MAAM,QAAQ,GAAG,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC,CAAsB,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC;YAC9E,KAAK,MAAM,MAAM,IAAI,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,CAAC;gBAC1C,MAAM,aAAa,GACjB,MAAM,CAAC,QAAQ,KAAK,OAAO,CAAC,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,KAAK,CAAC,MAAM,CAAC;gBACzD,MAAM,QAAQ,GAAG,MAAM,CAAC,IAAI;oBAC1B,CAAC,CAAC,OAAO,MAAM,CAAC,IAAI,GAAG,MAAM,CAAC,IAAI,KAAK,SAAS,CAAC,CAAC,CAAC,IAAI,MAAM,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC,EAAE,EAAE;oBAC3E,CAAC,CAAC,EAAE,CAAC;gBACP,OAAO,CAAC,GAAG,CACT,UAAU,aAAa,CAAC,IAAI,MAAM,CAAC,QAAQ,CAAC,WAAW,EAAE,GAAG,CAAC,IAAI,MAAM,CAAC,OAAO,GAAG,QAAQ,EAAE,CAC7F,CAAC;YACJ,CAAC;YACD,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBACxB,OAAO,CAAC,GAAG,CACT,KAAK,CAAC,IAAI,CAAC,kBAAkB,QAAQ,CAAC,MAAM,GAAG,CAAC,cAAc,CAAC,CAChE,CAAC;YACJ,CAAC;YAED,IAAI,MAAM,CAAC,QAAQ,EAAE,CAAC;gBACpB,OAAO,CAAC,GAAG,CAAC,KAAK,CAAC,MAAM,CAAC,oBAAoB,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC;YACjF,CAAC;QACH,CAAC;QACD,OAAO,CAAC,GAAG,EAAE,CAAC;IAChB,CAAC;IAED,OAAO,CAAC,GAAG,CAAC,KAAK,CAAC,IAAI,CAAC,YAAY,UAAU,CAAC,OAAO,EAAE,CAAC,CAAC,CAAC;IAE1D,IAAI,CAAC,UAAU,CAAC,MAAM,EAAE,CAAC;QACvB,OAAO,CAAC,QAAQ,GAAG,CAAC,CAAC;IACvB,CAAC;AACH,CAAC"}

package/dist/cli/commands/init.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+export interface InitCommandOptions {
+    preset?: string;
+}
+export declare function runInitCommand(projectRoot: string, options?: InitCommandOptions): Promise<void>;
+//# sourceMappingURL=init.d.ts.map

package/dist/cli/commands/init.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"init.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/init.ts"],"names":[],"mappings":"AAwPA,MAAM,WAAW,kBAAkB;IACjC,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,wBAAsB,cAAc,CAClC,WAAW,EAAE,MAAM,EACnB,OAAO,GAAE,kBAAuB,GAC/B,OAAO,CAAC,IAAI,CAAC,CAyEf"}