npm - @event4u/agent-config - Versions diffs - 1.14.0 → 1.16.0 - Mend

@event4u/agent-config 1.14.0 → 1.16.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (293) hide show

package/.agent-src/commands/agent-handoff.md +1 -1
package/.agent-src/commands/bug-fix.md +3 -3
package/.agent-src/commands/bug-investigate.md +2 -2
package/.agent-src/commands/chat-history-checkpoint.md +3 -3
package/.agent-src/commands/chat-history-clear.md +2 -2
package/.agent-src/commands/chat-history-resume.md +2 -2
package/.agent-src/commands/chat-history.md +3 -3
package/.agent-src/commands/check-current-md.md +44 -33
package/.agent-src/commands/commit-in-chunks.md +43 -23
package/.agent-src/commands/compress.md +34 -2
package/.agent-src/commands/council-design.md +96 -0
package/.agent-src/commands/council-optimize.md +115 -0
package/.agent-src/commands/council-pr.md +123 -0
package/.agent-src/commands/council.md +219 -0
package/.agent-src/commands/create-pr.md +23 -0
package/.agent-src/commands/do-and-judge.md +3 -3
package/.agent-src/commands/do-in-steps.md +4 -4
package/.agent-src/commands/e2e-heal.md +1 -1
package/.agent-src/commands/e2e-plan.md +1 -1
package/.agent-src/commands/feature-dev.md +8 -0
package/.agent-src/commands/feature-explore.md +6 -1
package/.agent-src/commands/feature-plan.md +33 -2
package/.agent-src/commands/feature-refactor.md +5 -0
package/.agent-src/commands/feature-roadmap.md +8 -3
package/.agent-src/commands/feature.md +58 -0
package/.agent-src/commands/fix-ci.md +5 -0
package/.agent-src/commands/fix-portability.md +7 -2
package/.agent-src/commands/fix-pr-bot-comments.md +5 -0
package/.agent-src/commands/fix-pr-comments.md +5 -0
package/.agent-src/commands/fix-pr-developer-comments.md +5 -0
package/.agent-src/commands/fix-references.md +5 -0
package/.agent-src/commands/fix-seeder.md +5 -0
package/.agent-src/commands/fix.md +60 -0
package/.agent-src/commands/jira-ticket.md +1 -1
package/.agent-src/commands/judge.md +1 -1
package/.agent-src/commands/memory-add.md +3 -3
package/.agent-src/commands/memory-full.md +2 -2
package/.agent-src/commands/memory-promote.md +2 -2
package/.agent-src/commands/mode.md +5 -5
package/.agent-src/commands/onboard.md +17 -8
package/.agent-src/commands/optimize-agents.md +6 -1
package/.agent-src/commands/optimize-augmentignore.md +14 -0
package/.agent-src/commands/optimize-rtk-filters.md +5 -0
package/.agent-src/commands/optimize-skills.md +6 -1
package/.agent-src/commands/optimize.md +54 -0
package/.agent-src/commands/propose-memory.md +2 -2
package/.agent-src/commands/refine-ticket.md +9 -7
package/.agent-src/commands/review-changes.md +61 -9
package/.agent-src/commands/review-routing.md +1 -1
package/.agent-src/commands/roadmap-create.md +42 -4
package/.agent-src/commands/roadmap-execute.md +9 -7
package/.agent-src/commands/set-cost-profile.md +11 -3
package/.agent-src/commands/sync-agent-settings.md +11 -2
package/.agent-src/commands/tests-create.md +1 -1
package/.agent-src/commands/tests-execute.md +2 -3
package/.agent-src/commands/upstream-contribute.md +1 -1
package/.agent-src/contexts/authority/commit-mechanics.md +57 -0
package/.agent-src/contexts/authority/destructive-mechanics.md +66 -0
package/.agent-src/contexts/authority/scope-mechanics.md +87 -0
package/.agent-src/contexts/execution/autonomy-detection.md +54 -0
package/.agent-src/contexts/execution/autonomy-examples.md +90 -0
package/.agent-src/contexts/execution/autonomy-mechanics.md +29 -0
package/.agent-src/contexts/execution/verification-mechanics.md +80 -0
package/.agent-src/personas/README.md +1 -1
package/.agent-src/rules/agent-authority.md +24 -0
package/.agent-src/rules/architecture.md +1 -1
package/.agent-src/rules/artifact-drafting-protocol.md +1 -1
package/.agent-src/rules/artifact-engagement-recording.md +2 -2
package/.agent-src/rules/ask-when-uncertain.md +1 -1
package/.agent-src/rules/augment-portability.md +56 -37
package/.agent-src/rules/autonomous-execution.md +78 -114
package/.agent-src/rules/capture-learnings.md +1 -1
package/.agent-src/rules/chat-history-cadence.md +109 -0
package/.agent-src/rules/chat-history-ownership.md +123 -0
package/.agent-src/rules/chat-history-visibility.md +96 -0
package/.agent-src/rules/cli-output-handling.md +1 -1
package/.agent-src/rules/{command-suggestion.md → command-suggestion-policy.md} +10 -9
package/.agent-src/rules/commit-conventions.md +1 -1
package/.agent-src/rules/commit-policy.md +43 -61
package/.agent-src/rules/context-hygiene.md +3 -3
package/.agent-src/rules/direct-answers.md +2 -2
package/.agent-src/rules/docs-sync.md +1 -1
package/.agent-src/rules/e2e-testing.md +1 -1
package/.agent-src/rules/guidelines.md +4 -4
package/.agent-src/rules/improve-before-implement.md +2 -2
package/.agent-src/rules/language-and-tone.md +41 -96
package/.agent-src/rules/minimal-safe-diff.md +3 -3
package/.agent-src/rules/model-recommendation.md +4 -4
package/.agent-src/rules/no-cheap-questions.md +89 -0
package/.agent-src/rules/non-destructive-by-default.md +25 -59
package/.agent-src/rules/onboarding-gate.md +5 -5
package/.agent-src/rules/review-routing-awareness.md +9 -9
package/.agent-src/rules/roadmap-progress-sync.md +132 -80
package/.agent-src/rules/role-mode-adherence.md +3 -3
package/.agent-src/rules/scope-control.md +65 -46
package/.agent-src/rules/security-sensitive-stop.md +2 -2
package/.agent-src/rules/size-enforcement.md +3 -2
package/.agent-src/rules/think-before-action.md +5 -5
package/.agent-src/rules/token-efficiency.md +4 -4
package/.agent-src/rules/{ui-audit-before-build.md → ui-audit-gate.md} +3 -3
package/.agent-src/rules/user-interaction.md +31 -7
package/.agent-src/rules/verify-before-complete.md +12 -67
package/.agent-src/scripts/update_roadmap_progress.py +65 -8
package/.agent-src/skills/ai-council/SKILL.md +333 -0
package/.agent-src/skills/api-endpoint/SKILL.md +2 -2
package/.agent-src/skills/blade-ui/SKILL.md +30 -11
package/.agent-src/skills/blast-radius-analyzer/SKILL.md +1 -1
package/.agent-src/skills/bug-analyzer/SKILL.md +1 -1
package/.agent-src/skills/command-routing/SKILL.md +1 -1
package/.agent-src/skills/command-writing/SKILL.md +16 -5
package/.agent-src/skills/conventional-commits-writing/SKILL.md +1 -1
package/.agent-src/skills/copilot-agents-optimization/SKILL.md +2 -2
package/.agent-src/skills/developer-like-execution/SKILL.md +2 -2
package/.agent-src/skills/existing-ui-audit/SKILL.md +24 -9
package/.agent-src/skills/fe-design/SKILL.md +20 -15
package/.agent-src/skills/file-editor/SKILL.md +9 -0
package/.agent-src/skills/flux/SKILL.md +1 -1
package/.agent-src/skills/git-workflow/SKILL.md +1 -1
package/.agent-src/skills/guideline-writing/SKILL.md +11 -11
package/.agent-src/skills/learning-to-rule-or-skill/SKILL.md +4 -4
package/.agent-src/skills/livewire/SKILL.md +27 -8
package/.agent-src/skills/override-management/SKILL.md +2 -2
package/.agent-src/skills/php-coder/SKILL.md +1 -1
package/.agent-src/skills/playwright-testing/SKILL.md +2 -2
package/.agent-src/skills/readme-reviewer/SKILL.md +1 -1
package/.agent-src/skills/readme-writing/SKILL.md +1 -1
package/.agent-src/skills/readme-writing-package/SKILL.md +1 -1
package/.agent-src/skills/receiving-code-review/SKILL.md +1 -1
package/.agent-src/skills/refine-ticket/SKILL.md +30 -24
package/.agent-src/skills/review-routing/SKILL.md +2 -2
package/.agent-src/skills/roadmap-management/SKILL.md +22 -16
package/.agent-src/skills/rule-writing/SKILL.md +1 -1
package/.agent-src/skills/skill-reviewer/SKILL.md +1 -1
package/.agent-src/skills/skill-writing/SKILL.md +6 -6
package/.agent-src/skills/subagent-orchestration/SKILL.md +1 -0
package/.agent-src/skills/systematic-debugging/SKILL.md +1 -1
package/.agent-src/skills/upstream-contribute/SKILL.md +3 -3
package/.agent-src/skills/validate-feature-fit/SKILL.md +2 -2
package/.agent-src/skills/{verify-before-complete → verify-completion-evidence}/SKILL.md +2 -2
package/.agent-src/templates/agent-settings.md +9 -9
package/.agent-src/templates/contexts/auth-model.md +1 -1
package/.agent-src/templates/roadmaps.md +9 -8
package/.agent-src/templates/scripts/README.md +2 -2
package/.agent-src/templates/scripts/memory_lookup.py +1 -1
package/.agent-src/templates/scripts/telemetry/aggregator.py +16 -1
package/.agent-src/templates/scripts/telemetry/engagement.py +59 -0
package/.agent-src/templates/scripts/telemetry/report_renderer.py +28 -1
package/.agent-src/templates/scripts/telemetry_record.py +14 -1
package/.agent-src/templates/scripts/work_engine/__init__.py +2 -2
package/.agent-src/templates/scripts/work_engine/cli.py +64 -461
package/.agent-src/templates/scripts/work_engine/cli_args.py +116 -0
package/.agent-src/templates/scripts/work_engine/delivery_state.py +3 -3
package/.agent-src/templates/scripts/work_engine/directives/backend/__init__.py +1 -1
package/.agent-src/templates/scripts/work_engine/directives/backend/implement.py +1 -1
package/.agent-src/templates/scripts/work_engine/directives/backend/memory.py +1 -1
package/.agent-src/templates/scripts/work_engine/directives/backend/plan.py +1 -1
package/.agent-src/templates/scripts/work_engine/directives/backend/report.py +1 -1
package/.agent-src/templates/scripts/work_engine/dispatcher.py +1 -1
package/.agent-src/templates/scripts/work_engine/emitters.py +43 -0
package/.agent-src/templates/scripts/work_engine/errors.py +19 -0
package/.agent-src/templates/scripts/work_engine/hook_bootstrap.py +76 -0
package/.agent-src/templates/scripts/work_engine/input_builders.py +163 -0
package/.agent-src/templates/scripts/work_engine/migration/v0_to_v1.py +34 -2
package/.agent-src/templates/scripts/work_engine/persona_policy.py +1 -1
package/.agent-src/templates/scripts/work_engine/resolvers/prompt.py +1 -1
package/.agent-src/templates/scripts/work_engine/state_io.py +202 -0
package/.claude-plugin/marketplace.json +10 -2
package/AGENTS.md +16 -12
package/CHANGELOG.md +206 -9
package/README.md +51 -52
package/config/agent-settings.template.yml +58 -1
package/config/gitignore-block.txt +3 -0
package/docs/MIGRATION.md +122 -0
package/docs/architecture.md +83 -34
package/docs/catalog.md +331 -0
package/docs/contracts/STABILITY.md +134 -0
package/docs/contracts/adr-chat-history-split.md +132 -0
package/docs/contracts/adr-command-suggestion.md +146 -0
package/docs/contracts/adr-implement-ticket-runtime.md +122 -0
package/docs/contracts/adr-product-ui-track.md +384 -0
package/docs/contracts/adr-prompt-driven-execution.md +187 -0
package/docs/contracts/agent-memory-contract.md +149 -0
package/docs/contracts/artifact-engagement-flow.md +262 -0
package/docs/contracts/command-clusters.md +126 -0
package/docs/contracts/command-suggestion-flow.md +148 -0
package/docs/contracts/implement-ticket-flow.md +628 -0
package/docs/contracts/linear-ai-rules-inclusion.md +143 -0
package/docs/contracts/linear-ai-three-layers.md +131 -0
package/docs/contracts/load-context-schema.md +186 -0
package/docs/contracts/rule-interactions.md +107 -0
package/docs/contracts/rule-interactions.yml +238 -0
package/docs/contracts/rule-priority-hierarchy.md +87 -0
package/docs/contracts/ui-stack-extension.md +236 -0
package/docs/contracts/ui-track-flow.md +338 -0
package/docs/customization.md +14 -0
package/docs/end-to-end-walkthroughs.md +165 -0
package/docs/getting-started.md +27 -9
package/docs/github-topics.md +12 -3
package/docs/guidelines/agent-infra/language-and-tone-examples.md +79 -0
package/{.agent-src → docs}/guidelines/docs/readme-size-and-splitting.md +26 -25
package/docs/guidelines/php/git.md +164 -0
package/docs/installation.md +42 -6
package/docs/migrations/commands-1.15.0.md +112 -0
package/docs/showcase.md +9 -4
package/docs/skills-catalog.md +14 -8
package/docs/ui-track-mental-model.md +121 -0
package/llms.txt +13 -7
package/package.json +1 -1
package/scripts/agent-config +23 -0
package/scripts/ai_council/__init__.py +39 -0
package/scripts/ai_council/_default_prices.py +41 -0
package/scripts/ai_council/_one_off_rebalancing_audit.py +149 -0
package/scripts/ai_council/_one_off_roundtrip.py +106 -0
package/scripts/ai_council/budget_guard.py +172 -0
package/scripts/ai_council/bundler.py +261 -0
package/scripts/ai_council/clients.py +381 -0
package/scripts/ai_council/modes.py +127 -0
package/scripts/ai_council/orchestrator.py +350 -0
package/scripts/ai_council/pricing.py +213 -0
package/scripts/ai_council/project_context.py +159 -0
package/scripts/ai_council/prompts.py +232 -0
package/scripts/ai_council/session.py +144 -0
package/scripts/build_linear_digest.py +4 -4
package/scripts/check_always_budget.py +126 -0
package/scripts/check_augmentignore.py +69 -0
package/scripts/check_command_count_messaging.py +120 -0
package/scripts/check_portability.py +57 -0
package/scripts/check_public_catalog_links.py +122 -0
package/scripts/check_public_links.py +185 -0
package/scripts/check_references.py +5 -1
package/scripts/check_roadmap_trackable.py +111 -0
package/scripts/command_suggester/cooldown.py +1 -1
package/scripts/generate_index.py +266 -0
package/scripts/install_anthropic_key.sh +5 -0
package/scripts/install_openai_key.sh +106 -0
package/scripts/lint_load_context.py +163 -0
package/scripts/lint_no_new_atomic_commands.py +179 -0
package/scripts/lint_rule_interactions.py +149 -0
package/scripts/memory_lookup.py +1 -1
package/scripts/release.py +297 -64
package/scripts/schemas/command.schema.json +20 -0
package/scripts/schemas/rule.schema.json +10 -0
package/scripts/skill_linter.py +26 -4
package/scripts/sync_agent_settings.py +1 -1
package/scripts/update_counts.py +19 -4
package/scripts/update_prices.py +124 -0
package/.agent-src/guidelines/php/git.md +0 -96
package/.agent-src/rules/chat-history.md +0 -200
/package/.agent-src/rules/{slash-commands.md → slash-command-routing-policy.md} +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/agent-interaction-and-decision-quality.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/break-glass-usage.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/developer-judgment.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/engineering-memory-data-format.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/layered-settings.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/memory-access.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/naming.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/output-patterns.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/review-routing-data-format.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/role-contracts.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/role-mode-router.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/runtime-layer.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/self-improvement-pipeline.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/size-and-scope.md +0 -0
/package/{.agent-src → docs}/guidelines/agent-infra/tool-integration.md +0 -0
/package/{.agent-src → docs}/guidelines/e2e/playwright.md +0 -0
/package/{.agent-src → docs}/guidelines/php/api-design.md +0 -0
/package/{.agent-src → docs}/guidelines/php/artisan-commands.md +0 -0
/package/{.agent-src → docs}/guidelines/php/blade-ui.md +0 -0
/package/{.agent-src → docs}/guidelines/php/controllers.md +0 -0
/package/{.agent-src → docs}/guidelines/php/database.md +0 -0
/package/{.agent-src → docs}/guidelines/php/eloquent.md +0 -0
/package/{.agent-src → docs}/guidelines/php/flux.md +0 -0
/package/{.agent-src → docs}/guidelines/php/general.md +0 -0
/package/{.agent-src → docs}/guidelines/php/jobs.md +0 -0
/package/{.agent-src → docs}/guidelines/php/livewire.md +0 -0
/package/{.agent-src → docs}/guidelines/php/logging.md +0 -0
/package/{.agent-src → docs}/guidelines/php/naming.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/dependency-injection.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/dtos.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/events.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/factory.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/pipelines.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/policies.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/repositories.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/service-layer.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns/strategy.md +0 -0
/package/{.agent-src → docs}/guidelines/php/patterns.md +0 -0
/package/{.agent-src → docs}/guidelines/php/performance.md +0 -0
/package/{.agent-src → docs}/guidelines/php/resources.md +0 -0
/package/{.agent-src → docs}/guidelines/php/security.md +0 -0
/package/{.agent-src → docs}/guidelines/php/sql.md +0 -0
/package/{.agent-src → docs}/guidelines/php/validations.md +0 -0
/package/{.agent-src → docs}/guidelines/php/websocket.md +0 -0

package/scripts/ai_council/orchestrator.py ADDED Viewed

@@ -0,0 +1,350 @@
+"""Council orchestrator — fan out one question to multiple members.
+v2 contract (sequential + interactive overrun prompt):
+- Members are called **sequentially** in input order. The previous
+  parallel ThreadPoolExecutor was traded for predictable mid-flow
+  user prompts; with 2-3 council members the latency cost is small.
+- `estimate(question, members, table)` returns a pre-call cost preview
+  (input tokens + max-output ceiling + USD per member). The host
+  agent shows this before invoking `consult()`.
+- `consult(..., on_overrun=...)` invokes the callback BEFORE each
+  member's actual API call when the projected total cost would push
+  past the cost budget. The callback decides whether to proceed for
+  this single member; the next member triggers the callback again.
+Failure normalisation (one member's exception → `error`-set
+CouncilResponse, never raise) is unchanged.
+"""
+from __future__ import annotations
+from dataclasses import dataclass
+from typing import Callable
+from scripts.ai_council.budget_guard import (
+    record_spend as _record_daily_spend,
+    today_spend_usd as _today_spend_usd,
+    would_exceed as _would_exceed_daily,
+)
+from scripts.ai_council.clients import CouncilResponse, ExternalAIClient
+from scripts.ai_council.pricing import (
+    CostEstimate,
+    PriceTable,
+    estimate_cost,
+    estimate_input_tokens,
+)
+from scripts.ai_council.project_context import ProjectContext
+from scripts.ai_council.prompts import system_prompt_for
+@dataclass
+class CostBudget:
+    max_input_tokens: int = 50_000
+    max_output_tokens: int = 20_000
+    max_calls: int = 10
+    max_total_usd: float = 0.0  # 0 = USD ceiling disabled (token caps still apply)
+    daily_limit_usd: float = 0.0  # 0 = rolling 24h cap disabled (D3)
+@dataclass
+class CouncilQuestion:
+    mode: str  # one of: prompt, roadmap, diff, files
+    user_prompt: str  # bundled artefact text
+    max_tokens: int = 1024
+@dataclass
+class OverrunEvent:
+    """Passed to `on_overrun` when projected spend exceeds the budget."""
+    member_index: int
+    member: ExternalAIClient
+    next_estimate: CostEstimate  # this member's projected cost
+    spent_input_tokens: int  # already-billed totals BEFORE this member
+    spent_output_tokens: int
+    spent_usd: float
+    projected_total_usd: float  # spent_usd + next_estimate.total_usd
+    daily_spent_usd: float = 0.0  # rolling 24h spend BEFORE this member (D3)
+    daily_limit_usd: float = 0.0  # the configured daily cap (0 = disabled)
+    breach_kind: str = "session"  # "session" | "daily" | "tokens"
+# Callback signature: receive event → return True (proceed) or False (skip + tag error).
+OnOverrunCallback = Callable[[OverrunEvent], bool]
+def estimate(
+    question: CouncilQuestion,
+    members: list[ExternalAIClient],
+    table: PriceTable,
+    *,
+    project: ProjectContext | None = None,
+    original_ask: str = "",
+) -> list[CostEstimate]:
+    """Return a pre-call cost estimate per member, in input order.
+    `project` and `original_ask` are passed through to
+    `system_prompt_for()` so the estimate covers the handoff preamble
+    bytes too. Both default to v1-shape (no preamble extension).
+    """
+    sys_prompt = system_prompt_for(
+        question.mode, project=project, original_ask=original_ask,
+    )
+    input_tokens = estimate_input_tokens(question.user_prompt) + estimate_input_tokens(sys_prompt)
+    return [
+        estimate_cost(m.name, m.model, input_tokens, question.max_tokens, table)
+        for m in members
+    ]
+def consult(
+    members: list[ExternalAIClient],
+    question: CouncilQuestion,
+    budget: CostBudget | None = None,
+    *,
+    table: PriceTable | None = None,
+    on_overrun: OnOverrunCallback | None = None,
+    project: ProjectContext | None = None,
+    original_ask: str = "",
+    rounds: int = 1,
+    on_round_complete: Callable[[int, list[CouncilResponse]], None] | None = None,
+) -> list[CouncilResponse]:
+    """Sequentially fan out `question` to every enabled member.
+    - If `table` is provided, USD spend is tracked against
+      `budget.max_total_usd` (when > 0). Without `table`, only the
+      token caps apply (back-compat with v1 callers).
+    - When the projected next-member spend would breach any cap,
+      `on_overrun` is consulted. Returning False marks that member as
+      `cost_budget_exceeded`; True proceeds with the call.
+    - Without `on_overrun`, breaching caps short-circuits remaining
+      members with `cost_budget_exceeded` (v1 behaviour preserved).
+    - `project` + `original_ask` flow into `handoff_preamble()` so the
+      council member receives a neutral context-handoff alongside the
+      artefact. Both default to v1 shape (no preamble extension).
+    - `rounds >= 2` enables multi-round debate (D1). Each subsequent
+      round augments the user prompt with anonymised prior-round
+      responses (provider/model identity stripped). Token + USD caps
+      accumulate across rounds. Returns the FINAL round's responses;
+      use `on_round_complete(round_idx, responses)` to capture
+      intermediate rounds.
+    """
+    if rounds < 1:
+        raise ValueError(f"rounds must be >= 1 (got {rounds})")
+    if not members:
+        return []
+    budget = budget or CostBudget()
+    if len(members) > budget.max_calls:
+        raise ValueError(
+            f"Council has {len(members)} members but budget caps at "
+            f"{budget.max_calls} calls."
+        )
+    spent: dict[str, float] = {"input": 0, "output": 0, "usd": 0.0}
+    last_results: list[CouncilResponse] = []
+    current_user_prompt = question.user_prompt
+    for round_idx in range(rounds):
+        round_question = (
+            question if round_idx == 0
+            else CouncilQuestion(
+                mode=question.mode,
+                user_prompt=current_user_prompt,
+                max_tokens=question.max_tokens,
+            )
+        )
+        last_results = _run_round(
+            members, round_question, budget, spent,
+            table=table, on_overrun=on_overrun,
+            project=project, original_ask=original_ask,
+        )
+        if on_round_complete is not None:
+            on_round_complete(round_idx, last_results)
+        if round_idx + 1 < rounds:
+            current_user_prompt = _augment_for_next_round(
+                question.user_prompt, last_results, round_idx + 2,
+            )
+    return last_results
+def _run_round(
+    members: list[ExternalAIClient],
+    question: CouncilQuestion,
+    budget: CostBudget,
+    spent: dict[str, float],
+    *,
+    table: PriceTable | None,
+    on_overrun: OnOverrunCallback | None,
+    project: ProjectContext | None,
+    original_ask: str,
+) -> list[CouncilResponse]:
+    """Run a single round; mutate `spent` with cumulative totals."""
+    system_prompt = system_prompt_for(
+        question.mode, project=project, original_ask=original_ask,
+    )
+    results: list[CouncilResponse] = []
+    estimates = (
+        estimate(question, members, table, project=project, original_ask=original_ask)
+        if table is not None
+        else None
+    )
+    for idx, member in enumerate(members):
+        # ── non-billable members skip the cost gate entirely ─────────
+        # ManualClient (and future PlaywrightClient) cost us $0; their
+        # token counts are still tracked from the response below for
+        # observability, but no projection / budget breach can apply.
+        if not getattr(member, "billable", True):
+            try:
+                response = member.ask(system_prompt, question.user_prompt, question.max_tokens)
+            except Exception as exc:  # noqa: BLE001 - last-resort safety net
+                response = CouncilResponse(
+                    provider=member.name, model=member.model, text="",
+                    error=f"{type(exc).__name__}: {exc}",
+                )
+            results.append(response)
+            spent["input"] += response.input_tokens
+            spent["output"] += response.output_tokens
+            continue
+        # ── projected spend check ────────────────────────────────────
+        proj_input = spent["input"] + (estimates[idx].input_tokens if estimates else 0)
+        proj_output = spent["output"] + (estimates[idx].output_tokens if estimates else 0)
+        proj_usd = spent["usd"] + (estimates[idx].total_usd if estimates else 0.0)
+        next_call_usd = estimates[idx].total_usd if estimates else 0.0
+        breaches_tokens = (
+            proj_input > budget.max_input_tokens
+            or proj_output > budget.max_output_tokens
+        )
+        breaches_usd = budget.max_total_usd > 0 and proj_usd > budget.max_total_usd
+        breaches_daily = (
+            budget.daily_limit_usd > 0
+            and _would_exceed_daily(budget.daily_limit_usd, next_call_usd)
+        )
+        if breaches_tokens or breaches_usd or breaches_daily:
+            breach_kind = (
+                "tokens" if breaches_tokens
+                else "daily" if breaches_daily
+                else "session"
+            )
+            error_tag = (
+                "daily_budget_exceeded" if breach_kind == "daily"
+                else "cost_budget_exceeded"
+            )
+            if on_overrun is not None and estimates is not None:
+                event = OverrunEvent(
+                    member_index=idx,
+                    member=member,
+                    next_estimate=estimates[idx],
+                    spent_input_tokens=int(spent["input"]),
+                    spent_output_tokens=int(spent["output"]),
+                    spent_usd=spent["usd"],
+                    projected_total_usd=proj_usd,
+                    daily_spent_usd=(
+                        _today_spend_usd() if budget.daily_limit_usd > 0 else 0.0
+                    ),
+                    daily_limit_usd=budget.daily_limit_usd,
+                    breach_kind=breach_kind,
+                )
+                if not on_overrun(event):
+                    results.append(_aborted(member, error_tag))
+                    continue
+            else:
+                # v1 behaviour: short-circuit all remaining members.
+                for left in members[idx:]:
+                    results.append(_aborted(left, error_tag))
+                return results
+        # ── actual call ──────────────────────────────────────────────
+        try:
+            response = member.ask(system_prompt, question.user_prompt, question.max_tokens)
+        except Exception as exc:  # noqa: BLE001 - last-resort safety net
+            response = CouncilResponse(
+                provider=member.name, model=member.model, text="",
+                error=f"{type(exc).__name__}: {exc}",
+            )
+        results.append(response)
+        spent["input"] += response.input_tokens
+        spent["output"] += response.output_tokens
+        if estimates is not None and table is not None:
+            # Bill the actual output against the budget using the
+            # member's per-1M output rate. Re-use estimate_cost with
+            # the *real* token count.
+            actual = estimate_cost(
+                member.name, member.model,
+                response.input_tokens, response.output_tokens, table,
+            )
+            spent["usd"] += actual.total_usd
+            # Persist to the rolling 24h ledger when the daily cap is
+            # active. Errors are swallowed inside record_spend.
+            if budget.daily_limit_usd > 0 and not response.error:
+                _record_daily_spend(
+                    actual.total_usd, member.name, member.model,
+                )
+    return results
+def _aborted(member: ExternalAIClient, reason: str) -> CouncilResponse:
+    return CouncilResponse(
+        provider=member.name, model=member.model, text="", error=reason,
+    )
+def _augment_for_next_round(
+    original_prompt: str,
+    prior_responses: list[CouncilResponse],
+    next_round_number: int,
+) -> str:
+    """Build the round-N user prompt: original artefact + anonymised prior round.
+    Provider/model identifiers are stripped (Iron Law of Neutrality §
+    multi-round). Reviewers are labelled "Reviewer A / B / C…" in the
+    order they appeared. Errors are skipped — they reveal nothing
+    useful and can leak provider error formats.
+    """
+    blocks: list[str] = []
+    label_idx = 0
+    for r in prior_responses:
+        if r.error or not r.text.strip():
+            continue
+        label = chr(ord("A") + label_idx)
+        label_idx += 1
+        blocks.append(f"### Reviewer {label}\n\n{r.text.strip()}")
+    if not blocks:
+        return original_prompt
+    prior_block = "\n\n".join(blocks)
+    return (
+        f"{original_prompt}\n\n"
+        f"---\n\n"
+        f"## Prior round critiques (round {next_round_number - 1})\n\n"
+        f"You are now in round {next_round_number}. Below are anonymised\n"
+        f"critiques from independent reviewers in the previous round.\n"
+        f"You do NOT know which model produced which critique. Read them,\n"
+        f"then respond with:\n\n"
+        f"1. Which prior points you agree with (cite reviewer label).\n"
+        f"2. Which you disagree with and why.\n"
+        f"3. New points or refinements not raised in round 1.\n\n"
+        f"{prior_block}"
+    )
+def render(responses: list[CouncilResponse]) -> str:
+    """Render stacked sections + a Convergence/Divergence summary slot."""
+    blocks: list[str] = []
+    for r in responses:
+        header = f"## {r.provider} · {r.model}"
+        if r.error:
+            blocks.append(f"{header}\n\n*ERROR:* `{r.error}`")
+            continue
+        meta = (
+            f"*tokens: {r.input_tokens} in / {r.output_tokens} out · "
+            f"{r.latency_ms} ms*"
+        )
+        blocks.append(f"{header}\n\n{meta}\n\n{r.text}")
+    blocks.append("## Convergence / Divergence\n\n*to be summarised by the host agent*")
+    return "\n\n---\n\n".join(blocks)

package/scripts/ai_council/pricing.py ADDED Viewed

@@ -0,0 +1,213 @@
+"""Runtime pricing layer for the AI Council.
+Reads `.agent-prices.md` from the repo root, parses YAML frontmatter
+and the Markdown table, and exposes:
+- `load_prices()`           — parse `.agent-prices.md` (bootstraps if missing)
+- `estimate_input_tokens()` — chars / 4 heuristic
+- `estimate_cost()`         — input + output USD for a single member
+- `is_stale()`              — True if `last_updated` is older than the
+                              most recent UTC Monday 00:00
+- `bootstrap_from_defaults()` — write a fresh `.agent-prices.md` from
+                              `_default_prices.DEFAULT_PRICES`
+The orchestrator never reads `_default_prices` directly. It always
+goes through `load_prices()` so user edits to `.agent-prices.md` win.
+"""
+from __future__ import annotations
+import datetime as _dt
+from dataclasses import dataclass
+from pathlib import Path
+from scripts.ai_council._default_prices import DEFAULT_PRICES, LAST_UPDATED, as_rows
+REPO_ROOT = Path(__file__).resolve().parents[2]
+PRICES_FILE = REPO_ROOT / ".agent-prices.md"
+# Heuristic: 1 token ≈ 4 characters of English text. OpenAI's tiktoken
+# is more accurate but pulls in a heavy dep we explicitly avoid.
+_CHARS_PER_TOKEN = 4
+@dataclass
+class Price:
+    provider: str
+    model: str
+    input_per_1m_usd: float
+    output_per_1m_usd: float
+@dataclass
+class PriceTable:
+    last_updated: str  # YYYY-MM-DD
+    currency: str
+    unit: str  # "per_1M_tokens"
+    source: str
+    prices: dict[tuple[str, str], Price]
+    def lookup(self, provider: str, model: str) -> Price | None:
+        return self.prices.get((provider, model))
+@dataclass
+class CostEstimate:
+    provider: str
+    model: str
+    input_tokens: int
+    output_tokens: int  # max_tokens budget — worst-case ceiling
+    input_usd: float
+    output_usd: float
+    @property
+    def total_usd(self) -> float:
+        return self.input_usd + self.output_usd
+# ── token + cost arithmetic ────────────────────────────────────────
+def estimate_input_tokens(text: str) -> int:
+    """chars / 4 heuristic. Always returns ≥ 1 for non-empty strings."""
+    if not text:
+        return 0
+    return max(1, len(text) // _CHARS_PER_TOKEN)
+def estimate_cost(
+    provider: str,
+    model: str,
+    input_tokens: int,
+    max_output_tokens: int,
+    table: PriceTable,
+) -> CostEstimate:
+    price = table.lookup(provider, model)
+    if price is None:
+        # Unknown model — return zero-cost estimate; caller decides what
+        # to do (warn user, skip, ...). Never silently invent a price.
+        return CostEstimate(provider, model, input_tokens, max_output_tokens, 0.0, 0.0)
+    input_usd = (input_tokens / 1_000_000) * price.input_per_1m_usd
+    output_usd = (max_output_tokens / 1_000_000) * price.output_per_1m_usd
+    return CostEstimate(provider, model, input_tokens, max_output_tokens, input_usd, output_usd)
+# ── staleness ──────────────────────────────────────────────────────
+def last_monday_utc(now: _dt.datetime | None = None) -> _dt.date:
+    """Return the most recent Monday 00:00 UTC as a date."""
+    now = now or _dt.datetime.now(_dt.timezone.utc)
+    weekday = now.weekday()  # Mon=0 ... Sun=6
+    return (now - _dt.timedelta(days=weekday)).date()
+def is_stale(table: PriceTable, now: _dt.datetime | None = None) -> bool:
+    """True if `last_updated` is older than the most recent UTC Monday."""
+    try:
+        last = _dt.date.fromisoformat(table.last_updated)
+    except ValueError:
+        return True
+    return last < last_monday_utc(now)
+# ── parser + bootstrap ─────────────────────────────────────────────
+def load_prices(path: Path = PRICES_FILE) -> PriceTable:
+    """Parse `.agent-prices.md`; bootstrap from defaults if missing."""
+    if not path.exists():
+        bootstrap_from_defaults(path)
+    return _parse(path.read_text(encoding="utf-8"))
+def bootstrap_from_defaults(path: Path = PRICES_FILE) -> None:
+    """Write a fresh `.agent-prices.md` from `_default_prices.py`."""
+    rows = as_rows()
+    body = _render_markdown(LAST_UPDATED, "shipped-default", rows)
+    path.write_text(body, encoding="utf-8")
+def _render_markdown(
+    last_updated: str,
+    source: str,
+    rows: list[tuple[str, str, float, float]],
+) -> str:
+    lines = [
+        "---",
+        f"last_updated: {last_updated}",
+        "currency: USD",
+        "unit: per_1M_tokens",
+        f"source: {source}",
+        "---",
+        "",
+        "# Agent prices",
+        "",
+        "| provider  | model               | input  | output |",
+        "|-----------|---------------------|--------|--------|",
+    ]
+    for provider, model, inp, outp in rows:
+        lines.append(f"| {provider:<9} | {model:<19} | {inp:>6.2f} | {outp:>6.2f} |")
+    lines.append("")
+    return "\n".join(lines)
+def _parse(text: str) -> PriceTable:
+    front, body = _split_frontmatter(text)
+    meta = _parse_frontmatter(front)
+    prices = _parse_table(body)
+    return PriceTable(
+        last_updated=meta.get("last_updated", "1970-01-01"),
+        currency=meta.get("currency", "USD"),
+        unit=meta.get("unit", "per_1M_tokens"),
+        source=meta.get("source", "unknown"),
+        prices=prices,
+    )
+def _split_frontmatter(text: str) -> tuple[str, str]:
+    if not text.startswith("---"):
+        return "", text
+    parts = text.split("---", 2)
+    if len(parts) < 3:
+        return "", text
+    return parts[1], parts[2]
+def _parse_frontmatter(front: str) -> dict[str, str]:
+    out: dict[str, str] = {}
+    for line in front.splitlines():
+        line = line.strip()
+        if not line or ":" not in line:
+            continue
+        k, _, v = line.partition(":")
+        out[k.strip()] = v.strip()
+    return out
+def _parse_table(body: str) -> dict[tuple[str, str], Price]:
+    out: dict[tuple[str, str], Price] = {}
+    for line in body.splitlines():
+        line = line.strip()
+        if not line.startswith("|") or line.startswith("|--") or line.startswith("|-"):
+            continue
+        cells = [c.strip() for c in line.strip("|").split("|")]
+        if len(cells) != 4:
+            continue
+        provider, model, inp, outp = cells
+        if provider == "provider":  # header row
+            continue
+        try:
+            out[(provider, model)] = Price(provider, model, float(inp), float(outp))
+        except ValueError:
+            continue
+    return out
+__all__ = [
+    "Price", "PriceTable", "CostEstimate",
+    "PRICES_FILE", "DEFAULT_PRICES",
+    "load_prices", "bootstrap_from_defaults",
+    "estimate_input_tokens", "estimate_cost",
+    "last_monday_utc", "is_stale",
+]