npm - agentera - Versions diffs - 0.0.0 → 3.0.0-dev.1 - Mend

agentera 0.0.0 → 3.0.0-dev.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (256) hide show

package/README.md +6 -45
package/bundle/.agentera-npx-bundle.json +4 -0
package/bundle/references/adapters/cursor.md +213 -0
package/bundle/references/adapters/opencode.md +530 -0
package/bundle/references/adapters/package-manifest-interface-model.yaml +337 -0
package/bundle/references/adapters/package-registry.yaml +247 -0
package/bundle/references/adapters/package-surface-characterization.md +48 -0
package/bundle/references/adapters/runtime-adapter-characterization.md +79 -0
package/bundle/references/adapters/runtime-adapter-interface-model.yaml +200 -0
package/bundle/references/adapters/runtime-adapter-registry.yaml +548 -0
package/bundle/references/adapters/runtime-feature-parity.md +189 -0
package/bundle/references/analysis/benchmark.md +267 -0
package/bundle/references/analysis/startup-measurement-contract.yaml +424 -0
package/bundle/references/artifacts/artifact-registry-interface-model.yaml +288 -0
package/bundle/references/cli/agent-ready-state-contract.yaml +950 -0
package/bundle/references/cli/app-lifecycle-vocabulary.yaml +241 -0
package/bundle/references/cli/audience-namespace-cli-migration.yaml +355 -0
package/bundle/references/cli/bundle-skill-vocabulary.yaml +278 -0
package/bundle/references/cli/capability-instruction-contract.yaml +123 -0
package/bundle/references/cli/capability-tool-classification.yaml +53 -0
package/bundle/references/cli/routing-execution-vocabulary.yaml +281 -0
package/bundle/references/cli/update-channels.yaml +147 -0
package/bundle/references/cli/vocabulary-index.yaml +160 -0
package/bundle/references/cli/vocabulary.md +566 -0
package/bundle/references/meta/documentation-inventory.md +43 -0
package/bundle/references/v1-section-mapping.md +47 -0
package/bundle/registry.json +39 -0
package/bundle/skills/agentera/.claude-plugin/plugin.json +27 -0
package/bundle/skills/agentera/SKILL.md +470 -0
package/bundle/skills/agentera/agents/dokumentera.toml +6 -0
package/bundle/skills/agentera/agents/hej.toml +6 -0
package/bundle/skills/agentera/agents/inspektera.toml +6 -0
package/bundle/skills/agentera/agents/inspirera.toml +6 -0
package/bundle/skills/agentera/agents/optimera.toml +6 -0
package/bundle/skills/agentera/agents/orkestrera.toml +6 -0
package/bundle/skills/agentera/agents/planera.toml +6 -0
package/bundle/skills/agentera/agents/profilera.toml +6 -0
package/bundle/skills/agentera/agents/realisera.toml +6 -0
package/bundle/skills/agentera/agents/resonera.toml +6 -0
package/bundle/skills/agentera/agents/visionera.toml +6 -0
package/bundle/skills/agentera/agents/visualisera.toml +6 -0
package/bundle/skills/agentera/capabilities/dokumentera/instructions.md +428 -0
package/bundle/skills/agentera/capabilities/dokumentera/schemas/artifacts.yaml +73 -0
package/bundle/skills/agentera/capabilities/dokumentera/schemas/exit.yaml +35 -0
package/bundle/skills/agentera/capabilities/dokumentera/schemas/triggers.yaml +35 -0
package/bundle/skills/agentera/capabilities/dokumentera/schemas/validation.yaml +139 -0
package/bundle/skills/agentera/capabilities/hej/instructions.md +331 -0
package/bundle/skills/agentera/capabilities/hej/schemas/artifacts.yaml +69 -0
package/bundle/skills/agentera/capabilities/hej/schemas/exit.yaml +32 -0
package/bundle/skills/agentera/capabilities/hej/schemas/triggers.yaml +58 -0
package/bundle/skills/agentera/capabilities/hej/schemas/validation.yaml +55 -0
package/bundle/skills/agentera/capabilities/inspektera/instructions.md +514 -0
package/bundle/skills/agentera/capabilities/inspektera/schemas/artifacts.yaml +76 -0
package/bundle/skills/agentera/capabilities/inspektera/schemas/exit.yaml +36 -0
package/bundle/skills/agentera/capabilities/inspektera/schemas/triggers.yaml +38 -0
package/bundle/skills/agentera/capabilities/inspektera/schemas/validation.yaml +113 -0
package/bundle/skills/agentera/capabilities/inspirera/instructions.md +280 -0
package/bundle/skills/agentera/capabilities/inspirera/schemas/artifacts.yaml +24 -0
package/bundle/skills/agentera/capabilities/inspirera/schemas/exit.yaml +33 -0
package/bundle/skills/agentera/capabilities/inspirera/schemas/triggers.yaml +34 -0
package/bundle/skills/agentera/capabilities/inspirera/schemas/validation.yaml +58 -0
package/bundle/skills/agentera/capabilities/optimera/instructions.md +437 -0
package/bundle/skills/agentera/capabilities/optimera/schemas/artifacts.yaml +69 -0
package/bundle/skills/agentera/capabilities/optimera/schemas/exit.yaml +35 -0
package/bundle/skills/agentera/capabilities/optimera/schemas/triggers.yaml +39 -0
package/bundle/skills/agentera/capabilities/optimera/schemas/validation.yaml +91 -0
package/bundle/skills/agentera/capabilities/orkestrera/instructions.md +433 -0
package/bundle/skills/agentera/capabilities/orkestrera/schemas/artifacts.yaml +64 -0
package/bundle/skills/agentera/capabilities/orkestrera/schemas/exit.yaml +34 -0
package/bundle/skills/agentera/capabilities/orkestrera/schemas/triggers.yaml +42 -0
package/bundle/skills/agentera/capabilities/orkestrera/schemas/validation.yaml +107 -0
package/bundle/skills/agentera/capabilities/planera/instructions.md +368 -0
package/bundle/skills/agentera/capabilities/planera/schemas/artifacts.yaml +62 -0
package/bundle/skills/agentera/capabilities/planera/schemas/exit.yaml +33 -0
package/bundle/skills/agentera/capabilities/planera/schemas/triggers.yaml +34 -0
package/bundle/skills/agentera/capabilities/planera/schemas/validation.yaml +61 -0
package/bundle/skills/agentera/capabilities/profilera/instructions.md +419 -0
package/bundle/skills/agentera/capabilities/profilera/schemas/artifacts.yaml +18 -0
package/bundle/skills/agentera/capabilities/profilera/schemas/exit.yaml +34 -0
package/bundle/skills/agentera/capabilities/profilera/schemas/triggers.yaml +45 -0
package/bundle/skills/agentera/capabilities/profilera/schemas/validation.yaml +57 -0
package/bundle/skills/agentera/capabilities/realisera/instructions.md +403 -0
package/bundle/skills/agentera/capabilities/realisera/schemas/artifacts.yaml +80 -0
package/bundle/skills/agentera/capabilities/realisera/schemas/exit.yaml +35 -0
package/bundle/skills/agentera/capabilities/realisera/schemas/triggers.yaml +39 -0
package/bundle/skills/agentera/capabilities/realisera/schemas/validation.yaml +110 -0
package/bundle/skills/agentera/capabilities/resonera/instructions.md +329 -0
package/bundle/skills/agentera/capabilities/resonera/schemas/artifacts.yaml +47 -0
package/bundle/skills/agentera/capabilities/resonera/schemas/exit.yaml +35 -0
package/bundle/skills/agentera/capabilities/resonera/schemas/triggers.yaml +46 -0
package/bundle/skills/agentera/capabilities/resonera/schemas/validation.yaml +77 -0
package/bundle/skills/agentera/capabilities/visionera/instructions.md +309 -0
package/bundle/skills/agentera/capabilities/visionera/schemas/artifacts.yaml +57 -0
package/bundle/skills/agentera/capabilities/visionera/schemas/exit.yaml +35 -0
package/bundle/skills/agentera/capabilities/visionera/schemas/triggers.yaml +41 -0
package/bundle/skills/agentera/capabilities/visionera/schemas/validation.yaml +74 -0
package/bundle/skills/agentera/capabilities/visualisera/instructions.md +400 -0
package/bundle/skills/agentera/capabilities/visualisera/schemas/artifacts.yaml +44 -0
package/bundle/skills/agentera/capabilities/visualisera/schemas/exit.yaml +34 -0
package/bundle/skills/agentera/capabilities/visualisera/schemas/triggers.yaml +33 -0
package/bundle/skills/agentera/capabilities/visualisera/schemas/validation.yaml +80 -0
package/bundle/skills/agentera/capability_schema_contract.yaml +385 -0
package/bundle/skills/agentera/protocol.yaml +463 -0
package/bundle/skills/agentera/references/contract.md +1039 -0
package/bundle/skills/agentera/schemas/artifacts/changelog.yaml +60 -0
package/bundle/skills/agentera/schemas/artifacts/decisions.yaml +461 -0
package/bundle/skills/agentera/schemas/artifacts/design.yaml +55 -0
package/bundle/skills/agentera/schemas/artifacts/docs.yaml +402 -0
package/bundle/skills/agentera/schemas/artifacts/experiments.yaml +373 -0
package/bundle/skills/agentera/schemas/artifacts/health.yaml +484 -0
package/bundle/skills/agentera/schemas/artifacts/objective.yaml +399 -0
package/bundle/skills/agentera/schemas/artifacts/plan.yaml +342 -0
package/bundle/skills/agentera/schemas/artifacts/progress.yaml +325 -0
package/bundle/skills/agentera/schemas/artifacts/todo.yaml +110 -0
package/bundle/skills/agentera/schemas/artifacts/vision.yaml +262 -0
package/bundle/skills/hej/.claude-plugin/plugin.json +6 -0
package/bundle/skills/hej/SKILL.md +69 -0
package/bundle/skills/hej/agents/hej.toml +11 -0
package/bundle/skills/hej/agents/openai.yaml +8 -0
package/dist/analytics/extractCorpus.js +1791 -0
package/dist/analytics/extractCorpus.js.map +1 -0
package/dist/analytics/usageStats.js +487 -0
package/dist/analytics/usageStats.js.map +1 -0
package/dist/bin/agentera.js +4 -0
package/dist/bin/agentera.js.map +1 -0
package/dist/cli/appContext.js +226 -0
package/dist/cli/appContext.js.map +1 -0
package/dist/cli/argvalidate.js +41 -0
package/dist/cli/argvalidate.js.map +1 -0
package/dist/cli/capabilityContext.js +2421 -0
package/dist/cli/capabilityContext.js.map +1 -0
package/dist/cli/commands/backfill.js +84 -0
package/dist/cli/commands/backfill.js.map +1 -0
package/dist/cli/commands/capability.js +44 -0
package/dist/cli/commands/capability.js.map +1 -0
package/dist/cli/commands/compact.js +148 -0
package/dist/cli/commands/compact.js.map +1 -0
package/dist/cli/commands/doctor.js +180 -0
package/dist/cli/commands/doctor.js.map +1 -0
package/dist/cli/commands/lint.js +179 -0
package/dist/cli/commands/lint.js.map +1 -0
package/dist/cli/commands/prime.js +544 -0
package/dist/cli/commands/prime.js.map +1 -0
package/dist/cli/commands/query.js +346 -0
package/dist/cli/commands/query.js.map +1 -0
package/dist/cli/commands/report.js +210 -0
package/dist/cli/commands/report.js.map +1 -0
package/dist/cli/commands/schema.js +306 -0
package/dist/cli/commands/schema.js.map +1 -0
package/dist/cli/commands/state.js +1012 -0
package/dist/cli/commands/state.js.map +1 -0
package/dist/cli/commands/upgrade.js +48 -0
package/dist/cli/commands/upgrade.js.map +1 -0
package/dist/cli/commands/validate.js +519 -0
package/dist/cli/commands/validate.js.map +1 -0
package/dist/cli/commands/verify.js +204 -0
package/dist/cli/commands/verify.js.map +1 -0
package/dist/cli/dispatch.js +958 -0
package/dist/cli/dispatch.js.map +1 -0
package/dist/cli/orientation.js +595 -0
package/dist/cli/orientation.js.map +1 -0
package/dist/cli/prime-blob.js +3 -0
package/dist/cli/prime-blob.js.map +1 -0
package/dist/cli/stateQuery.js +292 -0
package/dist/cli/stateQuery.js.map +1 -0
package/dist/cli/structured.js +18 -0
package/dist/cli/structured.js.map +1 -0
package/dist/core/difflib.js +274 -0
package/dist/core/difflib.js.map +1 -0
package/dist/core/git.js +43 -0
package/dist/core/git.js.map +1 -0
package/dist/core/paths.js +50 -0
package/dist/core/paths.js.map +1 -0
package/dist/core/pyjson.js +101 -0
package/dist/core/pyjson.js.map +1 -0
package/dist/core/sourceRoot.js +72 -0
package/dist/core/sourceRoot.js.map +1 -0
package/dist/core/toml.js +11 -0
package/dist/core/toml.js.map +1 -0
package/dist/core/yaml.js +25 -0
package/dist/core/yaml.js.map +1 -0
package/dist/eval/evalSkills.js +258 -0
package/dist/eval/evalSkills.js.map +1 -0
package/dist/eval/semanticEval.js +148 -0
package/dist/eval/semanticEval.js.map +1 -0
package/dist/eval/semanticFixtures.js +227 -0
package/dist/eval/semanticFixtures.js.map +1 -0
package/dist/hooks/common.js +160 -0
package/dist/hooks/common.js.map +1 -0
package/dist/hooks/compaction.js +935 -0
package/dist/hooks/compaction.js.map +1 -0
package/dist/hooks/cursorPreToolUse.js +19 -0
package/dist/hooks/cursorPreToolUse.js.map +1 -0
package/dist/hooks/cursorSessionStart.js +71 -0
package/dist/hooks/cursorSessionStart.js.map +1 -0
package/dist/hooks/sessionStart.js +209 -0
package/dist/hooks/sessionStart.js.map +1 -0
package/dist/hooks/sessionStop.js +212 -0
package/dist/hooks/sessionStop.js.map +1 -0
package/dist/hooks/validateArtifact.js +933 -0
package/dist/hooks/validateArtifact.js.map +1 -0
package/dist/registries/artifactRegistry.js +206 -0
package/dist/registries/artifactRegistry.js.map +1 -0
package/dist/registries/capabilityContract.js +310 -0
package/dist/registries/capabilityContract.js.map +1 -0
package/dist/registries/packageRegistry.js +641 -0
package/dist/registries/packageRegistry.js.map +1 -0
package/dist/registries/runtimeAdapterRegistry.js +315 -0
package/dist/registries/runtimeAdapterRegistry.js.map +1 -0
package/dist/setup/codex.js +1056 -0
package/dist/setup/codex.js.map +1 -0
package/dist/setup/copilot.js +227 -0
package/dist/setup/copilot.js.map +1 -0
package/dist/setup/cursor.js +127 -0
package/dist/setup/cursor.js.map +1 -0
package/dist/setup/doctor.js +1276 -0
package/dist/setup/doctor.js.map +1 -0
package/dist/state/installRoot.js +279 -0
package/dist/state/installRoot.js.map +1 -0
package/dist/state/progressCommit.js +289 -0
package/dist/state/progressCommit.js.map +1 -0
package/dist/state/startupAnalysis.js +1953 -0
package/dist/state/startupAnalysis.js.map +1 -0
package/dist/upgrade/appModel.js +189 -0
package/dist/upgrade/appModel.js.map +1 -0
package/dist/upgrade/channels.js +208 -0
package/dist/upgrade/channels.js.map +1 -0
package/dist/upgrade/compatibility.js +201 -0
package/dist/upgrade/compatibility.js.map +1 -0
package/dist/upgrade/doctor.js +373 -0
package/dist/upgrade/doctor.js.map +1 -0
package/dist/upgrade/migrateArtifactsV2ToV3.js +332 -0
package/dist/upgrade/migrateArtifactsV2ToV3.js.map +1 -0
package/dist/upgrade/runtimeMigration.js +484 -0
package/dist/upgrade/runtimeMigration.js.map +1 -0
package/dist/upgrade/upgradeCommands.js +36 -0
package/dist/upgrade/upgradeCommands.js.map +1 -0
package/dist/upgrade/upgradeOrchestrator.js +299 -0
package/dist/upgrade/upgradeOrchestrator.js.map +1 -0
package/dist/upgrade/versionResolution.js +179 -0
package/dist/upgrade/versionResolution.js.map +1 -0
package/dist/validate/appHomeContract.js +150 -0
package/dist/validate/appHomeContract.js.map +1 -0
package/dist/validate/capability.js +412 -0
package/dist/validate/capability.js.map +1 -0
package/dist/validate/crossCapability.js +145 -0
package/dist/validate/crossCapability.js.map +1 -0
package/dist/validate/lifecycleAdapters.js +772 -0
package/dist/validate/lifecycleAdapters.js.map +1 -0
package/dist/validate/selfAudit.js +107 -0
package/dist/validate/selfAudit.js.map +1 -0
package/package.json +28 -8
package/LICENSE +0 -201
package/bin/agentera.mjs +0 -50
package/lib/exec.mjs +0 -116
package/lib/resolve.mjs +0 -129

package/bundle/skills/agentera/capabilities/optimera/instructions.md ADDED Viewed

@@ -0,0 +1,437 @@
+# OPTIMERA
+**Objective Pursuit: Targeted Iterative Measurement. Experiment, Record, Advance.**
+Metric-driven optimization: improve any measurable property one experiment at a time. User defines the objective, agent writes an eval harness, harness becomes the immutable judge. Improve + pass regression = keep; everything else is discarded.
+Each invocation = one experiment. `/loop` handles recurrence.
+---
+## Visual identity
+Glyph: **⎘** (protocol ref: SG7). Used in the mandatory exit marker.
+---
+## State artifacts
+Three artifacts per objective, under `.agentera/optimera/<objective-name>/`, bootstrapped if absent.
+| Artifact | Purpose | Bootstrap |
+|----------|---------|-----------|
+| `.agentera/optimera/<objective-name>/objective.yaml` | What we're optimizing, why, how we measure it, and what "done" looks like. | Via inline brainstorm session with the user (see below). |
+| `.agentera/optimera/<objective-name>/harness` | Eval script that measures the metric. Locked after user approval. | Written by the agent during brainstorm, approved by the user. |
+| `.agentera/optimera/<objective-name>/experiments.yaml` | Log of every experiment: what was tried, what the metric said, kept or discarded. | First experiment entry in YAML form. |
+### Artifact path resolution
+Before reading or writing any artifact, check if `.agentera/docs.yaml` exists. If it has an Artifact Mapping section, use the path specified for each canonical filename. If `.agentera/docs.yaml` doesn't exist or has no mapping for a given artifact, use the default layout: TODO.md, CHANGELOG.md, and DESIGN.md at the project root; canonical VISION.md at `.agentera/vision.yaml`; other agent-facing artifacts at `.agentera/*.yaml`. This applies to all artifact references in this capability, including cross-capability reads (`.agentera/decisions.yaml`). objective.yaml and experiments.yaml are NOT resolved via the docs.yaml mapping; they always live under `.agentera/optimera/<objective-name>/` for whichever objective is active.
+### Contract
+Before starting, read `references/contract.md` (at v2 skill location `skills/agentera/references/contract.md`) for authoritative values: token budgets, severity levels, format contracts, and other shared conventions referenced in the steps below. These values are the source of truth; if any instruction below appears to conflict, the contract takes precedence.
+### Benchmark context source contract
+For benchmark-oriented optimization work, start from:
+```bash
+agentera prime --context optimera --format json
+```
+Use `benchmark_context` before direct retained startup benchmark file access. If `benchmark_context.source_contract.complete_for_benchmark_context` is true, do not read `latest-report.json`, `latest-report.md`, or `runs.jsonl` during normal Optimera startup. Use the bounded fields in `benchmark_context.latest_report`, `benchmark_context.history_summary`, `benchmark_context.runtime_coverage`, `benchmark_context.state_access_metrics`, `benchmark_context.token_impact`, `benchmark_context.comparison`, `benchmark_context.recommendation`, and `benchmark_context.manual_refresh` instead.
+If benchmark_context is incomplete, follow `benchmark_context.fallback_commands` and `benchmark_context.manual_refresh` first. Direct reads of retained benchmark files are last-resort diagnostics only, and must preserve the context caveats rather than reconstructing hidden state. Never run `mage bench:startupState` automatically; it is manual-only.
+When reporting benchmark evidence, preserve caveats about manual-only execution, missing or malformed retained evidence, empty local history, runtime coverage degradation, missing token estimates, non-comparable previous rows, and privacy boundaries. Do not expose raw transcripts, raw corpus files, raw intermediates, raw runtime store paths, raw session IDs, private salts, generated salted hashes, raw benchmark report bodies, or full local benchmark paths.
+### objective.yaml
+Evergreen. Created via brainstorm on first run, refined only when the user explicitly asks. Outside those two cases, the agent reads it but never writes it. Typical structure:
+```yaml
+target: Optimization target name
+status: active
+objective: >-
+  Precise metric, current value, and target value, for example reduce p95
+  latency of /api/search from 320ms to under 100ms.
+why: >-
+  What changes when the target is hit, who benefits, and what tradeoffs matter.
+measurement:
+  command: .agentera/optimera/<objective-name>/harness
+  metric: p95_latency_ms
+  direction: lower
+  baseline: 320
+  target: 100
+  budget:
+    runs: 5
+    time_limit: 10m
+constraints:
+  - Existing tests must pass.
+  - Public API must not change.
+scope:
+  included: [api/search]
+  excluded: [public_api]
+```
+The objective must be precise enough to measure, constraints clear enough to enforce, and scope defined enough to prevent wandering.
+Fixed budgets are part of the measurement contract, not experiment strategy. Keep them in objective.yaml and the locked harness. Do not store budget state in root artifacts, registries, symlinks, or DOCS.md mappings. experiments.yaml records the budget actually used only when that evidence matters to interpret the result.
+### `.agentera/optimera/<objective-name>/harness`
+Script that measures the metric and outputs structured JSON. Written during brainstorm, approved by the user, then **locked**. Never modified during optimization cycles.
+Wraps the project's own tooling (test runners, benchmarks, linters) and translates output into a consistent format. The project's tooling is the source of truth.
+**Before writing a harness**, inspect the project's existing test, benchmark, lint, or measurement commands. The Agentera app currently ships only the shared contract reference, so harness specifics come from project tooling and the objective's measurement fields.
+**Output contract** (minimal):
+```json
+{"metric": <number>, "direction": "higher"|"lower"}
+```
+**Output contract** (with optional fields for richer signal):
+```json
+{"metric": 85.5, "direction": "higher", "unit": "%", "detail": "42/50 tests passing", "breakdown": [{"name": "unit", "value": 95.0}, {"name": "integration", "value": 60.0}]}
+```
+The harness is the **immutable ground truth**, separating measurement from optimization. If wrong, the user must explicitly ask to rebuild it.
+### experiments.yaml
+When presenting experiment results, open with your interpretation of what happened before the structured data. "Here's what I tried and what it told us"; then the metrics table backs it up. Call out surprises, dead ends, and what the result changes about the approach.
+```yaml
+experiments:
+  - number: N
+    timestamp: YYYY-MM-DD HH:MM
+    hypothesis: What we expected to improve and why.
+    method: The approach taken to test the hypothesis.
+    change: One-line summary of the code change.
+    metric:
+      before: 320
+      after: 250
+      direction: lower
+      verdict: better
+    regression: pass
+    status: kept
+    commit: <hash>
+    inspiration: External source, if any.
+    conclusion: What the experiment taught.
+    next: What the result suggests trying next.
+```
+Closure entries are appended once when the objective reaches its target:
+```yaml
+closure:
+  timestamp: YYYY-MM-DDTHH:MM:SSZ
+  final_value: <value>
+  target: <target>
+  reason: already met at startup
+```
+The "Next" field from the previous experiment is a suggestion, not a mandate. Re-evaluate fresh each cycle based on the full experiment history.
+### Experiment history analyzer contract
+`npx -y agentera experiments` is the read-only summary layer for rich experiments.yaml records. It must inspect the active objective directory only. The command never creates root objective artifacts, registries, symlinks, DOCS.md fixed mappings, or sidecar ledgers.
+---
+## Brainstorm: bootstrapping or refining the objective
+This runs in two situations:
+1. **objective.yaml doesn't exist**: the first time optimera runs on a project
+2. **User explicitly asks** to refine the objective (e.g., "change the target", "update objective.yaml")
+In all other cases, skip straight to the cycle.
+### How the brainstorm works
+The sharp colleague figuring out what to optimize. One question at a time, push for precision, push back on vague targets. Call out when an objective is too fuzzy to measure or when constraints are missing.
+1. **Objective**: "What metric, current value, target?" If code exists, run existing test/bench/lint commands first.
+2. **Motivation**: "Why does this matter? What breaks at current value? What's possible at target?"
+3. **Constraints**: "What must NOT break? Off-limits files? Resource limits?" If a decision profile exists, propose constraints from it.
+4. **Scope**: "Which parts to focus on? Where are the biggest gains?" Read codebase to propose informed boundaries.
+5. **Pre-write self-audit**: run `agentera lint --artifact <ARTIFACT> --text "<DRAFT>"` (or `--file <PATH>`; schema names such as `decisions` auto-resolve the artifact file when no input is given) on the draft entry to check verbosity overruns, abstraction creep, and filler accumulation. Max 3 revision attempts. Flag with [post-audit-flagged] if still failing.
+6. **Write objective.yaml**: synthesize into a precise charter. Write to `.agentera/optimera/<objective-name>/objective.yaml`. Present for approval.
+7. **Write the eval harness**: use the project's own tooling and the objective's measurement fields. Write `.agentera/optimera/<objective-name>/harness` so it outputs JSON with at least `metric` and `direction`. Present, explain, get approval, run once to establish baseline.
+Artifact writing follows contract Artifact Writing Conventions: banned verbosity patterns, 25-word sentence cap, preferred vocabulary, and lead-with-conclusion structure.
+When **refining**, read current objective.yaml, show proposed changes with rationale, get confirmation. If the harness changes, the user must approve the new version. After brainstorm, proceed to experiment 1.
+---
+## The cycle
+Skill introduction: `─── ⎘ optimera · experiment N ───`
+Step markers: display `── step N/8: verb` before each step.
+Steps: orient, analyze, hypothesize, implement, measure, decide, audit, log.
+### Step 1: Orient
+**Benchmark context**: for benchmark-oriented work, use `benchmark_context` from `agentera prime --context optimera --format json` before direct retained benchmark files. Raw benchmark file reads are last-resort diagnostics.
+**Active-objective inference**: before reading any per-objective artifact, determine which objective is active by inspecting `.agentera/optimera/`:
+- If no objective subdirectories exist, keep the existing new-objective path: run the brainstorm.
+- For each objective subdirectory with an objective.yaml, classify it as closed before any active selection when `status: closed`. Do not reopen closed objectives.
+- If the user explicitly names a closed objective, load its objective.yaml and experiments.yaml read-only for context, summarize that it is closed, and ask before defining successor work.
+- If one or more objective subdirectories exist and all are closed, ask the user for a successor objective.
+- If only one non-closed subdirectory exists, use it.
+- If multiple non-closed subdirectories exist, run `git log -1 --format=%aI -- .agentera/optimera/<name>/experiments.yaml` for each and pick the one with the most recent modification timestamp.
+- If the result is ambiguous, ask the user to specify the active objective by name.
+All subsequent references to objective.yaml, experiments.yaml, and harness refer to the files under `.agentera/optimera/<active-objective-name>/`.
+1. **experiments.yaml**: last 5 experiments only (check for plateau patterns)
+2. **objective.yaml**: the metric, target, constraints, and scope
+3. **Decision profile**: read `$PROFILERA_PROFILE_DIR/PROFILE.md` directly when it exists. Apply confidence thresholds per contract profile consumption conventions. If missing, proceed without persona grounding but flag it.
+4. **Project discovery** (experiment 1 or when unfamiliar): map directory structure within scope, read dependency manifests, and read README.md, CLAUDE.md, AGENTS.md.
+5. `git log --oneline -20` for recent changes
+Before experimenting: in your response, list the current baseline, target, status, and constraints from objective.yaml.
+**Objective closure procedure**: when closing an objective, update objective.yaml with canonical closed state: `status: closed`, `closed_at: <ISO-8601 UTC timestamp>`, `final_value: <value>`, `target: <target>`, and `reason: <reason>`. Append one experiments.yaml closure entry. Do not append duplicates.
+**Exit-early stop condition**: If objective.yaml or experiments.yaml evidence shows the target is already met and the objective is not already closed, run the objective closure procedure with reason `already met at startup`, report exit signal `complete: objective achieved`, and stop before Analyze.
+### Step 2: Analyze
+Run two things:
+**2a. Experiment history analysis**: if experiments.yaml has prior entries, run:
+```bash
+npx -y agentera experiments
+```
+Outputs recent experiment status counts, metric deltas, conclusions, and next-step notes.
+**2b. Current metric**: run the eval harness to get the baseline for this experiment:
+```bash
+chmod +x .agentera/optimera/<objective-name>/harness && .agentera/optimera/<objective-name>/harness
+```
+Parse the JSON output. Record the current metric as the baseline.
+**Plateau detection**: if `plateau_detected: true` (no improvement in 3+ experiments), flag explicitly. Consider a radically different approach, ⬚ inspirera, or escalate to the user.
+### Step 3: Hypothesize
+Formulate a single, focused hypothesis.
+Effort-bias check: if one hypothesis took more effort to construct, reset before selection. Choose by experiment history, expected metric impact, risk, constraints, and smallest falsifiable test; construction effort is not evidence.
+1. **Review history**: what's been tried, what worked, what failed?
+2. **Seek inspiration**: for non-trivial domains, 2-3 targeted web queries for techniques, libraries, or patterns.
+3. **Formulate**: "I expect [change] to improve the metric because [reasoning]." Must be falsifiable.
+Be conservative early; escalate if conservative approaches plateau.
+### Step 4: Implement
+**Pre-spawn Git commit**: before creating the worktree, commit any pending artifact changes so the subagent branches from current state.
+1. Run `git status --porcelain`. If empty, skip to spawn.
+2. Stage only the artifact files this session wrote.
+3. Commit with `chore(optimera): checkpoint before worktree dispatch`. Do not pass `--no-verify`.
+4. If pre-commit hooks reject the commit: fix and retry. If retry also fails, abort the spawn.
+**Stale-base awareness**: some harnesses create the worktree branch from `origin/main` rather than local `HEAD`. Before spawning, run `git rev-list --count origin/main..HEAD`. If the count is greater than zero, the worktree will be based on a stale commit. Proceed with spawn, but in Step 5 do NOT merge the worktree branch: fetch the diff and apply it to the main checkout. Re-run the eval harness in the main checkout.
+Runtime subagent mechanisms:
+| Runtime | Substrate | Limitation |
+|---------|-----------|------------|
+| Claude Code | Task tool with worktree-aware prompt | Native in-session spawn. |
+| OpenCode | `@<capability>` descriptors from `~/.config/opencode/agents/*.md` or a host Task subagent | Same working tree unless this step explicitly creates and targets a manual git worktree. |
+| Codex CLI | `~/.codex/agents/*.toml` descriptors plus `[agents]` limits | Agentera setup installs descriptor files; do not write legacy `[agents.<name>]` config blocks. |
+| Copilot CLI | User-driven `/fleet` or equivalent host action | No guaranteed programmatic in-session spawn. |
+Never spawn workers by running unsupported capability-name CLI commands such as `agentera optimera`; use the runtime-native subagent surface with the experiment prompt below.
+Spawn an implementation sub-agent in a worktree (`isolation: "worktree"`) with:
+- The hypothesis from step 3
+- Relevant context files (objective.yaml, recent experiments, source files being modified)
+- Clear constraint: implement the hypothesis and nothing else
+```
+You are implementing one optimization experiment for [project].
+## Hypothesis
+[The hypothesis]
+## Context
+- Current metric: [value] ([unit])
+- Target: [target value]
+- Scope: [files/modules in scope from objective.yaml]
+## Constraints
+- Implement ONLY what the hypothesis describes. No scope creep.
+- Do NOT modify the eval harness at .agentera/optimera/<objective-name>/harness.
+- Do NOT modify objective.yaml or experiments.yaml.
+- Follow existing code patterns and conventions.
+- Read the files you are modifying before changing them.
+- Keep the change as small as possible while testing the hypothesis.
+- If you encounter a bug unrelated to your task, note it but do not fix it.
+```
+Wait for the implementation agent to complete before proceeding.
+### Step 5: Measure
+After implementation completes, run two checks in sequence:
+**5a. Regression check**: run the project's existing test/build/lint suite. If the regression check fails, **stop here**. The experiment is discarded. Do not run the eval harness. Log the regression failure and move to Step 7.
+**5b. Metric measurement**: run the eval harness. Parse the JSON output. Compare the new metric against the baseline from Step 2.
+### Step 6: Decide
+Present the decision conversationally: what the numbers say and what you'd recommend, then the structured gate below makes it official.
+Apply the decision gate. **Both conditions must be true** to keep an experiment:
+1. **Regression check passed** (from Step 5a)
+2. **Metric improved**: the new value is strictly better than the baseline, in the direction declared by the harness (lower for "lower", higher for "higher")
+If both pass: **keep**. Merge the worktree branch into the current branch. Commit with a conventional commit message:
+```
+perf(scope): summary of what improved the metric
+Metric: <before> → <after> ⮉ (<unit>)
+```
+If either fails: **discard**. The worktree is abandoned. No merge. No commit.
+If the kept experiment's new metric also meets the target in the harness direction, mark the objective as ready for closure after the experiment entry is logged in Step 8.
+### Step 7: Pre-write self-audit
+Pre-write self-audit: run `agentera lint --artifact <ARTIFACT> --text "<DRAFT>"` (or `--file <PATH>`; schema names such as `decisions` auto-resolve the artifact file when no input is given) on the draft entry to check verbosity overruns (per-artifact budget), abstraction creep (>=1 concrete anchor), and filler accumulation (banned patterns table). Max 3 revision attempts. Flag with [post-audit-flagged] if still failing.
+Narration voice (riff, don't script):
+"Tightening this up..." · "Cutting the filler first..." · "One more pass..."
+### Step 8: Log
+Summarize the experiment for the user before writing the log: what moved, what didn't, and what it suggests trying next. Then write the structured record.
+Update **experiments.yaml**: append the experiment entry. Output constraint per contract token budgets.
+If Step 6 marked the objective as ready for closure, immediately run the objective closure procedure with reason `experiment met target`. This closure is part of the same log step, after the experiment result is recorded.
+After writing a new experiment entry to experiments.yaml, apply the schema COMPACTION rules before writing if thresholds are exceeded: keep 10 full experiments, keep up to 40 one-line archive entries, and drop beyond 50 total.
+Artifact writing follows contract Artifact Writing Conventions: banned verbosity patterns, 25-word sentence cap, preferred vocabulary, and lead-with-conclusion structure.
+Then stop. One experiment complete.
+---
+## Safety rails
+<critical>
+- NEVER push to any remote. Local commits only.
+- NEVER modify the eval harness (`.agentera/optimera/<objective-name>/harness`) during an optimization cycle. Only touch it during a brainstorm (bootstrap or user-requested refinement).
+- NEVER modify objective.yaml during a cycle except to record canonical closure when the target is met. Other objective.yaml edits only happen during brainstorm or refine.
+- NEVER bypass the project's test/lint/build suite. Regression check before every metric measurement. Regression failure = automatic discard.
+- NEVER modify git config or skip git hooks.
+- NEVER force push, amend published commits, or run destructive git operations.
+- NEVER keep an experiment that causes a regression, even if the metric improved.
+- NEVER add placeholder data or functionality. All code must be real and functional.
+- NEVER modify files outside the scope declared in objective.yaml (when scope is declared).
+- One experiment per invocation. Do not attempt multiple experiments.
+</critical>
+---
+## Handling blocked experiments
+If blocked (missing dependency, ambiguous constraint, too risky):
+1. Log blocked hypothesis in experiments.yaml with context and decision needed
+2. Formulate a different hypothesis and complete a full experiment on that instead
+---
+## Exit signals
+Report one of these statuses at workflow completion (protocol refs: EX1-EX4).
+Format: `─── ⎘ optimera · status ───` followed by a summary sentence.
+For flagged, stuck, and waiting: add `▸` bullet details below the summary.
+- **complete** (EX1): One experiment completed the full cycle: hypothesis formulated, implementation dispatched, regression check passed, metric measured, decision made (kept or discarded), and experiments.yaml updated.
+- **flagged** (EX2): The experiment cycle completed but with issues worth noting: the metric did not improve after multiple attempts, a plateau was detected, or the experiment had to be discarded due to a regression.
+- **stuck** (EX3): Cannot proceed because objective.yaml is missing and the brainstorm cannot be completed without user input, the eval harness is broken and cannot be repaired without user approval, or the regression check infrastructure is unavailable.
+- **waiting** (EX4): The optimization objective is too vague to experiment against, the metric cannot be measured by any available tooling, or the scope is undefined and cannot be safely inferred.
+Before reporting any status, inspect the last 3 entries in PROGRESS.md. If all 3 entries record failed or discarded experiments, this constitutes 3 consecutive failures: **stop the cycle**, log the failure pattern to TODO.md, and surface the situation to the user with a recommended course of action. Do not attempt a 4th consecutive experiment on the same problem.
+---
+## Cross-capability integration
+Optimera is part of a twelve-capability suite. Each capability can invoke the others when the work calls for it.
+### Optimera invokes ⬚ inspirera
+When the Hypothesize step needs external techniques (especially after a plateau), search for approaches the way ⬚ inspirera would. Read the source deeply, extract transferable patterns, and fold them into the next hypothesis.
+### Realisera invokes ⎘ optimera
+When realisera picks work that is optimization-shaped (e.g., "improve test performance by 20%", "reduce build time", "increase coverage"), it can delegate to optimera. Realisera provides the context; optimera runs the optimization loop.
+### Optimera reads ♾ profilera output
+Every experiment reads `$PROFILERA_PROFILE_DIR/PROFILE.md` when it exists and applies confidence thresholds per contract profile consumption conventions. Effective confidence weighting ensures stale preferences don't over-constrain experiments.
+### Optimera uses ❈ resonera for objective decisions
+When the brainstorm session surfaces ambiguity about what to optimize (competing metrics, unclear constraints, or tradeoffs between measurement approaches), suggest ❈ resonera to deliberate first. Resonera can produce or refine objective.yaml directly, and its DECISIONS.md entries give optimera context for why the objective was chosen. During Orient, use `agentera decisions --format json` for prior deliberation context and preserve returned `missing_fields`, `compacted`, `caveats`, and `satisfaction.review_needed` pressure instead of raw-reading missing historical context.
+### Inspektera feeds ⎘ optimera
+When an inspektera audit reveals a poor dimension grade with a clearly measurable improvement path (test coverage, complexity score, dependency count), the finding can become an optimization objective. ⛶ inspektera may suggest ⎘ optimera when the metric and direction are clear.
+---
+## Getting started
+### First optimization
+1. `/agentera profile`: generate or refresh the decision profile (skip if recent)
+2. `/agentera optimize`: the first run detects no objective.yaml, runs a brainstorm with you to define the objective and write the eval harness, then proceeds to experiment 1
+3. Host loop + `/agentera optimize`: set up continuous optimization where supported
+### Resuming optimization
+1. `/agentera optimize`: if objective.yaml and the eval harness exist, starts experimenting immediately. Reads experiments.yaml to understand what's been tried.
+### Changing the target
+Edit objective.yaml directly to adjust the target value or constraints, or tell optimera to "refine the objective" for a guided session. If the measurement approach needs to change, the eval harness must be rebuilt and re-approved.
+### Optimera is fed by ≡ planera
+When a plan includes optimization-shaped tasks (improving a measurable metric), planera can delegate those tasks to optimera. The plan's acceptance criteria inform the optimization objective.
+### Drawing in external techniques
+Run `/agentera research <url>` with a relevant article, repo, or resource. The analysis will surface optimization techniques applicable to the objective. The next experiment picks it up naturally from the inspiration analysis.

package/bundle/skills/agentera/capabilities/optimera/schemas/artifacts.yaml ADDED Viewed

@@ -0,0 +1,69 @@
+ARTIFACTS:
+  1:
+    id: A1
+    artifact_id: objective
+    local_role: produces_and_consumes
+    description: >-
+      Optimization target definition: metric, current value, target, constraints,
+      scope, and measurement approach. Optimera writes this during brainstorm
+      and reads it every cycle. Written to only during brainstorm, refine, or
+      canonical closure.
+  2:
+    id: A2
+    artifact_id: optimera_harness
+    local_role: produces
+    description: >-
+      Eval script that measures the metric and outputs structured JSON. Written
+      during brainstorm, approved by user, then locked.
+      Never modified during optimization cycles.
+  3:
+    id: A3
+    artifact_id: experiments
+    local_role: produces_and_consumes
+    description: >-
+      Log of every experiment: hypothesis, method, change, metric before/after,
+      regression result, status (kept/discarded/error), conclusion, and next
+      suggestion. Optimera appends to this each cycle.
+  4:
+    id: A4
+    artifact_id: progress
+    local_role: consumes
+    description: >-
+      Optimera inspects the last 3 entries to detect 3 consecutive failures
+      before reporting exit status.
+  5:
+    id: A5
+    artifact_id: todo
+    local_role: produces
+    description: >-
+      Optimera writes to this when logging a failure pattern after 3
+      consecutive failures.
+  6:
+    id: A6
+    artifact_id: decisions
+    local_role: consumes
+    description: >-
+      Optimera reads this during Orient for context on prior deliberations
+      about the optimization objective.
+  7:
+    id: A7
+    artifact_id: profile
+    local_role: consumes
+    description: >-
+      Optimera reads this to modulate experiment aggressiveness and constraint
+      tolerance based on user preferences.
+  8:
+    id: A8
+    artifact_id: docs
+    local_role: consumes
+    description: >-
+      Optimera reads this first to resolve project-local artifact mappings
+      before accessing other artifacts.
+  9:
+    id: A9
+    artifact_id: benchmark_context
+    local_role: consumes
+    description: >-
+      CLI-provided startup benchmark summary from `agentera prime --context
+      optimera --format json`. Optimera consumes this before any direct
+      latest-report.json, latest-report.md, or runs.jsonl diagnostic read.

package/bundle/skills/agentera/capabilities/optimera/schemas/exit.yaml ADDED Viewed

@@ -0,0 +1,35 @@
+EXIT_CONDITIONS:
+  1:
+    id: E1
+    condition: complete
+    description: >-
+      One experiment completed the full cycle: hypothesis formulated,
+      implementation dispatched, regression check passed, metric measured,
+      decision made (kept or discarded), and EXPERIMENTS.md updated.
+    exit_signal: complete
+  2:
+    id: E2
+    condition: flagged
+    description: >-
+      The experiment cycle completed but with issues worth noting: the metric
+      did not improve after multiple attempts, a plateau was detected, or the
+      experiment had to be discarded due to a regression. Each concern is
+      listed explicitly.
+    exit_signal: flagged
+  3:
+    id: E3
+    condition: stuck
+    description: >-
+      Cannot proceed because OBJECTIVE.md is missing and the brainstorm cannot
+      be completed without user input, the eval harness is broken and cannot
+      be repaired without user approval, or the regression check infrastructure
+      is unavailable.
+    exit_signal: stuck
+  4:
+    id: E4
+    condition: waiting
+    description: >-
+      The optimization objective is too vague to experiment against, the metric
+      cannot be measured by any available tooling, or the scope is undefined
+      and cannot be safely inferred.
+    exit_signal: waiting

package/bundle/skills/agentera/capabilities/optimera/schemas/triggers.yaml ADDED Viewed

@@ -0,0 +1,39 @@
+TRIGGERS:
+  1:
+    id: T1
+    description: >-
+      Direct invocation by name or slash command. Matches when the user
+      explicitly requests optimera.
+    priority: high
+    patterns:
+      - "optimera"
+      - "/optimera"
+  2:
+    id: T2
+    description: >-
+      Metric-driven optimization requests. Matches when the user wants to
+      improve a concrete, quantifiable property of their codebase.
+    priority: medium
+    patterns:
+      - "optimize"
+      - "improve performance"
+      - "reduce latency"
+      - "increase test coverage"
+      - "lower bundle size"
+      - "speed up"
+      - "make faster"
+      - "make smaller"
+      - "get the score up"
+      - "hit the target"
+      - "improve the metric"
+  3:
+    id: T3
+    description: >-
+      Iterative experimentation requests. Matches when the user wants to
+      run experiments, benchmark, or iterate on a measurable objective.
+    priority: medium
+    patterns:
+      - "benchmark and iterate"
+      - "run experiments"
+      - "tune"
+      - "experiment until"

package/bundle/skills/agentera/capabilities/optimera/schemas/validation.yaml ADDED Viewed

@@ -0,0 +1,91 @@
+VALIDATION:
+  1:
+    id: V1
+    rule: harness_locked_during_cycle
+    description: >-
+      The eval harness MUST NOT be modified during an optimization cycle.
+      It may only be written during brainstorm (bootstrap) or user-requested
+      refinement. This ensures measurement consistency across experiments.
+    severity: critical
+    checks:
+      - "Harness file is not modified between Step 1 and Step 8"
+  2:
+    id: V2
+    rule: regression_first
+    description: >-
+      The regression check MUST pass before the eval harness runs. If the
+      project's test/build/lint suite fails, the experiment is automatically
+      discarded. Metric improvement does not override regression failure.
+    severity: critical
+    checks:
+      - "Regression check runs before metric measurement"
+      - "Regression failure results in experiment discard"
+  3:
+    id: V3
+    rule: objective_readonly_during_cycle
+    description: >-
+      OBJECTIVE.md MUST NOT be modified during a cycle except for canonical
+      closure when the target is met. Other edits only happen during
+      brainstorm or refine.
+    severity: critical
+    checks:
+      - "OBJECTIVE.md only modified for closure during cycle"
+  4:
+    id: V4
+    rule: one_experiment_per_invocation
+    description: >-
+      Each optimera invocation performs exactly one experiment. Multiple
+      experiments require multiple invocations or /loop setup.
+    severity: critical
+    checks:
+      - "At most one experiment logged per invocation"
+  5:
+    id: V5
+    rule: decision_gate_both_conditions
+    description: >-
+      An experiment is kept only when BOTH conditions are true:
+      (1) regression check passed, and (2) metric improved in the declared
+      direction. If either fails, the experiment is discarded.
+    severity: critical
+    checks:
+      - "Kept experiments have both regression pass and metric improvement"
+  6:
+    id: V6
+    rule: exit_marker_required
+    description: >-
+      Every optimera invocation MUST emit an exit marker. The marker uses
+      the canonical glyph ⎘ (SG7) in the format ⎘ optimera · <status>
+      where status is one of EX1-EX4.
+    severity: critical
+    checks:
+      - "Exit marker present after experiment"
+      - "Exit marker uses glyph ⎘ (SG7)"
+      - "Exit marker status is one of complete, flagged, stuck, waiting"
+  7:
+    id: V7
+    rule: benchmark_context_first
+    description: >-
+      For benchmark-oriented startup, Optimera MUST start from `agentera prime
+      --context optimera --format json` and consume complete
+      benchmark_context before direct retained benchmark file reads. Direct
+      latest-report.json, latest-report.md, or runs.jsonl reads are last-resort
+      diagnostics only when the CLI context is incomplete.
+    severity: critical
+    checks:
+      - "Optimera startup uses benchmark_context before direct retained benchmark files"
+      - "Incomplete benchmark_context follows listed CLI fallback and manual refresh guidance"
+      - "Direct benchmark file reads are treated as last-resort diagnostics"
+  8:
+    id: V8
+    rule: benchmark_caveat_preservation
+    description: >-
+      Benchmark caveats from benchmark_context MUST be preserved when Optimera
+      reports measurement evidence. Agents must not hide, upgrade, reconstruct,
+      or infer away caveats for manual-only execution, missing local history,
+      runtime coverage degradation, missing token estimates, non-comparable
+      previous rows, or privacy boundaries.
+    severity: critical
+    checks:
+      - "Manual-only benchmark execution caveats are reported"
+      - "Missing or malformed retained evidence remains incomplete"
+      - "Runtime coverage, token-impact, comparison, and privacy caveats are preserved"