selftune 0.2.23 → 0.2.24
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +6 -0
- package/README.md +93 -15
- package/apps/local-dashboard/dist/assets/index-DgY2KGP-.css +1 -0
- package/apps/local-dashboard/dist/assets/index-Dmx7LPVX.js +15 -0
- package/apps/local-dashboard/dist/assets/vendor-react-C5oyHiV1.js +11 -0
- package/apps/local-dashboard/dist/assets/{vendor-table-BIiI3YhS.js → vendor-table-Bc_bbKd8.js} +1 -1
- package/apps/local-dashboard/dist/assets/vendor-ui-B3BPIYy7.js +1 -0
- package/apps/local-dashboard/dist/index.html +5 -5
- package/cli/selftune/adapters/codex/install.ts +310 -78
- package/cli/selftune/adapters/opencode/install.ts +3 -4
- package/cli/selftune/alpha-upload/build-payloads.ts +3 -3
- package/cli/selftune/alpha-upload/stage-canonical.ts +17 -11
- package/cli/selftune/auto-update.ts +200 -8
- package/cli/selftune/canonical-export.ts +55 -25
- package/cli/selftune/command-surface.ts +397 -0
- package/cli/selftune/contribute/contribute.ts +64 -13
- package/cli/selftune/contribution-config.ts +57 -3
- package/cli/selftune/contribution-preferences.ts +117 -0
- package/cli/selftune/contribution-signals.ts +8 -4
- package/cli/selftune/contribution-staging.ts +13 -2
- package/cli/selftune/contributions.ts +55 -121
- package/cli/selftune/creator-contributions.ts +29 -10
- package/cli/selftune/cron/setup.ts +7 -3
- package/cli/selftune/dashboard-contract.ts +73 -0
- package/cli/selftune/dashboard-server.ts +168 -17
- package/cli/selftune/dashboard.ts +350 -17
- package/cli/selftune/eval/baseline.ts +21 -5
- package/cli/selftune/eval/execution-eval.ts +170 -0
- package/cli/selftune/eval/family-overlap.ts +2 -2
- package/cli/selftune/eval/hooks-to-evals.ts +228 -82
- package/cli/selftune/eval/import-skillsbench.ts +2 -2
- package/cli/selftune/eval/invocation-classifier.ts +56 -0
- package/cli/selftune/eval/synthetic-evals.ts +5 -3
- package/cli/selftune/eval/unit-test-cli.ts +7 -4
- package/cli/selftune/evolution/apply-proposal.ts +295 -0
- package/cli/selftune/evolution/engines/replay-engine.ts +79 -57
- package/cli/selftune/evolution/evolve-body.ts +100 -39
- package/cli/selftune/evolution/evolve.ts +244 -52
- package/cli/selftune/evolution/rollback.ts +0 -1
- package/cli/selftune/evolution/validate-body.ts +68 -42
- package/cli/selftune/evolution/validate-host-replay.ts +510 -60
- package/cli/selftune/evolution/validate-proposal.ts +11 -150
- package/cli/selftune/evolution/validate-routing.ts +43 -41
- package/cli/selftune/evolution/validation-contract.ts +91 -0
- package/cli/selftune/grading/auto-grade.ts +11 -7
- package/cli/selftune/grading/grade-session.ts +10 -16
- package/cli/selftune/index.ts +35 -10
- package/cli/selftune/ingestors/claude-replay.ts +15 -10
- package/cli/selftune/ingestors/codex-wrapper.ts +3 -3
- package/cli/selftune/ingestors/opencode-ingest.ts +2 -2
- package/cli/selftune/ingestors/pi-ingest.ts +3 -2
- package/cli/selftune/init.ts +27 -3
- package/cli/selftune/localdb/direct-write.ts +35 -1
- package/cli/selftune/localdb/queries/cron.ts +34 -0
- package/cli/selftune/localdb/queries/dashboard.ts +834 -0
- package/cli/selftune/localdb/queries/evolution.ts +158 -0
- package/cli/selftune/localdb/queries/execution.ts +133 -0
- package/cli/selftune/localdb/queries/json.ts +18 -0
- package/cli/selftune/localdb/queries/monitoring.ts +263 -0
- package/cli/selftune/localdb/queries/raw.ts +95 -0
- package/cli/selftune/localdb/queries/staging.ts +270 -0
- package/cli/selftune/localdb/queries/trust.ts +392 -0
- package/cli/selftune/localdb/queries.ts +60 -2288
- package/cli/selftune/localdb/schema.ts +21 -0
- package/cli/selftune/monitoring/watch.ts +96 -29
- package/cli/selftune/normalization.ts +3 -0
- package/cli/selftune/observability.ts +4 -2
- package/cli/selftune/orchestrate/cli.ts +161 -0
- package/cli/selftune/orchestrate/execute.ts +295 -0
- package/cli/selftune/orchestrate/finalize.ts +157 -0
- package/cli/selftune/orchestrate/locks.ts +40 -0
- package/cli/selftune/orchestrate/plan.ts +131 -0
- package/cli/selftune/orchestrate/post-run.ts +59 -0
- package/cli/selftune/orchestrate/prepare.ts +334 -0
- package/cli/selftune/orchestrate/report.ts +182 -0
- package/cli/selftune/orchestrate/runtime.ts +120 -0
- package/cli/selftune/orchestrate/signals.ts +48 -0
- package/cli/selftune/orchestrate.ts +150 -1173
- package/cli/selftune/repair/skill-usage.ts +5 -2
- package/cli/selftune/routes/overview.ts +5 -2
- package/cli/selftune/routes/skill-report.ts +15 -2
- package/cli/selftune/schedule.ts +5 -5
- package/cli/selftune/status.ts +39 -2
- package/cli/selftune/testing-readiness.ts +597 -0
- package/cli/selftune/types.ts +44 -4
- package/cli/selftune/uninstall.ts +2 -1
- package/cli/selftune/utils/canonical-log.ts +1 -9
- package/cli/selftune/utils/cli-error.ts +9 -0
- package/cli/selftune/utils/llm-call.ts +126 -6
- package/cli/selftune/utils/skill-discovery.ts +2 -0
- package/cli/selftune/workflows/proposals.ts +184 -0
- package/cli/selftune/workflows/skill-scaffold.ts +241 -0
- package/cli/selftune/workflows/workflows.ts +100 -26
- package/node_modules/@selftune/telemetry-contract/fixtures/complete-push.ts +1 -1
- package/node_modules/@selftune/telemetry-contract/fixtures/evidence-only-push.ts +1 -1
- package/node_modules/@selftune/telemetry-contract/fixtures/partial-push-no-sessions.ts +1 -1
- package/node_modules/@selftune/telemetry-contract/fixtures/partial-push-unresolved-parents.ts +1 -1
- package/node_modules/@selftune/telemetry-contract/src/schemas.ts +41 -1
- package/node_modules/@selftune/telemetry-contract/src/types.ts +103 -2
- package/package.json +25 -9
- package/packages/dashboard-core/AGENTS.md +18 -0
- package/packages/dashboard-core/README.md +30 -0
- package/packages/dashboard-core/index.ts +3 -0
- package/packages/dashboard-core/package.json +39 -0
- package/packages/dashboard-core/src/chrome/DashboardChrome.tsx +74 -0
- package/packages/dashboard-core/src/chrome/DashboardHeader.tsx +200 -0
- package/packages/dashboard-core/src/chrome/DashboardSidebar.tsx +219 -0
- package/packages/dashboard-core/src/chrome/RuntimeBadge.tsx +46 -0
- package/packages/dashboard-core/src/chrome/index.ts +14 -0
- package/packages/dashboard-core/src/chrome/types.ts +81 -0
- package/packages/dashboard-core/src/chrome/utils.ts +23 -0
- package/packages/dashboard-core/src/gates/FeatureGate.tsx +11 -0
- package/packages/dashboard-core/src/gates/LockedRoute.tsx +29 -0
- package/packages/dashboard-core/src/gates/UpgradeCard.tsx +89 -0
- package/packages/dashboard-core/src/gates/index.ts +3 -0
- package/packages/dashboard-core/src/host/DashboardHostProvider.tsx +62 -0
- package/packages/dashboard-core/src/host/adapter.ts +47 -0
- package/packages/dashboard-core/src/host/capabilities.ts +55 -0
- package/packages/dashboard-core/src/host/index.ts +3 -0
- package/packages/dashboard-core/src/models/analytics.ts +39 -0
- package/packages/dashboard-core/src/models/index.ts +4 -0
- package/packages/dashboard-core/src/models/overview.ts +98 -0
- package/packages/dashboard-core/src/models/runtime.ts +7 -0
- package/packages/dashboard-core/src/models/skills.ts +34 -0
- package/packages/dashboard-core/src/routes/index.ts +2 -0
- package/packages/dashboard-core/src/routes/manifest.test.ts +70 -0
- package/packages/dashboard-core/src/routes/manifest.ts +451 -0
- package/packages/dashboard-core/src/routes/types.ts +39 -0
- package/packages/dashboard-core/src/screens/analytics/AnalyticsScreen.tsx +278 -0
- package/packages/dashboard-core/src/screens/analytics/index.ts +1 -0
- package/packages/dashboard-core/src/screens/index.ts +37 -0
- package/packages/dashboard-core/src/screens/overview/OverviewComparisonSurface.test.ts +101 -0
- package/packages/dashboard-core/src/screens/overview/OverviewComparisonSurface.tsx +393 -0
- package/packages/dashboard-core/src/screens/overview/OverviewCompositionSurface.test.tsx +113 -0
- package/packages/dashboard-core/src/screens/overview/OverviewCompositionSurface.tsx +72 -0
- package/packages/dashboard-core/src/screens/overview/OverviewCoreSurface.tsx +71 -0
- package/packages/dashboard-core/src/screens/overview/OverviewOnboardingBanner.tsx +90 -0
- package/packages/dashboard-core/src/screens/overview/OverviewRunSummary.tsx +40 -0
- package/packages/dashboard-core/src/screens/overview/index.ts +16 -0
- package/packages/dashboard-core/src/screens/overview/types.ts +13 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportDailyBreakdownSection.tsx +99 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportDataQualityTabContent.tsx +35 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportEvidenceRail.tsx +71 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportEvidenceSection.tsx +63 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportEvidenceTabContent.tsx +25 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportInvocationsSection.tsx +24 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportMissedQueriesSection.tsx +79 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportScaffold.tsx +150 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportSections.test.tsx +224 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportTabs.test.tsx +76 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportTabs.tsx +88 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportTrendSection.tsx +33 -0
- package/packages/dashboard-core/src/screens/skill-report/SkillReportTrustBadge.tsx +67 -0
- package/packages/dashboard-core/src/screens/skill-report/index.ts +45 -0
- package/packages/dashboard-core/src/screens/skills/SkillsLibraryScreen.tsx +162 -0
- package/packages/dashboard-core/src/screens/skills/index.ts +6 -0
- package/packages/telemetry-contract/fixtures/complete-push.ts +1 -1
- package/packages/telemetry-contract/fixtures/evidence-only-push.ts +1 -1
- package/packages/telemetry-contract/fixtures/partial-push-no-sessions.ts +1 -1
- package/packages/telemetry-contract/fixtures/partial-push-unresolved-parents.ts +1 -1
- package/packages/telemetry-contract/src/schemas.ts +41 -1
- package/packages/telemetry-contract/src/types.ts +103 -2
- package/packages/ui/src/components/EvidenceViewer.tsx +80 -25
- package/packages/ui/src/components/OverviewPanels.tsx +67 -26
- package/packages/ui/src/primitives/tabs.tsx +7 -6
- package/packages/ui/src/types.ts +10 -0
- package/skill/SKILL.md +130 -332
- package/skill/agents/diagnosis-analyst.md +3 -3
- package/skill/agents/evolution-reviewer.md +3 -3
- package/skill/agents/integration-guide.md +3 -3
- package/skill/agents/pattern-analyst.md +2 -2
- package/skill/references/cli-quick-reference.md +89 -0
- package/skill/references/creator-playbook.md +131 -0
- package/skill/references/examples.md +48 -0
- package/skill/references/troubleshooting.md +47 -0
- package/skill/references/version-history.md +1 -1
- package/skill/selftune.contribute.json +11 -0
- package/skill/{Workflows → workflows}/Baseline.md +20 -1
- package/skill/{Workflows → workflows}/Contribute.md +23 -10
- package/skill/{Workflows → workflows}/Contributions.md +13 -5
- package/skill/workflows/CreateTestDeploy.md +170 -0
- package/skill/{Workflows → workflows}/CreatorContributions.md +18 -6
- package/skill/{Workflows → workflows}/Cron.md +1 -1
- package/skill/{Workflows → workflows}/Dashboard.md +20 -0
- package/skill/{Workflows → workflows}/Doctor.md +1 -1
- package/skill/{Workflows → workflows}/Evals.md +67 -2
- package/skill/{Workflows → workflows}/Evolve.md +119 -30
- package/skill/{Workflows → workflows}/EvolveBody.md +41 -1
- package/skill/{Workflows → workflows}/Grade.md +1 -1
- package/skill/{Workflows → workflows}/Initialize.md +8 -4
- package/skill/{Workflows → workflows}/Orchestrate.md +13 -3
- package/skill/{Workflows → workflows}/Schedule.md +3 -3
- package/skill/workflows/SignalsDashboard.md +87 -0
- package/skill/{Workflows → workflows}/UnitTest.md +19 -0
- package/skill/{Workflows → workflows}/Watch.md +42 -2
- package/skill/{Workflows → workflows}/Workflows.md +39 -2
- package/apps/local-dashboard/dist/assets/index-CwOtTrUS.css +0 -1
- package/apps/local-dashboard/dist/assets/index-f1HQpbeH.js +0 -59
- package/apps/local-dashboard/dist/assets/vendor-react-CKkiCskZ.js +0 -11
- package/apps/local-dashboard/dist/assets/vendor-ui-jVSaIZey.js +0 -12
- /package/skill/{Workflows → workflows}/AlphaUpload.md +0 -0
- /package/skill/{Workflows → workflows}/AutoActivation.md +0 -0
- /package/skill/{Workflows → workflows}/Badge.md +0 -0
- /package/skill/{Workflows → workflows}/Composability.md +0 -0
- /package/skill/{Workflows → workflows}/EvolutionMemory.md +0 -0
- /package/skill/{Workflows → workflows}/ExportCanonical.md +0 -0
- /package/skill/{Workflows → workflows}/Hook.md +0 -0
- /package/skill/{Workflows → workflows}/ImportSkillsBench.md +0 -0
- /package/skill/{Workflows → workflows}/Ingest.md +0 -0
- /package/skill/{Workflows → workflows}/PlatformHooks.md +0 -0
- /package/skill/{Workflows → workflows}/Quickstart.md +0 -0
- /package/skill/{Workflows → workflows}/Recover.md +0 -0
- /package/skill/{Workflows → workflows}/Registry.md +0 -0
- /package/skill/{Workflows → workflows}/RepairSkillUsage.md +0 -0
- /package/skill/{Workflows → workflows}/Replay.md +0 -0
- /package/skill/{Workflows → workflows}/Rollback.md +0 -0
- /package/skill/{Workflows → workflows}/Sync.md +0 -0
- /package/skill/{Workflows → workflows}/Telemetry.md +0 -0
- /package/skill/{Workflows → workflows}/Uninstall.md +0 -0
|
@@ -7,19 +7,22 @@
|
|
|
7
7
|
* Gate 3 (quality): Student model rates body clarity/completeness 0.0-1.0
|
|
8
8
|
*
|
|
9
9
|
* Gate 2 now supports replay-backed validation (via replay engine) in addition
|
|
10
|
-
* to LLM-judge-based checking. When replay
|
|
11
|
-
* the replay path is preferred. Falls back to LLM judge otherwise.
|
|
10
|
+
* to LLM-judge-based checking. When real host/runtime replay is available and
|
|
11
|
+
* succeeds, the replay path is preferred. Falls back to LLM judge otherwise.
|
|
12
12
|
*/
|
|
13
13
|
|
|
14
14
|
import type {
|
|
15
15
|
BodyEvolutionProposal,
|
|
16
16
|
BodyValidationResult,
|
|
17
17
|
EvalEntry,
|
|
18
|
+
RoutingReplayEntryResult,
|
|
19
|
+
ValidationGate,
|
|
18
20
|
ValidationMode,
|
|
19
21
|
} from "../types.js";
|
|
20
22
|
import { callLlm, stripMarkdownFences } from "../utils/llm-call.js";
|
|
21
23
|
import { runJudgeValidation } from "./engines/judge-engine.js";
|
|
22
|
-
import {
|
|
24
|
+
import type { ReplayValidationOptions } from "./engines/replay-engine.js";
|
|
25
|
+
import { runValidationContract, type ValidationStrategy } from "./validation-contract.js";
|
|
23
26
|
|
|
24
27
|
// ---------------------------------------------------------------------------
|
|
25
28
|
// Types
|
|
@@ -28,6 +31,8 @@ import { runReplayValidation, type ReplayValidationOptions } from "./engines/rep
|
|
|
28
31
|
export interface BodyValidationOptions {
|
|
29
32
|
/** Replay options for Gate 2 trigger accuracy. */
|
|
30
33
|
replay?: ReplayValidationOptions;
|
|
34
|
+
mode?: ValidationStrategy;
|
|
35
|
+
onReplayFallback?: (reason?: string) => void;
|
|
31
36
|
}
|
|
32
37
|
|
|
33
38
|
// ---------------------------------------------------------------------------
|
|
@@ -83,7 +88,7 @@ export function validateBodyStructure(proposedBody: string): { valid: boolean; r
|
|
|
83
88
|
* Run trigger checks on the eval set using the proposed body content.
|
|
84
89
|
* Returns before/after pass rates.
|
|
85
90
|
*
|
|
86
|
-
* When replay options are provided, attempts replay
|
|
91
|
+
* When replay options are provided, attempts host/runtime replay first.
|
|
87
92
|
* Falls back to LLM judge when replay is unavailable or no options given.
|
|
88
93
|
*/
|
|
89
94
|
export async function validateBodyTriggerAccuracy(
|
|
@@ -99,6 +104,9 @@ export async function validateBodyTriggerAccuracy(
|
|
|
99
104
|
improved: boolean;
|
|
100
105
|
regressions: string[];
|
|
101
106
|
validation_mode: ValidationMode;
|
|
107
|
+
validation_agent?: string;
|
|
108
|
+
validation_fixture_id?: string;
|
|
109
|
+
validation_fallback_reason?: string;
|
|
102
110
|
per_entry_results?: import("../types.js").RoutingReplayEntryResult[];
|
|
103
111
|
before_entry_results?: import("../types.js").RoutingReplayEntryResult[];
|
|
104
112
|
}> {
|
|
@@ -109,48 +117,64 @@ export async function validateBodyTriggerAccuracy(
|
|
|
109
117
|
improved: false,
|
|
110
118
|
regressions: [],
|
|
111
119
|
validation_mode: "llm_judge",
|
|
120
|
+
validation_agent: agent,
|
|
112
121
|
};
|
|
113
122
|
}
|
|
114
123
|
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
|
|
123
|
-
|
|
124
|
-
|
|
125
|
-
|
|
126
|
-
|
|
127
|
-
|
|
128
|
-
|
|
129
|
-
|
|
130
|
-
regressions: [],
|
|
131
|
-
validation_mode: replayResult.validation_mode,
|
|
132
|
-
per_entry_results: replayResult.per_entry_results,
|
|
133
|
-
before_entry_results: replayResult.before_entry_results,
|
|
134
|
-
};
|
|
135
|
-
}
|
|
136
|
-
}
|
|
137
|
-
|
|
138
|
-
// Fall back to LLM judge
|
|
139
|
-
const judgeResult = await runJudgeValidation(
|
|
140
|
-
originalBody,
|
|
141
|
-
proposedBody,
|
|
124
|
+
const { result, fallbackReason } = await runValidationContract<{
|
|
125
|
+
before_pass_rate: number;
|
|
126
|
+
after_pass_rate: number;
|
|
127
|
+
improved: boolean;
|
|
128
|
+
regressions: string[];
|
|
129
|
+
validation_mode: ValidationMode;
|
|
130
|
+
validation_agent?: string;
|
|
131
|
+
validation_fixture_id?: string;
|
|
132
|
+
validation_fallback_reason?: string;
|
|
133
|
+
per_entry_results?: RoutingReplayEntryResult[];
|
|
134
|
+
before_entry_results?: RoutingReplayEntryResult[];
|
|
135
|
+
}>({
|
|
136
|
+
mode: options?.mode ?? "auto",
|
|
137
|
+
originalContent: originalBody,
|
|
138
|
+
proposedContent: proposedBody,
|
|
142
139
|
evalSet,
|
|
143
140
|
agent,
|
|
144
|
-
|
|
145
|
-
|
|
141
|
+
replayOptions: options?.replay,
|
|
142
|
+
runJudge: async () => {
|
|
143
|
+
const judgeResult = await runJudgeValidation(
|
|
144
|
+
originalBody,
|
|
145
|
+
proposedBody,
|
|
146
|
+
evalSet,
|
|
147
|
+
agent,
|
|
148
|
+
modelFlag,
|
|
149
|
+
);
|
|
146
150
|
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
151
|
+
return {
|
|
152
|
+
result: {
|
|
153
|
+
before_pass_rate: judgeResult.before_pass_rate,
|
|
154
|
+
after_pass_rate: judgeResult.after_pass_rate,
|
|
155
|
+
improved: judgeResult.improved,
|
|
156
|
+
regressions: judgeResult.regressions,
|
|
157
|
+
validation_mode: judgeResult.validation_mode,
|
|
158
|
+
validation_agent: judgeResult.validation_agent,
|
|
159
|
+
},
|
|
160
|
+
modeUsed: judgeResult.validation_mode,
|
|
161
|
+
};
|
|
162
|
+
},
|
|
163
|
+
onReplayFallback: options?.onReplayFallback,
|
|
164
|
+
adaptReplayResult: (replayResult) => ({
|
|
165
|
+
before_pass_rate: replayResult.before_pass_rate,
|
|
166
|
+
after_pass_rate: replayResult.after_pass_rate,
|
|
167
|
+
improved: replayResult.improved,
|
|
168
|
+
regressions: [],
|
|
169
|
+
validation_mode: replayResult.validation_mode,
|
|
170
|
+
validation_agent: replayResult.validation_agent,
|
|
171
|
+
validation_fixture_id: replayResult.validation_fixture_id,
|
|
172
|
+
per_entry_results: replayResult.per_entry_results,
|
|
173
|
+
before_entry_results: replayResult.before_entry_results,
|
|
174
|
+
}),
|
|
175
|
+
});
|
|
176
|
+
|
|
177
|
+
return fallbackReason ? { ...result, validation_fallback_reason: fallbackReason } : result;
|
|
154
178
|
}
|
|
155
179
|
|
|
156
180
|
// ---------------------------------------------------------------------------
|
|
@@ -224,7 +248,7 @@ export async function validateBodyProposal(
|
|
|
224
248
|
qualityThreshold = QUALITY_THRESHOLD,
|
|
225
249
|
options?: BodyValidationOptions,
|
|
226
250
|
): Promise<BodyValidationResult> {
|
|
227
|
-
const gateResults: Array<{ gate:
|
|
251
|
+
const gateResults: Array<{ gate: ValidationGate; passed: boolean; reason: string }> = [];
|
|
228
252
|
|
|
229
253
|
// Gate 1: Structural validation (pure code)
|
|
230
254
|
const structural = validateBodyStructure(proposal.proposed_body);
|
|
@@ -287,7 +311,9 @@ export async function validateBodyProposal(
|
|
|
287
311
|
improved: gatesPassed === 3,
|
|
288
312
|
regressions: accuracy.regressions,
|
|
289
313
|
validation_mode: accuracy.validation_mode,
|
|
290
|
-
validation_agent: agent,
|
|
314
|
+
validation_agent: accuracy.validation_agent ?? agent,
|
|
315
|
+
validation_fallback_reason: accuracy.validation_fallback_reason,
|
|
316
|
+
validation_fixture_id: accuracy.validation_fixture_id,
|
|
291
317
|
...(evalSet.length > 0
|
|
292
318
|
? {
|
|
293
319
|
before_pass_rate: accuracy.before_pass_rate,
|