@thinkhive/sdk 3.1.0 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,250 @@
1
+ /**
2
+ * ThinkHive SDK v3.0 - Evaluation Health API
3
+ *
4
+ * API for eval saturation monitoring, regression detection, and health reports
5
+ */
6
+ export type SaturationType = 'ceiling' | 'floor' | 'healthy';
7
+ export type HealthStatus = 'healthy' | 'warning' | 'critical';
8
+ export type RegressionSeverity = 'minor' | 'moderate' | 'severe';
9
+ export interface EvalHealthSnapshot {
10
+ id: string;
11
+ companyId: string;
12
+ agentId: string;
13
+ criterionId?: string;
14
+ snapshotDate: string;
15
+ passRate?: string;
16
+ evalCount?: number;
17
+ meanScore?: string;
18
+ saturationType?: SaturationType;
19
+ daysAtSaturation?: number;
20
+ trendDirection?: string;
21
+ trendStrength?: string;
22
+ healthStatus?: HealthStatus;
23
+ healthScore?: string;
24
+ createdAt: string;
25
+ }
26
+ export interface EvalRegression {
27
+ id: string;
28
+ companyId: string;
29
+ agentId: string;
30
+ criterionId?: string;
31
+ severity: RegressionSeverity;
32
+ baselinePassRate: string;
33
+ currentPassRate: string;
34
+ delta: string;
35
+ deltaPercent?: string;
36
+ baselinePeriodStart: string;
37
+ baselinePeriodEnd: string;
38
+ currentPeriodStart: string;
39
+ currentPeriodEnd: string;
40
+ baselineEvalCount?: number;
41
+ currentEvalCount?: number;
42
+ suspectedCauses?: unknown[];
43
+ isSignificant?: boolean;
44
+ isResolved: boolean;
45
+ isAcknowledged: boolean;
46
+ resolvedAt?: string;
47
+ resolvedBy?: string;
48
+ resolutionType?: string;
49
+ resolutionNotes?: string;
50
+ acknowledgedAt?: string;
51
+ acknowledgedBy?: string;
52
+ detectedAt: string;
53
+ createdAt: string;
54
+ }
55
+ export interface HealthReport {
56
+ agentId: string;
57
+ generatedAt: string;
58
+ overallHealth: HealthStatus;
59
+ overallScore: number;
60
+ passRate: number;
61
+ evalCount: number;
62
+ saturationStatus: {
63
+ type: SaturationType;
64
+ daysAtSaturation: number;
65
+ recommendation: string;
66
+ };
67
+ regressionCount: number;
68
+ activeRegressions: EvalRegression[];
69
+ trend: {
70
+ direction: 'improving' | 'stable' | 'declining';
71
+ strength: number;
72
+ description: string;
73
+ };
74
+ recommendations: string[];
75
+ }
76
+ export interface CreateSnapshotOptions {
77
+ agentId: string;
78
+ criterionId?: string;
79
+ snapshotDate: string;
80
+ passRate?: string;
81
+ evalCount?: number;
82
+ meanScore?: string;
83
+ saturationType?: SaturationType;
84
+ daysAtSaturation?: number;
85
+ trendDirection?: string;
86
+ trendStrength?: string;
87
+ healthStatus?: HealthStatus;
88
+ healthScore?: string;
89
+ }
90
+ export interface CreateRegressionOptions {
91
+ agentId: string;
92
+ criterionId?: string;
93
+ severity: RegressionSeverity;
94
+ baselinePassRate: string;
95
+ currentPassRate: string;
96
+ delta: string;
97
+ deltaPercent?: string;
98
+ baselinePeriodStart: string;
99
+ baselinePeriodEnd: string;
100
+ currentPeriodStart: string;
101
+ currentPeriodEnd: string;
102
+ baselineEvalCount?: number;
103
+ currentEvalCount?: number;
104
+ suspectedCauses?: unknown[];
105
+ isSignificant?: boolean;
106
+ detectedAt?: string;
107
+ }
108
+ export interface ResolveRegressionOptions {
109
+ resolutionType: string;
110
+ notes?: string;
111
+ }
112
+ export interface GetSnapshotsOptions {
113
+ agentId: string;
114
+ criterionId?: string;
115
+ startDate?: string;
116
+ endDate?: string;
117
+ }
118
+ /**
119
+ * Evaluation Health API client for monitoring eval quality and detecting regressions
120
+ */
121
+ export declare const evalHealth: {
122
+ /**
123
+ * Get comprehensive health report for an agent
124
+ *
125
+ * @example
126
+ * ```typescript
127
+ * const report = await evalHealth.getReport('agent_123');
128
+ * console.log(`Overall health: ${report.overallHealth}`);
129
+ * console.log(`Active regressions: ${report.regressionCount}`);
130
+ * ```
131
+ */
132
+ getReport(agentId: string): Promise<HealthReport>;
133
+ /**
134
+ * Get historical health snapshots
135
+ *
136
+ * @example
137
+ * ```typescript
138
+ * const snapshots = await evalHealth.getSnapshots({
139
+ * agentId: 'agent_123',
140
+ * startDate: '2024-01-01T00:00:00Z',
141
+ * endDate: '2024-01-31T23:59:59Z',
142
+ * });
143
+ * ```
144
+ */
145
+ getSnapshots(options: GetSnapshotsOptions): Promise<EvalHealthSnapshot[]>;
146
+ /**
147
+ * Get latest health snapshot
148
+ *
149
+ * @example
150
+ * ```typescript
151
+ * const snapshot = await evalHealth.getLatestSnapshot('agent_123');
152
+ * ```
153
+ */
154
+ getLatestSnapshot(agentId: string, criterionId?: string): Promise<EvalHealthSnapshot | null>;
155
+ /**
156
+ * Record a health snapshot
157
+ *
158
+ * @example
159
+ * ```typescript
160
+ * const snapshot = await evalHealth.recordSnapshot({
161
+ * agentId: 'agent_123',
162
+ * snapshotDate: new Date().toISOString(),
163
+ * passRate: '0.85',
164
+ * evalCount: 150,
165
+ * healthStatus: 'healthy',
166
+ * });
167
+ * ```
168
+ */
169
+ recordSnapshot(options: CreateSnapshotOptions): Promise<EvalHealthSnapshot>;
170
+ /**
171
+ * Get unresolved regressions for an agent
172
+ *
173
+ * @example
174
+ * ```typescript
175
+ * const regressions = await evalHealth.getRegressions('agent_123');
176
+ * for (const regression of regressions) {
177
+ * console.log(`${regression.severity}: ${regression.delta}% drop`);
178
+ * }
179
+ * ```
180
+ */
181
+ getRegressions(agentId: string): Promise<EvalRegression[]>;
182
+ /**
183
+ * Record a new regression
184
+ *
185
+ * @example
186
+ * ```typescript
187
+ * const regression = await evalHealth.recordRegression({
188
+ * agentId: 'agent_123',
189
+ * severity: 'moderate',
190
+ * baselinePassRate: '0.92',
191
+ * currentPassRate: '0.78',
192
+ * delta: '-0.14',
193
+ * baselinePeriodStart: '2024-01-01T00:00:00Z',
194
+ * baselinePeriodEnd: '2024-01-15T23:59:59Z',
195
+ * currentPeriodStart: '2024-01-16T00:00:00Z',
196
+ * currentPeriodEnd: '2024-01-31T23:59:59Z',
197
+ * });
198
+ * ```
199
+ */
200
+ recordRegression(options: CreateRegressionOptions): Promise<EvalRegression>;
201
+ /**
202
+ * Resolve a regression
203
+ *
204
+ * @example
205
+ * ```typescript
206
+ * await evalHealth.resolveRegression('regression_123', {
207
+ * resolutionType: 'fixed',
208
+ * notes: 'Updated prompt template to address quality issues',
209
+ * });
210
+ * ```
211
+ */
212
+ resolveRegression(regressionId: string, options: ResolveRegressionOptions): Promise<void>;
213
+ /**
214
+ * Acknowledge a regression
215
+ *
216
+ * @example
217
+ * ```typescript
218
+ * await evalHealth.acknowledgeRegression('regression_123');
219
+ * ```
220
+ */
221
+ acknowledgeRegression(regressionId: string): Promise<void>;
222
+ };
223
+ /**
224
+ * Check if health status indicates an issue
225
+ *
226
+ * @param status - Health status to check
227
+ * @returns Whether the status indicates a problem
228
+ */
229
+ export declare function hasHealthIssue(status: HealthStatus): boolean;
230
+ /**
231
+ * Get severity level as numeric value for sorting
232
+ *
233
+ * @param severity - Regression severity
234
+ * @returns Numeric severity (1-3, higher is worse)
235
+ */
236
+ export declare function getSeverityLevel(severity: RegressionSeverity): number;
237
+ /**
238
+ * Check if evaluation is saturated
239
+ *
240
+ * @param snapshot - Health snapshot to check
241
+ * @returns Whether evaluation is at ceiling or floor
242
+ */
243
+ export declare function isSaturated(snapshot: EvalHealthSnapshot): boolean;
244
+ /**
245
+ * Get recommendation for saturation type
246
+ *
247
+ * @param saturationType - Type of saturation
248
+ * @returns Recommendation string
249
+ */
250
+ export declare function getSaturationRecommendation(saturationType: SaturationType): string;
@@ -0,0 +1,224 @@
1
+ "use strict";
2
+ /**
3
+ * ThinkHive SDK v3.0 - Evaluation Health API
4
+ *
5
+ * API for eval saturation monitoring, regression detection, and health reports
6
+ */
7
+ Object.defineProperty(exports, "__esModule", { value: true });
8
+ exports.evalHealth = void 0;
9
+ exports.hasHealthIssue = hasHealthIssue;
10
+ exports.getSeverityLevel = getSeverityLevel;
11
+ exports.isSaturated = isSaturated;
12
+ exports.getSaturationRecommendation = getSaturationRecommendation;
13
+ const client_1 = require("../core/client");
14
+ // ============================================================================
15
+ // EVAL HEALTH API CLIENT
16
+ // ============================================================================
17
+ /**
18
+ * Evaluation Health API client for monitoring eval quality and detecting regressions
19
+ */
20
+ exports.evalHealth = {
21
+ /**
22
+ * Get comprehensive health report for an agent
23
+ *
24
+ * @example
25
+ * ```typescript
26
+ * const report = await evalHealth.getReport('agent_123');
27
+ * console.log(`Overall health: ${report.overallHealth}`);
28
+ * console.log(`Active regressions: ${report.regressionCount}`);
29
+ * ```
30
+ */
31
+ async getReport(agentId) {
32
+ return (0, client_1.apiRequestWithData)(`/eval-health/report?agentId=${agentId}`, { apiVersion: 'v1' });
33
+ },
34
+ // ---------------------------------------------------------------------------
35
+ // SNAPSHOTS
36
+ // ---------------------------------------------------------------------------
37
+ /**
38
+ * Get historical health snapshots
39
+ *
40
+ * @example
41
+ * ```typescript
42
+ * const snapshots = await evalHealth.getSnapshots({
43
+ * agentId: 'agent_123',
44
+ * startDate: '2024-01-01T00:00:00Z',
45
+ * endDate: '2024-01-31T23:59:59Z',
46
+ * });
47
+ * ```
48
+ */
49
+ async getSnapshots(options) {
50
+ const params = new URLSearchParams();
51
+ params.set('agentId', options.agentId);
52
+ if (options.criterionId)
53
+ params.set('criterionId', options.criterionId);
54
+ if (options.startDate)
55
+ params.set('startDate', options.startDate);
56
+ if (options.endDate)
57
+ params.set('endDate', options.endDate);
58
+ return (0, client_1.apiRequestWithData)(`/eval-health/snapshots?${params.toString()}`, { apiVersion: 'v1' });
59
+ },
60
+ /**
61
+ * Get latest health snapshot
62
+ *
63
+ * @example
64
+ * ```typescript
65
+ * const snapshot = await evalHealth.getLatestSnapshot('agent_123');
66
+ * ```
67
+ */
68
+ async getLatestSnapshot(agentId, criterionId) {
69
+ const params = new URLSearchParams();
70
+ params.set('agentId', agentId);
71
+ if (criterionId)
72
+ params.set('criterionId', criterionId);
73
+ return (0, client_1.apiRequestWithData)(`/eval-health/snapshots/latest?${params.toString()}`, { apiVersion: 'v1' });
74
+ },
75
+ /**
76
+ * Record a health snapshot
77
+ *
78
+ * @example
79
+ * ```typescript
80
+ * const snapshot = await evalHealth.recordSnapshot({
81
+ * agentId: 'agent_123',
82
+ * snapshotDate: new Date().toISOString(),
83
+ * passRate: '0.85',
84
+ * evalCount: 150,
85
+ * healthStatus: 'healthy',
86
+ * });
87
+ * ```
88
+ */
89
+ async recordSnapshot(options) {
90
+ return (0, client_1.apiRequestWithData)('/eval-health/snapshots', {
91
+ method: 'POST',
92
+ body: options,
93
+ apiVersion: 'v1',
94
+ });
95
+ },
96
+ // ---------------------------------------------------------------------------
97
+ // REGRESSIONS
98
+ // ---------------------------------------------------------------------------
99
+ /**
100
+ * Get unresolved regressions for an agent
101
+ *
102
+ * @example
103
+ * ```typescript
104
+ * const regressions = await evalHealth.getRegressions('agent_123');
105
+ * for (const regression of regressions) {
106
+ * console.log(`${regression.severity}: ${regression.delta}% drop`);
107
+ * }
108
+ * ```
109
+ */
110
+ async getRegressions(agentId) {
111
+ return (0, client_1.apiRequestWithData)(`/eval-health/regressions?agentId=${agentId}`, { apiVersion: 'v1' });
112
+ },
113
+ /**
114
+ * Record a new regression
115
+ *
116
+ * @example
117
+ * ```typescript
118
+ * const regression = await evalHealth.recordRegression({
119
+ * agentId: 'agent_123',
120
+ * severity: 'moderate',
121
+ * baselinePassRate: '0.92',
122
+ * currentPassRate: '0.78',
123
+ * delta: '-0.14',
124
+ * baselinePeriodStart: '2024-01-01T00:00:00Z',
125
+ * baselinePeriodEnd: '2024-01-15T23:59:59Z',
126
+ * currentPeriodStart: '2024-01-16T00:00:00Z',
127
+ * currentPeriodEnd: '2024-01-31T23:59:59Z',
128
+ * });
129
+ * ```
130
+ */
131
+ async recordRegression(options) {
132
+ return (0, client_1.apiRequestWithData)('/eval-health/regressions', {
133
+ method: 'POST',
134
+ body: options,
135
+ apiVersion: 'v1',
136
+ });
137
+ },
138
+ /**
139
+ * Resolve a regression
140
+ *
141
+ * @example
142
+ * ```typescript
143
+ * await evalHealth.resolveRegression('regression_123', {
144
+ * resolutionType: 'fixed',
145
+ * notes: 'Updated prompt template to address quality issues',
146
+ * });
147
+ * ```
148
+ */
149
+ async resolveRegression(regressionId, options) {
150
+ await (0, client_1.apiRequest)(`/eval-health/regressions/${regressionId}/resolve`, {
151
+ method: 'POST',
152
+ body: options,
153
+ apiVersion: 'v1',
154
+ });
155
+ },
156
+ /**
157
+ * Acknowledge a regression
158
+ *
159
+ * @example
160
+ * ```typescript
161
+ * await evalHealth.acknowledgeRegression('regression_123');
162
+ * ```
163
+ */
164
+ async acknowledgeRegression(regressionId) {
165
+ await (0, client_1.apiRequest)(`/eval-health/regressions/${regressionId}/acknowledge`, {
166
+ method: 'POST',
167
+ apiVersion: 'v1',
168
+ });
169
+ },
170
+ };
171
+ // ============================================================================
172
+ // HELPER FUNCTIONS
173
+ // ============================================================================
174
+ /**
175
+ * Check if health status indicates an issue
176
+ *
177
+ * @param status - Health status to check
178
+ * @returns Whether the status indicates a problem
179
+ */
180
+ function hasHealthIssue(status) {
181
+ return status === 'warning' || status === 'critical';
182
+ }
183
+ /**
184
+ * Get severity level as numeric value for sorting
185
+ *
186
+ * @param severity - Regression severity
187
+ * @returns Numeric severity (1-3, higher is worse)
188
+ */
189
+ function getSeverityLevel(severity) {
190
+ switch (severity) {
191
+ case 'minor': return 1;
192
+ case 'moderate': return 2;
193
+ case 'severe': return 3;
194
+ default: return 0;
195
+ }
196
+ }
197
+ /**
198
+ * Check if evaluation is saturated
199
+ *
200
+ * @param snapshot - Health snapshot to check
201
+ * @returns Whether evaluation is at ceiling or floor
202
+ */
203
+ function isSaturated(snapshot) {
204
+ return snapshot.saturationType === 'ceiling' || snapshot.saturationType === 'floor';
205
+ }
206
+ /**
207
+ * Get recommendation for saturation type
208
+ *
209
+ * @param saturationType - Type of saturation
210
+ * @returns Recommendation string
211
+ */
212
+ function getSaturationRecommendation(saturationType) {
213
+ switch (saturationType) {
214
+ case 'ceiling':
215
+ return 'Evaluation criteria may be too lenient. Consider adding stricter checks or more challenging test cases.';
216
+ case 'floor':
217
+ return 'Evaluation criteria may be too strict. Consider relaxing thresholds or reviewing criteria for accuracy.';
218
+ case 'healthy':
219
+ return 'Evaluation is operating within healthy parameters.';
220
+ default:
221
+ return 'Unable to determine saturation status.';
222
+ }
223
+ }
224
+ //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"eval-health.js","sourceRoot":"","sources":["../../src/api/eval-health.ts"],"names":[],"mappings":";AAAA;;;;GAIG;;;AA4TH,wCAEC;AAQD,4CAOC;AAQD,kCAEC;AAQD,kEAWC;AAxWD,2CAAgE;AA8HhE,+EAA+E;AAC/E,yBAAyB;AACzB,+EAA+E;AAE/E;;GAEG;AACU,QAAA,UAAU,GAAG;IACxB;;;;;;;;;OASG;IACH,KAAK,CAAC,SAAS,CAAC,OAAe;QAC7B,OAAO,IAAA,2BAAkB,EACvB,+BAA+B,OAAO,EAAE,EACxC,EAAE,UAAU,EAAE,IAAI,EAAE,CACrB,CAAC;IACJ,CAAC;IAED,8EAA8E;IAC9E,YAAY;IACZ,8EAA8E;IAE9E;;;;;;;;;;;OAWG;IACH,KAAK,CAAC,YAAY,CAAC,OAA4B;QAC7C,MAAM,MAAM,GAAG,IAAI,eAAe,EAAE,CAAC;QACrC,MAAM,CAAC,GAAG,CAAC,SAAS,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;QACvC,IAAI,OAAO,CAAC,WAAW;YAAE,MAAM,CAAC,GAAG,CAAC,aAAa,EAAE,OAAO,CAAC,WAAW,CAAC,CAAC;QACxE,IAAI,OAAO,CAAC,SAAS;YAAE,MAAM,CAAC,GAAG,CAAC,WAAW,EAAE,OAAO,CAAC,SAAS,CAAC,CAAC;QAClE,IAAI,OAAO,CAAC,OAAO;YAAE,MAAM,CAAC,GAAG,CAAC,SAAS,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;QAE5D,OAAO,IAAA,2BAAkB,EACvB,0BAA0B,MAAM,CAAC,QAAQ,EAAE,EAAE,EAC7C,EAAE,UAAU,EAAE,IAAI,EAAE,CACrB,CAAC;IACJ,CAAC;IAED;;;;;;;OAOG;IACH,KAAK,CAAC,iBAAiB,CAAC,OAAe,EAAE,WAAoB;QAC3D,MAAM,MAAM,GAAG,IAAI,eAAe,EAAE,CAAC;QACrC,MAAM,CAAC,GAAG,CAAC,SAAS,EAAE,OAAO,CAAC,CAAC;QAC/B,IAAI,WAAW;YAAE,MAAM,CAAC,GAAG,CAAC,aAAa,EAAE,WAAW,CAAC,CAAC;QAExD,OAAO,IAAA,2BAAkB,EACvB,iCAAiC,MAAM,CAAC,QAAQ,EAAE,EAAE,EACpD,EAAE,UAAU,EAAE,IAAI,EAAE,CACrB,CAAC;IACJ,CAAC;IAED;;;;;;;;;;;;;OAaG;IACH,KAAK,CAAC,cAAc,CAAC,OAA8B;QACjD,OAAO,IAAA,2BAAkB,EAAqB,wBAAwB,EAAE;YACtE,MAAM,EAAE,MAAM;YACd,IAAI,EAAE,OAAO;YACb,UAAU,EAAE,IAAI;SACjB,CAAC,CAAC;IACL,CAAC;IAED,8EAA8E;IAC9E,cAAc;IACd,8EAA8E;IAE9E;;;;;;;;;;OAUG;IACH,KAAK,CAAC,cAAc,CAAC,OAAe;QAClC,OAAO,IAAA,2BAAkB,EACvB,oCAAoC,OAAO,EAAE,EAC7C,EAAE,UAAU,EAAE,IAAI,EAAE,CACrB,CAAC;IACJ,CAAC;IAED;;;;;;;;;;;;;;;;;OAiBG;IACH,KAAK,CAAC,gBAAgB,CAAC,OAAgC;QACrD,OAAO,IAAA,2BAAkB,EAAiB,0BAA0B,EAAE;YACpE,MAAM,EAAE,MAAM;YACd,IAAI,EAAE,OAAO;YACb,UAAU,EAAE,IAAI;SACjB,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;;;OAUG;IACH,KAAK,CAAC,iBAAiB,CAAC,YAAoB,EAAE,OAAiC;QAC7E,MAAM,IAAA,mBAAU,EAAC,4BAA4B,YAAY,UAAU,EAAE;YACnE,MAAM,EAAE,MAAM;YACd,IAAI,EAAE,OAAO;YACb,UAAU,EAAE,IAAI;SACjB,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;OAOG;IACH,KAAK,CAAC,qBAAqB,CAAC,YAAoB;QAC9C,MAAM,IAAA,mBAAU,EAAC,4BAA4B,YAAY,cAAc,EAAE;YACvE,MAAM,EAAE,MAAM;YACd,UAAU,EAAE,IAAI;SACjB,CAAC,CAAC;IACL,CAAC;CACF,CAAC;AAEF,+EAA+E;AAC/E,mBAAmB;AACnB,+EAA+E;AAE/E;;;;;GAKG;AACH,SAAgB,cAAc,CAAC,MAAoB;IACjD,OAAO,MAAM,KAAK,SAAS,IAAI,MAAM,KAAK,UAAU,CAAC;AACvD,CAAC;AAED;;;;;GAKG;AACH,SAAgB,gBAAgB,CAAC,QAA4B;IAC3D,QAAQ,QAAQ,EAAE,CAAC;QACjB,KAAK,OAAO,CAAC,CAAC,OAAO,CAAC,CAAC;QACvB,KAAK,UAAU,CAAC,CAAC,OAAO,CAAC,CAAC;QAC1B,KAAK,QAAQ,CAAC,CAAC,OAAO,CAAC,CAAC;QACxB,OAAO,CAAC,CAAC,OAAO,CAAC,CAAC;IACpB,CAAC;AACH,CAAC;AAED;;;;;GAKG;AACH,SAAgB,WAAW,CAAC,QAA4B;IACtD,OAAO,QAAQ,CAAC,cAAc,KAAK,SAAS,IAAI,QAAQ,CAAC,cAAc,KAAK,OAAO,CAAC;AACtF,CAAC;AAED;;;;;GAKG;AACH,SAAgB,2BAA2B,CAAC,cAA8B;IACxE,QAAQ,cAAc,EAAE,CAAC;QACvB,KAAK,SAAS;YACZ,OAAO,yGAAyG,CAAC;QACnH,KAAK,OAAO;YACV,OAAO,yGAAyG,CAAC;QACnH,KAAK,SAAS;YACZ,OAAO,oDAAoD,CAAC;QAC9D;YACE,OAAO,wCAAwC,CAAC;IACpD,CAAC;AACH,CAAC","sourcesContent":["/**\n * ThinkHive SDK v3.0 - Evaluation Health API\n *\n * API for eval saturation monitoring, regression detection, and health reports\n */\n\nimport { apiRequest, apiRequestWithData } from '../core/client';\n\n// ============================================================================\n// TYPES\n// ============================================================================\n\nexport type SaturationType = 'ceiling' | 'floor' | 'healthy';\nexport type HealthStatus = 'healthy' | 'warning' | 'critical';\nexport type RegressionSeverity = 'minor' | 'moderate' | 'severe';\n\nexport interface EvalHealthSnapshot {\n  id: string;\n  companyId: string;\n  agentId: string;\n  criterionId?: string;\n  snapshotDate: string;\n  passRate?: string;\n  evalCount?: number;\n  meanScore?: string;\n  saturationType?: SaturationType;\n  daysAtSaturation?: number;\n  trendDirection?: string;\n  trendStrength?: string;\n  healthStatus?: HealthStatus;\n  healthScore?: string;\n  createdAt: string;\n}\n\nexport interface EvalRegression {\n  id: string;\n  companyId: string;\n  agentId: string;\n  criterionId?: string;\n  severity: RegressionSeverity;\n  baselinePassRate: string;\n  currentPassRate: string;\n  delta: string;\n  deltaPercent?: string;\n  baselinePeriodStart: string;\n  baselinePeriodEnd: string;\n  currentPeriodStart: string;\n  currentPeriodEnd: string;\n  baselineEvalCount?: number;\n  currentEvalCount?: number;\n  suspectedCauses?: unknown[];\n  isSignificant?: boolean;\n  isResolved: boolean;\n  isAcknowledged: boolean;\n  resolvedAt?: string;\n  resolvedBy?: string;\n  resolutionType?: string;\n  resolutionNotes?: string;\n  acknowledgedAt?: string;\n  acknowledgedBy?: string;\n  detectedAt: string;\n  createdAt: string;\n}\n\nexport interface HealthReport {\n  agentId: string;\n  generatedAt: string;\n  overallHealth: HealthStatus;\n  overallScore: number;\n  passRate: number;\n  evalCount: number;\n  saturationStatus: {\n    type: SaturationType;\n    daysAtSaturation: number;\n    recommendation: string;\n  };\n  regressionCount: number;\n  activeRegressions: EvalRegression[];\n  trend: {\n    direction: 'improving' | 'stable' | 'declining';\n    strength: number;\n    description: string;\n  };\n  recommendations: string[];\n}\n\nexport interface CreateSnapshotOptions {\n  agentId: string;\n  criterionId?: string;\n  snapshotDate: string;\n  passRate?: string;\n  evalCount?: number;\n  meanScore?: string;\n  saturationType?: SaturationType;\n  daysAtSaturation?: number;\n  trendDirection?: string;\n  trendStrength?: string;\n  healthStatus?: HealthStatus;\n  healthScore?: string;\n}\n\nexport interface CreateRegressionOptions {\n  agentId: string;\n  criterionId?: string;\n  severity: RegressionSeverity;\n  baselinePassRate: string;\n  currentPassRate: string;\n  delta: string;\n  deltaPercent?: string;\n  baselinePeriodStart: string;\n  baselinePeriodEnd: string;\n  currentPeriodStart: string;\n  currentPeriodEnd: string;\n  baselineEvalCount?: number;\n  currentEvalCount?: number;\n  suspectedCauses?: unknown[];\n  isSignificant?: boolean;\n  detectedAt?: string;\n}\n\nexport interface ResolveRegressionOptions {\n  resolutionType: string;\n  notes?: string;\n}\n\nexport interface GetSnapshotsOptions {\n  agentId: string;\n  criterionId?: string;\n  startDate?: string;\n  endDate?: string;\n}\n\n// ============================================================================\n// EVAL HEALTH API CLIENT\n// ============================================================================\n\n/**\n * Evaluation Health API client for monitoring eval quality and detecting regressions\n */\nexport const evalHealth = {\n  /**\n   * Get comprehensive health report for an agent\n   *\n   * @example\n   * ```typescript\n   * const report = await evalHealth.getReport('agent_123');\n   * console.log(`Overall health: ${report.overallHealth}`);\n   * console.log(`Active regressions: ${report.regressionCount}`);\n   * ```\n   */\n  async getReport(agentId: string): Promise<HealthReport> {\n    return apiRequestWithData<HealthReport>(\n      `/eval-health/report?agentId=${agentId}`,\n      { apiVersion: 'v1' }\n    );\n  },\n\n  // ---------------------------------------------------------------------------\n  // SNAPSHOTS\n  // ---------------------------------------------------------------------------\n\n  /**\n   * Get historical health snapshots\n   *\n   * @example\n   * ```typescript\n   * const snapshots = await evalHealth.getSnapshots({\n   *   agentId: 'agent_123',\n   *   startDate: '2024-01-01T00:00:00Z',\n   *   endDate: '2024-01-31T23:59:59Z',\n   * });\n   * ```\n   */\n  async getSnapshots(options: GetSnapshotsOptions): Promise<EvalHealthSnapshot[]> {\n    const params = new URLSearchParams();\n    params.set('agentId', options.agentId);\n    if (options.criterionId) params.set('criterionId', options.criterionId);\n    if (options.startDate) params.set('startDate', options.startDate);\n    if (options.endDate) params.set('endDate', options.endDate);\n\n    return apiRequestWithData<EvalHealthSnapshot[]>(\n      `/eval-health/snapshots?${params.toString()}`,\n      { apiVersion: 'v1' }\n    );\n  },\n\n  /**\n   * Get latest health snapshot\n   *\n   * @example\n   * ```typescript\n   * const snapshot = await evalHealth.getLatestSnapshot('agent_123');\n   * ```\n   */\n  async getLatestSnapshot(agentId: string, criterionId?: string): Promise<EvalHealthSnapshot | null> {\n    const params = new URLSearchParams();\n    params.set('agentId', agentId);\n    if (criterionId) params.set('criterionId', criterionId);\n\n    return apiRequestWithData<EvalHealthSnapshot | null>(\n      `/eval-health/snapshots/latest?${params.toString()}`,\n      { apiVersion: 'v1' }\n    );\n  },\n\n  /**\n   * Record a health snapshot\n   *\n   * @example\n   * ```typescript\n   * const snapshot = await evalHealth.recordSnapshot({\n   *   agentId: 'agent_123',\n   *   snapshotDate: new Date().toISOString(),\n   *   passRate: '0.85',\n   *   evalCount: 150,\n   *   healthStatus: 'healthy',\n   * });\n   * ```\n   */\n  async recordSnapshot(options: CreateSnapshotOptions): Promise<EvalHealthSnapshot> {\n    return apiRequestWithData<EvalHealthSnapshot>('/eval-health/snapshots', {\n      method: 'POST',\n      body: options,\n      apiVersion: 'v1',\n    });\n  },\n\n  // ---------------------------------------------------------------------------\n  // REGRESSIONS\n  // ---------------------------------------------------------------------------\n\n  /**\n   * Get unresolved regressions for an agent\n   *\n   * @example\n   * ```typescript\n   * const regressions = await evalHealth.getRegressions('agent_123');\n   * for (const regression of regressions) {\n   *   console.log(`${regression.severity}: ${regression.delta}% drop`);\n   * }\n   * ```\n   */\n  async getRegressions(agentId: string): Promise<EvalRegression[]> {\n    return apiRequestWithData<EvalRegression[]>(\n      `/eval-health/regressions?agentId=${agentId}`,\n      { apiVersion: 'v1' }\n    );\n  },\n\n  /**\n   * Record a new regression\n   *\n   * @example\n   * ```typescript\n   * const regression = await evalHealth.recordRegression({\n   *   agentId: 'agent_123',\n   *   severity: 'moderate',\n   *   baselinePassRate: '0.92',\n   *   currentPassRate: '0.78',\n   *   delta: '-0.14',\n   *   baselinePeriodStart: '2024-01-01T00:00:00Z',\n   *   baselinePeriodEnd: '2024-01-15T23:59:59Z',\n   *   currentPeriodStart: '2024-01-16T00:00:00Z',\n   *   currentPeriodEnd: '2024-01-31T23:59:59Z',\n   * });\n   * ```\n   */\n  async recordRegression(options: CreateRegressionOptions): Promise<EvalRegression> {\n    return apiRequestWithData<EvalRegression>('/eval-health/regressions', {\n      method: 'POST',\n      body: options,\n      apiVersion: 'v1',\n    });\n  },\n\n  /**\n   * Resolve a regression\n   *\n   * @example\n   * ```typescript\n   * await evalHealth.resolveRegression('regression_123', {\n   *   resolutionType: 'fixed',\n   *   notes: 'Updated prompt template to address quality issues',\n   * });\n   * ```\n   */\n  async resolveRegression(regressionId: string, options: ResolveRegressionOptions): Promise<void> {\n    await apiRequest(`/eval-health/regressions/${regressionId}/resolve`, {\n      method: 'POST',\n      body: options,\n      apiVersion: 'v1',\n    });\n  },\n\n  /**\n   * Acknowledge a regression\n   *\n   * @example\n   * ```typescript\n   * await evalHealth.acknowledgeRegression('regression_123');\n   * ```\n   */\n  async acknowledgeRegression(regressionId: string): Promise<void> {\n    await apiRequest(`/eval-health/regressions/${regressionId}/acknowledge`, {\n      method: 'POST',\n      apiVersion: 'v1',\n    });\n  },\n};\n\n// ============================================================================\n// HELPER FUNCTIONS\n// ============================================================================\n\n/**\n * Check if health status indicates an issue\n *\n * @param status - Health status to check\n * @returns Whether the status indicates a problem\n */\nexport function hasHealthIssue(status: HealthStatus): boolean {\n  return status === 'warning' || status === 'critical';\n}\n\n/**\n * Get severity level as numeric value for sorting\n *\n * @param severity - Regression severity\n * @returns Numeric severity (1-3, higher is worse)\n */\nexport function getSeverityLevel(severity: RegressionSeverity): number {\n  switch (severity) {\n    case 'minor': return 1;\n    case 'moderate': return 2;\n    case 'severe': return 3;\n    default: return 0;\n  }\n}\n\n/**\n * Check if evaluation is saturated\n *\n * @param snapshot - Health snapshot to check\n * @returns Whether evaluation is at ceiling or floor\n */\nexport function isSaturated(snapshot: EvalHealthSnapshot): boolean {\n  return snapshot.saturationType === 'ceiling' || snapshot.saturationType === 'floor';\n}\n\n/**\n * Get recommendation for saturation type\n *\n * @param saturationType - Type of saturation\n * @returns Recommendation string\n */\nexport function getSaturationRecommendation(saturationType: SaturationType): string {\n  switch (saturationType) {\n    case 'ceiling':\n      return 'Evaluation criteria may be too lenient. Consider adding stricter checks or more challenging test cases.';\n    case 'floor':\n      return 'Evaluation criteria may be too strict. Consider relaxing thresholds or reviewing criteria for accuracy.';\n    case 'healthy':\n      return 'Evaluation is operating within healthy parameters.';\n    default:\n      return 'Unable to determine saturation status.';\n  }\n}\n"]}