vibeostheog 0.22.16 → 0.22.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,440 +0,0 @@
1
- {
2
- "meta": {
3
- "generated_at": "2026-05-22T07:46:33.046Z",
4
- "version": "2.0",
5
- "schema": "vibeos-mode-calibration-v2"
6
- },
7
- "active_models": {
8
- "brain": "deepseek/deepseek-v4-pro",
9
- "medium": "deepseek/deepseek-v4-flash",
10
- "cheap": "deepseek/deepseek-chat"
11
- },
12
- "tier_collisions": [],
13
- "pricing_estimates": {
14
- "deepseek-v4-pro": {
15
- "prompt": 1.25,
16
- "completion": 8
17
- },
18
- "deepseek-v4-flash": {
19
- "prompt": 0.25,
20
- "completion": 1
21
- },
22
- "deepseek-chat": {
23
- "prompt": 0.14,
24
- "completion": 0.56
25
- },
26
- "deepseek-reasoner": {
27
- "prompt": 0.55,
28
- "completion": 2.19
29
- },
30
- "gpt-4o": {
31
- "prompt": 2.5,
32
- "completion": 10
33
- },
34
- "gpt-4o-mini": {
35
- "prompt": 0.15,
36
- "completion": 0.6
37
- },
38
- "claude-sonnet-4": {
39
- "prompt": 3,
40
- "completion": 15
41
- },
42
- "default": {
43
- "prompt": 1,
44
- "completion": 4
45
- }
46
- },
47
- "mode_configs": {
48
- "balanced": {
49
- "tier": "auto",
50
- "thinking": "auto",
51
- "enforcement": "normal",
52
- "flow": "normal",
53
- "tdd": "normal",
54
- "stress": 1,
55
- "loop_threshold": 0.6,
56
- "api_enrichment": true,
57
- "outcome_detection": true,
58
- "_empirical": {
59
- "brain": {
60
- "avg_latency_ms": 329,
61
- "avg_tps": 7564,
62
- "total_tok_out": 36892,
63
- "total_cost": 0.295821,
64
- "runs": 15
65
- },
66
- "medium": {
67
- "avg_latency_ms": 308,
68
- "avg_tps": 6686,
69
- "total_tok_out": 29542,
70
- "total_cost": 0.029679,
71
- "runs": 15
72
- },
73
- "cheap": {
74
- "avg_latency_ms": 391,
75
- "avg_tps": 5344,
76
- "total_tok_out": 13215,
77
- "total_cost": 0.007441560000000001,
78
- "runs": 8
79
- }
80
- }
81
- },
82
- "budget": {
83
- "tier": "cheap",
84
- "thinking": "off",
85
- "enforcement": "relaxed",
86
- "flow": "audit",
87
- "tdd": "lazy",
88
- "stress": 1,
89
- "loop_threshold": 0.6,
90
- "api_enrichment": false,
91
- "outcome_detection": false,
92
- "_empirical": {
93
- "avg_latency_ms": 391,
94
- "avg_tps": 5344,
95
- "total_tok_out": 13215,
96
- "total_cost": 0.007441560000000001,
97
- "runs": 8
98
- }
99
- },
100
- "quality": {
101
- "tier": "brain",
102
- "thinking": "full",
103
- "enforcement": "strict",
104
- "flow": "normal",
105
- "tdd": "strict",
106
- "stress": 1,
107
- "loop_threshold": 0.4,
108
- "api_enrichment": true,
109
- "outcome_detection": true,
110
- "_empirical": {
111
- "avg_latency_ms": 329,
112
- "avg_tps": 7564,
113
- "total_tok_out": 36892,
114
- "total_cost": 0.295821,
115
- "runs": 15
116
- }
117
- },
118
- "speed": {
119
- "tier": "medium",
120
- "thinking": "off",
121
- "enforcement": "relaxed",
122
- "flow": "audit",
123
- "tdd": "lazy",
124
- "stress": 1,
125
- "loop_threshold": 0.7,
126
- "api_enrichment": false,
127
- "outcome_detection": false,
128
- "_empirical": {
129
- "avg_latency_ms": 308,
130
- "avg_tps": 6686,
131
- "total_tok_out": 29542,
132
- "total_cost": 0.029679,
133
- "runs": 15
134
- }
135
- },
136
- "longrun": {
137
- "tier": "brain",
138
- "thinking": "brief",
139
- "enforcement": "normal",
140
- "flow": "normal",
141
- "tdd": "normal",
142
- "stress": 1,
143
- "loop_threshold": 0.5,
144
- "api_enrichment": true,
145
- "outcome_detection": true,
146
- "_empirical": {
147
- "avg_latency_ms": 329,
148
- "avg_tps": 7564,
149
- "total_tok_out": 36892,
150
- "total_cost": 0.295821,
151
- "runs": 15
152
- }
153
- },
154
- "forensic": {
155
- "tier": "brain",
156
- "thinking": "full",
157
- "enforcement": "strict",
158
- "flow": "strict",
159
- "tdd": "strict",
160
- "stress": 1.5,
161
- "loop_threshold": 0.3,
162
- "api_enrichment": true,
163
- "outcome_detection": true,
164
- "_empirical": {
165
- "avg_latency_ms": 329,
166
- "avg_tps": 7564,
167
- "total_tok_out": 36892,
168
- "total_cost": 0.295821,
169
- "runs": 15,
170
- "context7_urgency": "high",
171
- "wbp_verbosity": "verbose",
172
- "use_cases": [
173
- "debugging",
174
- "root cause analysis",
175
- "security audit",
176
- "bug investigation"
177
- ],
178
- "loop_protection": "aggressive"
179
- }
180
- },
181
- "web-research": {
182
- "tier": "medium",
183
- "thinking": "full",
184
- "enforcement": "audit",
185
- "flow": "audit",
186
- "tdd": "lazy",
187
- "stress": 1,
188
- "loop_threshold": 0.7,
189
- "api_enrichment": true,
190
- "outcome_detection": true,
191
- "_empirical": {
192
- "avg_latency_ms": 308,
193
- "avg_tps": 6686,
194
- "total_tok_out": 29542,
195
- "total_cost": 0.029679,
196
- "runs": 15,
197
- "context7_urgency": "required",
198
- "wbp_verbosity": "concise",
199
- "use_cases": [
200
- "web research",
201
- "exploration",
202
- "competitive analysis",
203
- "documentation lookup"
204
- ],
205
- "loop_protection": "lenient"
206
- }
207
- }
208
- },
209
- "mode_breakdown": {
210
- "balanced": {
211
- "sessions": 5,
212
- "cost": 0,
213
- "deleg_savings": 0.11000000000000001,
214
- "cache_savings": 0,
215
- "warns": 12,
216
- "tool_calls": 0,
217
- "stress_sum": 0.68,
218
- "stress_count": 5,
219
- "scratchpad_hits": 0,
220
- "total_session_ms": 0,
221
- "context7_bypass": 0,
222
- "ledger_entries": 0,
223
- "task_calls": 0,
224
- "task_success": 0,
225
- "regime_changes": 0,
226
- "cost_per_turn": 0,
227
- "savings_ratio": 0,
228
- "warn_per_session": 2.4,
229
- "stress_avg": 0.14,
230
- "cache_hit_rate": 0,
231
- "cost_per_success": 0,
232
- "thinking_roi": 0,
233
- "speed_to_cost": 0,
234
- "avg_cost_per_session": 0,
235
- "est_prompt_tokens": 0,
236
- "est_completion_tokens": 0,
237
- "est_total_tokens": 0,
238
- "est_tok_per_session": 0
239
- },
240
- "budget": {
241
- "sessions": 0,
242
- "cost": 0,
243
- "deleg_savings": 0,
244
- "cache_savings": 0,
245
- "warns": 0,
246
- "tool_calls": 0,
247
- "stress_sum": 0,
248
- "stress_count": 0,
249
- "scratchpad_hits": 0,
250
- "total_session_ms": 0,
251
- "context7_bypass": 0,
252
- "ledger_entries": 0,
253
- "task_calls": 0,
254
- "task_success": 0,
255
- "regime_changes": 0,
256
- "cost_per_turn": 0,
257
- "savings_ratio": 0,
258
- "warn_per_session": 0,
259
- "stress_avg": 0,
260
- "cache_hit_rate": 0,
261
- "cost_per_success": 0,
262
- "thinking_roi": 0,
263
- "speed_to_cost": 0,
264
- "avg_cost_per_session": 0,
265
- "est_prompt_tokens": 0,
266
- "est_completion_tokens": 0,
267
- "est_total_tokens": 0,
268
- "est_tok_per_session": 0
269
- },
270
- "quality": {
271
- "sessions": 0,
272
- "cost": 0,
273
- "deleg_savings": 0,
274
- "cache_savings": 0,
275
- "warns": 0,
276
- "tool_calls": 0,
277
- "stress_sum": 0,
278
- "stress_count": 0,
279
- "scratchpad_hits": 0,
280
- "total_session_ms": 0,
281
- "context7_bypass": 0,
282
- "ledger_entries": 0,
283
- "task_calls": 0,
284
- "task_success": 0,
285
- "regime_changes": 0,
286
- "cost_per_turn": 0,
287
- "savings_ratio": 0,
288
- "warn_per_session": 0,
289
- "stress_avg": 0,
290
- "cache_hit_rate": 0,
291
- "cost_per_success": 0,
292
- "thinking_roi": 0,
293
- "speed_to_cost": 0,
294
- "avg_cost_per_session": 0,
295
- "est_prompt_tokens": 0,
296
- "est_completion_tokens": 0,
297
- "est_total_tokens": 0,
298
- "est_tok_per_session": 0
299
- },
300
- "speed": {
301
- "sessions": 0,
302
- "cost": 0,
303
- "deleg_savings": 0,
304
- "cache_savings": 0,
305
- "warns": 0,
306
- "tool_calls": 0,
307
- "stress_sum": 0,
308
- "stress_count": 0,
309
- "scratchpad_hits": 0,
310
- "total_session_ms": 0,
311
- "context7_bypass": 0,
312
- "ledger_entries": 0,
313
- "task_calls": 0,
314
- "task_success": 0,
315
- "regime_changes": 0,
316
- "cost_per_turn": 0,
317
- "savings_ratio": 0,
318
- "warn_per_session": 0,
319
- "stress_avg": 0,
320
- "cache_hit_rate": 0,
321
- "cost_per_success": 0,
322
- "thinking_roi": 0,
323
- "speed_to_cost": 0,
324
- "avg_cost_per_session": 0,
325
- "est_prompt_tokens": 0,
326
- "est_completion_tokens": 0,
327
- "est_total_tokens": 0,
328
- "est_tok_per_session": 0
329
- },
330
- "longrun": {
331
- "sessions": 0,
332
- "cost": 0,
333
- "deleg_savings": 0,
334
- "cache_savings": 0,
335
- "warns": 0,
336
- "tool_calls": 0,
337
- "stress_sum": 0,
338
- "stress_count": 0,
339
- "scratchpad_hits": 0,
340
- "total_session_ms": 0,
341
- "context7_bypass": 0,
342
- "ledger_entries": 0,
343
- "task_calls": 0,
344
- "task_success": 0,
345
- "regime_changes": 0,
346
- "cost_per_turn": 0,
347
- "savings_ratio": 0,
348
- "warn_per_session": 0,
349
- "stress_avg": 0,
350
- "cache_hit_rate": 0,
351
- "cost_per_success": 0,
352
- "thinking_roi": 0,
353
- "speed_to_cost": 0,
354
- "avg_cost_per_session": 0,
355
- "est_prompt_tokens": 0,
356
- "est_completion_tokens": 0,
357
- "est_total_tokens": 0,
358
- "est_tok_per_session": 0
359
- }
360
- },
361
- "regime_distribution": {
362
- "UNKNOWN": 20
363
- },
364
- "regime_mode_map": {
365
- "UNKNOWN": {
366
- "balanced": 20
367
- }
368
- },
369
- "learning_stats": {
370
- "exploratory_words": 24,
371
- "task_first_words": 122,
372
- "ml_graph": "present",
373
- "ml_cache": "present",
374
- "cross_project_patterns": 58
375
- },
376
- "calibration_flags": [],
377
- "expected_rankings": {
378
- "cost_ranking": [
379
- "balanced"
380
- ],
381
- "cost_valid": false,
382
- "savings_ranking": [
383
- "balanced"
384
- ],
385
- "warning_ranking": [
386
- "balanced"
387
- ]
388
- },
389
- "lifetime": {
390
- "total_savings_usd": 0.366,
391
- "cache_savings_usd": 0,
392
- "missed_context7_usd": 0,
393
- "scratchpad_hits": 0,
394
- "warn_count": 22,
395
- "session_count": 5,
396
- "cost_sum": 0
397
- },
398
- "checklist": {
399
- "speed_is_fastest_unverified": false,
400
- "budget_is_cheapest_unverified": true,
401
- "quality_best_output_unverified": true,
402
- "longrun_appropriate_unverified": true,
403
- "auto_mode_sensible_unverified": true,
404
- "ttft_needs_live_bench": false,
405
- "token_throughput_needs_live_bench": true,
406
- "first_attempt_success_needs_live_bench": true,
407
- "rework_cycles_needs_live_bench": true,
408
- "compile_pass_rate_needs_live_bench": true,
409
- "user_override_rate_needs_live_bench": true,
410
- "balanced_empirically_verified": true,
411
- "speed_latency_measured": "308ms avg",
412
- "brain_latency_measured": "329ms avg",
413
- "cheap_latency_measured": "391ms avg",
414
- "tier_parity_confirmed": "brain ~= medium (within 8%)",
415
- "forensic_mode_added": true,
416
- "web_research_mode_added": true,
417
- "calibration_date": "2026-05-23T07:07:08.679Z"
418
- },
419
- "verification": {
420
- "tier_benchmark_completed": true,
421
- "total_api_runs": 38,
422
- "total_cost": 0.3329415600000001,
423
- "human_flow_simulations": [
424
- "delete-record-saving@72s",
425
- "rename-sync-control@30s",
426
- "fix-savings-field@95s"
427
- ],
428
- "modes_implemented": [
429
- "balanced",
430
- "budget",
431
- "quality",
432
- "speed",
433
- "longrun",
434
- "forensic",
435
- "web-research"
436
- ],
437
- "auto_select_mode_fixed": true,
438
- "compute_control_vector_active": true
439
- }
440
- }
@@ -1,89 +0,0 @@
1
- {
2
- "meta": {
3
- "generated_at": "2026-05-23T06:59:30.473Z",
4
- "type": "mode-signal-analysis",
5
- "version": "1.0"
6
- },
7
- "mode_projections": [
8
- {
9
- "mode": "balanced",
10
- "tier": "brain",
11
- "thinking": "off",
12
- "avg_lat_ms": 309,
13
- "avg_tps": 8898,
14
- "cost_per_run": 0.020487833333333334,
15
- "tok_eff": 0.008016629711751664
16
- },
17
- {
18
- "mode": "budget",
19
- "tier": "cheap",
20
- "thinking": "off",
21
- "avg_lat_ms": 330,
22
- "avg_tps": 1109,
23
- "cost_per_run": 0.00022820000000000002,
24
- "tok_eff": 0.000569077306733167
25
- },
26
- {
27
- "mode": "quality",
28
- "tier": "brain",
29
- "thinking": "full",
30
- "avg_lat_ms": 355,
31
- "avg_tps": 7817,
32
- "cost_per_run": 0.019018499999999997,
33
- "tok_eff": 0.008017917369308599
34
- },
35
- {
36
- "mode": "speed",
37
- "tier": "medium",
38
- "thinking": "off",
39
- "avg_lat_ms": 283,
40
- "avg_tps": 5442,
41
- "cost_per_run": 0.0015545000000000001,
42
- "tok_eff": 0.001005498059508409
43
- },
44
- {
45
- "mode": "longrun",
46
- "tier": "brain",
47
- "thinking": "brief",
48
- "avg_lat_ms": 332,
49
- "avg_tps": 6040,
50
- "cost_per_run": 0.017647833333333335,
51
- "tok_eff": 0.008019312329597092
52
- }
53
- ],
54
- "gaps_found": [
55
- {
56
- "id": "TURBO",
57
- "priority": "low",
58
- "description": "Cheap + off thinking, already covered by budget"
59
- },
60
- {
61
- "id": "FORENSIC",
62
- "priority": "high",
63
- "description": "Brain + full thinking + strict flow — no existing mode covers debugging"
64
- },
65
- {
66
- "id": "WEB_RESEARCH",
67
- "priority": "high",
68
- "description": "Medium + full thinking + context7 — fills exploration gap"
69
- },
70
- {
71
- "id": "CODE_REVIEW",
72
- "priority": "medium",
73
- "description": "Brain + full thinking + strict TDD — partially covered by quality"
74
- }
75
- ],
76
- "key_insights": [
77
- "Brain and medium have nearly identical latency (~320ms avg) — medium is not meaningfully faster",
78
- "Medium is 8x cheaper than brain for equivalent throughput",
79
- "First cheap request is 2.6x slower than subsequent (cold start: 981ms vs ~370ms)",
80
- "All modes except 'balanced' have 0 real sessions in calibration data",
81
- "Calibration checklist marks all mode hypotheses as 'unverified'"
82
- ],
83
- "recommendations": [
84
- "Add FORENSIC mode for debugging/sleuthing workflows",
85
- "Add WEB_RESEARCH mode for exploration tasks",
86
- "Recalibrate auto mode selection since brain=medium in latency",
87
- "Run forced mode sessions to populate calibration data for non-balanced modes"
88
- ]
89
- }