rafcode 2.2.0 → 2.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/RAF/ahtahs-token-reaper/decisions.md +37 -0
- package/RAF/ahtahs-token-reaper/input.md +20 -0
- package/RAF/ahtahs-token-reaper/outcomes/01-extend-token-tracker-data-model.md +42 -0
- package/RAF/ahtahs-token-reaper/outcomes/02-accumulate-usage-in-retry-loop.md +31 -0
- package/RAF/ahtahs-token-reaper/outcomes/03-per-attempt-display-formatting.md +60 -0
- package/RAF/ahtahs-token-reaper/outcomes/04-add-model-name-to-claude-call-logs.md +57 -0
- package/RAF/ahtahs-token-reaper/outcomes/05-handle-invalid-config-in-raf-config.md +46 -0
- package/RAF/ahtahs-token-reaper/outcomes/06-fix-verbose-toggle-timer-display.md +38 -0
- package/RAF/ahtahs-token-reaper/plans/01-extend-token-tracker-data-model.md +36 -0
- package/RAF/ahtahs-token-reaper/plans/02-accumulate-usage-in-retry-loop.md +36 -0
- package/RAF/ahtahs-token-reaper/plans/03-per-attempt-display-formatting.md +43 -0
- package/RAF/ahtahs-token-reaper/plans/04-add-model-name-to-claude-call-logs.md +38 -0
- package/RAF/ahtahs-token-reaper/plans/05-handle-invalid-config-in-raf-config.md +36 -0
- package/RAF/ahtahs-token-reaper/plans/06-fix-verbose-toggle-timer-display.md +40 -0
- package/dist/commands/config.d.ts.map +1 -1
- package/dist/commands/config.js +27 -5
- package/dist/commands/config.js.map +1 -1
- package/dist/commands/do.js +17 -10
- package/dist/commands/do.js.map +1 -1
- package/dist/commands/plan.js +3 -2
- package/dist/commands/plan.js.map +1 -1
- package/dist/core/pull-request.d.ts.map +1 -1
- package/dist/core/pull-request.js +3 -1
- package/dist/core/pull-request.js.map +1 -1
- package/dist/utils/config.d.ts +6 -0
- package/dist/utils/config.d.ts.map +1 -1
- package/dist/utils/config.js +21 -0
- package/dist/utils/config.js.map +1 -1
- package/dist/utils/terminal-symbols.d.ts +8 -4
- package/dist/utils/terminal-symbols.d.ts.map +1 -1
- package/dist/utils/terminal-symbols.js +31 -6
- package/dist/utils/terminal-symbols.js.map +1 -1
- package/dist/utils/token-tracker.d.ts +11 -1
- package/dist/utils/token-tracker.d.ts.map +1 -1
- package/dist/utils/token-tracker.js +37 -2
- package/dist/utils/token-tracker.js.map +1 -1
- package/package.json +1 -1
- package/src/commands/config.ts +30 -4
- package/src/commands/do.ts +17 -10
- package/src/commands/plan.ts +3 -2
- package/src/core/pull-request.ts +3 -1
- package/src/utils/config.ts +22 -0
- package/src/utils/terminal-symbols.ts +42 -7
- package/src/utils/token-tracker.ts +44 -2
- package/tests/unit/config-command.test.ts +80 -1
- package/tests/unit/config.test.ts +24 -0
- package/tests/unit/terminal-symbols.test.ts +121 -33
- package/tests/unit/timer-verbose-integration.test.ts +170 -0
- package/tests/unit/token-tracker.test.ts +350 -17
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { TokenTracker, CostBreakdown } from '../../src/utils/token-tracker.js';
|
|
1
|
+
import { TokenTracker, CostBreakdown, accumulateUsage } from '../../src/utils/token-tracker.js';
|
|
2
2
|
import { UsageData, PricingConfig, DEFAULT_CONFIG } from '../../src/types/config.js';
|
|
3
3
|
|
|
4
4
|
function makeUsage(overrides: Partial<UsageData> = {}): UsageData {
|
|
@@ -178,7 +178,7 @@ describe('TokenTracker', () => {
|
|
|
178
178
|
it('should accumulate usage across multiple tasks', () => {
|
|
179
179
|
const tracker = new TokenTracker(testPricing);
|
|
180
180
|
|
|
181
|
-
tracker.addTask('01', makeUsage({
|
|
181
|
+
tracker.addTask('01', [makeUsage({
|
|
182
182
|
inputTokens: 500_000,
|
|
183
183
|
outputTokens: 200_000,
|
|
184
184
|
modelUsage: {
|
|
@@ -189,9 +189,9 @@ describe('TokenTracker', () => {
|
|
|
189
189
|
cacheCreationInputTokens: 0,
|
|
190
190
|
},
|
|
191
191
|
},
|
|
192
|
-
}));
|
|
192
|
+
})]);
|
|
193
193
|
|
|
194
|
-
tracker.addTask('02', makeUsage({
|
|
194
|
+
tracker.addTask('02', [makeUsage({
|
|
195
195
|
inputTokens: 300_000,
|
|
196
196
|
outputTokens: 100_000,
|
|
197
197
|
modelUsage: {
|
|
@@ -202,7 +202,7 @@ describe('TokenTracker', () => {
|
|
|
202
202
|
cacheCreationInputTokens: 0,
|
|
203
203
|
},
|
|
204
204
|
},
|
|
205
|
-
}));
|
|
205
|
+
})]);
|
|
206
206
|
|
|
207
207
|
const totals = tracker.getTotals();
|
|
208
208
|
expect(totals.usage.inputTokens).toBe(800_000);
|
|
@@ -214,7 +214,7 @@ describe('TokenTracker', () => {
|
|
|
214
214
|
it('should accumulate costs across multiple tasks', () => {
|
|
215
215
|
const tracker = new TokenTracker(testPricing);
|
|
216
216
|
|
|
217
|
-
const entry1 = tracker.addTask('01', makeUsage({
|
|
217
|
+
const entry1 = tracker.addTask('01', [makeUsage({
|
|
218
218
|
inputTokens: 1_000_000,
|
|
219
219
|
outputTokens: 1_000_000,
|
|
220
220
|
modelUsage: {
|
|
@@ -225,9 +225,9 @@ describe('TokenTracker', () => {
|
|
|
225
225
|
cacheCreationInputTokens: 0,
|
|
226
226
|
},
|
|
227
227
|
},
|
|
228
|
-
}));
|
|
228
|
+
})]);
|
|
229
229
|
|
|
230
|
-
const entry2 = tracker.addTask('02', makeUsage({
|
|
230
|
+
const entry2 = tracker.addTask('02', [makeUsage({
|
|
231
231
|
inputTokens: 1_000_000,
|
|
232
232
|
outputTokens: 1_000_000,
|
|
233
233
|
modelUsage: {
|
|
@@ -238,7 +238,7 @@ describe('TokenTracker', () => {
|
|
|
238
238
|
cacheCreationInputTokens: 0,
|
|
239
239
|
},
|
|
240
240
|
},
|
|
241
|
-
}));
|
|
241
|
+
})]);
|
|
242
242
|
|
|
243
243
|
const totals = tracker.getTotals();
|
|
244
244
|
// Each task: $3 input + $15 output = $18
|
|
@@ -250,7 +250,7 @@ describe('TokenTracker', () => {
|
|
|
250
250
|
it('should accumulate multi-model usage across tasks', () => {
|
|
251
251
|
const tracker = new TokenTracker(testPricing);
|
|
252
252
|
|
|
253
|
-
tracker.addTask('01', makeUsage({
|
|
253
|
+
tracker.addTask('01', [makeUsage({
|
|
254
254
|
inputTokens: 1_000_000,
|
|
255
255
|
outputTokens: 500_000,
|
|
256
256
|
modelUsage: {
|
|
@@ -261,9 +261,9 @@ describe('TokenTracker', () => {
|
|
|
261
261
|
cacheCreationInputTokens: 0,
|
|
262
262
|
},
|
|
263
263
|
},
|
|
264
|
-
}));
|
|
264
|
+
})]);
|
|
265
265
|
|
|
266
|
-
tracker.addTask('02', makeUsage({
|
|
266
|
+
tracker.addTask('02', [makeUsage({
|
|
267
267
|
inputTokens: 500_000,
|
|
268
268
|
outputTokens: 200_000,
|
|
269
269
|
modelUsage: {
|
|
@@ -274,7 +274,7 @@ describe('TokenTracker', () => {
|
|
|
274
274
|
cacheCreationInputTokens: 0,
|
|
275
275
|
},
|
|
276
276
|
},
|
|
277
|
-
}));
|
|
277
|
+
})]);
|
|
278
278
|
|
|
279
279
|
const totals = tracker.getTotals();
|
|
280
280
|
expect(totals.usage.modelUsage['claude-opus-4-6']?.inputTokens).toBe(1_000_000);
|
|
@@ -292,8 +292,8 @@ describe('TokenTracker', () => {
|
|
|
292
292
|
|
|
293
293
|
it('should return per-task entries', () => {
|
|
294
294
|
const tracker = new TokenTracker(testPricing);
|
|
295
|
-
tracker.addTask('01', makeUsage({ inputTokens: 100 }));
|
|
296
|
-
tracker.addTask('02', makeUsage({ inputTokens: 200 }));
|
|
295
|
+
tracker.addTask('01', [makeUsage({ inputTokens: 100 })]);
|
|
296
|
+
tracker.addTask('02', [makeUsage({ inputTokens: 200 })]);
|
|
297
297
|
|
|
298
298
|
const entries = tracker.getEntries();
|
|
299
299
|
expect(entries).toHaveLength(2);
|
|
@@ -303,7 +303,7 @@ describe('TokenTracker', () => {
|
|
|
303
303
|
|
|
304
304
|
it('addTask returns the entry with cost', () => {
|
|
305
305
|
const tracker = new TokenTracker(testPricing);
|
|
306
|
-
const entry = tracker.addTask('01', makeUsage({
|
|
306
|
+
const entry = tracker.addTask('01', [makeUsage({
|
|
307
307
|
inputTokens: 1_000_000,
|
|
308
308
|
modelUsage: {
|
|
309
309
|
'claude-opus-4-6': {
|
|
@@ -313,12 +313,345 @@ describe('TokenTracker', () => {
|
|
|
313
313
|
cacheCreationInputTokens: 0,
|
|
314
314
|
},
|
|
315
315
|
},
|
|
316
|
-
}));
|
|
316
|
+
})]);
|
|
317
317
|
|
|
318
318
|
expect(entry.taskId).toBe('01');
|
|
319
319
|
expect(entry.cost.inputCost).toBeCloseTo(15);
|
|
320
320
|
expect(entry.cost.totalCost).toBeCloseTo(15);
|
|
321
321
|
});
|
|
322
|
+
|
|
323
|
+
it('should store attempts array in entry', () => {
|
|
324
|
+
const tracker = new TokenTracker(testPricing);
|
|
325
|
+
const usage = makeUsage({ inputTokens: 100 });
|
|
326
|
+
const entry = tracker.addTask('01', [usage]);
|
|
327
|
+
|
|
328
|
+
expect(entry.attempts).toHaveLength(1);
|
|
329
|
+
expect(entry.attempts[0]).toEqual(usage);
|
|
330
|
+
});
|
|
331
|
+
|
|
332
|
+
it('should accumulate multiple attempts for a single task', () => {
|
|
333
|
+
const tracker = new TokenTracker(testPricing);
|
|
334
|
+
const attempt1 = makeUsage({
|
|
335
|
+
inputTokens: 500_000,
|
|
336
|
+
outputTokens: 100_000,
|
|
337
|
+
modelUsage: {
|
|
338
|
+
'claude-opus-4-6': {
|
|
339
|
+
inputTokens: 500_000,
|
|
340
|
+
outputTokens: 100_000,
|
|
341
|
+
cacheReadInputTokens: 0,
|
|
342
|
+
cacheCreationInputTokens: 0,
|
|
343
|
+
},
|
|
344
|
+
},
|
|
345
|
+
});
|
|
346
|
+
const attempt2 = makeUsage({
|
|
347
|
+
inputTokens: 600_000,
|
|
348
|
+
outputTokens: 200_000,
|
|
349
|
+
modelUsage: {
|
|
350
|
+
'claude-opus-4-6': {
|
|
351
|
+
inputTokens: 600_000,
|
|
352
|
+
outputTokens: 200_000,
|
|
353
|
+
cacheReadInputTokens: 0,
|
|
354
|
+
cacheCreationInputTokens: 0,
|
|
355
|
+
},
|
|
356
|
+
},
|
|
357
|
+
});
|
|
358
|
+
|
|
359
|
+
const entry = tracker.addTask('01', [attempt1, attempt2]);
|
|
360
|
+
|
|
361
|
+
expect(entry.usage.inputTokens).toBe(1_100_000);
|
|
362
|
+
expect(entry.usage.outputTokens).toBe(300_000);
|
|
363
|
+
expect(entry.usage.modelUsage['claude-opus-4-6']?.inputTokens).toBe(1_100_000);
|
|
364
|
+
expect(entry.attempts).toHaveLength(2);
|
|
365
|
+
});
|
|
366
|
+
|
|
367
|
+
it('should correctly accumulate multi-attempt costs', () => {
|
|
368
|
+
const tracker = new TokenTracker(testPricing);
|
|
369
|
+
const attempt1 = makeUsage({
|
|
370
|
+
inputTokens: 1_000_000,
|
|
371
|
+
modelUsage: {
|
|
372
|
+
'claude-sonnet-4-5': {
|
|
373
|
+
inputTokens: 1_000_000,
|
|
374
|
+
outputTokens: 0,
|
|
375
|
+
cacheReadInputTokens: 0,
|
|
376
|
+
cacheCreationInputTokens: 0,
|
|
377
|
+
},
|
|
378
|
+
},
|
|
379
|
+
});
|
|
380
|
+
const attempt2 = makeUsage({
|
|
381
|
+
inputTokens: 1_000_000,
|
|
382
|
+
modelUsage: {
|
|
383
|
+
'claude-sonnet-4-5': {
|
|
384
|
+
inputTokens: 1_000_000,
|
|
385
|
+
outputTokens: 0,
|
|
386
|
+
cacheReadInputTokens: 0,
|
|
387
|
+
cacheCreationInputTokens: 0,
|
|
388
|
+
},
|
|
389
|
+
},
|
|
390
|
+
});
|
|
391
|
+
|
|
392
|
+
const entry = tracker.addTask('01', [attempt1, attempt2]);
|
|
393
|
+
|
|
394
|
+
// 2M tokens * $3/MTok = $6
|
|
395
|
+
expect(entry.cost.inputCost).toBeCloseTo(6);
|
|
396
|
+
expect(entry.cost.totalCost).toBeCloseTo(6);
|
|
397
|
+
});
|
|
398
|
+
});
|
|
399
|
+
|
|
400
|
+
describe('accumulateUsage', () => {
|
|
401
|
+
it('should return empty usage for empty array', () => {
|
|
402
|
+
const result = accumulateUsage([]);
|
|
403
|
+
expect(result.inputTokens).toBe(0);
|
|
404
|
+
expect(result.outputTokens).toBe(0);
|
|
405
|
+
expect(result.cacheReadInputTokens).toBe(0);
|
|
406
|
+
expect(result.cacheCreationInputTokens).toBe(0);
|
|
407
|
+
expect(Object.keys(result.modelUsage)).toHaveLength(0);
|
|
408
|
+
});
|
|
409
|
+
|
|
410
|
+
it('should return same usage for single-element array', () => {
|
|
411
|
+
const usage = makeUsage({
|
|
412
|
+
inputTokens: 100,
|
|
413
|
+
outputTokens: 200,
|
|
414
|
+
cacheReadInputTokens: 50,
|
|
415
|
+
cacheCreationInputTokens: 25,
|
|
416
|
+
modelUsage: {
|
|
417
|
+
'claude-opus-4-6': {
|
|
418
|
+
inputTokens: 100,
|
|
419
|
+
outputTokens: 200,
|
|
420
|
+
cacheReadInputTokens: 50,
|
|
421
|
+
cacheCreationInputTokens: 25,
|
|
422
|
+
},
|
|
423
|
+
},
|
|
424
|
+
});
|
|
425
|
+
|
|
426
|
+
const result = accumulateUsage([usage]);
|
|
427
|
+
expect(result.inputTokens).toBe(100);
|
|
428
|
+
expect(result.outputTokens).toBe(200);
|
|
429
|
+
expect(result.cacheReadInputTokens).toBe(50);
|
|
430
|
+
expect(result.cacheCreationInputTokens).toBe(25);
|
|
431
|
+
expect(result.modelUsage['claude-opus-4-6']?.inputTokens).toBe(100);
|
|
432
|
+
});
|
|
433
|
+
|
|
434
|
+
it('should sum all token fields across attempts', () => {
|
|
435
|
+
const attempt1 = makeUsage({
|
|
436
|
+
inputTokens: 100,
|
|
437
|
+
outputTokens: 50,
|
|
438
|
+
cacheReadInputTokens: 10,
|
|
439
|
+
cacheCreationInputTokens: 5,
|
|
440
|
+
});
|
|
441
|
+
const attempt2 = makeUsage({
|
|
442
|
+
inputTokens: 200,
|
|
443
|
+
outputTokens: 100,
|
|
444
|
+
cacheReadInputTokens: 20,
|
|
445
|
+
cacheCreationInputTokens: 10,
|
|
446
|
+
});
|
|
447
|
+
|
|
448
|
+
const result = accumulateUsage([attempt1, attempt2]);
|
|
449
|
+
expect(result.inputTokens).toBe(300);
|
|
450
|
+
expect(result.outputTokens).toBe(150);
|
|
451
|
+
expect(result.cacheReadInputTokens).toBe(30);
|
|
452
|
+
expect(result.cacheCreationInputTokens).toBe(15);
|
|
453
|
+
});
|
|
454
|
+
|
|
455
|
+
it('should merge modelUsage for same model across attempts', () => {
|
|
456
|
+
const attempt1 = makeUsage({
|
|
457
|
+
modelUsage: {
|
|
458
|
+
'claude-opus-4-6': {
|
|
459
|
+
inputTokens: 100,
|
|
460
|
+
outputTokens: 50,
|
|
461
|
+
cacheReadInputTokens: 10,
|
|
462
|
+
cacheCreationInputTokens: 5,
|
|
463
|
+
},
|
|
464
|
+
},
|
|
465
|
+
});
|
|
466
|
+
const attempt2 = makeUsage({
|
|
467
|
+
modelUsage: {
|
|
468
|
+
'claude-opus-4-6': {
|
|
469
|
+
inputTokens: 200,
|
|
470
|
+
outputTokens: 100,
|
|
471
|
+
cacheReadInputTokens: 20,
|
|
472
|
+
cacheCreationInputTokens: 10,
|
|
473
|
+
},
|
|
474
|
+
},
|
|
475
|
+
});
|
|
476
|
+
|
|
477
|
+
const result = accumulateUsage([attempt1, attempt2]);
|
|
478
|
+
expect(result.modelUsage['claude-opus-4-6']?.inputTokens).toBe(300);
|
|
479
|
+
expect(result.modelUsage['claude-opus-4-6']?.outputTokens).toBe(150);
|
|
480
|
+
expect(result.modelUsage['claude-opus-4-6']?.cacheReadInputTokens).toBe(30);
|
|
481
|
+
expect(result.modelUsage['claude-opus-4-6']?.cacheCreationInputTokens).toBe(15);
|
|
482
|
+
});
|
|
483
|
+
|
|
484
|
+
it('should handle different models across attempts', () => {
|
|
485
|
+
const attempt1 = makeUsage({
|
|
486
|
+
inputTokens: 100,
|
|
487
|
+
outputTokens: 50,
|
|
488
|
+
modelUsage: {
|
|
489
|
+
'claude-opus-4-6': {
|
|
490
|
+
inputTokens: 100,
|
|
491
|
+
outputTokens: 50,
|
|
492
|
+
cacheReadInputTokens: 0,
|
|
493
|
+
cacheCreationInputTokens: 0,
|
|
494
|
+
},
|
|
495
|
+
},
|
|
496
|
+
});
|
|
497
|
+
const attempt2 = makeUsage({
|
|
498
|
+
inputTokens: 200,
|
|
499
|
+
outputTokens: 100,
|
|
500
|
+
modelUsage: {
|
|
501
|
+
'claude-sonnet-4-5': {
|
|
502
|
+
inputTokens: 200,
|
|
503
|
+
outputTokens: 100,
|
|
504
|
+
cacheReadInputTokens: 0,
|
|
505
|
+
cacheCreationInputTokens: 0,
|
|
506
|
+
},
|
|
507
|
+
},
|
|
508
|
+
});
|
|
509
|
+
|
|
510
|
+
const result = accumulateUsage([attempt1, attempt2]);
|
|
511
|
+
expect(result.inputTokens).toBe(300);
|
|
512
|
+
expect(result.outputTokens).toBe(150);
|
|
513
|
+
expect(result.modelUsage['claude-opus-4-6']?.inputTokens).toBe(100);
|
|
514
|
+
expect(result.modelUsage['claude-sonnet-4-5']?.inputTokens).toBe(200);
|
|
515
|
+
expect(Object.keys(result.modelUsage)).toHaveLength(2);
|
|
516
|
+
});
|
|
517
|
+
|
|
518
|
+
it('should handle mixed model usage across attempts', () => {
|
|
519
|
+
const attempt1 = makeUsage({
|
|
520
|
+
inputTokens: 300,
|
|
521
|
+
outputTokens: 150,
|
|
522
|
+
modelUsage: {
|
|
523
|
+
'claude-opus-4-6': {
|
|
524
|
+
inputTokens: 200,
|
|
525
|
+
outputTokens: 100,
|
|
526
|
+
cacheReadInputTokens: 0,
|
|
527
|
+
cacheCreationInputTokens: 0,
|
|
528
|
+
},
|
|
529
|
+
'claude-haiku-4-5': {
|
|
530
|
+
inputTokens: 100,
|
|
531
|
+
outputTokens: 50,
|
|
532
|
+
cacheReadInputTokens: 0,
|
|
533
|
+
cacheCreationInputTokens: 0,
|
|
534
|
+
},
|
|
535
|
+
},
|
|
536
|
+
});
|
|
537
|
+
const attempt2 = makeUsage({
|
|
538
|
+
inputTokens: 400,
|
|
539
|
+
outputTokens: 200,
|
|
540
|
+
modelUsage: {
|
|
541
|
+
'claude-opus-4-6': {
|
|
542
|
+
inputTokens: 100,
|
|
543
|
+
outputTokens: 50,
|
|
544
|
+
cacheReadInputTokens: 0,
|
|
545
|
+
cacheCreationInputTokens: 0,
|
|
546
|
+
},
|
|
547
|
+
'claude-sonnet-4-5': {
|
|
548
|
+
inputTokens: 300,
|
|
549
|
+
outputTokens: 150,
|
|
550
|
+
cacheReadInputTokens: 0,
|
|
551
|
+
cacheCreationInputTokens: 0,
|
|
552
|
+
},
|
|
553
|
+
},
|
|
554
|
+
});
|
|
555
|
+
|
|
556
|
+
const result = accumulateUsage([attempt1, attempt2]);
|
|
557
|
+
expect(result.inputTokens).toBe(700);
|
|
558
|
+
expect(result.outputTokens).toBe(350);
|
|
559
|
+
// Opus: 200 + 100 = 300
|
|
560
|
+
expect(result.modelUsage['claude-opus-4-6']?.inputTokens).toBe(300);
|
|
561
|
+
// Haiku: only from attempt1
|
|
562
|
+
expect(result.modelUsage['claude-haiku-4-5']?.inputTokens).toBe(100);
|
|
563
|
+
// Sonnet: only from attempt2
|
|
564
|
+
expect(result.modelUsage['claude-sonnet-4-5']?.inputTokens).toBe(300);
|
|
565
|
+
});
|
|
566
|
+
|
|
567
|
+
it('should not mutate input objects', () => {
|
|
568
|
+
const attempt1 = makeUsage({
|
|
569
|
+
inputTokens: 100,
|
|
570
|
+
modelUsage: {
|
|
571
|
+
'claude-opus-4-6': {
|
|
572
|
+
inputTokens: 100,
|
|
573
|
+
outputTokens: 0,
|
|
574
|
+
cacheReadInputTokens: 0,
|
|
575
|
+
cacheCreationInputTokens: 0,
|
|
576
|
+
},
|
|
577
|
+
},
|
|
578
|
+
});
|
|
579
|
+
const attempt2 = makeUsage({
|
|
580
|
+
inputTokens: 200,
|
|
581
|
+
modelUsage: {
|
|
582
|
+
'claude-opus-4-6': {
|
|
583
|
+
inputTokens: 200,
|
|
584
|
+
outputTokens: 0,
|
|
585
|
+
cacheReadInputTokens: 0,
|
|
586
|
+
cacheCreationInputTokens: 0,
|
|
587
|
+
},
|
|
588
|
+
},
|
|
589
|
+
});
|
|
590
|
+
|
|
591
|
+
accumulateUsage([attempt1, attempt2]);
|
|
592
|
+
|
|
593
|
+
expect(attempt1.inputTokens).toBe(100);
|
|
594
|
+
expect(attempt1.modelUsage['claude-opus-4-6']?.inputTokens).toBe(100);
|
|
595
|
+
expect(attempt2.inputTokens).toBe(200);
|
|
596
|
+
});
|
|
597
|
+
});
|
|
598
|
+
|
|
599
|
+
describe('multi-attempt cost calculation', () => {
|
|
600
|
+
it('should calculate correct cost when retry uses different model', () => {
|
|
601
|
+
const tracker = new TokenTracker(testPricing);
|
|
602
|
+
// Attempt 1: Opus, Attempt 2: Sonnet (fallback)
|
|
603
|
+
const attempt1 = makeUsage({
|
|
604
|
+
inputTokens: 1_000_000,
|
|
605
|
+
outputTokens: 500_000,
|
|
606
|
+
modelUsage: {
|
|
607
|
+
'claude-opus-4-6': {
|
|
608
|
+
inputTokens: 1_000_000,
|
|
609
|
+
outputTokens: 500_000,
|
|
610
|
+
cacheReadInputTokens: 0,
|
|
611
|
+
cacheCreationInputTokens: 0,
|
|
612
|
+
},
|
|
613
|
+
},
|
|
614
|
+
});
|
|
615
|
+
const attempt2 = makeUsage({
|
|
616
|
+
inputTokens: 1_000_000,
|
|
617
|
+
outputTokens: 1_000_000,
|
|
618
|
+
modelUsage: {
|
|
619
|
+
'claude-sonnet-4-5': {
|
|
620
|
+
inputTokens: 1_000_000,
|
|
621
|
+
outputTokens: 1_000_000,
|
|
622
|
+
cacheReadInputTokens: 0,
|
|
623
|
+
cacheCreationInputTokens: 0,
|
|
624
|
+
},
|
|
625
|
+
},
|
|
626
|
+
});
|
|
627
|
+
|
|
628
|
+
const entry = tracker.addTask('01', [attempt1, attempt2]);
|
|
629
|
+
|
|
630
|
+
// Opus: 1M*$15 + 0.5M*$75 = $15 + $37.5 = $52.5
|
|
631
|
+
// Sonnet: 1M*$3 + 1M*$15 = $3 + $15 = $18
|
|
632
|
+
// Total: $52.5 + $18 = $70.5
|
|
633
|
+
expect(entry.cost.inputCost).toBeCloseTo(18); // 15 + 3
|
|
634
|
+
expect(entry.cost.outputCost).toBeCloseTo(52.5); // 37.5 + 15
|
|
635
|
+
expect(entry.cost.totalCost).toBeCloseTo(70.5);
|
|
636
|
+
});
|
|
637
|
+
|
|
638
|
+
it('should include all attempt usage in grand totals', () => {
|
|
639
|
+
const tracker = new TokenTracker(testPricing);
|
|
640
|
+
|
|
641
|
+
// Task 1: 2 attempts
|
|
642
|
+
tracker.addTask('01', [
|
|
643
|
+
makeUsage({ inputTokens: 500_000 }),
|
|
644
|
+
makeUsage({ inputTokens: 500_000 }),
|
|
645
|
+
]);
|
|
646
|
+
|
|
647
|
+
// Task 2: 1 attempt
|
|
648
|
+
tracker.addTask('02', [
|
|
649
|
+
makeUsage({ inputTokens: 1_000_000 }),
|
|
650
|
+
]);
|
|
651
|
+
|
|
652
|
+
const totals = tracker.getTotals();
|
|
653
|
+
expect(totals.usage.inputTokens).toBe(2_000_000);
|
|
654
|
+
});
|
|
322
655
|
});
|
|
323
656
|
|
|
324
657
|
describe('custom pricing', () => {
|