adaptive-memory-multi-model-router 1.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (95) hide show
  1. package/README.md +114 -0
  2. package/demo/research-demo.js +266 -0
  3. package/dist/cache/prefixCache.d.ts +114 -0
  4. package/dist/cache/prefixCache.d.ts.map +1 -0
  5. package/dist/cache/prefixCache.js +285 -0
  6. package/dist/cache/prefixCache.js.map +1 -0
  7. package/dist/cache/responseCache.d.ts +58 -0
  8. package/dist/cache/responseCache.d.ts.map +1 -0
  9. package/dist/cache/responseCache.js +153 -0
  10. package/dist/cache/responseCache.js.map +1 -0
  11. package/dist/cli.js +59 -0
  12. package/dist/cost/costTracker.d.ts +95 -0
  13. package/dist/cost/costTracker.d.ts.map +1 -0
  14. package/dist/cost/costTracker.js +240 -0
  15. package/dist/cost/costTracker.js.map +1 -0
  16. package/dist/index.d.ts +723 -0
  17. package/dist/index.d.ts.map +1 -0
  18. package/dist/index.js +239 -0
  19. package/dist/index.js.map +1 -0
  20. package/dist/memory/episodicMemory.d.ts +82 -0
  21. package/dist/memory/episodicMemory.d.ts.map +1 -0
  22. package/dist/memory/episodicMemory.js +145 -0
  23. package/dist/memory/episodicMemory.js.map +1 -0
  24. package/dist/orchestration/haloOrchestrator.d.ts +102 -0
  25. package/dist/orchestration/haloOrchestrator.d.ts.map +1 -0
  26. package/dist/orchestration/haloOrchestrator.js +207 -0
  27. package/dist/orchestration/haloOrchestrator.js.map +1 -0
  28. package/dist/orchestration/mctsWorkflow.d.ts +85 -0
  29. package/dist/orchestration/mctsWorkflow.d.ts.map +1 -0
  30. package/dist/orchestration/mctsWorkflow.js +210 -0
  31. package/dist/orchestration/mctsWorkflow.js.map +1 -0
  32. package/dist/providers/localProvider.d.ts +102 -0
  33. package/dist/providers/localProvider.d.ts.map +1 -0
  34. package/dist/providers/localProvider.js +338 -0
  35. package/dist/providers/localProvider.js.map +1 -0
  36. package/dist/providers/registry.d.ts +55 -0
  37. package/dist/providers/registry.d.ts.map +1 -0
  38. package/dist/providers/registry.js +138 -0
  39. package/dist/providers/registry.js.map +1 -0
  40. package/dist/routing/advancedRouter.d.ts +68 -0
  41. package/dist/routing/advancedRouter.d.ts.map +1 -0
  42. package/dist/routing/advancedRouter.js +332 -0
  43. package/dist/routing/advancedRouter.js.map +1 -0
  44. package/dist/tools/tmlpdTools.d.ts +101 -0
  45. package/dist/tools/tmlpdTools.d.ts.map +1 -0
  46. package/dist/tools/tmlpdTools.js +368 -0
  47. package/dist/tools/tmlpdTools.js.map +1 -0
  48. package/dist/utils/batchProcessor.d.ts +96 -0
  49. package/dist/utils/batchProcessor.d.ts.map +1 -0
  50. package/dist/utils/batchProcessor.js +170 -0
  51. package/dist/utils/batchProcessor.js.map +1 -0
  52. package/dist/utils/compression.d.ts +61 -0
  53. package/dist/utils/compression.d.ts.map +1 -0
  54. package/dist/utils/compression.js +281 -0
  55. package/dist/utils/compression.js.map +1 -0
  56. package/dist/utils/reliability.d.ts +74 -0
  57. package/dist/utils/reliability.d.ts.map +1 -0
  58. package/dist/utils/reliability.js +177 -0
  59. package/dist/utils/reliability.js.map +1 -0
  60. package/dist/utils/speculativeDecoding.d.ts +117 -0
  61. package/dist/utils/speculativeDecoding.d.ts.map +1 -0
  62. package/dist/utils/speculativeDecoding.js +246 -0
  63. package/dist/utils/speculativeDecoding.js.map +1 -0
  64. package/dist/utils/tokenUtils.d.ts +50 -0
  65. package/dist/utils/tokenUtils.d.ts.map +1 -0
  66. package/dist/utils/tokenUtils.js +124 -0
  67. package/dist/utils/tokenUtils.js.map +1 -0
  68. package/examples/QUICKSTART.md +183 -0
  69. package/notebooks/quickstart.ipynb +157 -0
  70. package/package.json +83 -0
  71. package/python/examples.py +53 -0
  72. package/python/integrations.py +330 -0
  73. package/python/setup.py +28 -0
  74. package/python/tmlpd.py +369 -0
  75. package/qna/REDDIT_GAP_ANALYSIS.md +299 -0
  76. package/qna/TMLPD_QNA.md +751 -0
  77. package/rust/tmlpd.h +268 -0
  78. package/skill/SKILL.md +238 -0
  79. package/src/cache/prefixCache.ts +365 -0
  80. package/src/cache/responseCache.ts +147 -0
  81. package/src/cost/costTracker.ts +302 -0
  82. package/src/index.ts +224 -0
  83. package/src/memory/episodicMemory.ts +185 -0
  84. package/src/orchestration/haloOrchestrator.ts +266 -0
  85. package/src/orchestration/mctsWorkflow.ts +262 -0
  86. package/src/providers/localProvider.ts +406 -0
  87. package/src/providers/registry.ts +164 -0
  88. package/src/routing/advancedRouter.ts +406 -0
  89. package/src/tools/tmlpdTools.ts +433 -0
  90. package/src/utils/batchProcessor.ts +232 -0
  91. package/src/utils/compression.ts +325 -0
  92. package/src/utils/reliability.ts +221 -0
  93. package/src/utils/speculativeDecoding.ts +344 -0
  94. package/src/utils/tokenUtils.ts +145 -0
  95. package/tsconfig.json +18 -0
@@ -0,0 +1,325 @@
1
+ /**
2
+ * TMLPD Context Compression Utilities
3
+ *
4
+ * Strategies for reducing context window usage:
5
+ * - Smart truncation
6
+ * - Message summarization
7
+ * - ISON-style encoding (inspired by Reddit ISON format)
8
+ * - Context window management
9
+ */
10
+
11
+ export interface Message {
12
+ role: "system" | "user" | "assistant";
13
+ content: string;
14
+ name?: string;
15
+ tool_calls?: any[];
16
+ tool_call_id?: string;
17
+ }
18
+
19
+ export type CompressionStrategy = "smart" | "first" | "last" | "isentropy";
20
+
21
+ /**
22
+ * ISON (Intelligence-Sparse Object Notation)
23
+ *
24
+ * A compression format that reduces token count by:
25
+ * - Removing redundant whitespace
26
+ * - Shortening common phrases
27
+ * - Using abbreviations strategically
28
+ *
29
+ * Example: "The quick brown fox jumps over the lazy dog"
30
+ * → "quick brown fox jumps lazy dog" (removes articles, repeated words)
31
+ */
32
+
33
+ const ISON_REPLACEMENTS: Array<[RegExp, string]> = [
34
+ // Common phrase abbreviations
35
+ [/\bthe\b/g, ""],
36
+ [/\ba\b/g, ""],
37
+ [/\ban\b/g, ""],
38
+ [/\bthat\b/g, "that"],
39
+ [/\bthis\b/g, "this"],
40
+ [/\bwith\b/g, "w/"],
41
+ [/\bwithout\b/g, "w/o"],
42
+ [/\band\b/g, "&"],
43
+ [/\bor\b/g, "|"],
44
+ [/\bfor\b/g, "4"],
45
+ [/\bto\b/g, "2"],
46
+ [/\binto\b/g, "2"],
47
+ [/\bfrom\b/g, "fr"],
48
+ [/\bplease\b/gi, ""],
49
+ [/\bthank you\b/gi, "thx"],
50
+ [/\byou are\b/gi, "u r"],
51
+ [/\byou can\b/gi, "u c"],
52
+ [/\bcan you\b/gi, "c?"],
53
+ [/\bhow do\b/gi, "how 2"],
54
+ [/\bwhat is\b/gi, "wat"],
55
+ [/\bwhat are\b/gi, "wat"],
56
+
57
+ // Whitespace normalization
58
+ [/\s+/g, " "],
59
+ [/^\s+|\s+$/g, ""],
60
+
61
+ // Remove repeated characters
62
+ [/(\w)\1{2,}/g, "$1$1"],
63
+
64
+ // Shorten common technical terms
65
+ [/\binformation\b/gi, "info"],
66
+ [/\bprocessing\b/gi, "proc"],
67
+ [/\bdevelopment\b/gi, "dev"],
68
+ [/\bapplication\b/gi, "app"],
69
+ [/\bconfiguration\b/gi, "config"],
70
+ [/\brepresentation\b/gi, "repr"],
71
+ [/\bunderstanding\b/gi, "unders"],
72
+ [/\brecommendation\b/gi, "rec"],
73
+ ];
74
+
75
+ const ISON_UNREPLACEMENTS: Array<[RegExp, string]> = [
76
+ [/w\//g, "with "],
77
+ [/w\/o/g, "without "],
78
+ [/&/g, " and "],
79
+ [/\b4\b/g, " for "],
80
+ [/\b2\b/g, " to "],
81
+ [/\bfr\b/g, "from "],
82
+ [/\bthx\b/gi, "thank you"],
83
+ [/\bu r\b/gi, "you are"],
84
+ [/\bu c\b/gi, "you can"],
85
+ [/\bc\?\b/g, "can you"],
86
+ [/how 2\b/gi, "how do"],
87
+ [/\bwat\b/g, "what is"],
88
+ ];
89
+
90
+ export interface CompressionResult {
91
+ original_tokens: number;
92
+ compressed_tokens: number;
93
+ ratio: number;
94
+ compressed_text: string;
95
+ }
96
+
97
+ /**
98
+ * ISON encode text for token reduction.
99
+ */
100
+ export function isonEncode(text: string): string {
101
+ let result = text;
102
+
103
+ // Apply replacements
104
+ for (const [pattern, replacement] of ISON_REPLACEMENTS) {
105
+ result = result.replace(pattern, replacement);
106
+ }
107
+
108
+ // Remove extra spaces and trim
109
+ result = result.replace(/\s+/g, " ").trim();
110
+
111
+ return result;
112
+ }
113
+
114
+ /**
115
+ * Decode ISON encoded text.
116
+ */
117
+ export function isonDecode(text: string): string {
118
+ let result = text;
119
+
120
+ // Apply un-replacements
121
+ for (const [pattern, replacement] of ISON_UNREPLACEMENTS) {
122
+ result = result.replace(pattern, replacement);
123
+ }
124
+
125
+ return result;
126
+ }
127
+
128
+ /**
129
+ * Compress text using ISON encoding.
130
+ */
131
+ export function compressText(text: string): CompressionResult {
132
+ const original_tokens = estimateTokens(text);
133
+ const compressed = isonEncode(text);
134
+ const compressed_tokens = estimateTokens(compressed);
135
+
136
+ return {
137
+ original_tokens,
138
+ compressed_tokens,
139
+ ratio: compressed_tokens / original_tokens,
140
+ compressed_text: compressed
141
+ };
142
+ }
143
+
144
+ /**
145
+ * Estimate tokens (fallback if no model specified).
146
+ */
147
+ function estimateTokens(text: string): number {
148
+ const words = text.trim().split(/\s+/).filter(w => w.length > 0);
149
+ return Math.ceil(words.length * 1.3);
150
+ }
151
+
152
+ /**
153
+ * Truncate messages to fit within token budget.
154
+ *
155
+ * @param messages - Conversation messages
156
+ * @param max_tokens - Maximum tokens allowed
157
+ * @param strategy - "smart" (preserve system + recent), "first" (keep start), "last" (keep end)
158
+ */
159
+ export function truncateMessages(
160
+ messages: Message[],
161
+ max_tokens: number,
162
+ strategy: CompressionStrategy = "smart"
163
+ ): Message[] {
164
+ if (!messages || messages.length === 0) return [];
165
+
166
+ // Calculate total tokens
167
+ const totalTokens = (msg: Message) => {
168
+ const content = typeof msg.content === 'string' ? msg.content : JSON.stringify(msg.content);
169
+ return estimateTokens(content) + 4; // +4 for role/format overhead
170
+ };
171
+
172
+ let currentTokens = messages.reduce((sum, m) => sum + totalTokens(m), 0);
173
+
174
+ if (currentTokens <= max_tokens) {
175
+ return messages; // Already fits
176
+ }
177
+
178
+ const result: Message[] = [];
179
+
180
+ if (strategy === "first") {
181
+ // Keep system (first) messages, truncate from middle
182
+ let keepTokens = 0;
183
+ for (const msg of messages) {
184
+ const msgTokens = totalTokens(msg);
185
+ if (keepTokens + msgTokens <= max_tokens) {
186
+ result.push(msg);
187
+ keepTokens += msgTokens;
188
+ } else if (msg.role === "system" && result.length === 0) {
189
+ // Always keep system message, possibly truncated
190
+ const systemContent = typeof msg.content === 'string' ? msg.content : "";
191
+ const truncated = truncateToTokenBudget(systemContent, max_tokens - 4);
192
+ result.push({ ...msg, content: truncated });
193
+ break;
194
+ } else {
195
+ break;
196
+ }
197
+ }
198
+ } else if (strategy === "last") {
199
+ // Keep only most recent messages
200
+ for (let i = messages.length - 1; i >= 0; i--) {
201
+ const msg = messages[i];
202
+ const msgTokens = totalTokens(msg);
203
+
204
+ if (currentTokens - msgTokens <= max_tokens) {
205
+ result.unshift(msg);
206
+ currentTokens -= msgTokens;
207
+ } else if (msg.role === "user") {
208
+ // Try to keep a truncated user message
209
+ const truncated = truncateToTokenBudget(msg.content as string, max_tokens - currentTokens);
210
+ if (truncated.length > 20) {
211
+ result.unshift({ ...msg, content: truncated });
212
+ }
213
+ break;
214
+ }
215
+ }
216
+ } else if (strategy === "smart") {
217
+ // Keep system, compress middle, keep recent
218
+ const systemMessages: Message[] = [];
219
+ const middleMessages: Message[] = [];
220
+ const recentMessages: Message[] = [];
221
+
222
+ for (const msg of messages) {
223
+ if (msg.role === "system") {
224
+ systemMessages.push(msg);
225
+ } else if (messages.indexOf(msg) >= messages.length - 3) {
226
+ recentMessages.push(msg);
227
+ } else {
228
+ middleMessages.push(msg);
229
+ }
230
+ }
231
+
232
+ // Start with system
233
+ for (const msg of systemMessages) {
234
+ const msgTokens = totalTokens(msg);
235
+ if (currentTokens <= max_tokens) {
236
+ result.push(msg);
237
+ currentTokens -= msgTokens;
238
+ } else {
239
+ // Truncate system message
240
+ const truncated = truncateToTokenBudget(msg.content as string, max_tokens - currentTokens - 10);
241
+ result.push({ ...msg, content: truncated });
242
+ currentTokens = max_tokens;
243
+ break;
244
+ }
245
+ }
246
+
247
+ // Add compressed middle
248
+ if (currentTokens > max_tokens / 2 && middleMessages.length > 0) {
249
+ // Compress middle messages into a summary
250
+ const middleContent = middleMessages
251
+ .map(m => m.content)
252
+ .join("\n");
253
+ const summaryTokenBudget = Math.min(
254
+ max_tokens / 4,
255
+ max_tokens - currentTokens
256
+ );
257
+ const summary = truncateToTokenBudget(
258
+ `[Previous ${middleMessages.length} messages]: ${middleContent}`,
259
+ summaryTokenBudget
260
+ );
261
+ result.push({ role: "assistant", content: summary });
262
+ currentTokens -= estimateTokens(summary);
263
+ }
264
+
265
+ // Add recent messages if room
266
+ for (const msg of recentMessages) {
267
+ const msgTokens = totalTokens(msg);
268
+ if (currentTokens + msgTokens <= max_tokens) {
269
+ result.push(msg);
270
+ currentTokens += msgTokens;
271
+ }
272
+ }
273
+ }
274
+
275
+ return result;
276
+ }
277
+
278
+ /**
279
+ * Truncate a single string to fit within token budget.
280
+ */
281
+ export function truncateToTokenBudget(text: string, max_tokens: number): string {
282
+ const words = text.split(/\s+/);
283
+ let current = 0;
284
+ const targetWords: string[] = [];
285
+
286
+ for (const word of words) {
287
+ const wordTokens = estimateTokens(word);
288
+ if (current + wordTokens <= max_tokens) {
289
+ targetWords.push(word);
290
+ current += wordTokens;
291
+ } else {
292
+ break;
293
+ }
294
+ }
295
+
296
+ let result = targetWords.join(" ");
297
+
298
+ // If we truncated, add ellipsis
299
+ if (result.length < text.length) {
300
+ result += "...";
301
+ }
302
+
303
+ return result;
304
+ }
305
+
306
+ /**
307
+ * Calculate compression ratio for context.
308
+ */
309
+ export function calculateCompressionRatio(messages: Message[], max_tokens: number): number {
310
+ const totalTokens = messages.reduce((sum, m) => {
311
+ const content = typeof m.content === 'string' ? m.content : JSON.stringify(m.content);
312
+ return sum + estimateTokens(content) + 4;
313
+ }, 0);
314
+
315
+ return Math.min(1, max_tokens / totalTokens);
316
+ }
317
+
318
+ export default {
319
+ isonEncode,
320
+ isonDecode,
321
+ compressText,
322
+ truncateMessages,
323
+ truncateToTokenBudget,
324
+ calculateCompressionRatio
325
+ };
@@ -0,0 +1,221 @@
1
+ /**
2
+ * TMLPD Reliability Engine
3
+ *
4
+ * Circuit breaker, retry with jitter, and enhanced cooldown logic.
5
+ * Designed to handle flaky API calls gracefully.
6
+ */
7
+
8
+ export interface RetryConfig {
9
+ max_attempts: number;
10
+ base_delay_ms: number;
11
+ max_delay_ms: number;
12
+ jitter: number; // 0-1, percentage of delay to randomize
13
+ retryable_status_codes: number[];
14
+ }
15
+
16
+ export interface CircuitBreakerConfig {
17
+ failure_threshold: number;
18
+ recovery_timeout_ms: number;
19
+ half_open_max_calls: number;
20
+ }
21
+
22
+ export interface CircuitState {
23
+ status: "closed" | "open" | "half_open";
24
+ failure_count: number;
25
+ last_failure_time: number | null;
26
+ last_success_time: number | null;
27
+ consecutive_successes: number;
28
+ }
29
+
30
+ export const DEFAULT_RETRY_CONFIG: RetryConfig = {
31
+ max_attempts: 3,
32
+ base_delay_ms: 500,
33
+ max_delay_ms: 30000,
34
+ jitter: 0.3,
35
+ retryable_status_codes: [408, 429, 500, 502, 503, 504],
36
+ };
37
+
38
+ export const DEFAULT_CIRCUIT_BREAKER_CONFIG: CircuitBreakerConfig = {
39
+ failure_threshold: 5,
40
+ recovery_timeout_ms: 60000,
41
+ half_open_max_calls: 3,
42
+ };
43
+
44
+ /**
45
+ * Calculate delay with exponential backoff and jitter
46
+ */
47
+ export function calculateRetryDelay(
48
+ attempt: number,
49
+ config: RetryConfig = DEFAULT_RETRY_CONFIG
50
+ ): number {
51
+ // Exponential backoff
52
+ const exponential_delay = config.base_delay_ms * Math.pow(2, attempt - 1);
53
+
54
+ // Cap at max delay
55
+ const capped_delay = Math.min(exponential_delay, config.max_delay_ms);
56
+
57
+ // Add jitter
58
+ const jitter_range = capped_delay * config.jitter;
59
+ const jitter = (Math.random() * 2 - 1) * jitter_range;
60
+
61
+ return Math.round(capped_delay + jitter);
62
+ }
63
+
64
+ /**
65
+ * Check if status code is retryable
66
+ */
67
+ export function isRetryableStatus(statusCode: number | null, config: RetryConfig = DEFAULT_RETRY_CONFIG): boolean {
68
+ if (statusCode === null) return true; // Network errors are retryable
69
+ return config.retryable_status_codes.includes(statusCode);
70
+ }
71
+
72
+ /**
73
+ * Circuit Breaker implementation
74
+ */
75
+ export class CircuitBreaker {
76
+ private config: CircuitBreakerConfig;
77
+ private state: CircuitState;
78
+ private half_open_calls = 0;
79
+
80
+ constructor(config: Partial<CircuitBreakerConfig> = {}) {
81
+ this.config = { ...DEFAULT_CIRCUIT_BREAKER_CONFIG, ...config };
82
+ this.state = {
83
+ status: "closed",
84
+ failure_count: 0,
85
+ last_failure_time: null,
86
+ last_success_time: null,
87
+ consecutive_successes: 0,
88
+ };
89
+ }
90
+
91
+ /**
92
+ * Check if circuit allows requests
93
+ */
94
+ canExecute(): boolean {
95
+ if (this.state.status === "closed") return true;
96
+
97
+ if (this.state.status === "open") {
98
+ // Check if recovery timeout has passed
99
+ if (this.state.last_failure_time && Date.now() - this.state.last_failure_time >= this.config.recovery_timeout_ms) {
100
+ this.state.status = "half_open";
101
+ this.half_open_calls = 0;
102
+ return true;
103
+ }
104
+ return false;
105
+ }
106
+
107
+ // half_open
108
+ return this.half_open_calls < this.config.half_open_max_calls;
109
+ }
110
+
111
+ /**
112
+ * Record a successful execution
113
+ */
114
+ recordSuccess(): void {
115
+ this.state.last_success_time = Date.now();
116
+ this.half_open_calls++;
117
+
118
+ if (this.state.status === "half_open") {
119
+ this.state.consecutive_successes++;
120
+ if (this.state.consecutive_successes >= this.config.half_open_max_calls) {
121
+ // Circuit recovered
122
+ this.state.status = "closed";
123
+ this.state.failure_count = 0;
124
+ this.state.consecutive_successes = 0;
125
+ }
126
+ } else {
127
+ this.state.failure_count = 0;
128
+ }
129
+ }
130
+
131
+ /**
132
+ * Record a failed execution
133
+ */
134
+ recordFailure(): void {
135
+ this.state.last_failure_time = Date.now();
136
+ this.state.failure_count++;
137
+ this.state.consecutive_successes = 0;
138
+
139
+ if (this.state.status === "half_open") {
140
+ // Trip circuit back open
141
+ this.state.status = "open";
142
+ } else if (this.state.failure_count >= this.config.failure_threshold) {
143
+ this.state.status = "open";
144
+ }
145
+ }
146
+
147
+ /**
148
+ * Get current circuit state
149
+ */
150
+ getState(): CircuitState {
151
+ return { ...this.state };
152
+ }
153
+
154
+ /**
155
+ * Force reset circuit
156
+ */
157
+ reset(): void {
158
+ this.state = {
159
+ status: "closed",
160
+ failure_count: 0,
161
+ last_failure_time: null,
162
+ last_success_time: null,
163
+ consecutive_successes: 0,
164
+ };
165
+ this.half_open_calls = 0;
166
+ }
167
+ }
168
+
169
+ /**
170
+ * Enhanced retry wrapper with circuit breaker integration
171
+ */
172
+ export async function withRetry<T>(
173
+ fn: () => Promise<T>,
174
+ config: Partial<RetryConfig> = {},
175
+ circuitBreaker?: CircuitBreaker
176
+ ): Promise<{ result: T | null; error: Error | null; attempts: number; circuit_tripped: boolean }> {
177
+ const retryConfig = { ...DEFAULT_RETRY_CONFIG, ...config };
178
+ let lastError: Error | null = null;
179
+ let attempts = 0;
180
+ let circuit_tripped = false;
181
+
182
+ for (let i = 0; i < retryConfig.max_attempts; i++) {
183
+ attempts++;
184
+
185
+ try {
186
+ // Check circuit breaker before attempt
187
+ if (circuitBreaker && !circuitBreaker.canExecute()) {
188
+ circuit_tripped = true;
189
+ throw new Error("Circuit breaker is open");
190
+ }
191
+
192
+ const result = await fn();
193
+
194
+ if (circuitBreaker) {
195
+ circuitBreaker.recordSuccess();
196
+ }
197
+
198
+ return { result, error: null, attempts, circuit_tripped };
199
+ } catch (error) {
200
+ lastError = error instanceof Error ? error : new Error(String(error));
201
+
202
+ // Check if should retry
203
+ const statusCode = (error as any).statusCode || (error as any).response?.statusCode || null;
204
+ if (!isRetryableStatus(statusCode, retryConfig)) {
205
+ return { result: null, error: lastError, attempts, circuit_tripped };
206
+ }
207
+
208
+ if (circuitBreaker) {
209
+ circuitBreaker.recordFailure();
210
+ }
211
+
212
+ // Don't wait after last attempt
213
+ if (i < retryConfig.max_attempts - 1) {
214
+ const delay = calculateRetryDelay(i + 1, retryConfig);
215
+ await new Promise((resolve) => setTimeout(resolve, delay));
216
+ }
217
+ }
218
+ }
219
+
220
+ return { result: null, error: lastError, attempts, circuit_tripped };
221
+ }