autotel 4.1.0 → 4.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (154) hide show
  1. package/package.json +1 -2
  2. package/src/attribute-redacting-processor.test.ts +0 -763
  3. package/src/attribute-redacting-processor.ts +0 -621
  4. package/src/attributes/attachers.ts +0 -161
  5. package/src/attributes/builders.ts +0 -529
  6. package/src/attributes/domains.ts +0 -42
  7. package/src/attributes/index.ts +0 -81
  8. package/src/attributes/registry.ts +0 -323
  9. package/src/attributes/types.ts +0 -211
  10. package/src/attributes/utils.ts +0 -64
  11. package/src/attributes/validators.ts +0 -266
  12. package/src/attributes.test.ts +0 -292
  13. package/src/auto.ts +0 -67
  14. package/src/autotel-logger.test.ts +0 -548
  15. package/src/autotel-logger.ts +0 -364
  16. package/src/baggage-span-processor.test.ts +0 -202
  17. package/src/baggage-span-processor.ts +0 -100
  18. package/src/business-baggage.test.ts +0 -500
  19. package/src/business-baggage.ts +0 -669
  20. package/src/circuit-breaker.test.ts +0 -341
  21. package/src/circuit-breaker.ts +0 -184
  22. package/src/config.test.ts +0 -94
  23. package/src/config.ts +0 -172
  24. package/src/correlated-events.test.ts +0 -151
  25. package/src/correlated-events.ts +0 -47
  26. package/src/correlation-id.test.ts +0 -163
  27. package/src/correlation-id.ts +0 -206
  28. package/src/db.test.ts +0 -252
  29. package/src/db.ts +0 -447
  30. package/src/decorators.test.ts +0 -153
  31. package/src/decorators.ts +0 -188
  32. package/src/define-event.test.ts +0 -41
  33. package/src/define-event.ts +0 -58
  34. package/src/devtools.ts +0 -60
  35. package/src/drain-pipeline.test.ts +0 -68
  36. package/src/drain-pipeline.ts +0 -199
  37. package/src/drain-toolkit.test.ts +0 -113
  38. package/src/drain-toolkit.ts +0 -129
  39. package/src/enricher-toolkit.test.ts +0 -67
  40. package/src/enricher-toolkit.ts +0 -79
  41. package/src/enrichers.test.ts +0 -150
  42. package/src/enrichers.ts +0 -145
  43. package/src/env-config.test.ts +0 -323
  44. package/src/env-config.ts +0 -309
  45. package/src/error-catalog.test.ts +0 -133
  46. package/src/error-catalog.ts +0 -262
  47. package/src/event-queue.test.ts +0 -864
  48. package/src/event-queue.ts +0 -699
  49. package/src/event-subscriber.ts +0 -262
  50. package/src/event-testing.ts +0 -197
  51. package/src/event.test.ts +0 -1104
  52. package/src/event.ts +0 -988
  53. package/src/events-config.ts +0 -235
  54. package/src/exporters.ts +0 -165
  55. package/src/filtering-span-processor.test.ts +0 -281
  56. package/src/filtering-span-processor.ts +0 -111
  57. package/src/flatten-attributes.test.ts +0 -76
  58. package/src/flatten-attributes.ts +0 -80
  59. package/src/functional.strict-types.typecheck.ts +0 -53
  60. package/src/functional.test.ts +0 -1464
  61. package/src/functional.ts +0 -2539
  62. package/src/functional.types.test.ts +0 -135
  63. package/src/hook.mjs +0 -15
  64. package/src/http.test.ts +0 -485
  65. package/src/http.ts +0 -424
  66. package/src/index.ts +0 -433
  67. package/src/init-auto-redactor.test.ts +0 -53
  68. package/src/init-redactor.test.ts +0 -8
  69. package/src/init.customization.test.ts +0 -665
  70. package/src/init.integrations.test.ts +0 -399
  71. package/src/init.openllmetry.test.ts +0 -194
  72. package/src/init.protocol.test.ts +0 -215
  73. package/src/init.ts +0 -2439
  74. package/src/instrumentation.test.ts +0 -108
  75. package/src/instrumentation.ts +0 -319
  76. package/src/logger.test.ts +0 -125
  77. package/src/logger.ts +0 -341
  78. package/src/messaging-adapters.test.ts +0 -595
  79. package/src/messaging-adapters.ts +0 -583
  80. package/src/messaging-testing.test.ts +0 -573
  81. package/src/messaging-testing.ts +0 -935
  82. package/src/messaging.test.ts +0 -1646
  83. package/src/messaging.ts +0 -2245
  84. package/src/metric-helpers.ts +0 -47
  85. package/src/metric-testing.ts +0 -197
  86. package/src/metric.ts +0 -446
  87. package/src/metrics.test.ts +0 -241
  88. package/src/node-require.ts +0 -123
  89. package/src/operation-context.ts +0 -93
  90. package/src/parse-error.test.ts +0 -73
  91. package/src/parse-error.ts +0 -112
  92. package/src/posthog-logs.test.ts +0 -115
  93. package/src/posthog-logs.ts +0 -77
  94. package/src/pretty-console-exporter.test.ts +0 -545
  95. package/src/pretty-console-exporter.ts +0 -413
  96. package/src/pretty-log-formatter.test.ts +0 -123
  97. package/src/pretty-log-formatter.ts +0 -210
  98. package/src/processors/canonical-log-line-processor.test.ts +0 -523
  99. package/src/processors/canonical-log-line-processor.ts +0 -396
  100. package/src/processors.ts +0 -152
  101. package/src/rate-limiter.test.ts +0 -199
  102. package/src/rate-limiter.ts +0 -98
  103. package/src/redact-values.test.ts +0 -90
  104. package/src/redact-values.ts +0 -34
  105. package/src/register.ts +0 -37
  106. package/src/request-logger.test.ts +0 -545
  107. package/src/request-logger.ts +0 -342
  108. package/src/sampling.test.ts +0 -1060
  109. package/src/sampling.ts +0 -737
  110. package/src/security-schema.test.ts +0 -45
  111. package/src/security-schema.ts +0 -107
  112. package/src/semantic-conventions.ts +0 -15
  113. package/src/semantic-helpers.test.ts +0 -226
  114. package/src/semantic-helpers.ts +0 -438
  115. package/src/shutdown.test.ts +0 -364
  116. package/src/shutdown.ts +0 -246
  117. package/src/span-name-normalizer.test.ts +0 -377
  118. package/src/span-name-normalizer.ts +0 -213
  119. package/src/stable-hash.ts +0 -27
  120. package/src/structured-error.test.ts +0 -191
  121. package/src/structured-error.ts +0 -157
  122. package/src/stub.integration.test.ts +0 -361
  123. package/src/tail-sampling-processor.test.ts +0 -230
  124. package/src/tail-sampling-processor.ts +0 -55
  125. package/src/test-span-collector.test.ts +0 -234
  126. package/src/test-span-collector.ts +0 -150
  127. package/src/testing.ts +0 -705
  128. package/src/trace-context.test.ts +0 -73
  129. package/src/trace-context.ts +0 -567
  130. package/src/trace-helpers.new.test.ts +0 -278
  131. package/src/trace-helpers.test.ts +0 -290
  132. package/src/trace-helpers.ts +0 -710
  133. package/src/trace-hybrid.test.ts +0 -42
  134. package/src/trace-hybrid.ts +0 -37
  135. package/src/tracer-provider.test.ts +0 -183
  136. package/src/tracer-provider.ts +0 -266
  137. package/src/track.test.ts +0 -154
  138. package/src/track.ts +0 -216
  139. package/src/validate.test.ts +0 -287
  140. package/src/validate.ts +0 -307
  141. package/src/validation-attributes.ts +0 -43
  142. package/src/validation.test.ts +0 -330
  143. package/src/validation.ts +0 -246
  144. package/src/variable-name-inference.test.ts +0 -178
  145. package/src/variable-name-inference.ts +0 -242
  146. package/src/webhook.test.ts +0 -649
  147. package/src/webhook.ts +0 -637
  148. package/src/workflow-distributed.test.ts +0 -786
  149. package/src/workflow-distributed.ts +0 -916
  150. package/src/workflow.async-safety.integration.test.ts +0 -345
  151. package/src/workflow.test.ts +0 -647
  152. package/src/workflow.ts +0 -810
  153. package/src/yaml-config.test.ts +0 -373
  154. package/src/yaml-config.ts +0 -351
@@ -1,699 +0,0 @@
1
- /**
2
- * Events event queue with batching, backpressure, retry logic, rate limiting, and OTel metrics
3
- *
4
- * Exposes delivery pipeline metrics for observability:
5
- * - autotel.event_delivery.queue.size - Current queue size
6
- * - autotel.event_delivery.queue.oldest_age_ms - Age of oldest event in queue
7
- * - autotel.event_delivery.queue.delivered - Successfully delivered events
8
- * - autotel.event_delivery.queue.failed - Failed event deliveries
9
- * - autotel.event_delivery.queue.dropped - Dropped events with reason
10
- * - autotel.event_delivery.queue.latency_ms - Delivery latency histogram
11
- * - autotel.event_delivery.subscriber.health - Subscriber health (1=healthy, 0=unhealthy)
12
- */
13
-
14
- import type {
15
- Counter,
16
- Histogram,
17
- ObservableGauge,
18
- Attributes,
19
- } from '@opentelemetry/api';
20
- import type { ObservableResult } from '@opentelemetry/api';
21
- import type {
22
- EventSubscriber,
23
- EventAttributes,
24
- AutotelEventContext,
25
- EventSchemaMetadata,
26
- } from './event-subscriber';
27
- import { getLogger } from './init';
28
- import { getConfig as getRuntimeConfig } from './config';
29
- import { TokenBucketRateLimiter, type RateLimiterConfig } from './rate-limiter';
30
- import { getOrCreateCorrelationId } from './correlation-id';
31
-
32
- export interface EventData {
33
- name: string;
34
- attributes?: EventAttributes;
35
- timestamp: number;
36
- /** Internal: correlation ID for debug breadcrumbs */
37
- _correlationId?: string;
38
- /** Internal: trace ID for debug breadcrumbs */
39
- _traceId?: string;
40
- /** Autotel context for trace correlation (passed to subscribers) */
41
- autotel?: AutotelEventContext;
42
- /** Optional schema metadata for contract-aware subscribers. */
43
- schema?: EventSchemaMetadata;
44
- }
45
-
46
- /**
47
- * Drop reasons for event delivery queue metrics
48
- * LOW CARDINALITY: Only these 4 values allowed in metric labels
49
- */
50
- export type EventDropReason =
51
- | 'rate_limit'
52
- | 'circuit_open'
53
- | 'payload_invalid'
54
- | 'shutdown';
55
-
56
- export interface QueueConfig {
57
- maxSize: number; // Max events in queue (default: 50,000)
58
- batchSize: number; // Events per batch (default: 100)
59
- flushInterval: number; // Flush interval in ms (default: 10,000)
60
- maxRetries: number; // Max retry attempts (default: 3)
61
- rateLimit?: RateLimiterConfig; // Optional rate limiting (default: 100 events/sec)
62
- }
63
-
64
- const DEFAULT_CONFIG: QueueConfig = {
65
- maxSize: 50_000,
66
- batchSize: 100,
67
- flushInterval: 10_000,
68
- maxRetries: 3,
69
- rateLimit: {
70
- maxEventsPerSecond: 100,
71
- burstCapacity: 200,
72
- },
73
- };
74
-
75
- /**
76
- * Metrics for event delivery queue observability
77
- *
78
- * All metrics use low-cardinality labels only:
79
- * - subscriber: stable identifier (e.g., 'posthog', 'mixpanel')
80
- * - reason: one of EventDropReason values
81
- */
82
- interface EventQueueMetrics {
83
- /** Current queue size (observable gauge) */
84
- queueSize: ObservableGauge;
85
- /** Age of oldest event in queue in ms (observable gauge) */
86
- oldestAge: ObservableGauge;
87
- /** Successfully delivered events (counter) */
88
- delivered: Counter;
89
- /** Failed event deliveries after all retries (counter) */
90
- failed: Counter;
91
- /** Dropped events (counter with reason label) */
92
- dropped: Counter;
93
- /** Event delivery latency histogram in ms */
94
- latency: Histogram;
95
- /** Subscriber health: 1=healthy, 0=unhealthy (observable gauge) */
96
- subscriberHealth: ObservableGauge;
97
- }
98
-
99
- /**
100
- * Get subscriber name for metrics (stable, low-cardinality)
101
- *
102
- * Priority:
103
- * 1. Explicit config: subscriber.name
104
- * 2. Class static property (if available)
105
- * 3. Fallback: lowercase class name without "Subscriber" suffix
106
- */
107
- function getSubscriberName(subscriber: EventSubscriber): string {
108
- // Use explicit name if provided
109
- if (subscriber.name) {
110
- return subscriber.name.toLowerCase();
111
- }
112
-
113
- // Fallback: derive from class name
114
- const className = subscriber.constructor?.name || 'unknown';
115
- return className.replace(/Subscriber$/i, '').toLowerCase();
116
- }
117
-
118
- /**
119
- * Events queue with batching and backpressure
120
- *
121
- * Features:
122
- * - Batches events for efficient sending
123
- * - Bounded queue with drop-oldest policy (prod) or blocking (dev)
124
- * - Exponential backoff retry
125
- * - Rate limiting to prevent overwhelming subscribers
126
- * - Graceful flush on shutdown
127
- */
128
- export class EventQueue {
129
- private queue: EventData[] = [];
130
- private flushTimer: NodeJS.Timeout | null = null;
131
- private readonly config: QueueConfig;
132
- private readonly subscribers: EventSubscriber[];
133
- private readonly rateLimiter: TokenBucketRateLimiter | null;
134
- private flushPromise: Promise<void> | null = null;
135
- private isShuttingDown = false;
136
-
137
- // Metrics
138
- private metrics: EventQueueMetrics | null = null;
139
-
140
- // Observable callback cleanup functions
141
- private observableCleanups: Array<() => void> = [];
142
-
143
- // Subscriber health tracking (for observable gauges)
144
- private subscriberHealthy: Map<string, boolean> = new Map();
145
-
146
- constructor(subscribers: EventSubscriber[], config?: Partial<QueueConfig>) {
147
- this.subscribers = subscribers;
148
- this.config = { ...DEFAULT_CONFIG, ...config };
149
-
150
- // Initialize rate limiter if configured
151
- this.rateLimiter = this.config.rateLimit
152
- ? new TokenBucketRateLimiter(this.config.rateLimit)
153
- : null;
154
-
155
- // Initialize subscriber health tracking
156
- for (const subscriber of subscribers) {
157
- const name = getSubscriberName(subscriber);
158
- this.subscriberHealthy.set(name, true);
159
- }
160
-
161
- // Initialize metrics
162
- this.initMetrics();
163
- }
164
-
165
- /**
166
- * Initialize OTel metrics for queue observability
167
- */
168
- private initMetrics(): void {
169
- const runtimeConfig = getRuntimeConfig();
170
- const meter = runtimeConfig.meter;
171
-
172
- // Queue size gauge - observe current queue length
173
- const queueSize = meter.createObservableGauge(
174
- 'autotel.event_delivery.queue.size',
175
- {
176
- description: 'Current number of events in the delivery queue',
177
- unit: 'count',
178
- },
179
- );
180
- const queueSizeCallback = (observableResult: ObservableResult) => {
181
- observableResult.observe(this.queue.length);
182
- };
183
- queueSize.addCallback(queueSizeCallback);
184
- this.observableCleanups.push(() =>
185
- queueSize.removeCallback(queueSizeCallback),
186
- );
187
-
188
- // Oldest event age gauge - observe wait time of oldest event
189
- const oldestAge = meter.createObservableGauge(
190
- 'autotel.event_delivery.queue.oldest_age_ms',
191
- {
192
- description: 'Age of the oldest event in the queue in milliseconds',
193
- unit: 'ms',
194
- },
195
- );
196
- const oldestAgeCallback = (observableResult: ObservableResult) => {
197
- if (this.queue.length > 0) {
198
- const oldest = this.queue[0]!;
199
- const ageMs = Date.now() - oldest.timestamp;
200
- observableResult.observe(ageMs);
201
- } else {
202
- observableResult.observe(0);
203
- }
204
- };
205
- oldestAge.addCallback(oldestAgeCallback);
206
- this.observableCleanups.push(() =>
207
- oldestAge.removeCallback(oldestAgeCallback),
208
- );
209
-
210
- // Delivered counter
211
- const delivered = meter.createCounter(
212
- 'autotel.event_delivery.queue.delivered',
213
- {
214
- description: 'Number of events successfully delivered to subscribers',
215
- unit: 'count',
216
- },
217
- );
218
-
219
- // Failed counter
220
- const failed = meter.createCounter('autotel.event_delivery.queue.failed', {
221
- description:
222
- 'Number of events that failed delivery after all retry attempts',
223
- unit: 'count',
224
- });
225
-
226
- // Dropped counter (with reason label)
227
- const dropped = meter.createCounter(
228
- 'autotel.event_delivery.queue.dropped',
229
- {
230
- description: 'Number of events dropped from the queue',
231
- unit: 'count',
232
- },
233
- );
234
-
235
- // Latency histogram
236
- const latency = meter.createHistogram(
237
- 'autotel.event_delivery.queue.latency_ms',
238
- {
239
- description: 'Event delivery latency from enqueue to successful send',
240
- unit: 'ms',
241
- },
242
- );
243
-
244
- // Subscriber health gauge
245
- const subscriberHealth = meter.createObservableGauge(
246
- 'autotel.event_delivery.subscriber.health',
247
- {
248
- description: 'Subscriber health status (1=healthy, 0=unhealthy)',
249
- unit: '1',
250
- },
251
- );
252
- const subscriberHealthCallback = (observableResult: ObservableResult) => {
253
- for (const [subscriberName, isHealthy] of this.subscriberHealthy) {
254
- observableResult.observe(isHealthy ? 1 : 0, {
255
- subscriber: subscriberName,
256
- });
257
- }
258
- };
259
- subscriberHealth.addCallback(subscriberHealthCallback);
260
- this.observableCleanups.push(() =>
261
- subscriberHealth.removeCallback(subscriberHealthCallback),
262
- );
263
-
264
- this.metrics = {
265
- queueSize,
266
- oldestAge,
267
- delivered,
268
- failed,
269
- dropped,
270
- latency,
271
- subscriberHealth,
272
- };
273
- }
274
-
275
- /**
276
- * Record a dropped event with reason and emit debug breadcrumb
277
- */
278
- private recordDropped(
279
- reason: EventDropReason,
280
- event?: EventData,
281
- subscriberName?: string,
282
- ): void {
283
- // Increment metric
284
- const attrs: Attributes = { reason };
285
- if (subscriberName) {
286
- attrs.subscriber = subscriberName;
287
- }
288
- this.metrics?.dropped.add(1, attrs);
289
-
290
- // Debug breadcrumb log (rate-limited via existing logger)
291
- const logLevel = reason === 'payload_invalid' ? 'error' : 'warn';
292
- const logger = getLogger();
293
-
294
- if (logLevel === 'error') {
295
- logger.error(
296
- {
297
- eventName: event?.name,
298
- subscriber: subscriberName,
299
- reason,
300
- correlationId: event?._correlationId,
301
- traceId: event?._traceId,
302
- },
303
- `[autotel] Event dropped: ${reason}`,
304
- );
305
- } else {
306
- logger.warn(
307
- {
308
- eventName: event?.name,
309
- subscriber: subscriberName,
310
- reason,
311
- correlationId: event?._correlationId,
312
- traceId: event?._traceId,
313
- },
314
- `[autotel] Event dropped: ${reason}`,
315
- );
316
- }
317
- }
318
-
319
- /**
320
- * Record permanent delivery failure (after all retries exhausted)
321
- * Increments failed counter and logs error
322
- */
323
- private recordFailed(
324
- event: EventData,
325
- subscriberName: string,
326
- error?: Error,
327
- ): void {
328
- this.metrics?.failed.add(1, { subscriber: subscriberName });
329
-
330
- // Mark subscriber as unhealthy
331
- this.subscriberHealthy.set(subscriberName, false);
332
-
333
- // Debug breadcrumb log
334
- getLogger().error(
335
- {
336
- eventName: event.name,
337
- subscriber: subscriberName,
338
- correlationId: event._correlationId,
339
- traceId: event._traceId,
340
- err: error,
341
- },
342
- `[autotel] Event delivery failed after all retries`,
343
- );
344
- }
345
-
346
- /**
347
- * Mark subscriber as unhealthy on transient failure (without incrementing failed counter)
348
- * Used during retry attempts - only recordFailed should increment the counter
349
- */
350
- private markSubscriberUnhealthy(subscriberName: string): void {
351
- this.subscriberHealthy.set(subscriberName, false);
352
- }
353
-
354
- /**
355
- * Record successful delivery
356
- */
357
- private recordDelivered(
358
- event: EventData,
359
- subscriberName: string,
360
- startTime: number,
361
- ): void {
362
- const latencyMs = Date.now() - startTime;
363
-
364
- this.metrics?.delivered.add(1, { subscriber: subscriberName });
365
- this.metrics?.latency.record(latencyMs, { subscriber: subscriberName });
366
-
367
- // Mark subscriber as healthy
368
- this.subscriberHealthy.set(subscriberName, true);
369
- }
370
-
371
- /**
372
- * Enqueue an event for sending
373
- *
374
- * Backpressure policy:
375
- * - Drops oldest event and logs warning if queue is full (same behavior in all environments)
376
- */
377
- enqueue(event: EventData): void {
378
- // Reject events during shutdown
379
- if (this.isShuttingDown) {
380
- this.recordDropped('shutdown', event);
381
- return;
382
- }
383
-
384
- // Check queue size
385
- if (this.queue.length >= this.config.maxSize) {
386
- // Drop oldest event and log warning (same behavior in all environments)
387
- const droppedEvent = this.queue.shift();
388
- this.recordDropped('rate_limit', droppedEvent);
389
- getLogger().warn(
390
- {
391
- droppedEvent: droppedEvent?.name,
392
- },
393
- `[autotel] Events queue full (${this.config.maxSize} events). ` +
394
- 'Dropping oldest event. Events are being produced faster than they can be sent. ' +
395
- 'Check your subscribers or reduce tracking frequency.',
396
- );
397
- }
398
-
399
- // Enrich event with correlation context for debug breadcrumbs
400
- const enrichedEvent: EventData = {
401
- ...event,
402
- _correlationId: event._correlationId || getOrCreateCorrelationId(),
403
- };
404
-
405
- this.queue.push(enrichedEvent);
406
- this.scheduleBatchFlush();
407
- }
408
-
409
- /**
410
- * Schedule a batch flush if not already scheduled
411
- */
412
- private scheduleBatchFlush(): void {
413
- if (this.flushTimer || this.flushPromise) return;
414
-
415
- this.flushTimer = setTimeout(() => {
416
- this.flushTimer = null;
417
- void this.flushBatch();
418
- }, this.config.flushInterval);
419
- }
420
-
421
- /**
422
- * Flush a batch of events
423
- * Uses promise-based concurrency control to prevent race conditions
424
- */
425
- private async flushBatch(): Promise<void> {
426
- if (this.queue.length === 0) return;
427
-
428
- // If already flushing, wait for existing flush
429
- if (this.flushPromise) {
430
- await this.flushPromise;
431
- return;
432
- }
433
-
434
- this.flushPromise = this.doFlushBatch();
435
-
436
- try {
437
- await this.flushPromise;
438
- } finally {
439
- this.flushPromise = null;
440
-
441
- // Schedule next flush if more events
442
- if (this.queue.length > 0) {
443
- this.scheduleBatchFlush();
444
- }
445
- }
446
- }
447
-
448
- /**
449
- * Internal flush implementation
450
- */
451
- private async doFlushBatch(): Promise<void> {
452
- const batch = this.queue.splice(0, this.config.batchSize);
453
- await this.sendWithRetry(batch, this.config.maxRetries);
454
- }
455
-
456
- /**
457
- * Send events with exponential backoff retry
458
- * Tracks per-event, per-subscriber failures so failed counter reflects actual failed deliveries.
459
- * On retry, only failed (event, subscriber) pairs are re-sent to avoid double-counting delivered.
460
- */
461
- private async sendWithRetry(
462
- events: EventData[],
463
- retriesLeft: number,
464
- subscribersByEventIndex?: Map<number, Set<string>>,
465
- ): Promise<void> {
466
- const failedDeliveries = await this.sendToSubscribers(
467
- events,
468
- subscribersByEventIndex,
469
- );
470
-
471
- if (failedDeliveries.length > 0) {
472
- if (retriesLeft > 0) {
473
- // Retry only events that had at least one failure, and only to subscribers that failed (avoid re-sending to healthy subscribers and double-counting delivered)
474
- const failedEventIndices = new Set(
475
- failedDeliveries.map((f) => f.eventIndex),
476
- );
477
- const failedEventIndicesOrdered = [...failedEventIndices].sort(
478
- (a, b) => a - b,
479
- );
480
- const eventsToRetry = failedEventIndicesOrdered.map(
481
- (i) => events[i],
482
- ) as EventData[];
483
- const failedSubscribersByRetryIndex = new Map<number, Set<string>>();
484
- for (let j = 0; j < failedEventIndicesOrdered.length; j++) {
485
- const origIndex = failedEventIndicesOrdered[j];
486
- const set = new Set<string>();
487
- for (const { eventIndex, subscriberName } of failedDeliveries) {
488
- if (eventIndex === origIndex) set.add(subscriberName);
489
- }
490
- failedSubscribersByRetryIndex.set(j, set);
491
- }
492
- const delay = Math.pow(2, this.config.maxRetries - retriesLeft) * 1000;
493
- await new Promise((resolve) => setTimeout(resolve, delay));
494
- return this.sendWithRetry(
495
- eventsToRetry,
496
- retriesLeft - 1,
497
- failedSubscribersByRetryIndex,
498
- );
499
- } else {
500
- // Give up after max retries - record one failure per (event, subscriber) pair
501
- for (const { eventIndex, subscriberName, error } of failedDeliveries) {
502
- const event = events[eventIndex];
503
- if (event) this.recordFailed(event, subscriberName, error);
504
- }
505
-
506
- const failedSubscriberNames = [
507
- ...new Set(failedDeliveries.map((f) => f.subscriberName)),
508
- ];
509
- getLogger().error(
510
- {
511
- failedSubscribers: failedSubscriberNames,
512
- retriesAttempted: this.config.maxRetries,
513
- },
514
- '[autotel] Failed to send events after retries',
515
- );
516
- }
517
- }
518
- }
519
-
520
- /**
521
- * Send events to configured subscribers with rate limiting and metrics.
522
- * When subscribersByEventIndex is provided (retry path), only those subscribers are tried per event.
523
- * Returns per-event, per-subscriber failures (empty if all succeeded).
524
- */
525
- private async sendToSubscribers(
526
- events: EventData[],
527
- subscribersByEventIndex?: Map<number, Set<string>>,
528
- ): Promise<
529
- Array<{ eventIndex: number; subscriberName: string; error?: Error }>
530
- > {
531
- const failedDeliveries: Array<{
532
- eventIndex: number;
533
- subscriberName: string;
534
- error?: Error;
535
- }> = [];
536
-
537
- const sendOne = async (event: EventData, eventIndex: number) => {
538
- // On retry, only try subscribers that failed for this event (never re-send to healthy subscribers)
539
- const subscriberNames = subscribersByEventIndex?.get(eventIndex);
540
- const failures = await this.sendEventToSubscribers(
541
- event,
542
- subscriberNames ?? undefined,
543
- );
544
- for (const failure of failures) {
545
- failedDeliveries.push({
546
- eventIndex,
547
- subscriberName: failure.subscriberName,
548
- error: failure.error,
549
- });
550
- }
551
- };
552
-
553
- if (!this.rateLimiter) {
554
- for (let i = 0; i < events.length; i++) {
555
- const event = events[i];
556
- if (event) await sendOne(event, i);
557
- }
558
- return failedDeliveries;
559
- }
560
-
561
- for (let i = 0; i < events.length; i++) {
562
- await this.rateLimiter.waitForToken();
563
- const event = events[i];
564
- if (event) await sendOne(event, i);
565
- }
566
-
567
- return failedDeliveries;
568
- }
569
-
570
- /**
571
- * Send a single event to subscribers.
572
- * - When subscriberNames is undefined (initial attempt): send to all subscribers.
573
- * - When subscriberNames is provided (retry): send only to those subscribers (never re-send to healthy ones).
574
- * Returns list of subscribers that failed (empty if all succeeded).
575
- */
576
- private async sendEventToSubscribers(
577
- event: EventData,
578
- subscriberNames?: Set<string>,
579
- ): Promise<Array<{ subscriberName: string; error?: Error }>> {
580
- const startTime = event.timestamp;
581
- const failures: Array<{ subscriberName: string; error?: Error }> = [];
582
-
583
- const subscribersToTry =
584
- subscriberNames === undefined
585
- ? this.subscribers
586
- : this.subscribers.filter((s) =>
587
- subscriberNames.has(getSubscriberName(s)),
588
- );
589
-
590
- const results = await Promise.allSettled(
591
- subscribersToTry.map(async (subscriber) => {
592
- const subscriberName = getSubscriberName(subscriber);
593
-
594
- try {
595
- await subscriber.trackEvent(event.name, event.attributes, {
596
- autotel: event.autotel,
597
- schema: event.schema,
598
- });
599
- this.recordDelivered(event, subscriberName, startTime);
600
- return { subscriberName, success: true };
601
- } catch (error) {
602
- this.markSubscriberUnhealthy(subscriberName);
603
- return {
604
- subscriberName,
605
- success: false,
606
- error: error instanceof Error ? error : undefined,
607
- };
608
- }
609
- }),
610
- );
611
-
612
- for (const result of results) {
613
- if (result.status === 'fulfilled' && !result.value.success) {
614
- failures.push({
615
- subscriberName: result.value.subscriberName,
616
- error: result.value.error,
617
- });
618
- }
619
- }
620
-
621
- return failures;
622
- }
623
-
624
- /**
625
- * Flush all remaining events. Queue remains usable after flush (e.g. for
626
- * auto-flush at root span end). Use shutdown() when tearing down the queue.
627
- */
628
- async flush(): Promise<void> {
629
- // Cancel any pending timer
630
- if (this.flushTimer) {
631
- clearTimeout(this.flushTimer);
632
- this.flushTimer = null;
633
- }
634
-
635
- // Wait for any in-progress flush to complete
636
- if (this.flushPromise) {
637
- await this.flushPromise;
638
- }
639
-
640
- // Flush all remaining batches
641
- while (this.queue.length > 0) {
642
- await this.doFlushBatch();
643
- }
644
- }
645
-
646
- /**
647
- * Flush remaining events and permanently disable the queue (reject new events).
648
- * Use for process/SDK shutdown; use flush() for periodic or span-end drain.
649
- */
650
- async shutdown(): Promise<void> {
651
- this.isShuttingDown = true;
652
- await this.flush();
653
- }
654
-
655
- /**
656
- * Cleanup observable metric callbacks to prevent memory leaks
657
- * Call this when destroying the EventQueue instance
658
- */
659
- cleanup(): void {
660
- // Remove all observable callbacks
661
- for (const cleanupFn of this.observableCleanups) {
662
- try {
663
- cleanupFn();
664
- } catch {
665
- // Ignore cleanup errors
666
- }
667
- }
668
- this.observableCleanups = [];
669
- }
670
-
671
- /**
672
- * Get queue size (for testing/debugging)
673
- */
674
- size(): number {
675
- return this.queue.length;
676
- }
677
-
678
- /**
679
- * Get subscriber health status (for testing/debugging)
680
- */
681
- getSubscriberHealth(): Map<string, boolean> {
682
- return new Map(this.subscriberHealthy);
683
- }
684
-
685
- /**
686
- * Check if a specific subscriber is healthy
687
- */
688
- isSubscriberHealthy(subscriberName: string): boolean {
689
- return this.subscriberHealthy.get(subscriberName.toLowerCase()) ?? true;
690
- }
691
-
692
- /**
693
- * Manually mark a subscriber as healthy or unhealthy
694
- * (used for circuit breaker integration)
695
- */
696
- setSubscriberHealth(subscriberName: string, healthy: boolean): void {
697
- this.subscriberHealthy.set(subscriberName.toLowerCase(), healthy);
698
- }
699
- }