@agent-relay/wrapper 2.0.12 → 2.0.14

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -20,7 +20,7 @@ import { spawn, ChildProcess } from 'node:child_process';
20
20
  import { createConnection, Socket } from 'node:net';
21
21
  import { createHash } from 'node:crypto';
22
22
  import { join, dirname } from 'node:path';
23
- import { existsSync, unlinkSync, mkdirSync, symlinkSync, lstatSync, rmSync, watch, readdirSync } from 'node:fs';
23
+ import { existsSync, unlinkSync, mkdirSync, symlinkSync, lstatSync, rmSync, watch, readdirSync, readlinkSync, writeFileSync, appendFileSync } from 'node:fs';
24
24
  import type { FSWatcher } from 'node:fs';
25
25
  import { getProjectPaths } from '@agent-relay/config/project-namespace';
26
26
  import { getAgentOutboxTemplate } from '@agent-relay/config/relay-file-writer';
@@ -31,7 +31,8 @@ const __filename = fileURLToPath(import.meta.url);
31
31
  const __dirname = dirname(__filename);
32
32
  import { BaseWrapper, type BaseWrapperConfig } from './base-wrapper.js';
33
33
  import { parseSummaryWithDetails, parseSessionEndFromOutput } from './parser.js';
34
- import type { SendPayload, SendMeta } from '@agent-relay/protocol/types';
34
+ import type { SendPayload, SendMeta, Envelope } from '@agent-relay/protocol/types';
35
+ import type { ChannelMessagePayload } from '@agent-relay/protocol/channels';
35
36
  import { findRelayPtyBinary as findRelayPtyBinaryUtil } from '@agent-relay/utils/relay-pty-path';
36
37
  import {
37
38
  type QueuedMessage,
@@ -80,7 +81,17 @@ interface ShutdownRequest {
80
81
  type: 'shutdown';
81
82
  }
82
83
 
83
- type RelayPtyRequest = InjectRequest | StatusRequest | ShutdownRequest;
84
+ /**
85
+ * Send just Enter key (for stuck input recovery)
86
+ * Used when message was written to PTY but Enter wasn't processed
87
+ */
88
+ interface SendEnterRequest {
89
+ type: 'send_enter';
90
+ /** Message ID this is for (for tracking) */
91
+ id: string;
92
+ }
93
+
94
+ type RelayPtyRequest = InjectRequest | StatusRequest | ShutdownRequest | SendEnterRequest;
84
95
 
85
96
  /**
86
97
  * Response types received from relay-pty socket
@@ -116,12 +127,26 @@ interface ShutdownAckResponse {
116
127
  type: 'shutdown_ack';
117
128
  }
118
129
 
130
+ /**
131
+ * Response for SendEnter request (stuck input recovery)
132
+ */
133
+ interface SendEnterResultResponse {
134
+ type: 'send_enter_result';
135
+ /** Message ID this is for */
136
+ id: string;
137
+ /** Whether Enter was sent successfully */
138
+ success: boolean;
139
+ /** Unix timestamp in milliseconds */
140
+ timestamp: number;
141
+ }
142
+
119
143
  type RelayPtyResponse =
120
144
  | InjectResultResponse
121
145
  | StatusResponse
122
146
  | BackpressureResponse
123
147
  | ErrorResponse
124
- | ShutdownAckResponse;
148
+ | ShutdownAckResponse
149
+ | SendEnterResultResponse;
125
150
 
126
151
  /**
127
152
  * Configuration for RelayPtyOrchestrator
@@ -196,6 +221,16 @@ export class RelayPtyOrchestrator extends BaseWrapper {
196
221
  retryCount: number; // Track retry attempts
197
222
  originalBody: string; // Original injection content for retries
198
223
  }> = new Map();
224
+ // Pending SendEnter requests (for stuck input recovery)
225
+ private pendingSendEnter: Map<string, {
226
+ resolve: (verified: boolean) => void;
227
+ timeout: NodeJS.Timeout;
228
+ from: string;
229
+ shortId: string;
230
+ retryCount: number;
231
+ originalBody: string;
232
+ originalResolve: (success: boolean) => void; // Original injection promise resolver
233
+ }> = new Map();
199
234
  private backpressureActive = false;
200
235
  private readyForMessages = false;
201
236
 
@@ -330,18 +365,38 @@ export class RelayPtyOrchestrator extends BaseWrapper {
330
365
 
331
366
  /**
332
367
  * Debug log - only outputs when debug is enabled
368
+ * Writes to log file to avoid polluting TUI output
333
369
  */
334
370
  private log(message: string): void {
335
371
  if (this.config.debug) {
336
- console.log(`[relay-pty-orchestrator:${this.config.name}] ${message}`);
372
+ const logLine = `${new Date().toISOString()} [relay-pty-orchestrator:${this.config.name}] ${message}\n`;
373
+ try {
374
+ const logDir = dirname(this._logPath);
375
+ if (!existsSync(logDir)) {
376
+ mkdirSync(logDir, { recursive: true });
377
+ }
378
+ appendFileSync(this._logPath, logLine);
379
+ } catch {
380
+ // Fallback to stderr if file write fails (only during init before _logPath is set)
381
+ }
337
382
  }
338
383
  }
339
384
 
340
385
  /**
341
386
  * Error log - always outputs (errors are important)
387
+ * Writes to log file to avoid polluting TUI output
342
388
  */
343
389
  private logError(message: string): void {
344
- console.error(`[relay-pty-orchestrator:${this.config.name}] ERROR: ${message}`);
390
+ const logLine = `${new Date().toISOString()} [relay-pty-orchestrator:${this.config.name}] ERROR: ${message}\n`;
391
+ try {
392
+ const logDir = dirname(this._logPath);
393
+ if (!existsSync(logDir)) {
394
+ mkdirSync(logDir, { recursive: true });
395
+ }
396
+ appendFileSync(this._logPath, logLine);
397
+ } catch {
398
+ // Fallback to stderr if file write fails (only during init before _logPath is set)
399
+ }
345
400
  }
346
401
 
347
402
  /**
@@ -407,20 +462,78 @@ export class RelayPtyOrchestrator extends BaseWrapper {
407
462
  if (!existsSync(linkParent)) {
408
463
  mkdirSync(linkParent, { recursive: true });
409
464
  }
410
- if (existsSync(linkPath)) {
465
+
466
+ // Remove existing path if it exists (file, symlink, or directory)
467
+ // Use lstatSync instead of existsSync to detect broken symlinks
468
+ // (existsSync returns false for broken symlinks, but the symlink itself still exists)
469
+ let pathExists = false;
470
+ try {
471
+ lstatSync(linkPath);
472
+ pathExists = true;
473
+ } catch {
474
+ // Path doesn't exist at all - proceed to create symlink
475
+ }
476
+
477
+ if (pathExists) {
411
478
  try {
412
479
  const stats = lstatSync(linkPath);
413
- if (stats.isSymbolicLink() || stats.isFile()) {
480
+ if (stats.isSymbolicLink()) {
481
+ // Handle both valid and broken symlinks
482
+ try {
483
+ const currentTarget = readlinkSync(linkPath);
484
+ if (currentTarget === targetPath) {
485
+ // Symlink already points to correct target, no need to recreate
486
+ this.log(` Symlink already exists and is correct: ${linkPath} -> ${targetPath}`);
487
+ return;
488
+ }
489
+ } catch {
490
+ // Broken symlink (target doesn't exist) - remove it
491
+ this.log(` Removing broken symlink: ${linkPath}`);
492
+ }
493
+ unlinkSync(linkPath);
494
+ } else if (stats.isFile()) {
414
495
  unlinkSync(linkPath);
415
496
  } else if (stats.isDirectory()) {
497
+ // Force remove directory - this is critical for fixing existing directories
416
498
  rmSync(linkPath, { recursive: true, force: true });
499
+ // Verify removal succeeded using lstatSync to catch broken symlinks
500
+ try {
501
+ lstatSync(linkPath);
502
+ throw new Error(`Failed to remove existing directory: ${linkPath}`);
503
+ } catch (err: any) {
504
+ if (err.code !== 'ENOENT') {
505
+ throw err; // Re-throw if it's not a "doesn't exist" error
506
+ }
507
+ // Path successfully removed
508
+ }
417
509
  }
418
- } catch {
419
- // Ignore cleanup errors
510
+ } catch (err: any) {
511
+ // Log cleanup errors instead of silently ignoring them
512
+ this.logError(` Failed to clean up existing path ${linkPath}: ${err.message}`);
513
+ throw err; // Re-throw to prevent symlink creation on failed cleanup
514
+ }
515
+ }
516
+
517
+ // Create the symlink
518
+ try {
519
+ symlinkSync(targetPath, linkPath);
520
+ // Verify symlink was created correctly
521
+ if (!existsSync(linkPath)) {
522
+ throw new Error(`Symlink creation failed: ${linkPath}`);
420
523
  }
524
+ const verifyStats = lstatSync(linkPath);
525
+ if (!verifyStats.isSymbolicLink()) {
526
+ throw new Error(`Created path is not a symlink: ${linkPath}`);
527
+ }
528
+ const verifyTarget = readlinkSync(linkPath);
529
+ if (verifyTarget !== targetPath) {
530
+ throw new Error(`Symlink points to wrong target: expected ${targetPath}, got ${verifyTarget}`);
531
+ }
532
+ this.log(` Created symlink: ${linkPath} -> ${targetPath}`);
533
+ } catch (err: any) {
534
+ this.logError(` Failed to create symlink ${linkPath} -> ${targetPath}: ${err.message}`);
535
+ throw err;
421
536
  }
422
- symlinkSync(targetPath, linkPath);
423
- this.log(` Created symlink: ${linkPath} -> ${targetPath}`);
424
537
  };
425
538
 
426
539
  // In workspace mode, create symlinks so agents can use canonical path
@@ -445,6 +558,26 @@ export class RelayPtyOrchestrator extends BaseWrapper {
445
558
  this.logError(` Failed to set up outbox: ${err.message}`);
446
559
  }
447
560
 
561
+ // Write MCP identity file so MCP servers can discover their agent name
562
+ // This is needed because Claude Code may not pass through env vars to MCP server processes
563
+ try {
564
+ const projectPaths = getProjectPaths(this.config.cwd);
565
+ const identityDir = join(projectPaths.dataDir);
566
+ if (!existsSync(identityDir)) {
567
+ mkdirSync(identityDir, { recursive: true });
568
+ }
569
+ // Write a per-process identity file (using PPID so MCP server finds parent's identity)
570
+ const identityPath = join(identityDir, `mcp-identity-${process.pid}`);
571
+ writeFileSync(identityPath, this.config.name, 'utf-8');
572
+ this.log(` Wrote MCP identity file: ${identityPath}`);
573
+
574
+ // Also write a simple identity file (for single-agent scenarios)
575
+ const simpleIdentityPath = join(identityDir, 'mcp-identity');
576
+ writeFileSync(simpleIdentityPath, this.config.name, 'utf-8');
577
+ } catch (err: any) {
578
+ this.logError(` Failed to write MCP identity file: ${err.message}`);
579
+ }
580
+
448
581
  // Find relay-pty binary
449
582
  const binaryPath = this.findRelayPtyBinary();
450
583
  if (!binaryPath) {
@@ -494,6 +627,12 @@ export class RelayPtyOrchestrator extends BaseWrapper {
494
627
  this.stopProtocolMonitor();
495
628
  this.stopPeriodicReminder();
496
629
 
630
+ // Clear socket reconnect timer
631
+ if (this.socketReconnectTimer) {
632
+ clearTimeout(this.socketReconnectTimer);
633
+ this.socketReconnectTimer = undefined;
634
+ }
635
+
497
636
  // Unregister from memory monitor
498
637
  this.memoryMonitor.unregister(this.config.name);
499
638
  if (this.memoryAlertHandler) {
@@ -625,6 +764,7 @@ export class RelayPtyOrchestrator extends BaseWrapper {
625
764
  ...process.env,
626
765
  ...this.config.env,
627
766
  AGENT_RELAY_NAME: this.config.name,
767
+ RELAY_AGENT_NAME: this.config.name, // MCP server uses this env var
628
768
  AGENT_RELAY_OUTBOX: this._canonicalOutboxPath, // Agents use this for outbox path
629
769
  TERM: 'xterm-256color',
630
770
  },
@@ -1098,6 +1238,16 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1098
1238
  */
1099
1239
  private attemptSocketConnection(timeout: number): Promise<void> {
1100
1240
  return new Promise((resolve, reject) => {
1241
+ // Clean up any existing socket before creating new one
1242
+ // This prevents orphaned sockets with stale event handlers
1243
+ if (this.socket) {
1244
+ // Remove all listeners to prevent the old socket's 'close' event
1245
+ // from triggering another reconnect cycle
1246
+ this.socket.removeAllListeners();
1247
+ this.socket.destroy();
1248
+ this.socket = undefined;
1249
+ }
1250
+
1101
1251
  const timer = setTimeout(() => {
1102
1252
  reject(new Error('Socket connection timeout'));
1103
1253
  }, timeout);
@@ -1114,9 +1264,19 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1114
1264
  reject(err);
1115
1265
  });
1116
1266
 
1267
+ // Handle 'end' event - server closed its write side (half-close)
1268
+ this.socket.on('end', () => {
1269
+ this.socketConnected = false;
1270
+ this.log(` Socket received end (server closed write side)`);
1271
+ });
1272
+
1117
1273
  this.socket.on('close', () => {
1118
1274
  this.socketConnected = false;
1119
1275
  this.log(` Socket closed`);
1276
+ // Auto-reconnect if not intentionally stopped
1277
+ if (this.running && !this.isGracefulStop) {
1278
+ this.scheduleSocketReconnect();
1279
+ }
1120
1280
  });
1121
1281
 
1122
1282
  // Handle incoming data (responses)
@@ -1155,6 +1315,64 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1155
1315
  this.pendingInjections.clear();
1156
1316
  }
1157
1317
 
1318
+ /** Timer for socket reconnection */
1319
+ private socketReconnectTimer?: NodeJS.Timeout;
1320
+ /** Current reconnection attempt count */
1321
+ private socketReconnectAttempt = 0;
1322
+
1323
+ /**
1324
+ * Schedule a socket reconnection attempt with exponential backoff
1325
+ */
1326
+ private scheduleSocketReconnect(): void {
1327
+ const maxAttempts = this.config.socketReconnectAttempts ?? 3;
1328
+
1329
+ // Clear any existing timer
1330
+ if (this.socketReconnectTimer) {
1331
+ clearTimeout(this.socketReconnectTimer);
1332
+ this.socketReconnectTimer = undefined;
1333
+ }
1334
+
1335
+ if (this.socketReconnectAttempt >= maxAttempts) {
1336
+ this.logError(` Socket reconnect failed after ${maxAttempts} attempts`);
1337
+ // Reset counter for future reconnects (processMessageQueue can trigger new cycle)
1338
+ this.socketReconnectAttempt = 0;
1339
+ // Note: socketReconnectTimer is already undefined, allowing processMessageQueue
1340
+ // to trigger a new reconnection cycle when new messages arrive
1341
+ return;
1342
+ }
1343
+
1344
+ this.socketReconnectAttempt++;
1345
+ const delay = Math.min(1000 * Math.pow(2, this.socketReconnectAttempt - 1), 10000); // Max 10s
1346
+
1347
+ this.log(` Scheduling socket reconnect in ${delay}ms (attempt ${this.socketReconnectAttempt}/${maxAttempts})`);
1348
+
1349
+ this.socketReconnectTimer = setTimeout(async () => {
1350
+ // Clear timer reference now that callback is executing
1351
+ this.socketReconnectTimer = undefined;
1352
+
1353
+ if (!this.running || this.isGracefulStop) {
1354
+ return;
1355
+ }
1356
+
1357
+ try {
1358
+ const timeout = this.config.socketConnectTimeoutMs ?? 5000;
1359
+ await this.attemptSocketConnection(timeout);
1360
+ this.log(` Socket reconnected successfully`);
1361
+ this.socketReconnectAttempt = 0; // Reset on success
1362
+
1363
+ // Process any queued messages that were waiting
1364
+ if (this.messageQueue.length > 0 && !this.isInjecting) {
1365
+ this.log(` Processing ${this.messageQueue.length} queued messages after reconnect`);
1366
+ this.processMessageQueue();
1367
+ }
1368
+ } catch (err: any) {
1369
+ this.logError(` Socket reconnect attempt ${this.socketReconnectAttempt} failed: ${err.message}`);
1370
+ // Schedule another attempt
1371
+ this.scheduleSocketReconnect();
1372
+ }
1373
+ }, delay);
1374
+ }
1375
+
1158
1376
  /**
1159
1377
  * Send a request to the socket and optionally wait for response
1160
1378
  */
@@ -1208,6 +1426,13 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1208
1426
  case 'shutdown_ack':
1209
1427
  this.log(` Shutdown acknowledged`);
1210
1428
  break;
1429
+
1430
+ case 'send_enter_result':
1431
+ // Handle SendEnter result (stuck input recovery)
1432
+ this.handleSendEnterResult(response).catch((err: Error) => {
1433
+ this.logError(` Error handling send_enter result: ${err.message}`);
1434
+ });
1435
+ break;
1211
1436
  }
1212
1437
  } catch (err: any) {
1213
1438
  this.logError(` Failed to parse socket response: ${err.message}`);
@@ -1298,7 +1523,6 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1298
1523
 
1299
1524
  // Check if we should retry
1300
1525
  if (pending.retryCount < INJECTION_CONSTANTS.MAX_RETRIES - 1) {
1301
- this.log(` Retrying injection (attempt ${pending.retryCount + 2}/${INJECTION_CONSTANTS.MAX_RETRIES})`);
1302
1526
  clearTimeout(pending.timeout);
1303
1527
  this.pendingInjections.delete(response.id);
1304
1528
 
@@ -1324,40 +1548,56 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1324
1548
  return;
1325
1549
  }
1326
1550
 
1327
- // Re-inject by sending another socket request
1328
- // The original promise will be resolved when this retry completes
1329
- // Prepend [RETRY] to help agent notice this is a retry
1330
- const retryBody = pending.originalBody.startsWith('[RETRY]')
1331
- ? pending.originalBody
1332
- : `[RETRY] ${pending.originalBody}`;
1333
- const retryRequest: InjectRequest = {
1334
- type: 'inject',
1335
- id: response.id,
1336
- from: pending.from,
1337
- body: retryBody,
1338
- priority: 1, // Higher priority for retries
1339
- };
1340
-
1341
- // Create new pending entry with incremented retry count
1342
- const newTimeout = setTimeout(() => {
1343
- this.logError(` Retry timeout for ${pending.shortId}`);
1344
- this.pendingInjections.delete(response.id);
1345
- pending.resolve(false);
1346
- }, 30000);
1347
-
1348
- this.pendingInjections.set(response.id, {
1349
- ...pending,
1350
- timeout: newTimeout,
1351
- retryCount: pending.retryCount + 1,
1352
- originalBody: retryBody, // Use retry body for subsequent retries
1353
- });
1551
+ // On first retry attempt (retryCount === 0), try SendEnter first
1552
+ // This handles the case where message content was written but Enter wasn't processed
1553
+ if (pending.retryCount === 0) {
1554
+ this.log(` Trying SendEnter first for ${pending.shortId} (stuck input recovery)`);
1555
+
1556
+ // Send just the Enter key
1557
+ const sendEnterRequest: SendEnterRequest = {
1558
+ type: 'send_enter',
1559
+ id: response.id,
1560
+ };
1561
+
1562
+ // Track this SendEnter request for verification
1563
+ const sendEnterTimeout = setTimeout(() => {
1564
+ this.logError(` SendEnter timeout for ${pending.shortId}`);
1565
+ this.pendingSendEnter.delete(response.id);
1566
+ // Fall back to full retry after SendEnter timeout
1567
+ this.doFullRetry(response.id, pending);
1568
+ }, 5000); // 5 second timeout for SendEnter
1569
+
1570
+ this.pendingSendEnter.set(response.id, {
1571
+ resolve: (verified: boolean) => {
1572
+ if (verified) {
1573
+ // SendEnter worked!
1574
+ this.injectionMetrics.successWithRetry++;
1575
+ this.injectionMetrics.total++;
1576
+ pending.resolve(true);
1577
+ } else {
1578
+ // SendEnter didn't work, do full retry
1579
+ this.doFullRetry(response.id, pending);
1580
+ }
1581
+ },
1582
+ timeout: sendEnterTimeout,
1583
+ from: pending.from,
1584
+ shortId: pending.shortId,
1585
+ retryCount: pending.retryCount,
1586
+ originalBody: pending.originalBody,
1587
+ originalResolve: pending.resolve,
1588
+ });
1354
1589
 
1355
- this.sendSocketRequest(retryRequest).catch((err) => {
1356
- this.logError(` Retry request failed: ${err.message}`);
1357
- clearTimeout(newTimeout);
1358
- this.pendingInjections.delete(response.id);
1359
- pending.resolve(false);
1360
- });
1590
+ this.sendSocketRequest(sendEnterRequest).catch((err) => {
1591
+ this.logError(` SendEnter request failed: ${err.message}`);
1592
+ clearTimeout(sendEnterTimeout);
1593
+ this.pendingSendEnter.delete(response.id);
1594
+ // Fall back to full retry
1595
+ this.doFullRetry(response.id, pending);
1596
+ });
1597
+ } else {
1598
+ // On subsequent retries (retryCount > 0), do full retry directly
1599
+ this.doFullRetry(response.id, pending);
1600
+ }
1361
1601
  } else {
1362
1602
  // Max retries exceeded
1363
1603
  this.logError(` Message ${pending.shortId} failed after ${INJECTION_CONSTANTS.MAX_RETRIES} attempts - NOT found in output`);
@@ -1389,6 +1629,102 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1389
1629
  // queued/injecting are intermediate states - wait for final status
1390
1630
  }
1391
1631
 
1632
+ /**
1633
+ * Handle SendEnter result (stuck input recovery)
1634
+ * Called when relay-pty responds to a SendEnter request
1635
+ */
1636
+ private async handleSendEnterResult(response: SendEnterResultResponse): Promise<void> {
1637
+ this.log(` handleSendEnterResult: id=${response.id.substring(0, 8)} success=${response.success}`);
1638
+
1639
+ const pendingEnter = this.pendingSendEnter.get(response.id);
1640
+ if (!pendingEnter) {
1641
+ this.log(` No pending SendEnter found for ${response.id.substring(0, 8)}`);
1642
+ return;
1643
+ }
1644
+
1645
+ clearTimeout(pendingEnter.timeout);
1646
+ this.pendingSendEnter.delete(response.id);
1647
+
1648
+ if (!response.success) {
1649
+ this.log(` SendEnter failed for ${pendingEnter.shortId}, will try full retry`);
1650
+ pendingEnter.resolve(false);
1651
+ return;
1652
+ }
1653
+
1654
+ // SendEnter succeeded - wait and verify
1655
+ this.log(` SendEnter sent for ${pendingEnter.shortId}, waiting to verify...`);
1656
+ await sleep(150); // Give time for Enter to be processed
1657
+
1658
+ // Verify the message appeared in output
1659
+ const verified = await verifyInjection(
1660
+ pendingEnter.shortId,
1661
+ pendingEnter.from,
1662
+ async () => this.getCleanOutput()
1663
+ );
1664
+
1665
+ if (verified) {
1666
+ this.log(` Message ${pendingEnter.shortId} verified after SendEnter ✓`);
1667
+ pendingEnter.resolve(true);
1668
+ } else {
1669
+ this.log(` Message ${pendingEnter.shortId} still not verified after SendEnter, will try full retry`);
1670
+ pendingEnter.resolve(false);
1671
+ }
1672
+ }
1673
+
1674
+ /**
1675
+ * Do a full retry with message content (used when SendEnter fails or for subsequent retries)
1676
+ */
1677
+ private doFullRetry(
1678
+ messageId: string,
1679
+ pending: {
1680
+ resolve: (success: boolean) => void;
1681
+ reject: (error: Error) => void;
1682
+ from: string;
1683
+ shortId: string;
1684
+ retryCount: number;
1685
+ originalBody: string;
1686
+ }
1687
+ ): void {
1688
+ this.log(` Doing full retry for ${pending.shortId} (attempt ${pending.retryCount + 2}/${INJECTION_CONSTANTS.MAX_RETRIES})`);
1689
+
1690
+ // Re-inject by sending another socket request
1691
+ // Prepend [RETRY] to help agent notice this is a retry
1692
+ const retryBody = pending.originalBody.startsWith('[RETRY]')
1693
+ ? pending.originalBody
1694
+ : `[RETRY] ${pending.originalBody}`;
1695
+ const retryRequest: InjectRequest = {
1696
+ type: 'inject',
1697
+ id: messageId,
1698
+ from: pending.from,
1699
+ body: retryBody,
1700
+ priority: 1, // Higher priority for retries
1701
+ };
1702
+
1703
+ // Create new pending entry with incremented retry count
1704
+ const newTimeout = setTimeout(() => {
1705
+ this.logError(` Retry timeout for ${pending.shortId}`);
1706
+ this.pendingInjections.delete(messageId);
1707
+ pending.resolve(false);
1708
+ }, 30000);
1709
+
1710
+ this.pendingInjections.set(messageId, {
1711
+ resolve: pending.resolve,
1712
+ reject: pending.reject,
1713
+ timeout: newTimeout,
1714
+ from: pending.from,
1715
+ shortId: pending.shortId,
1716
+ retryCount: pending.retryCount + 1,
1717
+ originalBody: retryBody,
1718
+ });
1719
+
1720
+ this.sendSocketRequest(retryRequest).catch((err) => {
1721
+ this.logError(` Full retry request failed: ${err.message}`);
1722
+ clearTimeout(newTimeout);
1723
+ this.pendingInjections.delete(messageId);
1724
+ pending.resolve(false);
1725
+ });
1726
+ }
1727
+
1392
1728
  /**
1393
1729
  * Handle backpressure notification
1394
1730
  */
@@ -1474,14 +1810,46 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1474
1810
  * Process queued messages
1475
1811
  */
1476
1812
  private async processMessageQueue(): Promise<void> {
1477
- if (!this.readyForMessages || this.backpressureActive || this.isInjecting) {
1478
- return;
1813
+ // Debug: Log blocking conditions when queue has messages
1814
+ if (this.messageQueue.length > 0) {
1815
+ if (!this.readyForMessages) {
1816
+ this.log(` Queue blocked: readyForMessages=false (queue=${this.messageQueue.length})`);
1817
+ return;
1818
+ }
1819
+ if (this.backpressureActive) {
1820
+ this.log(` Queue blocked: backpressure active (queue=${this.messageQueue.length})`);
1821
+ return;
1822
+ }
1823
+ if (this.isInjecting) {
1824
+ // Already injecting - the finally block will process next message
1825
+ // But add a safety timeout in case injection gets stuck
1826
+ const elapsed = this.injectionStartTime > 0 ? Date.now() - this.injectionStartTime : 0;
1827
+ if (elapsed > 35000) {
1828
+ this.logError(` Injection stuck for ${elapsed}ms, forcing reset`);
1829
+ this.isInjecting = false;
1830
+ this.injectionStartTime = 0;
1831
+ }
1832
+ return;
1833
+ }
1479
1834
  }
1480
1835
 
1481
1836
  if (this.messageQueue.length === 0) {
1482
1837
  return;
1483
1838
  }
1484
1839
 
1840
+ // Proactively reconnect socket if disconnected and we have messages to send
1841
+ if (!this.socketConnected && !this.socketReconnectTimer) {
1842
+ this.log(` Socket disconnected, triggering reconnect before processing queue`);
1843
+ this.scheduleSocketReconnect();
1844
+ return; // Wait for reconnection to complete
1845
+ }
1846
+
1847
+ if (!this.socketConnected) {
1848
+ // Reconnection in progress, wait for it
1849
+ this.log(` Queue waiting: socket reconnecting (queue=${this.messageQueue.length})`);
1850
+ return;
1851
+ }
1852
+
1485
1853
  // Check if agent is in editor mode - delay injection if so
1486
1854
  const idleResult = this.idleDetector.checkIdle();
1487
1855
  if (idleResult.inEditorMode) {
@@ -1550,6 +1918,24 @@ export class RelayPtyOrchestrator extends BaseWrapper {
1550
1918
  this.processMessageQueue();
1551
1919
  }
1552
1920
 
1921
+ /**
1922
+ * Override handleIncomingChannelMessage to trigger queue processing.
1923
+ * Without this override, channel messages would be queued but processMessageQueue()
1924
+ * would never be called, causing messages to get stuck until the queue monitor runs.
1925
+ */
1926
+ protected override handleIncomingChannelMessage(
1927
+ from: string,
1928
+ channel: string,
1929
+ body: string,
1930
+ envelope: Envelope<ChannelMessagePayload>
1931
+ ): void {
1932
+ this.log(` === CHANNEL MESSAGE RECEIVED: ${envelope.id.substring(0, 8)} from ${from} on ${channel} ===`);
1933
+ this.log(` Body preview: ${body?.substring(0, 100) ?? '(no body)'}...`);
1934
+ super.handleIncomingChannelMessage(from, channel, body, envelope);
1935
+ this.log(` Queue length after add: ${this.messageQueue.length}`);
1936
+ this.processMessageQueue();
1937
+ }
1938
+
1553
1939
  // =========================================================================
1554
1940
  // Queue monitor - Detect and process stuck messages
1555
1941
  // =========================================================================
@@ -2230,6 +2616,10 @@ Then output: \`->relay-file:spawn\`
2230
2616
  */
2231
2617
  async kill(): Promise<void> {
2232
2618
  this.isGracefulStop = true; // Mark as intentional to prevent crash broadcast
2619
+ if (this.socketReconnectTimer) {
2620
+ clearTimeout(this.socketReconnectTimer);
2621
+ this.socketReconnectTimer = undefined;
2622
+ }
2233
2623
  if (this.relayPtyProcess && !this.relayPtyProcess.killed) {
2234
2624
  this.relayPtyProcess.kill('SIGKILL');
2235
2625
  }