channel-worker 2.5.3 → 2.5.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1340,24 +1340,78 @@ class CommandPoller {
1340
1340
  // Pause on the Renderers tab; profile should stay closed until Resume.
1341
1341
  const isPaused = (r) => r && r.health_state === 'paused'
1342
1342
  && (!r.pause_until || new Date(r.pause_until).getTime() > Date.now());
1343
- const stillOffline = renderers.filter(r => !runningRenderers.includes(r) && !isPaused(r));
1343
+ let stillOffline = renderers.filter(r => !runningRenderers.includes(r) && !isPaused(r));
1344
1344
  const pausedCount = renderers.filter(isPaused).length;
1345
1345
  console.log(`[scene-dispatch] running=${runningRenderers.length} cap=${parallelLimit} (flowkit=${flowkitQ} dom=${domQ}) offline=${stillOffline.length} paused=${pausedCount} queue=${queueCount} names=[${runningRenderers.map(r=>r.name)}]`);
1346
1346
 
1347
- // Launch policy: keep ALL non-paused owned renderers ONLINE whenever
1348
- // there's any queue work they take turns claiming via the API's
1349
- // per-worker concurrency cap (Worker.parallel_limit). The cap limits
1350
- // CONCURRENT CLAIMS, not the number of profiles kept open: e.g. with
1351
- // parallel_limit=1 + 2 renderers veo01/veo02, both browsers stay open
1352
- // and alternate scene claims. Operator pauses a specific renderer if
1353
- // they want it closed (e.g. while solving captcha).
1347
+ // ROUND-ROBIN ROTATION when a running renderer just finished its
1348
+ // scene (no in-flight cmd) AND there's at least one OFFLINE sibling
1349
+ // AND queue has more work, close the just-finished one so the next
1350
+ // cycle launches the sibling. Result: scenes alternate veo03
1351
+ // veo04 veo03 veo04 instead of one renderer claiming
1352
+ // everything. Required for shared-Google-account safety: keeping a
1353
+ // browser idle on Flow page keeps refreshing tokens / pinging
1354
+ // telemetry → Veo flags "2 concurrent sessions per account" → captcha.
1355
+ // Closing it = 0 idle sessions, only 1 active at a time.
1356
+ if (queueCount > 0 && stillOffline.length > 0 && runningRenderers.length > 0) {
1357
+ const stoppedNames = [];
1358
+ for (const r of [...runningRenderers]) {
1359
+ // Skip externally-launched profiles (user opened manually via NST UI)
1360
+ // — we don't own their lifecycle.
1361
+ if (!this._profileLastActivity[r.nst_profile_id]) continue;
1362
+ try {
1363
+ const c = await this.api.rendererHasCommands(r.nst_profile_id);
1364
+ if (c > 0) continue; // busy → keep alive
1365
+ console.log(`[scene-dispatch] Round-robin: closing idle ${r.name} to rotate to sibling`);
1366
+ await this.nst.stopProfile(r.nst_profile_id);
1367
+ delete this._profileLastActivity[r.nst_profile_id];
1368
+ if (r.name) delete this._profileLastActivity[r.name.toLowerCase()];
1369
+ const idx = runningRenderers.indexOf(r);
1370
+ if (idx >= 0) runningRenderers.splice(idx, 1);
1371
+ stoppedNames.push(r.name);
1372
+ // The now-closed renderer becomes a fresh offline candidate for
1373
+ // future cycles (won't relaunch immediately — sibling goes first
1374
+ // because its last_command_assigned_at is older).
1375
+ stillOffline.push(r);
1376
+ } catch (e) {
1377
+ console.warn(`[scene-dispatch] Round-robin close failed for ${r.name}: ${e.message}`);
1378
+ }
1379
+ }
1380
+ if (stoppedNames.length) {
1381
+ console.log(`[scene-dispatch] Round-robin closed: [${stoppedNames.join(',')}] — next launch picks sibling`);
1382
+ }
1383
+ }
1384
+
1385
+ // Sort offline by last_command_assigned_at ASC (most idle first) so
1386
+ // the launcher picks the round-robin partner, not the one that just
1387
+ // finished. API populates last_command_assigned_at on every claim,
1388
+ // so this naturally implements turn-taking across siblings.
1389
+ stillOffline = stillOffline.slice().sort((a, b) => {
1390
+ const ta = a.last_command_assigned_at ? new Date(a.last_command_assigned_at).getTime() : 0;
1391
+ const tb = b.last_command_assigned_at ? new Date(b.last_command_assigned_at).getTime() : 0;
1392
+ return ta - tb;
1393
+ });
1394
+
1395
+ // Launch policy: STRICT parallel_limit cap on physical launches.
1396
+ // With pc2.parallel_limit=1 + 2 renderers (veo03/veo04 share same Veo
1397
+ // Google account), only ONE of them is launched at any time. The
1398
+ // second stays closed until the first finishes / is paused / cap is
1399
+ // bumped. This prevents Google flagging "2 concurrent sessions on
1400
+ // same account" → captcha.
1354
1401
  //
1355
- // Old "Close excess profiles" + parallelLimit-bounded launch logic was
1356
- // removed they conflated "concurrent claims cap" with "max launched"
1357
- // and forced one of the renderers to sit unlaunched when cap < count.
1358
- const eligibleToLaunch = queueCount > 0 ? stillOffline : [];
1359
- for (const toLaunch of eligibleToLaunch) {
1360
- console.log(`[scene-dispatch] Launching ${toLaunch.name} (queue=${queueCount} running=${runningRenderers.length})`);
1402
+ // Earlier iteration tried "launch all, cap only claims" — that left
1403
+ // both browsers open, both pinging Flow (token refresh, telemetry),
1404
+ // and Veo's per-account session monitor counted them as 2 active
1405
+ // sessions tripped captcha on the supposedly-idle one.
1406
+ const needNew = Math.max(0, queueCount);
1407
+ const neededLaunches = Math.min(
1408
+ parallelLimit - runningRenderers.length,
1409
+ stillOffline.length,
1410
+ needNew,
1411
+ );
1412
+ for (let li = 0; li < Math.max(0, neededLaunches); li++) {
1413
+ const toLaunch = stillOffline[li];
1414
+ console.log(`[scene-dispatch] Launching ${toLaunch.name} (${runningRenderers.length + li + 1}/${parallelLimit})`);
1361
1415
  try {
1362
1416
  await this._launchRendererProfile(toLaunch);
1363
1417
  runningRenderers.push(toLaunch);
@@ -1388,6 +1442,35 @@ class CommandPoller {
1388
1442
  }
1389
1443
  }
1390
1444
 
1445
+ // Close EXCESS running profiles when count > parallel_limit. Happens
1446
+ // when operator drops the cap (eg 2→1 to throttle captcha) — the
1447
+ // already-launched 2nd profile should retire so it doesn't keep
1448
+ // refreshing tokens against the shared Google account. Only close
1449
+ // if it has no in-flight command (let work finish first).
1450
+ if (runningRenderers.length > parallelLimit) {
1451
+ const excess = runningRenderers.length - parallelLimit;
1452
+ const idleRunning = [];
1453
+ for (const r of runningRenderers) {
1454
+ if (!this._profileLastActivity[r.nst_profile_id]) continue;
1455
+ try {
1456
+ const c = await this.api.rendererHasCommands(r.nst_profile_id);
1457
+ if (c === 0) idleRunning.push(r);
1458
+ } catch {}
1459
+ }
1460
+ for (const r of idleRunning.slice(0, excess)) {
1461
+ console.log(`[scene-dispatch] Closing excess ${r.name} (cap=${parallelLimit})`);
1462
+ try {
1463
+ await this.nst.stopProfile(r.nst_profile_id);
1464
+ delete this._profileLastActivity[r.nst_profile_id];
1465
+ if (r.name) delete this._profileLastActivity[r.name.toLowerCase()];
1466
+ const idx = runningRenderers.indexOf(r);
1467
+ if (idx >= 0) runningRenderers.splice(idx, 1);
1468
+ } catch (e) {
1469
+ console.warn(`[scene-dispatch] Failed to close excess ${r.name}: ${e.message}`);
1470
+ }
1471
+ }
1472
+ }
1473
+
1391
1474
  if (runningRenderers.length === 0) {
1392
1475
  this._dispatching = false;
1393
1476
  return;
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "channel-worker",
3
- "version": "2.5.3",
3
+ "version": "2.5.5",
4
4
  "description": "Channel Manager worker daemon — runs on remote machines to execute video pipeline jobs",
5
5
  "main": "lib/daemon.js",
6
6
  "bin": {