open-agents-ai 0.185.40 → 0.185.42

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2) hide show
  1. package/dist/index.js +18 -4
  2. package/package.json +1 -1
package/dist/index.js CHANGED
@@ -41395,7 +41395,7 @@ function execAsync(cmd, opts = {}) {
41395
41395
  function selectWeightTier(vramGB) {
41396
41396
  if (vramGB >= 48)
41397
41397
  return "original";
41398
- if (vramGB >= 16)
41398
+ if (vramGB >= 24)
41399
41399
  return "nf4-distilled";
41400
41400
  return "nf4";
41401
41401
  }
@@ -41499,13 +41499,20 @@ function isPersonaPlexInstalled() {
41499
41499
  return existsSync37(join54(PERSONAPLEX_DIR, "model_ready"));
41500
41500
  }
41501
41501
  function getWeightTier() {
41502
+ const detected = detectPersonaPlexCapability();
41502
41503
  const tierFile = join54(PERSONAPLEX_DIR, "weight_tier");
41503
41504
  if (existsSync37(tierFile)) {
41504
41505
  const saved = readFileSync28(tierFile, "utf8").trim();
41505
- if (saved in WEIGHT_REPOS)
41506
+ if (saved in WEIGHT_REPOS) {
41507
+ const vram = detected.vramGB;
41508
+ if (saved === "nf4-distilled" && vram < 24) {
41509
+ writeFileSync16(tierFile, "nf4");
41510
+ return "nf4";
41511
+ }
41506
41512
  return saved;
41513
+ }
41507
41514
  }
41508
- return detectPersonaPlexCapability().weightTier;
41515
+ return detected.weightTier;
41509
41516
  }
41510
41517
  function getWeightRepoInfo(tier) {
41511
41518
  return WEIGHT_REPOS[tier];
@@ -41937,7 +41944,12 @@ print('Converted')
41937
41944
  } catch {
41938
41945
  log("Ollama not detected \u2014 running PersonaPlex standalone (no hybrid)");
41939
41946
  }
41940
- log(`Starting PersonaPlex daemon (${tier} tier${hybridEnabled ? ", hybrid" : ""})...`);
41947
+ const caps = detectPersonaPlexCapability();
41948
+ const needsOffload = caps.vramGB > 0 && caps.vramGB < 24;
41949
+ if (needsOffload) {
41950
+ log(`GPU has ${caps.vramGB.toFixed(0)}GB VRAM \u2014 enabling CPU offload (model needs ~19GB)`);
41951
+ }
41952
+ log(`Starting PersonaPlex daemon (${tier} tier${hybridEnabled ? ", hybrid" : ""}${needsOffload ? ", cpu-offload" : ""})...`);
41941
41953
  const serverArgs = [
41942
41954
  "-m",
41943
41955
  "moshi.server",
@@ -41953,6 +41965,8 @@ print('Converted')
41953
41965
  ];
41954
41966
  if (hybridEnabled)
41955
41967
  serverArgs.push("--hybrid");
41968
+ if (needsOffload)
41969
+ serverArgs.push("--cpu-offload");
41956
41970
  const serverEnv = { ...process.env };
41957
41971
  if (hybridEnabled) {
41958
41972
  serverEnv["HYBRID_ENABLED"] = "1";
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "open-agents-ai",
3
- "version": "0.185.40",
3
+ "version": "0.185.42",
4
4
  "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
5
5
  "type": "module",
6
6
  "main": "./dist/index.js",