open-agents-ai 0.185.40 → 0.185.41

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2) hide show
  1. package/dist/index.js +9 -2
  2. package/package.json +1 -1
package/dist/index.js CHANGED
@@ -41395,7 +41395,7 @@ function execAsync(cmd, opts = {}) {
41395
41395
  function selectWeightTier(vramGB) {
41396
41396
  if (vramGB >= 48)
41397
41397
  return "original";
41398
- if (vramGB >= 16)
41398
+ if (vramGB >= 24)
41399
41399
  return "nf4-distilled";
41400
41400
  return "nf4";
41401
41401
  }
@@ -41937,7 +41937,12 @@ print('Converted')
41937
41937
  } catch {
41938
41938
  log("Ollama not detected \u2014 running PersonaPlex standalone (no hybrid)");
41939
41939
  }
41940
- log(`Starting PersonaPlex daemon (${tier} tier${hybridEnabled ? ", hybrid" : ""})...`);
41940
+ const caps = detectPersonaPlexCapability();
41941
+ const needsOffload = caps.vramGB > 0 && caps.vramGB < 24;
41942
+ if (needsOffload) {
41943
+ log(`GPU has ${caps.vramGB.toFixed(0)}GB VRAM \u2014 enabling CPU offload (model needs ~19GB)`);
41944
+ }
41945
+ log(`Starting PersonaPlex daemon (${tier} tier${hybridEnabled ? ", hybrid" : ""}${needsOffload ? ", cpu-offload" : ""})...`);
41941
41946
  const serverArgs = [
41942
41947
  "-m",
41943
41948
  "moshi.server",
@@ -41953,6 +41958,8 @@ print('Converted')
41953
41958
  ];
41954
41959
  if (hybridEnabled)
41955
41960
  serverArgs.push("--hybrid");
41961
+ if (needsOffload)
41962
+ serverArgs.push("--cpu-offload");
41956
41963
  const serverEnv = { ...process.env };
41957
41964
  if (hybridEnabled) {
41958
41965
  serverEnv["HYBRID_ENABLED"] = "1";
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "open-agents-ai",
3
- "version": "0.185.40",
3
+ "version": "0.185.41",
4
4
  "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
5
5
  "type": "module",
6
6
  "main": "./dist/index.js",