npm - omnius - Versions diffs - 1.0.105 → 1.0.106 - Mend

omnius 1.0.105 → 1.0.106

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/index.js CHANGED Viewed

@@ -578020,10 +578020,43 @@ async function needsTextToolMode(modelName, backendUrl2) {
   const hasTools = await checkToolSupport(modelName, backendUrl2);
   return !hasTools;
 }
+function parseNvidiaSmi(stdout) {
+  let total = 0;
+  let free = 0;
+  let name10 = "";
+  const lines = stdout.trim().split("\n").filter(Boolean);
+  for (const line of lines) {
+    const parts = line.split(",").map((s2) => s2.trim());
+    const totMB = parseInt(parts[0] ?? "0", 10);
+    const freeMB = parseInt(parts[1] ?? "0", 10);
+    if (!isNaN(totMB)) total += totMB / 1024;
+    if (!isNaN(freeMB)) free += freeMB / 1024;
+    if (!name10 && parts[2]) name10 = parts[2];
+  }
+  return { total, free, name: name10 };
+}
+function parseRocmSmi(stdout) {
+  let total = 0;
+  let used = 0;
+  let name10 = "";
+  const lines = stdout.trim().split("\n").filter(Boolean);
+  for (const line of lines) {
+    if (line.toLowerCase().startsWith("device") || line.startsWith("=")) continue;
+    const parts = line.split(",").map((s2) => s2.trim());
+    if (parts.length < 3) continue;
+    const usedBytes = parseInt(parts[1] ?? "0", 10);
+    const totBytes = parseInt(parts[2] ?? "0", 10);
+    if (!isNaN(usedBytes)) used += usedBytes / 1024 ** 3;
+    if (!isNaN(totBytes)) total += totBytes / 1024 ** 3;
+    if (!name10 && parts[0]) name10 = parts[0];
+  }
+  return { total, free: Math.max(0, total - used), name: name10 ? `AMD ${name10}` : "AMD GPU" };
+}
 function detectSystemSpecs() {
   let totalRamGB = 0;
   let availableRamGB = 0;
   let gpuVramGB = 0;
+  let availableVramGB = 0;
   let gpuName = "";
   try {
     const memInfo = execSync50("free -b 2>/dev/null || sysctl -n hw.memsize 2>/dev/null", {
@@ -578047,24 +578080,33 @@ function detectSystemSpecs() {
   }
   try {
     const nvidiaSmi = execSync50(
-      "nvidia-smi --query-gpu=memory.total,name --format=csv,noheader,nounits 2>/dev/null",
+      "nvidia-smi --query-gpu=memory.total,memory.free,name --format=csv,noheader,nounits 2>/dev/null",
       { encoding: "utf8", timeout: 5e3 }
     );
-    const lines = nvidiaSmi.trim().split("\n");
-    if (lines.length > 0) {
-      for (const line of lines) {
-        const parts = line.split(",").map((s2) => s2.trim());
-        const vramMB = parseInt(parts[0] ?? "0", 10);
-        if (!isNaN(vramMB)) gpuVramGB += vramMB / 1024;
-        if (!gpuName && parts[1]) gpuName = parts[1];
-      }
-    }
+    const r2 = parseNvidiaSmi(nvidiaSmi);
+    gpuVramGB += r2.total;
+    availableVramGB += r2.free;
+    if (!gpuName && r2.name) gpuName = r2.name;
   } catch {
   }
+  if (gpuVramGB === 0) {
+    try {
+      const rocmSmi = execSync50(
+        "rocm-smi --showmeminfo vram --csv 2>/dev/null",
+        { encoding: "utf8", timeout: 5e3 }
+      );
+      const r2 = parseRocmSmi(rocmSmi);
+      gpuVramGB += r2.total;
+      availableVramGB += r2.free;
+      if (!gpuName && r2.name) gpuName = r2.name;
+    } catch {
+    }
+  }
   return {
     totalRamGB: Math.round(totalRamGB * 10) / 10,
     availableRamGB: Math.round(availableRamGB * 10) / 10,
     gpuVramGB: Math.round(gpuVramGB * 10) / 10,
+    availableVramGB: Math.round(availableVramGB * 10) / 10,
     gpuName
   };
 }
@@ -578072,6 +578114,7 @@ async function detectSystemSpecsAsync() {
   let totalRamGB = 0;
   let availableRamGB = 0;
   let gpuVramGB = 0;
+  let availableVramGB = 0;
   let gpuName = "";
   try {
     const { stdout: memInfo } = await execAsync2(
@@ -578095,24 +578138,33 @@ async function detectSystemSpecsAsync() {
   }
   try {
     const { stdout: nvidiaSmi } = await execAsync2(
-      "nvidia-smi --query-gpu=memory.total,name --format=csv,noheader,nounits 2>/dev/null",
+      "nvidia-smi --query-gpu=memory.total,memory.free,name --format=csv,noheader,nounits 2>/dev/null",
       { timeout: 5e3 }
     );
-    const lines = nvidiaSmi.trim().split("\n");
-    if (lines.length > 0) {
-      for (const line of lines) {
-        const parts = line.split(",").map((s2) => s2.trim());
-        const vramMB = parseInt(parts[0] ?? "0", 10);
-        if (!isNaN(vramMB)) gpuVramGB += vramMB / 1024;
-        if (!gpuName && parts[1]) gpuName = parts[1];
-      }
-    }
+    const r2 = parseNvidiaSmi(nvidiaSmi);
+    gpuVramGB += r2.total;
+    availableVramGB += r2.free;
+    if (!gpuName && r2.name) gpuName = r2.name;
   } catch {
   }
+  if (gpuVramGB === 0) {
+    try {
+      const { stdout: rocmSmi } = await execAsync2(
+        "rocm-smi --showmeminfo vram --csv 2>/dev/null",
+        { timeout: 5e3 }
+      );
+      const r2 = parseRocmSmi(rocmSmi);
+      gpuVramGB += r2.total;
+      availableVramGB += r2.free;
+      if (!gpuName && r2.name) gpuName = r2.name;
+    } catch {
+    }
+  }
   return {
     totalRamGB: Math.round(totalRamGB * 10) / 10,
     availableRamGB: Math.round(availableRamGB * 10) / 10,
     gpuVramGB: Math.round(gpuVramGB * 10) / 10,
+    availableVramGB: Math.round(availableVramGB * 10) / 10,
     gpuName
   };
 }
@@ -578129,7 +578181,8 @@ function recommendModel(specs) {
 }
 function calculateContextWindow(specs, modelSizeGB2, kvBytesPerToken, archMax) {
   const ramBudget = specs.availableRamGB > 0 ? specs.availableRamGB : specs.totalRamGB;
-  const totalAvail = Math.max(specs.gpuVramGB, ramBudget);
+  const vramBudget = specs.availableVramGB > 0 ? specs.availableVramGB : specs.gpuVramGB;
+  const totalAvail = Math.max(vramBudget, ramBudget);
   const remaining = Math.max(0, totalAvail - modelSizeGB2);
   const usableGB = remaining * 0.85;
   let numCtx;

package/npm-shrinkwrap.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "omnius",
-  "version": "1.0.105",
+  "version": "1.0.106",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "omnius",
-      "version": "1.0.105",
+      "version": "1.0.106",
       "bundleDependencies": [
         "image-to-ascii"
       ],

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "omnius",
-  "version": "1.0.105",
+  "version": "1.0.106",
   "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
   "type": "module",
   "main": "./dist/index.js",