npm - omnius - Versions diffs - 1.0.198 → 1.0.199 - Mend

omnius 1.0.198 → 1.0.199

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/index.js +220 -18
package/docs/rest/QUICKREF.md +2 -2
package/docs/rest/auth-and-scopes.md +1 -1
package/docs/rest/endpoints/run.md +2 -2
package/docs/rest/endpoints/tools.md +5 -5
package/npm-shrinkwrap.json +2 -2
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -260097,6 +260097,31 @@ function approxImageDownloadBytes(preset) {
   }
   return gigabytesToBytes(4);
 }
+function imagePresetDependencyModels(preset, selectedModel) {
+  const models = [
+    selectedModel,
+    preset?.diffusersBaseModel,
+    preset?.textEncoderModel,
+    ...preset?.loraAdapters?.map((adapter) => adapter.repoId) ?? []
+  ].filter((value2) => Boolean(value2 && value2.trim()));
+  return [...new Set(models)];
+}
+function diffusersRunnerModelArgs(model) {
+  const preset = getImageGenerationPreset(model);
+  const runnerModel = preset?.diffusersBaseModel ?? model;
+  const argv = ["--model", runnerModel];
+  if (runnerModel !== model)
+    argv.push("--display-model", model);
+  if (preset?.textEncoderModel) {
+    argv.push("--text-encoder", preset.textEncoderModel);
+    if (preset.textEncoderTarget)
+      argv.push("--text-encoder-target", preset.textEncoderTarget);
+  }
+  for (const adapter of preset?.loraAdapters ?? []) {
+    argv.push("--lora", JSON.stringify(adapter));
+  }
+  return argv;
+}
 async function ensureImageGenerationCacheDirs(repoRoot) {
   const env2 = imageGenerationPythonEnv(repoRoot);
   await Promise.all([
@@ -260228,7 +260253,7 @@ function parseRunnerJson(stdout) {
   }
   return null;
 }
-var DEFAULT_DIFFUSERS_IMAGE_MODEL, DEFAULT_OLLAMA_IMAGE_MODEL, LEGACY_SDXL_TURBO_MODEL, SANA_1_5_1_6B_MODEL, SANA_1_5_4_8B_MODEL, SANA_1_6B_MULTILING_MODEL, SANA_1_6B_2K_MODEL, SANA_1_6B_4K_MODEL, SANA_SPRINT_0_6B_MODEL, SECONDARY_FLUX_DEV_MODEL, SECONDARY_FLUX_DEV_MIRROR_MODEL, SECONDARY_FLUX_DEV_COMFY_MODEL, SECONDARY_FLUX_FILL_MODEL, SECONDARY_FLUX_FILL_FP8_MODEL, SECONDARY_FLUX2_MODEL, OFFICIAL_BFL_ORG, IMAGE_GENERATION_MODEL_REPLACEMENTS, DIFFUSERS_PYTHON_PACKAGES, SDCPP_PYTHON_PACKAGES, IMAGE_GENERATION_MODEL_PRESETS, IMAGE_GENERATION_QUALITY_LADDER, OLLAMA_IMAGE_MODELS, DIFFUSERS_RUNNER, SDCPP_RUNNER, ImageGenerateTool;
+var DEFAULT_DIFFUSERS_IMAGE_MODEL, DEFAULT_OLLAMA_IMAGE_MODEL, LEGACY_SDXL_TURBO_MODEL, SANA_1_5_1_6B_MODEL, SANA_1_5_4_8B_MODEL, SANA_1_6B_MULTILING_MODEL, SANA_1_6B_2K_MODEL, SANA_1_6B_4K_MODEL, SANA_SPRINT_0_6B_MODEL, SECONDARY_FLUX_DEV_MODEL, SECONDARY_FLUX_DEV_MIRROR_MODEL, SECONDARY_FLUX_DEV_COMFY_MODEL, SECONDARY_FLUX_FILL_MODEL, SECONDARY_FLUX_FILL_FP8_MODEL, SECONDARY_FLUX2_MODEL, OFFICIAL_FLUX1_DEV_MODEL, OFFICIAL_FLUX2_KLEIN_9B_MODEL, PONPOKE_FLUX2_UNCENSORED_TEXT_ENCODER_MODEL, LUSTLY_FLUX_UNCENSORED_LORA_MODEL, KENERATE_FLUX_UNCENSORED_LORA_MODEL, OFFICIAL_BFL_ORG, IMAGE_GENERATION_MODEL_REPLACEMENTS, DIFFUSERS_PYTHON_PACKAGES, SDCPP_PYTHON_PACKAGES, IMAGE_GENERATION_MODEL_PRESETS, IMAGE_GENERATION_QUALITY_LADDER, OLLAMA_IMAGE_MODELS, DIFFUSERS_RUNNER, SDCPP_RUNNER, ImageGenerateTool;
 var init_image_generate = __esm({
   "packages/execution/dist/tools/image-generate.js"() {
     "use strict";
@@ -260252,6 +260277,11 @@ var init_image_generate = __esm({
     SECONDARY_FLUX_FILL_MODEL = "diffusers/FLUX.1-Fill-dev-nf4";
     SECONDARY_FLUX_FILL_FP8_MODEL = "boricuapab/flux1-fill-dev-fp8";
     SECONDARY_FLUX2_MODEL = "x/flux2-klein";
+    OFFICIAL_FLUX1_DEV_MODEL = "black-forest-labs/FLUX.1-dev";
+    OFFICIAL_FLUX2_KLEIN_9B_MODEL = "black-forest-labs/FLUX.2-klein-9B";
+    PONPOKE_FLUX2_UNCENSORED_TEXT_ENCODER_MODEL = "ponpoke/flux2-klein-9b-uncensored-text-encoder";
+    LUSTLY_FLUX_UNCENSORED_LORA_MODEL = "lustlyai/Flux_Lustly.ai_Uncensored_nsfw_v1";
+    KENERATE_FLUX_UNCENSORED_LORA_MODEL = "kenerateai/Flux-uncensored";
     OFFICIAL_BFL_ORG = "black-forest-labs";
     IMAGE_GENERATION_MODEL_REPLACEMENTS = /* @__PURE__ */ new Map([
       [officialBflModel("FLUX.1-dev"), SECONDARY_FLUX_DEV_MODEL],
@@ -260274,6 +260304,7 @@ var init_image_generate = __esm({
       "transformers",
       "accelerate",
       "safetensors",
+      "peft",
       "pillow",
       "sentencepiece",
       "protobuf"
@@ -260387,6 +260418,76 @@ var init_image_generate = __esm({
         fallbackFor: [SECONDARY_FLUX_FILL_MODEL],
         note: "Traceable FP8 fallback for FLUX.1 Fill dev from the research package."
       },
+      {
+        id: PONPOKE_FLUX2_UNCENSORED_TEXT_ENCODER_MODEL,
+        label: "FLUX.2 Klein 9B uncensored text encoder",
+        backend: "diffusers",
+        install: 'python3 .omnius/image-gen/diffusers_text2image.py --model black-forest-labs/FLUX.2-klein-9B --text-encoder ponpoke/flux2-klein-9b-uncensored-text-encoder --steps 4 --guidance 1 --width 1024 --height 1024 --prompt "..." --output .omnius/images/out.png',
+        category: "Adult-capable FLUX adapter",
+        sizeClass: "FLUX.2 Klein 9B text-encoder override",
+        quality: "Uncensored FLUX.2 Klein text-encoder override; uses the official FLUX.2 Klein 9B base pipeline and replaces the prompt encoder when the installed Diffusers stack supports that component layout.",
+        minVramGB: 24,
+        recommendedVramGB: 32,
+        deployment: "Diffusers Flux2KleinPipeline over black-forest-labs/FLUX.2-klein-9B with a replacement text encoder. Requires Hugging Face access/license acceptance for the BFL base and the text-encoder repo.",
+        steps: 4,
+        guidance: 1,
+        width: 1024,
+        height: 1024,
+        diffusersBaseModel: OFFICIAL_FLUX2_KLEIN_9B_MODEL,
+        textEncoderModel: PONPOKE_FLUX2_UNCENSORED_TEXT_ENCODER_MODEL,
+        textEncoderTarget: "auto",
+        approxDownloadGB: 36,
+        note: "Adapter-style preset: loads the gated FLUX.2 Klein 9B base and swaps in the ponpoke text encoder. Not in the automatic fallback ladder."
+      },
+      {
+        id: LUSTLY_FLUX_UNCENSORED_LORA_MODEL,
+        label: "Flux Lustly uncensored LoRA",
+        backend: "diffusers",
+        install: `python3 .omnius/image-gen/diffusers_text2image.py --model black-forest-labs/FLUX.1-dev --lora '{"repoId":"lustlyai/Flux_Lustly.ai_Uncensored_nsfw_v1","weightName":"flux_lustly-ai_v1.safetensors","adapterName":"v1","adapterWeight":1}' --steps 20 --guidance 4 --width 768 --height 768 --prompt "..." --output .omnius/images/out.png`,
+        category: "Adult-capable FLUX adapter",
+        sizeClass: "FLUX.1-dev LoRA adapter",
+        quality: "Adult-capable FLUX.1-dev LoRA tested by its publisher on full FLUX dev and schnell. Listed as an explicit opt-in model, not part of automatic fallback.",
+        minVramGB: 16,
+        recommendedVramGB: 24,
+        deployment: "Diffusers LoRA over black-forest-labs/FLUX.1-dev. Requires Hugging Face access/license acceptance for the gated BFL base model and the adapter terms.",
+        steps: 20,
+        guidance: 4,
+        width: 768,
+        height: 768,
+        diffusersBaseModel: OFFICIAL_FLUX1_DEV_MODEL,
+        loraAdapters: [{
+          repoId: LUSTLY_FLUX_UNCENSORED_LORA_MODEL,
+          weightName: "flux_lustly-ai_v1.safetensors",
+          adapterName: "v1",
+          adapterWeight: 1
+        }],
+        approxDownloadGB: 24,
+        note: "Adapter-style preset: loads FLUX.1-dev then applies the Lustly LoRA. Explicit selection only."
+      },
+      {
+        id: KENERATE_FLUX_UNCENSORED_LORA_MODEL,
+        label: "Kenerate Flux uncensored LoRA",
+        backend: "diffusers",
+        install: `python3 .omnius/image-gen/diffusers_text2image.py --model black-forest-labs/FLUX.1-dev --lora '{"repoId":"kenerateai/Flux-uncensored","adapterName":"kenerate","adapterWeight":1}' --steps 20 --guidance 3.5 --width 1024 --height 1024 --prompt "..." --output .omnius/images/out.png`,
+        category: "Adult-capable FLUX adapter",
+        sizeClass: "FLUX.1-dev LoRA adapter",
+        quality: "Community FLUX.1-dev LoRA. Hugging Face currently marks the model card as removed, so availability may fail at download time; kept as a selectable explicit model because the repo still advertises a Diffusers LoRA load path.",
+        minVramGB: 16,
+        recommendedVramGB: 24,
+        deployment: "Diffusers LoRA over black-forest-labs/FLUX.1-dev. Requires Hugging Face access/license acceptance for the gated BFL base model; adapter availability may vary.",
+        steps: 20,
+        guidance: 3.5,
+        width: 1024,
+        height: 1024,
+        diffusersBaseModel: OFFICIAL_FLUX1_DEV_MODEL,
+        loraAdapters: [{
+          repoId: KENERATE_FLUX_UNCENSORED_LORA_MODEL,
+          adapterName: "kenerate",
+          adapterWeight: 1
+        }],
+        approxDownloadGB: 24,
+        note: "Adapter-style preset: loads FLUX.1-dev then applies the Kenerate LoRA. The upstream card says the LoRA has been removed, so failures should be surfaced directly."
+      },
       {
         id: "stabilityai/stable-diffusion-3.5-large",
         label: "Stable Diffusion 3.5 Large",
@@ -260723,6 +260824,13 @@ def _device():
 def _pipeline_class(model):
     lowered = model.lower()
+    if "flux.2" in lowered or "flux2" in lowered or "flux-2" in lowered:
+        try:
+            from diffusers import Flux2KleinPipeline
+            return Flux2KleinPipeline
+        except Exception:
+            from diffusers import DiffusionPipeline
+            return DiffusionPipeline
     if "flux" in lowered:
         from diffusers import FluxPipeline
         return FluxPipeline
@@ -260749,13 +260857,85 @@ def _pipeline_class(model):
 def _large_model(model):
     lowered = model.lower()
     return any(token in lowered for token in [
-        "flux.1", "flux.2", "stable-diffusion-3.5", "hunyuan", "janus",
+        "flux.1", "flux.2", "flux2", "stable-diffusion-3.5", "hunyuan", "janus",
         "sana1.5_4.8b", "sana_1600m_2kpx", "sana_1600m_4kpx",
     ])
+def _parse_lora_specs(raw_specs):
+    specs = []
+    for raw in raw_specs or []:
+        if not raw:
+            continue
+        try:
+            parsed = json.loads(raw)
+            if isinstance(parsed, str):
+                parsed = {"repoId": parsed}
+            if isinstance(parsed, dict) and parsed.get("repoId"):
+                specs.append(parsed)
+        except Exception as exc:
+            raise ValueError(f"Invalid --lora JSON {raw!r}: {exc}")
+    return specs
+def _load_lora_adapters(pipe, specs):
+    adapter_names = []
+    adapter_weights = []
+    for index, spec in enumerate(specs):
+        repo_id = str(spec.get("repoId") or "").strip()
+        if not repo_id:
+            continue
+        kwargs = {}
+        weight_name = str(spec.get("weightName") or "").strip()
+        adapter_name = str(spec.get("adapterName") or f"adapter_{index}").strip()
+        if weight_name:
+            kwargs["weight_name"] = weight_name
+        if adapter_name:
+            kwargs["adapter_name"] = adapter_name
+        _progress("load", f"loading LoRA adapter {repo_id}")
+        pipe.load_lora_weights(repo_id, **kwargs)
+        if adapter_name:
+            adapter_names.append(adapter_name)
+            adapter_weights.append(float(spec.get("adapterWeight", 1.0)))
+    if adapter_names and hasattr(pipe, "set_adapters"):
+        _progress("load", f"activating {len(adapter_names)} LoRA adapter(s)")
+        pipe.set_adapters(adapter_names, adapter_weights=adapter_weights)
+def _target_text_encoder_attrs(pipe, target, repo_id):
+    explicit = str(target or "").strip()
+    if explicit and explicit != "auto":
+        return [explicit]
+    lowered = repo_id.lower()
+    preferred = ["text_encoder_3", "text_encoder_2", "text_encoder"] if ("qwen" in lowered or "flux2" in lowered or "klein" in lowered) else ["text_encoder", "text_encoder_2", "text_encoder_3"]
+    return [name for name in preferred if hasattr(pipe, name)]
+def _tokenizer_attr_for_text_encoder(attr):
+    if attr == "text_encoder":
+        return "tokenizer"
+    if attr.startswith("text_encoder_"):
+        return "tokenizer_" + attr.split("_")[-1]
+    return "tokenizer"
+def _replace_text_encoder(pipe, repo_id, target, dtype):
+    if not repo_id:
+        return
+    from transformers import AutoModel, AutoTokenizer
+    attrs = _target_text_encoder_attrs(pipe, target, repo_id)
+    if not attrs:
+        raise ValueError(f"Pipeline has no text_encoder component compatible with text encoder override {repo_id}")
+    attr = attrs[0]
+    tokenizer_attr = _tokenizer_attr_for_text_encoder(attr)
+    _progress("load", f"loading replacement text encoder {repo_id} into {attr}")
+    tokenizer = AutoTokenizer.from_pretrained(repo_id, trust_remote_code=True)
+    text_encoder = AutoModel.from_pretrained(repo_id, torch_dtype=dtype, trust_remote_code=True)
+    setattr(pipe, attr, text_encoder)
+    if hasattr(pipe, tokenizer_attr):
+        setattr(pipe, tokenizer_attr, tokenizer)
+    else:
+        _progress("load", f"pipeline has no {tokenizer_attr}; replaced {attr} only")
 def main():
     parser = argparse.ArgumentParser()
     parser.add_argument("--model", required=True)
+    parser.add_argument("--display-model", default="")
     parser.add_argument("--prompt", required=True)
     parser.add_argument("--output", required=True)
     parser.add_argument("--width", type=int, default=512)
@@ -260765,6 +260945,9 @@ def main():
     parser.add_argument("--seed", type=int, default=None)
     parser.add_argument("--device", default="auto")
     parser.add_argument("--variant", default="")
+    parser.add_argument("--lora", action="append", default=[])
+    parser.add_argument("--text-encoder", default="")
+    parser.add_argument("--text-encoder-target", default="auto")
     parser.add_argument("--prewarm", action="store_true")
     args = parser.parse_args()
@@ -260793,12 +260976,19 @@ def main():
         pipe = pipeline_cls.from_pretrained(args.model, **kwargs)
     _progress("load", f"model loaded on {device}")
+    if args.text_encoder:
+        _replace_text_encoder(pipe, args.text_encoder, args.text_encoder_target, dtype)
     if "sana" in lowered_model and hasattr(pipe, "text_encoder") and pipe.text_encoder is not None:
         try:
             pipe.text_encoder.to(torch.bfloat16)
         except Exception:
             pass
+    lora_specs = _parse_lora_specs(args.lora)
+    if lora_specs:
+        _load_lora_adapters(pipe, lora_specs)
     if hasattr(pipe, "enable_attention_slicing"):
         try:
             pipe.enable_attention_slicing()
@@ -260817,7 +261007,10 @@ def main():
         print(json.dumps({
             "ok": True,
             "path": "",
-            "model": args.model,
+            "model": args.display_model or args.model,
+            "base_model": args.model,
+            "lora_adapters": [spec.get("repoId") for spec in lora_specs],
+            "text_encoder": args.text_encoder or None,
             "backend": "diffusers",
             "device": device,
             "prewarm": True,
@@ -260853,7 +261046,10 @@ def main():
     print(json.dumps({
         "ok": True,
         "path": str(out),
-        "model": args.model,
+        "model": args.display_model or args.model,
+        "base_model": args.model,
+        "lora_adapters": [spec.get("repoId") for spec in lora_specs],
+        "text_encoder": args.text_encoder or None,
         "backend": "diffusers",
         "device": device,
         "seconds": round(time.perf_counter() - t0, 3),
@@ -260913,7 +261109,7 @@ if __name__ == "__main__":
 `;
     ImageGenerateTool = class {
       name = "generate_image";
-      description = `Generate an image from a text prompt using a local image-generation backend. Supports Ollama image models (x/flux2-klein), Python Diffusers models (Sana 1.5 1.6B default, Sana 1.5 4.8B, Sana multilingual/2K/4K, FLUX.1 dev, SD3.5 Large, SDXL Turbo, Tiny-SD, LCM, Sana Sprint), and stable-diffusion.cpp local checkpoints/GGUF. When fallback is enabled, auto generation tries ranked high-quality candidates first (Sana 1.5 above FLUX so we avoid HF gating), including community FLUX mirrors, and then falls back to smaller models if setup, download, or generation fails. Aspect ratio and resolution are model-controllable: pass aspect_ratio (e.g. "16:9", "9:16", "4:3", "3:4", "1:1", "21:9", "2:3", "3:2") to derive width/height around the selected model's preferred base resolution, or pass explicit width/height (in pixels, both rounded to a multiple of 8) when a specific size is required. A preliminary prompt-expansion stage rewrites the user's prompt into a richer, model-tuned version before generation when an LLM expander is wired; pass expand_prompt=false to skip. Saves a PNG under .omnius/images and returns the file path.`;
+      description = `Generate an image from a text prompt using a local image-generation backend. Supports Ollama image models (x/flux2-klein), Python Diffusers models (Sana 1.5 1.6B default, Sana 1.5 4.8B, Sana multilingual/2K/4K, FLUX.1 dev, FLUX adapter/LoRA presets, SD3.5 Large, SDXL Turbo, Tiny-SD, LCM, Sana Sprint), and stable-diffusion.cpp local checkpoints/GGUF. When fallback is enabled, auto generation tries ranked high-quality candidates first (Sana 1.5 above FLUX so we avoid HF gating), including community FLUX mirrors, and then falls back to smaller models if setup, download, or generation fails. Aspect ratio and resolution are model-controllable: pass aspect_ratio (e.g. "16:9", "9:16", "4:3", "3:4", "1:1", "21:9", "2:3", "3:2") to derive width/height around the selected model's preferred base resolution, or pass explicit width/height (in pixels, both rounded to a multiple of 8) when a specific size is required. A preliminary prompt-expansion stage rewrites the user's prompt into a richer, model-tuned version before generation when an LLM expander is wired; pass expand_prompt=false to skip. Saves a PNG under .omnius/images and returns the file path.`;
       parameters = {
         type: "object",
         properties: {
@@ -261407,7 +261603,7 @@ ${errText.slice(0, 1200)}`,
         try {
           const space = ensureDiskSpaceForDownload({
             approxDownloadBytes: approxBytes,
-            keepRepos: [args.model]
+            keepRepos: imagePresetDependencyModels(preset, args.model)
           });
           if (space.evicted.length > 0) {
             this.emitProgress({
@@ -261442,8 +261638,7 @@ ${errText.slice(0, 1200)}`,
         }
         const result = await runProcess2(python.command, [
           runner,
-          "--model",
-          args.model,
+          ...diffusersRunnerModelArgs(args.model),
           "--prompt",
           "omnius prewarm",
           "--output",
@@ -261617,8 +261812,7 @@ ${errText.slice(0, 800)}`,
         }
         const argv = [
           runner,
-          "--model",
-          args.model,
+          ...diffusersRunnerModelArgs(args.model),
           "--prompt",
           args.prompt,
           "--output",
@@ -261639,7 +261833,7 @@ ${errText.slice(0, 800)}`,
         try {
           const space = ensureDiskSpaceForDownload({
             approxDownloadBytes: approxBytes,
-            keepRepos: [args.model]
+            keepRepos: imagePresetDependencyModels(preset, args.model)
           });
           if (space.evicted.length > 0) {
             this.emitProgress({
@@ -534733,6 +534927,7 @@ __export(dist_exports, {
   imageGenerationDir: () => imageGenerationDir,
   imageGenerationModelPresets: () => imageGenerationModelPresets,
   imageGenerationSetupPlan: () => imageGenerationSetupPlan,
+  imagePresetDependencyModels: () => imagePresetDependencyModels,
   inferAudioGenerationBackend: () => inferAudioGenerationBackend,
   inferImageGenerationBackend: () => inferImageGenerationBackend,
   inferMediaBackend: () => inferMediaBackend,
@@ -586916,9 +587111,9 @@ var init_profiles = __esm({
         encrypted: false,
         created: "2026-03-31T00:00:00Z"
       },
-      "cygnus-regi-tracking": {
-        name: "cygnus-regi-tracking",
-        description: "REGI bookkeeping only — todos, working notes, and completion markers. No filesystem, search, shell, network, or model-generation tools.",
+      "bookkeeping-tracking": {
+        name: "bookkeeping-tracking",
+        description: "Bookkeeping only — todos, working notes, and completion markers. No filesystem, search, shell, network, or model-generation tools.",
         tools: {
           allow: ["todo_write", "todo_read", "working_notes", "task_complete"],
           deny: [
@@ -616212,7 +616407,13 @@ function ollamaModelDiskStats(model, sizes) {
 }
 function imageModelDiskStats(ctx3, preset, ollamaSizes) {
   if (preset.backend === "ollama") return ollamaModelDiskStats(preset.id, ollamaSizes);
-  if (preset.backend === "diffusers") return cachedModelDiskStats(imageGenerationDir(ctx3.repoRoot), preset.id);
+  if (preset.backend === "diffusers") {
+    const root = imageGenerationDir(ctx3.repoRoot);
+    const parts = imagePresetDependencyModels(preset, preset.id).map((model) => cachedModelDiskStats(root, model));
+    const paths = [...new Set(parts.flatMap((part) => part.paths))];
+    const bytes = parts.reduce((sum, part) => sum + part.bytes, 0);
+    return { downloaded: paths.length > 0, bytes, paths };
+  }
   return { downloaded: false, bytes: 0, paths: [] };
 }
 function audioModelDiskStats(ctx3, preset) {
@@ -616238,7 +616439,8 @@ async function deleteImageModelWeights(ctx3, preset) {
   if (preset.backend === "ollama") {
     messages2.push(await deleteOllamaWeights(ctx3, preset.id));
   } else if (preset.backend === "diffusers") {
-    const removed = removeCachedModelPaths(imageGenerationDir(ctx3.repoRoot), preset.id);
+    const root = imageGenerationDir(ctx3.repoRoot);
+    const removed = imagePresetDependencyModels(preset, preset.id).flatMap((model) => removeCachedModelPaths(root, model));
     messages2.push(removed.length > 0 ? `Deleted ${removed.length} cached image model path(s) for ${preset.id}.` : `No cached image weights found for ${preset.id}.`);
   } else {
     messages2.push("stable-diffusion.cpp uses explicit local checkpoint paths; remove the chosen checkpoint file directly if needed.");
@@ -616261,7 +616463,7 @@ async function showImageModelsMenu(ctx3, hasLocal) {
   };
   const items = [
     { key: "setup:ollama", label: "Setup Ollama", detail: "Pull x/z-image-turbo or x/flux2-klein" },
-    { key: "setup:diffusers", label: "Setup Diffusers", detail: "Auto-installs SDXL Turbo under .omnius/image-gen/.venv" },
+    { key: "setup:diffusers", label: "Setup Diffusers", detail: "Auto-installs the shared image runtime and selected Diffusers model" },
     { key: "setup:sdcpp", label: "Setup stable-diffusion.cpp", detail: "CPU/GGUF/checkpoint route" },
     { key: "hdr:models", label: selectColors.dim("─── Models ───") },
     ...imageGenerationModelPresets().map(buildModelItem)
@@ -667079,7 +667281,7 @@ function handleHelp(req2, res) {
         override: "Operators can override per-tool classification via OMNIUS_TOOL_OVERRIDES env var (JSON map of name → partial security info).",
         filters: "GET /v1/tools supports ?category=, ?scope=, ?risk=, ?off_device=true|false (Q9). E.g. /v1/tools?scope=read&off_device=true returns the safe-to-expose set.",
         profiles: "Tool profiles are enforced before tool exposure and again at execution. Resolution order: preset, working_directory/.omnius/profiles, ~/.omnius/profiles. Missing named profiles fail closed.",
-        bookkeeping: "For deterministic tracking, direct-call todo_write, todo_read, working_notes, and task_complete with profile:'cygnus-regi-tracking' and a stable session_id. Do not use /v1/run for bookkeeping-only mutations."
+        bookkeeping: "For deterministic tracking, direct-call todo_write, todo_read, working_notes, and task_complete with profile:'bookkeeping-tracking' and a stable session_id. Do not use /v1/run for bookkeeping-only mutations."
       },
       runtime_keys: {
         "GET /v1/keys": "List runtime keys (admin scope). Secrets masked.",

package/docs/rest/QUICKREF.md CHANGED Viewed

@@ -110,8 +110,8 @@ Deterministic bookkeeping without an agent run:
 ```bash
 curl -s -X POST http://127.0.0.1:11435/v1/tools/todo_write/call \
   -H 'content-type: application/json' \
-  -H 'x-omnius-session-id: regi-turn-123' \
-  -d '{"profile":"cygnus-regi-tracking","args":{"todos":[{"content":"Create NC report","status":"in_progress"}]}}'
+  -H 'x-omnius-session-id: tracking-turn-123' \
+  -d '{"profile":"bookkeeping-tracking","args":{"todos":[{"content":"Create report","status":"in_progress"}]}}'
 ```
 ## Voice TTS

package/docs/rest/auth-and-scopes.md CHANGED Viewed

@@ -88,7 +88,7 @@ Mint body:
 Tool calls are additionally gated by each tool's security metadata. Scope alone is not the only control.
-Runtime keys may bind a tool profile. A run-scope key with profile `cygnus-regi-tracking` can update todos and notes but cannot expose or execute filesystem/search/shell tools.
+Runtime keys may bind a tool profile. A run-scope key with profile `bookkeeping-tracking` can update todos and notes but cannot expose or execute filesystem/search/shell tools.
 ## Request Header

package/docs/rest/endpoints/run.md CHANGED Viewed

@@ -47,8 +47,8 @@ For bookkeeping integrations, prefer direct calls instead of `/v1/run`:
 ```bash
 curl -s -X POST "$OMNIUS/v1/tools/todo_write/call" \
   -H 'content-type: application/json' \
-  -H 'x-omnius-session-id: regi-turn-123' \
-  -d '{"profile":"cygnus-regi-tracking","args":{"todos":[{"content":"Create NC report","status":"in_progress"}]}}'
+  -H 'x-omnius-session-id: tracking-turn-123' \
+  -d '{"profile":"bookkeeping-tracking","args":{"todos":[{"content":"Create report","status":"in_progress"}]}}'
 ```
 ## Abort

package/docs/rest/endpoints/tools.md CHANGED Viewed

@@ -39,7 +39,7 @@ Filters include:
 ?scope=read|run|admin
 ?risk=low|medium|high|critical
 ?limit=200&offset=0
-?profile=cygnus-regi-tracking
+?profile=bookkeeping-tracking
 ```
 Profiles can also be selected with `X-Tool-Profile`. Named profiles resolve in this order: built-in preset, `{working_dir}/.omnius/profiles/{name}.json`, then `~/.omnius/profiles/{name}.json`. Missing profiles fail closed.
@@ -50,10 +50,10 @@ Profiles can also be selected with `X-Tool-Profile`. Named profiles resolve in t
 ```json
 {
-  "session_id": "regi-turn-123",
+  "session_id": "tracking-turn-123",
   "args": {},
   "working_dir": "/path/to/repo",
-  "profile": "cygnus-regi-tracking"
+  "profile": "bookkeeping-tracking"
 }
 ```
@@ -66,8 +66,8 @@ Bookkeeping tools are direct-callable and do not require a model run:
 ```bash
 curl -s -X POST "$OMNIUS/v1/tools/todo_write/call" \
   -H 'content-type: application/json' \
-  -H 'x-omnius-session-id: regi-turn-123' \
-  -d '{"profile":"cygnus-regi-tracking","args":{"todos":[{"content":"Create NC report","status":"in_progress"}]}}'
+  -H 'x-omnius-session-id: tracking-turn-123' \
+  -d '{"profile":"bookkeeping-tracking","args":{"todos":[{"content":"Create report","status":"in_progress"}]}}'
 ```
 Use `todo_write`, `todo_read`, `working_notes`, and `task_complete` this way for deterministic tracking. `task_complete` on this endpoint is only a bookkeeping boundary; `/v1/runs/{id}` remains the canonical run terminal state.

package/npm-shrinkwrap.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "omnius",
-  "version": "1.0.198",
+  "version": "1.0.199",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "omnius",
-      "version": "1.0.198",
+      "version": "1.0.199",
       "bundleDependencies": [
         "image-to-ascii"
       ],

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "omnius",
-  "version": "1.0.198",
+  "version": "1.0.199",
   "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
   "type": "module",
   "main": "./dist/index.js",