npm - @simulatte/doppler - Versions diffs - 0.1.6 → 0.1.8 - Mend

@simulatte/doppler 0.1.6 → 0.1.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (355) hide show

package/CHANGELOG.md +145 -0
package/README.md +16 -23
package/package.json +30 -32
package/src/adapters/adapter-registry.js +12 -1
package/src/adapters/lora-loader.js +23 -6
package/src/bridge/extension-client.d.ts +5 -0
package/src/bridge/extension-client.js +40 -0
package/src/bridge/index.d.ts +2 -1
package/src/bridge/index.js +6 -4
package/src/browser/browser-converter.js +31 -1
package/src/browser/file-picker.js +6 -0
package/src/browser/safetensors-parser-browser.js +84 -1
package/src/browser/shard-io-browser.js +2 -2
package/src/browser/tensor-source-download.js +8 -2
package/src/browser/tensor-source-http.d.ts +1 -0
package/src/browser/tensor-source-http.js +5 -1
package/src/client/doppler-api.browser.js +20 -4
package/src/client/doppler-api.js +19 -3
package/src/client/doppler-provider/generation.js +12 -0
package/src/client/doppler-provider/model-manager.d.ts +10 -0
package/src/client/doppler-provider/model-manager.js +91 -19
package/src/client/doppler-provider/source-runtime.d.ts +2 -1
package/src/client/doppler-provider/source-runtime.js +132 -13
package/src/client/doppler-registry.json +5 -20
package/src/config/backward-registry-loader.js +17 -2
package/src/config/execution-v0-contract-check.js +113 -15
package/src/config/kernel-path-contract-check.js +57 -29
package/src/config/kernel-path-loader.d.ts +5 -0
package/src/config/kernel-path-loader.js +18 -36
package/src/config/kernels/kernel-ref-digests.js +1 -1
package/src/config/kernels/registry.js +14 -1
package/src/config/kernels/registry.json +81 -5
package/src/config/loader.d.ts +1 -1
package/src/config/loader.js +15 -2
package/src/config/merge-contract-check.js +66 -4
package/src/config/merge-helpers.js +128 -7
package/src/config/merge.d.ts +1 -0
package/src/config/merge.js +10 -0
package/src/config/param-validator.js +47 -2
package/src/config/presets/kernel-paths/{gemma2-q4k-dequant-f32a.json → gemma2-q4k-dequant-f32a-nosubgroups.json} +3 -3
package/src/config/presets/kernel-paths/gemma3-f16-fused-f32a-online-streamingprefill.json +223 -0
package/src/config/presets/kernel-paths/{gemma3-q4k-dequant-f32a.json → gemma3-q4k-dequant-f32a-nosubgroups.json} +3 -3
package/src/config/presets/kernel-paths/gemma3-q4k-dequant-f32w-f32a-online.json +56 -0
package/src/config/presets/kernel-paths/lfm2-q4k-dequant-f32a-nosubgroups.json +61 -0
package/src/config/presets/kernel-paths/registry.json +43 -8
package/src/config/presets/models/gemma2.json +3 -2
package/src/config/presets/models/gemma3.json +2 -0
package/src/config/presets/models/qwen3.json +4 -3
package/src/config/presets/models/qwen3_5.json +16 -0
package/src/config/presets/runtime/experiments/bench/gemma3-bench-q4k.json +1 -1
package/src/config/presets/runtime/experiments/debug/gemma3-debug-q4k.json +1 -1
package/src/config/presets/runtime/experiments/verify/gemma3-verify.json +1 -1
package/src/config/presets/runtime/kernels/dequant-f16-q4k.json +6 -13
package/src/config/presets/runtime/kernels/dequant-f32-q4k.json +6 -13
package/src/config/presets/runtime/kernels/embeddinggemma-q4k-dequant-f32a.json +37 -0
package/src/config/presets/runtime/kernels/fused-q4k.json +6 -13
package/src/config/presets/runtime/kernels/gemma2-q4k-dequant-f16a.json +33 -0
package/src/config/presets/runtime/kernels/gemma2-q4k-dequant-f32a-nosubgroups.json +33 -0
package/src/config/presets/runtime/kernels/gemma2-q4k-fused-f32a.json +33 -0
package/src/config/presets/runtime/kernels/safe-q4k.json +6 -13
package/src/config/presets/runtime/model/qwen3-5-layer-probe.json +52 -0
package/src/config/presets/runtime/model/qwen3-5-linear-attn-debug.json +90 -0
package/src/config/presets/runtime/platform/metal-apple-q4k.json +1 -1
package/src/config/runtime.js +6 -1
package/src/config/schema/conversion.schema.d.ts +1 -0
package/src/config/schema/debug.schema.d.ts +5 -0
package/src/config/schema/doppler.schema.js +16 -21
package/src/config/schema/inference-defaults.schema.js +3 -3
package/src/config/schema/kernel-path.schema.d.ts +5 -1
package/src/config/schema/kernel-thresholds.schema.js +12 -4
package/src/config/schema/manifest.schema.d.ts +3 -2
package/src/config/schema/manifest.schema.js +17 -4
package/src/config/schema/storage.schema.js +1 -1
package/src/config/training-defaults.js +30 -22
package/src/converter/conversion-plan.js +104 -11
package/src/converter/core.d.ts +7 -0
package/src/converter/core.js +16 -9
package/src/converter/execution-v0-manifest.js +4 -1
package/src/converter/index.d.ts +1 -0
package/src/converter/index.js +1 -0
package/src/converter/manifest-inference.js +50 -29
package/src/converter/parsers/diffusion.js +0 -3
package/src/converter/parsers/transformer.js +4 -0
package/src/converter/quantization-info.js +40 -16
package/src/converter/quantizer.js +19 -12
package/src/converter/rope-config.js +8 -6
package/src/converter/shard-packer.d.ts +1 -1
package/src/converter/shard-packer.js +4 -1
package/src/converter/tokenizer-utils.d.ts +1 -0
package/src/converter/tokenizer-utils.js +4 -1
package/src/debug/config.js +123 -11
package/src/debug/reference/hf_qwen35_linear_attn_debug.py +268 -0
package/src/debug/signals.js +7 -1
package/src/debug/tensor.d.ts +2 -0
package/src/debug/tensor.js +13 -2
package/src/distribution/p2p-control-plane.js +52 -12
package/src/distribution/p2p-observability.js +43 -7
package/src/distribution/p2p-webrtc-browser.js +20 -0
package/src/distribution/shard-delivery.js +83 -27
package/src/formats/gguf/types.js +33 -16
package/src/formats/rdrr/groups.d.ts +12 -4
package/src/formats/rdrr/groups.js +3 -6
package/src/formats/rdrr/parsing.d.ts +4 -0
package/src/formats/rdrr/parsing.js +53 -3
package/src/formats/rdrr/types.d.ts +2 -1
package/src/gpu/command-recorder.js +86 -61
package/src/gpu/device.d.ts +1 -0
package/src/gpu/device.js +73 -19
package/src/gpu/kernel-tuner/benchmarks.js +326 -316
package/src/gpu/kernel-tuner/cache.js +71 -4
package/src/gpu/kernel-tuner/tuner.js +22 -4
package/src/gpu/kernels/attention.js +15 -34
package/src/gpu/kernels/backward/adam.js +62 -58
package/src/gpu/kernels/backward/attention_backward.js +257 -169
package/src/gpu/kernels/backward/conv2d_backward.js +14 -1
package/src/gpu/kernels/cast.js +191 -149
package/src/gpu/kernels/check-stop.js +33 -44
package/src/gpu/kernels/conv2d.js +27 -17
package/src/gpu/kernels/cross_entropy_loss.js +21 -15
package/src/gpu/kernels/depthwise_conv2d.js +36 -26
package/src/gpu/kernels/dequant.js +178 -126
package/src/gpu/kernels/energy.d.ts +3 -21
package/src/gpu/kernels/energy.js +111 -88
package/src/gpu/kernels/feature-check.js +1 -1
package/src/gpu/kernels/fused_ffn.js +84 -65
package/src/gpu/kernels/fused_matmul_residual.js +56 -33
package/src/gpu/kernels/fused_matmul_rmsnorm.js +62 -45
package/src/gpu/kernels/gather.js +33 -15
package/src/gpu/kernels/gelu.js +19 -11
package/src/gpu/kernels/grouped_pointwise_conv2d.js +33 -23
package/src/gpu/kernels/groupnorm.js +34 -23
package/src/gpu/kernels/index.d.ts +8 -0
package/src/gpu/kernels/index.js +6 -0
package/src/gpu/kernels/kv-quantize.js +5 -2
package/src/gpu/kernels/layernorm.js +35 -19
package/src/gpu/kernels/logit-merge.js +5 -3
package/src/gpu/kernels/matmul-selection.js +47 -4
package/src/gpu/kernels/matmul.d.ts +2 -0
package/src/gpu/kernels/matmul.js +59 -40
package/src/gpu/kernels/modulate.js +23 -15
package/src/gpu/kernels/moe.js +221 -175
package/src/gpu/kernels/pixel_shuffle.js +22 -14
package/src/gpu/kernels/relu.js +18 -10
package/src/gpu/kernels/repeat_channels.js +25 -17
package/src/gpu/kernels/residual.js +37 -27
package/src/gpu/kernels/rmsnorm.js +66 -43
package/src/gpu/kernels/rope.js +3 -0
package/src/gpu/kernels/sample.js +27 -38
package/src/gpu/kernels/sana_linear_attention.js +18 -10
package/src/gpu/kernels/scale.js +18 -11
package/src/gpu/kernels/shader-cache.js +4 -2
package/src/gpu/kernels/silu.js +120 -72
package/src/gpu/kernels/softmax.js +44 -25
package/src/gpu/kernels/split_qg.d.ts +50 -0
package/src/gpu/kernels/split_qg.js +46 -0
package/src/gpu/kernels/split_qg.wgsl +58 -0
package/src/gpu/kernels/split_qg_f16.wgsl +62 -0
package/src/gpu/kernels/split_qkv.js +23 -13
package/src/gpu/kernels/transpose.js +18 -10
package/src/gpu/kernels/transpose.wgsl +5 -3
package/src/gpu/kernels/upsample2d.js +21 -13
package/src/gpu/kernels/utils.js +20 -13
package/src/gpu/partitioned-buffer-pool.js +10 -2
package/src/gpu/perf-guards.js +2 -9
package/src/gpu/profiler.js +27 -22
package/src/gpu/readback-utils.d.ts +16 -0
package/src/gpu/readback-utils.js +41 -0
package/src/gpu/submit-tracker.js +13 -0
package/src/gpu/uniform-cache.d.ts +1 -0
package/src/gpu/uniform-cache.js +30 -9
package/src/gpu/weight-buffer.d.ts +1 -1
package/src/gpu/weight-buffer.js +1 -1
package/src/hotswap/intent-bundle.js +6 -0
package/src/hotswap/manifest.d.ts +10 -1
package/src/hotswap/manifest.js +12 -2
package/src/hotswap/runtime.js +30 -8
package/src/index-browser.d.ts +44 -0
package/src/index-browser.js +14 -0
package/src/inference/browser-harness-contract-helpers.d.ts +5 -0
package/src/inference/browser-harness-contract-helpers.js +28 -0
package/src/inference/browser-harness-diffusion-energy-suites.d.ts +2 -0
package/src/inference/browser-harness-diffusion-energy-suites.js +269 -0
package/src/inference/browser-harness-model-helpers.d.ts +16 -0
package/src/inference/browser-harness-model-helpers.js +217 -0
package/src/inference/browser-harness-report-helpers.d.ts +7 -0
package/src/inference/browser-harness-report-helpers.js +42 -0
package/src/inference/browser-harness-runtime-helpers.d.ts +61 -0
package/src/inference/browser-harness-runtime-helpers.js +415 -0
package/src/inference/browser-harness-suite-helpers.d.ts +28 -0
package/src/inference/browser-harness-suite-helpers.js +268 -0
package/src/inference/browser-harness-text-helpers.d.ts +27 -0
package/src/inference/browser-harness-text-helpers.js +788 -0
package/src/inference/browser-harness.d.ts +8 -0
package/src/inference/browser-harness.js +149 -1996
package/src/inference/kv-cache/base.js +140 -94
package/src/inference/kv-cache/tiered.js +5 -3
package/src/inference/moe-router.js +88 -56
package/src/inference/multi-model-network.js +5 -3
package/src/inference/network-evolution.d.ts +11 -2
package/src/inference/network-evolution.js +20 -21
package/src/inference/pipelines/context.d.ts +3 -0
package/src/inference/pipelines/context.js +142 -2
package/src/inference/pipelines/diffusion/helpers.js +10 -2
package/src/inference/pipelines/diffusion/pipeline.js +2 -1
package/src/inference/pipelines/diffusion/sd3-transformer.js +10 -10
package/src/inference/pipelines/diffusion/text-encoder-gpu.js +8 -2
package/src/inference/pipelines/diffusion/vae.js +3 -7
package/src/inference/pipelines/energy/pipeline.js +27 -21
package/src/inference/pipelines/energy/quintel.d.ts +5 -0
package/src/inference/pipelines/energy/quintel.js +11 -0
package/src/inference/pipelines/energy-head/row-head-pipeline.js +17 -13
package/src/inference/pipelines/structured/json-head-pipeline.js +26 -11
package/src/inference/pipelines/text/attention/output-projection.d.ts +12 -0
package/src/inference/pipelines/text/attention/output-projection.js +8 -0
package/src/inference/pipelines/text/attention/projections.d.ts +10 -1
package/src/inference/pipelines/text/attention/projections.js +192 -112
package/src/inference/pipelines/text/attention/record.js +77 -14
package/src/inference/pipelines/text/attention/run.js +112 -14
package/src/inference/pipelines/text/config.js +17 -4
package/src/inference/pipelines/text/embed.js +2 -8
package/src/inference/pipelines/text/execution-plan.js +46 -23
package/src/inference/pipelines/text/execution-v0-contract-helpers.d.ts +59 -0
package/src/inference/pipelines/text/execution-v0-contract-helpers.js +937 -0
package/src/inference/pipelines/text/execution-v0-runtime-builders.d.ts +15 -0
package/src/inference/pipelines/text/execution-v0-runtime-builders.js +279 -0
package/src/inference/pipelines/text/execution-v0.js +62 -1013
package/src/inference/pipelines/text/generator-runtime.js +5 -0
package/src/inference/pipelines/text/generator-steps.d.ts +52 -0
package/src/inference/pipelines/text/generator-steps.js +340 -221
package/src/inference/pipelines/text/generator.js +56 -40
package/src/inference/pipelines/text/init.d.ts +13 -0
package/src/inference/pipelines/text/init.js +94 -25
package/src/inference/pipelines/text/kernel-path-auto-select.js +2 -0
package/src/inference/pipelines/text/kernel-trace.d.ts +2 -0
package/src/inference/pipelines/text/kernel-trace.js +6 -0
package/src/inference/pipelines/text/layer.js +4 -9
package/src/inference/pipelines/text/linear-attention.d.ts +15 -0
package/src/inference/pipelines/text/linear-attention.js +113 -9
package/src/inference/pipelines/text/logits/gpu.js +12 -7
package/src/inference/pipelines/text/logits/index.d.ts +6 -1
package/src/inference/pipelines/text/logits/index.js +13 -12
package/src/inference/pipelines/text/logits/utils.d.ts +7 -0
package/src/inference/pipelines/text/logits/utils.js +9 -0
package/src/inference/pipelines/text/lora-apply.js +50 -32
package/src/inference/pipelines/text/model-load.js +282 -104
package/src/inference/pipelines/text/moe-cache.js +5 -4
package/src/inference/pipelines/text/moe-cpu-gptoss.js +74 -69
package/src/inference/pipelines/text/moe-cpu.js +42 -38
package/src/inference/pipelines/text/moe-gpu.js +110 -86
package/src/inference/pipelines/text/ops.js +90 -90
package/src/inference/pipelines/text/probes.js +9 -9
package/src/inference/pipelines/text/sampling.js +52 -6
package/src/inference/pipelines/text/weights.js +17 -7
package/src/inference/pipelines/text.js +13 -1
package/src/inference/speculative.d.ts +2 -2
package/src/inference/speculative.js +4 -18
package/src/inference/test-harness.d.ts +1 -1
package/src/inference/test-harness.js +17 -7
package/src/inference/tokenizer.d.ts +0 -5
package/src/inference/tokenizer.js +4 -23
package/src/inference/tokenizers/bpe.js +9 -0
package/src/inference/tokenizers/bundled.js +20 -0
package/src/inference/tokenizers/sentencepiece.js +12 -0
package/src/loader/doppler-loader.js +38 -22
package/src/loader/dtype-utils.js +3 -44
package/src/loader/embedding-loader.js +7 -3
package/src/loader/experts/expert-cache.js +13 -6
package/src/loader/experts/expert-loader.js +10 -6
package/src/loader/final-weights-loader.js +10 -4
package/src/loader/layer-loader.js +2 -1
package/src/loader/loader-state.js +2 -2
package/src/loader/memory-monitor.js +8 -0
package/src/loader/multi-model-loader.d.ts +14 -0
package/src/loader/multi-model-loader.js +70 -24
package/src/loader/shard-cache.js +84 -14
package/src/loader/shard-resolver.js +25 -3
package/src/loader/tensors/tensor-loader.js +214 -144
package/src/loader/tensors/tensor-reader.js +76 -19
package/src/loader/weight-downcast.js +1 -1
package/src/memory/buffer-pool.d.ts +9 -1
package/src/memory/buffer-pool.js +109 -44
package/src/memory/unified-detect.js +1 -1
package/src/rules/inference/dtype.rules.json +5 -0
package/src/rules/inference/kernel-path.rules.json +24 -8
package/src/rules/kernels/split-qg.rules.json +6 -0
package/src/rules/rule-registry.js +27 -1
package/src/storage/backends/opfs-store.js +68 -24
package/src/storage/downloader.js +365 -83
package/src/storage/index.d.ts +3 -0
package/src/storage/index.js +3 -0
package/src/storage/preflight.d.ts +2 -2
package/src/storage/preflight.js +24 -2
package/src/storage/quickstart-downloader.js +11 -5
package/src/storage/registry.js +10 -4
package/src/storage/reports.js +1 -1
package/src/storage/shard-manager.d.ts +15 -1
package/src/storage/shard-manager.js +55 -6
package/src/storage/source-artifact-store.d.ts +52 -0
package/src/storage/source-artifact-store.js +234 -0
package/src/tooling/command-api-constants.d.ts +9 -0
package/src/tooling/command-api-constants.js +9 -0
package/src/tooling/command-api-family-normalizers.d.ts +9 -0
package/src/tooling/command-api-family-normalizers.js +343 -0
package/src/tooling/command-api-helpers.d.ts +25 -0
package/src/tooling/command-api-helpers.js +262 -0
package/src/tooling/command-api.js +16 -602
package/src/tooling/command-envelope.js +4 -1
package/src/tooling/command-runner-shared.js +52 -18
package/src/tooling/conversion-config-materializer.js +3 -5
package/src/tooling/lean-execution-contract.js +150 -3
package/src/tooling/node-browser-command-runner.js +161 -271
package/src/tooling/node-command-runner.js +29 -3
package/src/tooling/node-converter.js +30 -1
package/src/tooling/node-source-runtime.d.ts +1 -1
package/src/tooling/node-source-runtime.js +120 -3
package/src/tooling/node-webgpu.js +24 -21
package/src/tooling/opfs-cache.js +21 -4
package/src/tooling/runtime-input-composition.d.ts +38 -0
package/src/tooling/runtime-input-composition.js +86 -0
package/src/tooling/source-runtime-bundle.d.ts +40 -5
package/src/tooling/source-runtime-bundle.js +261 -34
package/src/tooling/source-runtime-materializer.d.ts +6 -0
package/src/tooling/source-runtime-materializer.js +93 -0
package/src/training/attention-backward.js +32 -17
package/src/training/autograd.js +80 -52
package/src/training/checkpoint-watch.d.ts +2 -1
package/src/training/checkpoint-watch.js +39 -6
package/src/training/checkpoint.js +40 -11
package/src/training/clip.js +2 -1
package/src/training/datasets/token-batch.js +20 -8
package/src/training/distillation/checkpoint-watch.js +1 -0
package/src/training/distillation/student-fixture.d.ts +22 -0
package/src/training/distillation/student-fixture.js +846 -0
package/src/training/distillation/suite-data.d.ts +45 -0
package/src/training/distillation/suite-data.js +189 -0
package/src/training/lora-pipeline.js +4 -7
package/src/training/lora.js +26 -12
package/src/training/loss.js +5 -6
package/src/training/objectives/cross_entropy.js +2 -5
package/src/training/objectives/distill_kd.js +4 -8
package/src/training/objectives/distill_triplet.js +4 -8
package/src/training/objectives/ul_stage2_base.js +4 -8
package/src/training/operator-command.js +2 -0
package/src/training/optimizer.js +19 -7
package/src/training/runner.js +2 -1
package/src/training/suite.js +18 -978
package/src/training/tensor-factory.d.ts +9 -0
package/src/training/tensor-factory.js +13 -0
package/src/training/trainer.js +3 -5
package/src/training/ul_dataset.js +3 -5
package/src/training/workloads.js +70 -79
package/src/types/model.d.ts +5 -0
package/src/version.js +1 -1
package/tools/convert-safetensors-node.js +22 -16
package/tools/doppler-cli.js +50 -26

package/src/training/tensor-factory.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+import type { Tensor, TensorDType } from '../gpu/tensor.js';
+export declare function createUploadedTensor(
+  data: ArrayBufferView,
+  dtype: TensorDType,
+  shape: number[],
+  label: string,
+  usage?: number | undefined
+): Tensor;

package/src/training/tensor-factory.js ADDED Viewed

@@ -0,0 +1,13 @@
+import { acquireBuffer, releaseBuffer, uploadData } from '../memory/buffer-pool.js';
+import { createTensor } from '../gpu/tensor.js';
+export function createUploadedTensor(data, dtype, shape, label, usage = undefined) {
+  const buffer = acquireBuffer(data.byteLength, usage, label);
+  try {
+    uploadData(buffer, data);
+    return createTensor(buffer, dtype, [...shape], label);
+  } catch (error) {
+    releaseBuffer(buffer);
+    throw error;
+  }
+}

package/src/training/trainer.js CHANGED Viewed

@@ -1,17 +1,15 @@
 import { AutogradTape } from './autograd.js';
 import { loadBackwardRegistry } from '../config/backward-registry-loader.js';
 import { runScale } from '../gpu/kernels/index.js';
-import { acquireBuffer, uploadData, releaseBuffer } from '../memory/buffer-pool.js';
-import { createTensor } from '../gpu/tensor.js';
+import { releaseBuffer } from '../memory/buffer-pool.js';
 import { createCrossEntropyObjective } from './objectives/cross_entropy.js';
+import { createUploadedTensor } from './tensor-factory.js';
 function createLossGradient(loss, lossScale) {
   const lossElements = loss.shape.reduce((acc, value) => acc * value, 1);
   const gradData = new Float32Array(lossElements);
   gradData.fill(lossScale);
-  const gradBuf = acquireBuffer(gradData.byteLength, undefined, 'loss_grad_output');
-  uploadData(gradBuf, gradData);
-  return createTensor(gradBuf, 'f32', [...loss.shape], 'loss_grad_output');
+  return createUploadedTensor(gradData, 'f32', loss.shape, 'loss_grad_output');
 }
 function normalizeLossResult(value) {

package/src/training/ul_dataset.js CHANGED Viewed

@@ -1,6 +1,6 @@
-import { acquireBuffer, uploadData, readBuffer, releaseBuffer } from '../memory/buffer-pool.js';
-import { createTensor } from '../gpu/tensor.js';
+import { readBuffer, releaseBuffer } from '../memory/buffer-pool.js';
 import { resolveUlScheduledLambda } from './ul_schedule.js';
+import { createUploadedTensor } from './tensor-factory.js';
 function xorshift32(value) {
   let x = value >>> 0;
@@ -79,9 +79,7 @@ export async function buildNoisyLatentsFromInputTensor(inputTensor, ulConfig, op
     noisy[i] = alpha * inputData[i] + sigma * n;
   }
-  const noisyBuffer = acquireBuffer(noisy.byteLength, undefined, 'ul_noisy_latents');
-  uploadData(noisyBuffer, noisy);
-  const noisyTensor = createTensor(noisyBuffer, 'f32', [...inputTensor.shape], 'ul_noisy_latents');
+  const noisyTensor = createUploadedTensor(noisy, 'f32', inputTensor.shape, 'ul_noisy_latents');
   const cleanStats = summarizeArray(inputData);
   const noiseStats = summarizeArray(noise);
   const noisyStats = summarizeArray(noisy);

package/src/training/workloads.js CHANGED Viewed

@@ -4,6 +4,11 @@ import { resolve } from 'node:path';
 import { isPlainObject } from '../utils/plain-object.js';
 import { sha256Hex } from '../utils/sha256.js';
 import { VALID_LORA_TARGET_MODULES } from '../config/schema/adapter.schema.js';
+import {
+  DEFAULT_TRAINING_GRADIENT_CONFIG,
+  DEFAULT_TRAINING_OPTIMIZER_CONFIG,
+  DEFAULT_TRAINING_PRECISION_CONFIG,
+} from '../config/schema/training.schema.js';
 export const TRAINING_WORKLOAD_SCHEMA_VERSION = 1;
 export const TRAINING_WORKLOAD_KINDS = Object.freeze(['lora', 'distill', 'ul']);
@@ -140,64 +145,57 @@ function inferLegacyKind(payload, contextLabel) {
   if (explicitKind) return explicitKind;
   const workloadKind = typeof payload?.workloadKind === 'string' ? payload.workloadKind.trim() : '';
   if (workloadKind) return workloadKind;
-  const id = String(payload?.id || '').trim();
-  if (id.startsWith('distill-')) return 'distill';
-  if (id.startsWith('lora-')) return 'lora';
-  if (id.startsWith('ul-') || id.startsWith('ul_training') || id.startsWith('ul-training')) {
+  const trainingTests = Array.isArray(payload?.trainingTests)
+    ? payload.trainingTests.map((entry) => String(entry))
+    : null;
+  const hasLegacyUlShape = trainingTests
+    && trainingTests.length > 0
+    && trainingTests.every((entry) => entry === 'ul-stage1' || entry === 'ul-stage2')
+    && Number.isInteger(Number(payload?.trainingBenchSteps));
+  if (hasLegacyUlShape) {
     return 'ul';
   }
-  if (Array.isArray(payload?.trainingTests) && payload.trainingTests.every((entry) => LEGACY_DISTILL_TEST_IDS.includes(String(entry)))) {
-    return 'distill';
-  }
   throw new Error(`${contextLabel}.kind is required.`);
 }
 function normalizeScheduler(value, label) {
-  const scheduler = asObject(value, label, { optional: true }) || {};
+  const scheduler = asObject(value, label);
   return {
-    enabled: scheduler.enabled === true,
-    type: asNonEmptyString(scheduler.type ?? 'constant', `${label}.type`),
-    warmupSteps: asNonNegativeInteger(
-      scheduler.warmupSteps ?? 0,
-      `${label}.warmupSteps`,
-      { optional: true }
-    ) ?? 0,
-    stepSize: asPositiveInteger(scheduler.stepSize ?? 1, `${label}.stepSize`, { optional: true }) ?? 1,
-    gamma: asFiniteNumber(scheduler.gamma ?? 1, `${label}.gamma`, { optional: true }) ?? 1,
-    totalSteps: asPositiveInteger(scheduler.totalSteps ?? 1, `${label}.totalSteps`, { optional: true }) ?? 1,
-    minLr: asFiniteNumber(scheduler.minLr ?? 0, `${label}.minLr`, { optional: true }) ?? 0,
+    enabled: asBoolean(scheduler.enabled, `${label}.enabled`),
+    type: asNonEmptyString(scheduler.type, `${label}.type`),
+    warmupSteps: asNonNegativeInteger(scheduler.warmupSteps, `${label}.warmupSteps`),
+    stepSize: asPositiveInteger(scheduler.stepSize, `${label}.stepSize`),
+    gamma: asFiniteNumber(scheduler.gamma, `${label}.gamma`),
+    totalSteps: asPositiveInteger(scheduler.totalSteps, `${label}.totalSteps`),
+    minLr: asFiniteNumber(scheduler.minLr, `${label}.minLr`),
   };
 }
 function normalizeTrainingConfig(value, label) {
   const training = asObject(value, label);
   const optimizer = asObject(training.optimizer, `${label}.optimizer`);
-  const precision = isPlainObject(training.precision)
-    ? training.precision
-    : { activations: training.precision ?? 'f16' };
-  const gradientClipping = isPlainObject(training.gradientClipping)
-    ? training.gradientClipping
-    : { maxNorm: training.gradientClipping ?? 1 };
+  const precision = asObject(training.precision, `${label}.precision`);
+  const gradientClipping = asObject(training.gradientClipping, `${label}.gradientClipping`);
   return {
     optimizer: {
-      type: asNonEmptyString(optimizer.type ?? 'adam', `${label}.optimizer.type`),
+      type: asNonEmptyString(optimizer.type, `${label}.optimizer.type`),
       lr: asFiniteNumber(optimizer.lr, `${label}.optimizer.lr`),
-      beta1: asFiniteNumber(optimizer.beta1 ?? 0.9, `${label}.optimizer.beta1`, { optional: true }) ?? 0.9,
-      beta2: asFiniteNumber(optimizer.beta2 ?? 0.999, `${label}.optimizer.beta2`, { optional: true }) ?? 0.999,
-      eps: asFiniteNumber(optimizer.eps ?? 1e-8, `${label}.optimizer.eps`, { optional: true }) ?? 1e-8,
-      weightDecay: asFiniteNumber(optimizer.weightDecay ?? 0, `${label}.optimizer.weightDecay`, { optional: true }) ?? 0,
+      beta1: asFiniteNumber(optimizer.beta1, `${label}.optimizer.beta1`),
+      beta2: asFiniteNumber(optimizer.beta2, `${label}.optimizer.beta2`),
+      eps: asFiniteNumber(optimizer.eps, `${label}.optimizer.eps`),
+      weightDecay: asFiniteNumber(optimizer.weightDecay, `${label}.optimizer.weightDecay`),
       scheduler: normalizeScheduler(optimizer.scheduler, `${label}.optimizer.scheduler`),
     },
     batchSize: asPositiveInteger(training.batchSize, `${label}.batchSize`),
-    accumSteps: asPositiveInteger(training.accumSteps ?? 1, `${label}.accumSteps`, { optional: true }) ?? 1,
+    accumSteps: asPositiveInteger(training.accumSteps, `${label}.accumSteps`),
     steps: asPositiveInteger(training.steps, `${label}.steps`),
     precision: {
-      activations: asNonEmptyString(precision.activations ?? 'f16', `${label}.precision.activations`),
-      gradients: asNonEmptyString(precision.gradients ?? 'f32', `${label}.precision.gradients`),
-      loraParams: asNonEmptyString(precision.loraParams ?? 'f32', `${label}.precision.loraParams`),
+      activations: asNonEmptyString(precision.activations, `${label}.precision.activations`),
+      gradients: asNonEmptyString(precision.gradients, `${label}.precision.gradients`),
+      loraParams: asNonEmptyString(precision.loraParams, `${label}.precision.loraParams`),
     },
     gradientClipping: {
-      maxNorm: asFiniteNumber(gradientClipping.maxNorm ?? 1, `${label}.gradientClipping.maxNorm`, { optional: true }) ?? 1,
+      maxNorm: asFiniteNumber(gradientClipping.maxNorm, `${label}.gradientClipping.maxNorm`),
     },
   };
 }
@@ -215,7 +213,7 @@ function normalizeEvalDatasets(value, label) {
       id: asNonEmptyString(dataset.id, `${label}[${index}].id`),
       datasetPath: asNonEmptyString(dataset.datasetPath ?? dataset.path, `${label}[${index}].datasetPath`),
       evalKind: asEnum(
-        dataset.evalKind ?? dataset.kind ?? 'text_generation',
+        dataset.evalKind ?? dataset.kind,
         `${label}[${index}].evalKind`,
         TRAINING_EVAL_KINDS
       ),
@@ -230,11 +228,7 @@ function normalizeEvalDatasets(value, label) {
             `${label}[${index}].decodePolicy.maxTokens`,
             { optional: true }
           ),
-          stopOnEos: asBoolean(
-            decodePolicy.stopOnEos ?? true,
-            `${label}[${index}].decodePolicy.stopOnEos`,
-            { optional: true }
-          ) ?? true,
+          stopOnEos: asBoolean(decodePolicy.stopOnEos, `${label}[${index}].decodePolicy.stopOnEos`),
         }
         : null,
       scoreboardColumns: asStringArray(
@@ -267,11 +261,11 @@ function normalizeStagePlan(value, label) {
   return value.map((entry, index) => {
     const stage = asObject(entry, `${label}[${index}]`);
     const selectionMetric = asNonEmptyString(
-      stage.selectionMetric ?? stage.metric ?? 'bleu',
+      stage.selectionMetric ?? stage.metric,
       `${label}[${index}].selectionMetric`
     );
     const selectionGoal = asEnum(
-      stage.selectionGoal ?? stage.goal ?? 'max',
+      stage.selectionGoal ?? stage.goal,
       `${label}[${index}].selectionGoal`,
       TRAINING_SELECTION_GOALS
     );
@@ -281,15 +275,12 @@ function normalizeStagePlan(value, label) {
       objective: asNonEmptyString(stage.objective, `${label}[${index}].objective`),
       steps: asPositiveInteger(stage.steps, `${label}[${index}].steps`),
       checkpointEvery: asPositiveInteger(
-        stage.checkpointEvery ?? stage.steps,
+        stage.checkpointEvery,
         `${label}[${index}].checkpointEvery`
       ),
       selectionMetric,
       selectionGoal,
-      evalSchedule: asNonEmptyString(
-        stage.evalSchedule ?? 'on_checkpoint',
-        `${label}[${index}].evalSchedule`
-      ),
+      evalSchedule: asNonEmptyString(stage.evalSchedule, `${label}[${index}].evalSchedule`),
     };
   });
 }
@@ -306,29 +297,29 @@ function normalizeLoraConfig(value, label) {
     }
   }
   return {
-    datasetFormat: asNonEmptyString(lora.datasetFormat ?? 'prompt_completion_jsonl', `${label}.datasetFormat`),
-    taskType: asNonEmptyString(lora.taskType ?? 'text_generation', `${label}.taskType`),
+    datasetFormat: asNonEmptyString(lora.datasetFormat, `${label}.datasetFormat`),
+    taskType: asNonEmptyString(lora.taskType, `${label}.taskType`),
     adapter: {
       rank: asPositiveInteger(adapter.rank, `${label}.adapter.rank`),
       alpha: asFiniteNumber(adapter.alpha, `${label}.adapter.alpha`),
-      dropout: asFiniteNumber(adapter.dropout ?? 0, `${label}.adapter.dropout`, { optional: true }) ?? 0,
+      dropout: asFiniteNumber(adapter.dropout, `${label}.adapter.dropout`),
       targetModules,
     },
     freeze: normalizeFreezeConfig(lora.freeze, `${label}.freeze`),
     export: exportConfig
       ? {
-        enabled: exportConfig.enabled !== false,
-        atCheckpoints: exportConfig.atCheckpoints === true,
-        select: asNonEmptyString(exportConfig.select ?? 'best', `${label}.export.select`),
+        enabled: asBoolean(exportConfig.enabled, `${label}.export.enabled`),
+        atCheckpoints: asBoolean(exportConfig.atCheckpoints, `${label}.export.atCheckpoints`),
+        select: asNonEmptyString(exportConfig.select, `${label}.export.select`),
         id: asNonEmptyString(exportConfig.id, `${label}.export.id`, { optional: true }),
         name: asNonEmptyString(exportConfig.name, `${label}.export.name`, { optional: true }),
-        format: asNonEmptyString(exportConfig.format ?? 'manifest_json', `${label}.export.format`),
+        format: asNonEmptyString(exportConfig.format, `${label}.export.format`),
       }
       : null,
     activation: activation
       ? {
-        enabled: activation.enabled === true,
-        autoActivate: activation.autoActivate === true,
+        enabled: asBoolean(activation.enabled, `${label}.activation.enabled`),
+        autoActivate: asBoolean(activation.autoActivate, `${label}.activation.autoActivate`),
         smokePrompt: asNonEmptyString(activation.smokePrompt, `${label}.activation.smokePrompt`, { optional: true }),
       }
       : null,
@@ -339,27 +330,21 @@ function normalizeDistillConfig(value, label) {
   const distill = asObject(value, label);
   return {
     stagePlan: normalizeStagePlan(distill.stagePlan, `${label}.stagePlan`),
-    studentGraphMode: asNonEmptyString(
-      distill.studentGraphMode ?? 'transformer_full',
-      `${label}.studentGraphMode`
-    ),
-    temperature: asFiniteNumber(distill.temperature ?? 1, `${label}.temperature`, { optional: true }) ?? 1,
-    alphaKd: asFiniteNumber(distill.alphaKd ?? 1, `${label}.alphaKd`, { optional: true }) ?? 1,
-    alphaCe: asFiniteNumber(distill.alphaCe ?? 0, `${label}.alphaCe`, { optional: true }) ?? 0,
-    tripletMargin: asFiniteNumber(distill.tripletMargin ?? 0.2, `${label}.tripletMargin`, { optional: true }) ?? 0.2,
+    studentGraphMode: asNonEmptyString(distill.studentGraphMode, `${label}.studentGraphMode`),
+    temperature: asFiniteNumber(distill.temperature, `${label}.temperature`),
+    alphaKd: asFiniteNumber(distill.alphaKd, `${label}.alphaKd`),
+    alphaCe: asFiniteNumber(distill.alphaCe, `${label}.alphaCe`),
+    tripletMargin: asFiniteNumber(distill.tripletMargin, `${label}.tripletMargin`),
     sourceLangs: asStringArray(distill.sourceLangs, `${label}.sourceLangs`, { optional: true, allowEmpty: true }),
     targetLangs: asStringArray(distill.targetLangs, `${label}.targetLangs`, { optional: true, allowEmpty: true }),
     pairAllowlist: asStringArray(distill.pairAllowlist, `${label}.pairAllowlist`, { optional: true, allowEmpty: true }),
-    strictPairContract: asBoolean(
-      distill.strictPairContract ?? false,
-      `${label}.strictPairContract`,
-      { optional: true }
-    ) ?? false,
+    strictPairContract: asBoolean(distill.strictPairContract, `${label}.strictPairContract`),
     subsetSpec: asObject(distill.subsetSpec, `${label}.subsetSpec`, { optional: true }),
   };
 }
 function normalizeLegacyUlPayload(payload, contextLabel) {
+  const optimizerOverrides = isPlainObject(payload.training?.optimizer) ? payload.training.optimizer : {};
   return {
     schemaVersion: asPositiveInteger(payload.schemaVersion, `${contextLabel}.schemaVersion`),
     kind: 'ul',
@@ -393,19 +378,25 @@ function normalizeLegacyUlPayload(payload, contextLabel) {
       TRAINING_WORKLOAD_SURFACE_SUPPORT
     ),
     training: normalizeTrainingConfig({
-      optimizer: payload.training?.optimizer ?? {
-        type: 'adam',
-        lr: 2e-4,
+      optimizer: {
+        ...DEFAULT_TRAINING_OPTIMIZER_CONFIG,
+        ...optimizerOverrides,
+        scheduler: {
+          ...DEFAULT_TRAINING_OPTIMIZER_CONFIG.scheduler,
+          ...(isPlainObject(optimizerOverrides.scheduler) ? optimizerOverrides.scheduler : {}),
+        },
       },
       batchSize: payload.training?.batchSize ?? 1,
-      accumSteps: payload.training?.accumSteps ?? 1,
+      accumSteps: payload.training?.accumSteps ?? DEFAULT_TRAINING_GRADIENT_CONFIG.accumSteps,
       steps: payload.training?.steps ?? payload.trainingBenchSteps ?? 1,
-      precision: payload.training?.precision ?? {
-        activations: 'f16',
-        gradients: 'f32',
-        loraParams: 'f32',
+      precision: {
+        ...DEFAULT_TRAINING_PRECISION_CONFIG,
+        ...(payload.training?.precision ?? {}),
+      },
+      gradientClipping: {
+        maxNorm: payload.training?.gradientClipping?.maxNorm
+          ?? DEFAULT_TRAINING_GRADIENT_CONFIG.maxNorm,
       },
-      gradientClipping: payload.training?.gradientClipping ?? { maxNorm: 1 },
     }, `${contextLabel}.training`),
     pipeline: {
       legacyWorkloadType: 'ul',

package/src/types/model.d.ts CHANGED Viewed

@@ -9,7 +9,11 @@ export type ModelArchitecture =
   | 'gemma'
   | 'gemma2'
   | 'gemma3'
+  | 'embeddinggemma'
   | 'functiongemma'
+  | 'janus_text'
+  | 'lfm2'
+  | 'modernbert'
   | 'qwen2'
   | 'qwen3'
   | 'phi3'
@@ -19,6 +23,7 @@ export type ModelArchitecture =
   | 'deepseek'
   | 'mamba'
   | 'kimi_k2'
+  | 'translategemma'
   | 'transformer';
 /** Attention type variants */

package/src/version.js CHANGED Viewed

@@ -1,2 +1,2 @@
-export const DOPPLER_VERSION = '0.1.6';
+export const DOPPLER_VERSION = '0.1.7';
 export const DOPPLER_PROVIDER_VERSION = DOPPLER_VERSION;

package/tools/convert-safetensors-node.js CHANGED Viewed

@@ -14,42 +14,43 @@ function parseArgs(argv) {
   const positional = [];
   for (let i = 0; i < argv.length; i += 1) {
     const arg = argv[i];
-    if (arg === '--output-dir') {
-      out.outputDir = argv[i + 1] ?? null;
+    const nextValue = () => {
+      const value = argv[i + 1];
+      if (value == null || String(value).startsWith('--')) {
+        throw new Error(`Missing value for ${arg}.`);
+      }
       i += 1;
+      return value;
+    };
+    if (arg === '--output-dir') {
+      out.outputDir = nextValue();
       continue;
     }
     if (arg === '--config') {
-      out.configPath = argv[i + 1] ?? null;
-      i += 1;
+      out.configPath = nextValue();
       continue;
     }
     if (arg === '--converter-config') {
       throw new Error('--converter-config has been removed. Use --config <path.json>.');
     }
     if (arg === '--workers') {
-      execution.workers = argv[i + 1] ?? null;
-      i += 1;
+      execution.workers = nextValue();
       continue;
     }
     if (arg === '--worker-policy') {
-      execution.workerCountPolicy = argv[i + 1] ?? null;
-      i += 1;
+      execution.workerCountPolicy = nextValue();
       continue;
     }
     if (arg === '--row-chunk-rows') {
-      execution.rowChunkRows = argv[i + 1] ?? null;
-      i += 1;
+      execution.rowChunkRows = nextValue();
       continue;
     }
     if (arg === '--row-chunk-min-tensor-bytes') {
-      execution.rowChunkMinTensorBytes = argv[i + 1] ?? null;
-      i += 1;
+      execution.rowChunkMinTensorBytes = nextValue();
       continue;
     }
     if (arg === '--max-in-flight-jobs') {
-      execution.maxInFlightJobs = argv[i + 1] ?? null;
-      i += 1;
+      execution.maxInFlightJobs = nextValue();
       continue;
     }
     if (arg === '--use-gpu-cast') {
@@ -57,12 +58,17 @@ function parseArgs(argv) {
       continue;
     }
     if (arg === '--gpu-cast-min-tensor-bytes') {
-      execution.gpuCastMinTensorBytes = argv[i + 1] ?? null;
-      i += 1;
+      execution.gpuCastMinTensorBytes = nextValue();
       continue;
     }
+    if (arg.startsWith('--')) {
+      throw new Error(`Unknown flag: ${arg}`);
+    }
     positional.push(arg);
   }
+  if (positional.length > 1) {
+    throw new Error(`Unexpected positional arguments: ${positional.slice(1).join(', ')}`);
+  }
   out.inputDir = positional[0] ?? null;
   out.execution = Object.keys(execution).length > 0 ? execution : null;
   return out;

package/tools/doppler-cli.js CHANGED Viewed

@@ -1,5 +1,6 @@
 #!/usr/bin/env node
+import { existsSync } from 'node:fs';
 import fs from 'node:fs/promises';
 import path from 'node:path';
 import { fileURLToPath, pathToFileURL } from 'node:url';
@@ -13,7 +14,8 @@ import { createToolingErrorEnvelope } from '../src/tooling/command-envelope.js';
 const NODE_WEBGPU_INCOMPLETE_MESSAGE = 'node command: WebGPU runtime is incomplete in Node';
 const CLI_POLICY_PATH = fileURLToPath(new URL('./configs/cli/doppler-cli-policy.json', import.meta.url));
-const DEFAULT_EXTERNAL_MODELS_ROOT = process.env.DOPPLER_EXTERNAL_MODELS_ROOT || '/media/x/models';
+const DEFAULT_EXTERNAL_MODELS_ROOT = process.env.DOPPLER_EXTERNAL_MODELS_ROOT
+  || (existsSync('/Volumes/models') ? '/Volumes/models' : '/media/x/models');
 const DEFAULT_EXTERNAL_RDRR_ROOT = path.join(DEFAULT_EXTERNAL_MODELS_ROOT, 'rdrr');
 const DEFAULT_CLI_POLICY = {
   defaults: {
@@ -22,8 +24,6 @@ const DEFAULT_CLI_POLICY = {
       allowed: ['auto', 'node', 'browser'],
     },
     bench: {
-      modelId: 'gemma-3-270m-it-wf16-ef16-hf16',
-      surface: 'browser',
       cacheMode: 'warm',
     },
     cacheMode: null,
@@ -82,7 +82,7 @@ function usage() {
     '    - run: CLI-only run controls (surface, browser options, and bench save/compare/manifest settings).',
     '',
     'Example:',
-    '  doppler verify --config \'{"request":{"suite":"inference","modelId":"gemma-3-270m-it-wf16-ef16-hf16"}}\' --json',
+    '  doppler verify --config \'{"request":{"suite":"inference","modelId":"gemma-3-270m-it-f16-af32"}}\' --json',
   ].join('\n');
 }
@@ -439,10 +439,6 @@ export async function resolveBrowserModelUrl(request, browserOptions = {}) {
   const staticRootDir = resolveStaticRootDir(browserOptions);
   const externalModel = await resolveExternalModelDirectory(resolveRdrrRoot(browserOptions), modelId);
   const candidates = [
-    {
-    modelUrl: `/models/curated/${encodedModelId}`,
-    manifestPath: path.join(staticRootDir, 'models', 'curated', modelId, 'manifest.json'),
-    },
     {
     modelUrl: `/models/local/${encodedModelId}`,
     manifestPath: path.join(staticRootDir, 'models', 'local', modelId, 'manifest.json'),
@@ -528,6 +524,9 @@ function parseSurface(value, command, policy = DEFAULT_CLI_POLICY) {
   if (command === 'convert' && normalized === 'browser') {
     throw new Error('convert is not supported on browser relay. Use --surface node or --surface auto.');
   }
+  if ((command === 'lora' || command === 'distill') && normalized === 'browser') {
+    throw new Error(`${command} is not supported on browser relay. Use --surface node or --surface auto.`);
+  }
   return normalized;
 }
@@ -587,13 +586,10 @@ function resolveBenchRunOptions(runConfig, policy = DEFAULT_CLI_POLICY) {
 function resolveSurfaceForCommand(command, parsed, runConfig, policy = DEFAULT_CLI_POLICY) {
   const fromCli = asStringOrNull(parsed.flags.surface);
   const fromRun = asStringOrNull(runConfig?.surface);
-  const fromPolicy = command === 'bench'
-    ? asStringOrNull(policy?.defaults?.bench?.surface)
-    : null;
-  return parseSurface(fromCli ?? fromRun ?? fromPolicy, command, policy);
+  return parseSurface(fromCli ?? fromRun ?? null, command, policy);
 }
-async function buildRequest(parsed, policy = DEFAULT_CLI_POLICY) {
+export async function buildRequest(parsed, policy = DEFAULT_CLI_POLICY) {
   const command = parsed.command;
   if (!command || !TOOLING_COMMANDS.includes(command)) {
     throw new Error(`Unsupported command "${command || ''}"`);
@@ -612,21 +608,15 @@ async function buildRequest(parsed, policy = DEFAULT_CLI_POLICY) {
   }
   requestInput.command = command;
-  if (command === 'bench' && !asStringOrNull(requestInput.modelId) && !asStringOrNull(requestInput.modelUrl)) {
-    const benchDefaultModelId = asStringOrNull(policy?.defaults?.bench?.modelId);
-    if (benchDefaultModelId) {
-      requestInput.modelId = benchDefaultModelId;
-    }
-  }
   applyRuntimeFlagOverride(requestInput, runtimeOverride);
   const surfaceFromCli = asStringOrNull(parsed.flags.surface) !== null;
+  const surface = resolveSurfaceForCommand(command, parsed, envelope.run, policy);
   return {
     request: normalizeToolingCommandRequest(requestInput),
     runConfig: envelope.run,
-    surface: resolveSurfaceForCommand(command, parsed, envelope.run, policy),
+    surface,
     surfaceFromCli,
     benchRunOptions: resolveBenchRunOptions(envelope.run, policy),
   };
@@ -723,6 +713,32 @@ function isTrainingCommandFlow(request) {
   return request.command === 'bench' && request.workloadType === 'training';
 }
+function resolveErrorSurface(error, fallbackSurface = null) {
+  return (
+    asStringOrNull(fallbackSurface)
+    || asStringOrNull(error?.surface)
+    || asStringOrNull(error?.details?.surface)
+    || null
+  );
+}
+export function createCliToolingErrorEnvelope(error, context = {}) {
+  return createToolingErrorEnvelope(error, {
+    surface: resolveErrorSurface(error, context.surface),
+    request: context.request ?? null,
+  });
+}
+export function finalizeCliCommandResponse(response, request) {
+  if (!isPlainObject(response) || !Object.prototype.hasOwnProperty.call(response, 'request')) {
+    return response;
+  }
+  return {
+    ...response,
+    request,
+  };
+}
 async function runCommandOnSurface(request, surface, runConfig, jsonOutput) {
   if (surface === 'node') {
     const nodeRequest = await resolveNodeModelUrl(request);
@@ -732,7 +748,8 @@ async function runCommandOnSurface(request, surface, runConfig, jsonOutput) {
         console.error(`[surface] node resolved modelUrl=${nodeRequest.modelUrl}`);
       }
     }
-    return runNodeCommand(nodeRequest, buildNodeRunOptions(jsonOutput));
+    const response = await runNodeCommand(nodeRequest, buildNodeRunOptions(jsonOutput));
+    return finalizeCliCommandResponse(response, request);
   }
   const browserOptions = buildBrowserRunOptions(runConfig, jsonOutput, request);
@@ -746,7 +763,8 @@ async function runCommandOnSurface(request, surface, runConfig, jsonOutput) {
     }
   }
-  return runBrowserCommandInNode(browserRequest, browserOptions);
+  const response = await runBrowserCommandInNode(browserRequest, browserOptions);
+  return finalizeCliCommandResponse(response, request);
 }
 async function runWithAutoSurface(request, runConfig, jsonOutput, policy = DEFAULT_CLI_POLICY) {
@@ -763,9 +781,12 @@ async function runWithAutoSurface(request, runConfig, jsonOutput, policy = DEFAU
     }
     if (isTrainingCommandFlow(request)) {
       const downgradeError = new Error(
-        'Training command auto-surface downgrade is blocked. Re-run with --surface node after fixing Node WebGPU support, or explicitly choose --surface browser.'
+        (request.command === 'lora' || request.command === 'distill')
+          ? 'Training command auto-surface downgrade is blocked. Re-run with --surface node after fixing Node WebGPU support.'
+          : 'Training command auto-surface downgrade is blocked. Re-run with --surface node after fixing Node WebGPU support, or explicitly choose --surface browser.'
       );
       downgradeError.code = 'training_surface_downgrade_blocked';
+      downgradeError.surface = 'node';
       downgradeError.command = request.command;
       downgradeError.suite = request.suite;
       downgradeError.workloadType = request.workloadType || null;
@@ -1021,7 +1042,7 @@ async function runManifestSweep(manifest, commandContext, jsonOutput, policy = D
       results.push({
         label,
         response: null,
-        error: createToolingErrorEnvelope(error, {
+        error: createCliToolingErrorEnvelope(error, {
           surface: surface === 'auto' ? null : surface,
           request,
         }),
@@ -1241,6 +1262,9 @@ function printMetricsSummary(result) {
       `prefill=${formatNumber(metrics.prefillTokensPerSec)} ` +
       `decode=${formatNumber(metrics.decodeTokensPerSec)}`
     );
+    if (typeof result.output === 'string' && result.output.length > 0) {
+      console.log(`[output] ${quoteOneLine(result.output)}`);
+    }
     printExecutionContractSummary(result);
     printExecutionV0GraphSummary(metrics.executionV0GraphContractArtifact);
     return;
@@ -1404,7 +1428,7 @@ async function main() {
     printMetricsSummary(response.result);
   } catch (error) {
     if (jsonOutputRequested) {
-      console.log(JSON.stringify(createToolingErrorEnvelope(error, errorContext), null, 2));
+      console.log(JSON.stringify(createCliToolingErrorEnvelope(error, errorContext), null, 2));
       process.exitCode = 1;
       return;
     }