npm - @simulatte/doppler - Versions diffs - 0.1.4 → 0.1.6 - Mend

@simulatte/doppler 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (199) hide show

package/README.md +26 -10
package/package.json +30 -6
package/src/client/doppler-api.browser.d.ts +1 -0
package/src/client/doppler-api.browser.js +288 -0
package/src/client/doppler-api.js +1 -1
package/src/client/doppler-provider/types.js +1 -1
package/src/config/execution-contract-check.d.ts +33 -0
package/src/config/execution-contract-check.js +72 -0
package/src/config/execution-v0-contract-check.d.ts +94 -0
package/src/config/execution-v0-contract-check.js +251 -0
package/src/config/execution-v0-graph-contract-check.d.ts +20 -0
package/src/config/execution-v0-graph-contract-check.js +64 -0
package/src/config/kernel-path-contract-check.d.ts +76 -0
package/src/config/kernel-path-contract-check.js +479 -0
package/src/config/kernel-path-loader.d.ts +16 -0
package/src/config/kernel-path-loader.js +54 -0
package/src/config/kernels/kernel-ref-digests.js +39 -27
package/src/config/kernels/registry.json +598 -2
package/src/config/loader.js +81 -48
package/src/config/merge-contract-check.d.ts +16 -0
package/src/config/merge-contract-check.js +321 -0
package/src/config/merge-helpers.d.ts +58 -0
package/src/config/merge-helpers.js +54 -0
package/src/config/merge.js +21 -6
package/src/config/presets/models/janus-text.json +2 -0
package/src/config/presets/models/qwen3.json +9 -2
package/src/config/presets/models/transformer.json +5 -0
package/src/config/quantization-contract-check.d.ts +12 -0
package/src/config/quantization-contract-check.js +91 -0
package/src/config/required-inference-fields-contract-check.d.ts +24 -0
package/src/config/required-inference-fields-contract-check.js +237 -0
package/src/config/schema/browser-suite-metrics.schema.d.ts +17 -0
package/src/config/schema/browser-suite-metrics.schema.js +46 -0
package/src/config/schema/conversion-report.schema.d.ts +40 -0
package/src/config/schema/conversion-report.schema.js +108 -0
package/src/config/schema/doppler.schema.js +12 -18
package/src/config/schema/index.d.ts +22 -0
package/src/config/schema/index.js +18 -0
package/src/config/schema/inference-defaults.schema.js +3 -0
package/src/config/schema/inference.schema.d.ts +9 -0
package/src/config/schema/kernel-path.schema.d.ts +6 -0
package/src/config/schema/manifest.schema.d.ts +6 -0
package/src/config/schema/manifest.schema.js +3 -0
package/src/converter/core.d.ts +10 -0
package/src/converter/core.js +27 -2
package/src/converter/parsers/diffusion.js +63 -3
package/src/converter/rope-config.js +42 -0
package/src/gpu/device.js +58 -0
package/src/gpu/kernels/attention.js +98 -0
package/src/gpu/kernels/bias_add.wgsl +8 -6
package/src/gpu/kernels/bias_add_f16.wgsl +8 -5
package/src/gpu/kernels/conv2d.js +1 -1
package/src/gpu/kernels/conv2d.wgsl +7 -8
package/src/gpu/kernels/conv2d_f16.wgsl +7 -8
package/src/gpu/kernels/depthwise_conv2d.d.ts +29 -0
package/src/gpu/kernels/depthwise_conv2d.js +99 -0
package/src/gpu/kernels/depthwise_conv2d.wgsl +55 -0
package/src/gpu/kernels/depthwise_conv2d_f16.wgsl +59 -0
package/src/gpu/kernels/grouped_pointwise_conv2d.d.ts +27 -0
package/src/gpu/kernels/grouped_pointwise_conv2d.js +93 -0
package/src/gpu/kernels/grouped_pointwise_conv2d.wgsl +44 -0
package/src/gpu/kernels/grouped_pointwise_conv2d_f16.wgsl +48 -0
package/src/gpu/kernels/index.d.ts +30 -0
package/src/gpu/kernels/index.js +25 -0
package/src/gpu/kernels/matmul.js +25 -0
package/src/gpu/kernels/pixel_shuffle.js +1 -1
package/src/gpu/kernels/pixel_shuffle.wgsl +4 -5
package/src/gpu/kernels/pixel_shuffle_f16.wgsl +4 -5
package/src/gpu/kernels/relu.d.ts +18 -0
package/src/gpu/kernels/relu.js +58 -0
package/src/gpu/kernels/relu.wgsl +22 -0
package/src/gpu/kernels/relu_f16.wgsl +24 -0
package/src/gpu/kernels/repeat_channels.d.ts +21 -0
package/src/gpu/kernels/repeat_channels.js +60 -0
package/src/gpu/kernels/repeat_channels.wgsl +28 -0
package/src/gpu/kernels/repeat_channels_f16.wgsl +30 -0
package/src/gpu/kernels/residual.js +44 -8
package/src/gpu/kernels/residual.wgsl +6 -3
package/src/gpu/kernels/residual_f16.wgsl +2 -1
package/src/gpu/kernels/residual_f16_vec4.wgsl +2 -1
package/src/gpu/kernels/residual_vec4.wgsl +2 -1
package/src/gpu/kernels/rmsnorm.js +58 -6
package/src/gpu/kernels/rmsnorm.wgsl +14 -6
package/src/gpu/kernels/rmsnorm_f16.wgsl +10 -2
package/src/gpu/kernels/rope.d.ts +2 -0
package/src/gpu/kernels/rope.js +11 -1
package/src/gpu/kernels/rope.wgsl +56 -40
package/src/gpu/kernels/sana_linear_attention.d.ts +27 -0
package/src/gpu/kernels/sana_linear_attention.js +121 -0
package/src/gpu/kernels/sana_linear_attention_apply.wgsl +43 -0
package/src/gpu/kernels/sana_linear_attention_apply_f16.wgsl +46 -0
package/src/gpu/kernels/sana_linear_attention_summary.wgsl +51 -0
package/src/gpu/kernels/sana_linear_attention_summary_f16.wgsl +53 -0
package/src/gpu/kernels/silu.d.ts +1 -0
package/src/gpu/kernels/silu.js +32 -14
package/src/gpu/kernels/silu.wgsl +19 -9
package/src/gpu/kernels/silu_f16.wgsl +19 -9
package/src/gpu/kernels/transpose.js +15 -2
package/src/gpu/kernels/transpose.wgsl +5 -6
package/src/gpu/kernels/upsample2d.js +2 -1
package/src/gpu/kernels/upsample2d.wgsl +6 -9
package/src/gpu/kernels/upsample2d_f16.wgsl +6 -9
package/src/gpu/kernels/utils.js +16 -1
package/src/index-browser.d.ts +1 -1
package/src/index-browser.js +2 -2
package/src/index.js +1 -1
package/src/inference/browser-harness.js +109 -23
package/src/inference/pipelines/diffusion/init.js +14 -0
package/src/inference/pipelines/diffusion/pipeline.js +215 -77
package/src/inference/pipelines/diffusion/sana-transformer.d.ts +53 -0
package/src/inference/pipelines/diffusion/sana-transformer.js +738 -0
package/src/inference/pipelines/diffusion/scheduler.d.ts +17 -1
package/src/inference/pipelines/diffusion/scheduler.js +91 -3
package/src/inference/pipelines/diffusion/text-encoder-gpu.d.ts +11 -4
package/src/inference/pipelines/diffusion/text-encoder-gpu.js +282 -0
package/src/inference/pipelines/diffusion/text-encoder.js +18 -1
package/src/inference/pipelines/diffusion/types.d.ts +4 -0
package/src/inference/pipelines/diffusion/vae.js +782 -78
package/src/inference/pipelines/text/attention/record.js +11 -2
package/src/inference/pipelines/text/attention/run.js +11 -2
package/src/inference/pipelines/text/chat-format.js +25 -1
package/src/inference/pipelines/text/config.d.ts +9 -0
package/src/inference/pipelines/text/config.js +69 -2
package/src/inference/pipelines/text/execution-plan.js +23 -31
package/src/inference/pipelines/text/execution-v0.js +43 -95
package/src/inference/pipelines/text/ffn/standard.js +3 -0
package/src/inference/pipelines/text/init.d.ts +4 -0
package/src/inference/pipelines/text/init.js +56 -9
package/src/inference/pipelines/text/layer.js +11 -0
package/src/inference/pipelines/text.js +4 -0
package/src/inference/tokenizers/bundled.js +156 -33
package/src/rules/execution-rules-contract-check.d.ts +17 -0
package/src/rules/execution-rules-contract-check.js +245 -0
package/src/rules/kernels/depthwise-conv2d.rules.json +6 -0
package/src/rules/kernels/grouped-pointwise-conv2d.rules.json +6 -0
package/src/rules/kernels/relu.rules.json +6 -0
package/src/rules/kernels/repeat-channels.rules.json +6 -0
package/src/rules/kernels/sana-linear-attention.rules.json +6 -0
package/src/rules/layer-pattern-contract-check.d.ts +17 -0
package/src/rules/layer-pattern-contract-check.js +231 -0
package/src/rules/rule-registry.d.ts +28 -0
package/src/rules/rule-registry.js +38 -0
package/src/rules/tooling/command-runtime.rules.json +18 -0
package/src/tooling/command-api.d.ts +27 -1
package/src/tooling/command-api.js +142 -3
package/src/tooling/conversion-config-materializer.d.ts +24 -0
package/src/tooling/conversion-config-materializer.js +99 -0
package/src/tooling/lean-execution-contract-runner.d.ts +43 -0
package/src/tooling/lean-execution-contract-runner.js +158 -0
package/src/tooling/node-browser-command-runner.d.ts +4 -0
package/src/tooling/node-browser-command-runner.js +58 -3
package/src/tooling/node-command-runner.js +15 -0
package/src/tooling/node-convert.d.ts +10 -0
package/src/tooling/node-converter.js +59 -0
package/src/tooling/node-webgpu.js +11 -89
package/src/training/checkpoint-watch.d.ts +7 -0
package/src/training/checkpoint-watch.js +106 -0
package/src/training/checkpoint.d.ts +6 -1
package/src/training/checkpoint.js +12 -2
package/src/training/distillation/artifacts.d.ts +71 -0
package/src/training/distillation/artifacts.js +132 -0
package/src/training/distillation/checkpoint-watch.d.ts +10 -0
package/src/training/distillation/checkpoint-watch.js +57 -0
package/src/training/distillation/dataset.d.ts +59 -0
package/src/training/distillation/dataset.js +337 -0
package/src/training/distillation/eval.d.ts +34 -0
package/src/training/distillation/eval.js +310 -0
package/src/training/distillation/index.d.ts +29 -0
package/src/training/distillation/index.js +29 -0
package/src/training/distillation/runtime.d.ts +20 -0
package/src/training/distillation/runtime.js +121 -0
package/src/training/distillation/scoreboard.d.ts +6 -0
package/src/training/distillation/scoreboard.js +8 -0
package/src/training/distillation/stage-a.d.ts +45 -0
package/src/training/distillation/stage-a.js +338 -0
package/src/training/distillation/stage-b.d.ts +24 -0
package/src/training/distillation/stage-b.js +20 -0
package/src/training/index.d.ts +10 -0
package/src/training/index.js +10 -0
package/src/training/lora-pipeline.d.ts +40 -0
package/src/training/lora-pipeline.js +796 -0
package/src/training/operator-artifacts.d.ts +62 -0
package/src/training/operator-artifacts.js +140 -0
package/src/training/operator-command.d.ts +5 -0
package/src/training/operator-command.js +453 -0
package/src/training/operator-eval.d.ts +48 -0
package/src/training/operator-eval.js +230 -0
package/src/training/operator-scoreboard.d.ts +5 -0
package/src/training/operator-scoreboard.js +44 -0
package/src/training/runner.d.ts +52 -0
package/src/training/runner.js +29 -4
package/src/training/suite.d.ts +112 -0
package/src/training/suite.js +9 -9
package/src/training/workloads.d.ts +164 -0
package/src/training/workloads.js +539 -0
package/src/version.d.ts +2 -0
package/src/version.js +2 -0
package/tools/convert-safetensors-node.js +47 -0
package/tools/doppler-cli.js +252 -41

package/README.md CHANGED Viewed

@@ -22,7 +22,7 @@ for await (const token of model.generate('Hello, world')) {
 }
 ```
-Registry IDs resolve to hosted RDRR artifacts from `Clocksmith/rdrr` by default. Tokens stream from a native `AsyncGenerator`. See [more examples](#more-examples) below or the full [API contract](docs/doppler-api-contract.md).
+Registry IDs resolve to hosted RDRR artifacts from `Clocksmith/rdrr` by default. Tokens stream from a native `AsyncGenerator`. See [more examples](#more-examples) below or the canonical [Root API guide](https://github.com/clocksmith/doppler/blob/main/docs/api/root.md).
 ## Why Doppler
@@ -36,11 +36,11 @@ Registry IDs resolve to hosted RDRR artifacts from `Clocksmith/rdrr` by default.
 ## Evidence
-![Phase-latency comparison on one workload across models](benchmarks/vendors/results/compare_1b_multi-workload_favorable_phases.svg)
+![Phase-latency comparison on one workload across models](https://raw.githubusercontent.com/clocksmith/doppler/main/benchmarks/vendors/results/compare_1b_multi-workload_favorable_phases.svg)
 Snapshot artifacts:
-- [g3-1b-p064-d064-t0-k1.compare.json](benchmarks/vendors/fixtures/g3-1b-p064-d064-t0-k1.compare.json)
-- [lfm2-5-1-2b-p064-d064-t0-k1.compare.json](benchmarks/vendors/fixtures/lfm2-5-1-2b-p064-d064-t0-k1.compare.json)
+- [g3-1b-p064-d064-t0-k1.compare.json](https://github.com/clocksmith/doppler/blob/main/benchmarks/vendors/fixtures/g3-1b-p064-d064-t0-k1.compare.json)
+- [lfm2-5-1-2b-p064-d064-t0-k1.compare.json](https://github.com/clocksmith/doppler/blob/main/benchmarks/vendors/fixtures/lfm2-5-1-2b-p064-d064-t0-k1.compare.json)
 ## Under the hood
@@ -67,7 +67,7 @@ const reply = await model.chatText([
 ]);
 // LoRA hot-swap
-await model.loadLoRA('oneshift-twoshift-redshift-blueshift');
+await model.loadLoRA('https://example.com/adapters/oneshift-twoshift-redshift-blueshift/manifest.json');
 // Convenience shorthand (caches model automatically)
 for await (const token of doppler('Hello', { model: 'gemma3-270m' })) {
@@ -77,14 +77,30 @@ for await (const token of doppler('Hello', { model: 'gemma3-270m' })) {
 ## Documentation
-- Docs index (canonical navigation): [docs/INDEX.md](docs/INDEX.md)
-- First-run workflow: [docs/getting-started.md](docs/getting-started.md)
-- Runtime config contract: [docs/config.md](docs/config.md)
-- Architecture: [docs/architecture.md](docs/architecture.md)
+- Docs index (canonical navigation): [docs/INDEX.md](https://github.com/clocksmith/doppler/blob/main/docs/INDEX.md)
+- First-run workflow: [docs/getting-started.md](https://github.com/clocksmith/doppler/blob/main/docs/getting-started.md)
+- Runtime config contract: [docs/config.md](https://github.com/clocksmith/doppler/blob/main/docs/config.md)
+- Architecture: [docs/architecture.md](https://github.com/clocksmith/doppler/blob/main/docs/architecture.md)
+- Generated model support table: [docs/model-support-matrix.md](https://github.com/clocksmith/doppler/blob/main/docs/model-support-matrix.md)
+## Current model support
+Verified right now:
+- `gemma-3-270m-it-wq4k-ef16-hf16`
+- `gemma-3-1b-it-wq4k-ef16-hf16`
+- `google-embeddinggemma-300m-wq4k-ef16`
+- `translategemma-4b-it-wq4k-ef16-hf16`
+Known failing right now:
+- `qwen-3-5-0-8b-wq4k-ef16-hf16-f16`
+- `qwen-3-5-2b-wq4k-ef16-hf16-f16`
+For the generated status table, including `loads but unverified` and `everything else`, see [docs/model-support-matrix.md](https://github.com/clocksmith/doppler/blob/main/docs/model-support-matrix.md).
 ## Environment requirements
-- WebGPU-capable browser runtime is required.
+- WebGPU is required.
+- Supported runtimes: WebGPU-capable browsers, or Node with a WebGPU provider.
 - Chrome / Edge 113+ supported.
 - Firefox support varies (typically behind a flag).
 - Safari support is evolving.

package/package.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "@simulatte/doppler",
-  "version": "0.1.4",
+  "version": "0.1.6",
   "description": "Browser-native WebGPU inference engine for local intent and inference loops",
   "main": "src/index.js",
   "types": "src/index.d.ts",
   "type": "module",
   "bin": {
-    "doppler": "./tools/doppler-cli.js"
+    "doppler": "tools/doppler-cli.js"
   },
   "scripts": {
     "cli": "node tools/doppler-cli.js",
@@ -16,6 +16,16 @@
     "bench": "node tools/doppler-cli.js bench",
     "lean:check": "./lean/check.sh",
     "lean:execution-contract": "node tools/lean-execution-contract.js",
+    "lean:execution-contract:sweep": "node tools/lean-execution-contract-sweep.js",
+    "lean:execution-contract:configs": "node tools/lean-execution-contract-config-sweep.js",
+    "ci:lean:execution-contract": "node tools/lean-execution-contract-sweep.js --root models",
+    "ci:lean:execution-contract:configs": "node tools/lean-execution-contract-config-sweep.js --config-root tools/configs/conversion --manifest-root models --require-manifest-match",
+    "contracts:check": "node tools/check-contract-artifacts.js",
+    "contracts:summary": "node tools/check-contract-artifacts.js --json",
+    "contracts:check:lean": "node tools/check-contract-artifacts.js --with-lean",
+    "contracts:summary:lean": "node tools/check-contract-artifacts.js --json --with-lean",
+    "ci:contracts:check": "node tools/check-contract-artifacts.js --with-lean --lean-require-manifest-match",
+    "reports:convert:summary": "node tools/summarize-conversion-reports.js",
     "bench:chart": "node ./benchmarks/vendors/compare-chart.js",
     "bench:chart:readme": "node ./benchmarks/vendors/compare-chart.js --preset readme-evidence",
     "bench:architecture:chart": "node ./benchmarks/vendors/generate-architecture-overview-svg.js",
@@ -41,6 +51,8 @@
     "agents:freshness:strict": "node tools/verify-agent-freshness.js --strict",
     "conflicts:check": "node tools/check-merge-markers.js",
     "imports:check:browser": "node tools/check-browser-import-graph.js",
+    "api:docs:sync": "node tools/sync-api-docs.js",
+    "api:docs:check": "node tools/sync-api-docs.js --check",
     "verify:model": "node tools/doppler-cli.js verify",
     "onboarding:check": "node tools/onboarding-tooling.js check",
     "onboarding:check:strict": "node tools/onboarding-tooling.js check --strict",
@@ -53,8 +65,11 @@
     "verify": "node tools/run-registry-verify.js",
     "registry:sync:scripts": "node tools/sync-registry-scripts.js",
     "registry:sync:scripts:check": "node tools/sync-registry-scripts.js --check",
+    "registry:hf:check": "node tools/check-hf-registry.js",
+    "registry:publish:hf": "node tools/publish-hf-registry-model.js",
     "support:matrix:sync": "node tools/sync-model-support-matrix.js",
     "support:matrix:check": "node tools/sync-model-support-matrix.js --check",
+    "ci:catalog:check": "npm run registry:sync:scripts:check && npm run support:matrix:check && npm run registry:hf:check",
     "external:rdrr:index": "node tools/sync-external-rdrr-index.js",
     "external:rdrr:index:check": "node tools/sync-external-rdrr-index.js --check",
     "verify:embeddinggemma-300m": "node tools/run-registry-verify.js embeddinggemma-300m",
@@ -65,6 +80,7 @@
     "verify:google-embeddinggemma-300m": "node tools/run-registry-verify.js google-embeddinggemma-300m",
     "verify:google-embeddinggemma-300m-wq4k-ef16": "node tools/run-registry-verify.js google-embeddinggemma-300m-wq4k-ef16",
     "verify:google-gemma-3-270m-it": "node tools/run-registry-verify.js google-gemma-3-270m-it",
+    "verify:google-translategemma-4b-it": "node tools/run-registry-verify.js google-translategemma-4b-it",
     "verify:qwen-3-5-0-8b": "node tools/run-registry-verify.js qwen-3-5-0-8b",
     "verify:qwen-3-5-0-8b-wq4k-ef16-hf16-f16": "node tools/run-registry-verify.js qwen-3-5-0-8b-wq4k-ef16-hf16-f16",
     "verify:qwen-3-5-2b": "node tools/run-registry-verify.js qwen-3-5-2b",
@@ -72,7 +88,10 @@
     "verify:qwen-qwen3.5-0.8b": "node tools/run-registry-verify.js qwen-qwen3.5-0.8b",
     "verify:qwen-qwen3.5-2b": "node tools/run-registry-verify.js qwen-qwen3.5-2b",
     "verify:qwen3-0.8b": "node tools/run-registry-verify.js qwen3-0.8b",
-    "verify:qwen3-2b": "node tools/run-registry-verify.js qwen3-2b"
+    "verify:qwen3-2b": "node tools/run-registry-verify.js qwen3-2b",
+    "verify:translategemma": "node tools/run-registry-verify.js translategemma",
+    "verify:translategemma-4b": "node tools/run-registry-verify.js translategemma-4b",
+    "verify:translategemma-4b-it-wq4k-ef16-hf16": "node tools/run-registry-verify.js translategemma-4b-it-wq4k-ef16-hf16"
   },
   "exports": {
     ".": {
@@ -102,12 +121,11 @@
     "./energy": {
       "types": "./src/energy/index.d.ts",
       "import": "./src/energy/index.js"
-    },
-    "./*": "./src/*"
+    }
   },
   "repository": {
     "type": "git",
-    "url": "https://github.com/clocksmith/doppler.git"
+    "url": "git+https://github.com/clocksmith/doppler.git"
   },
   "homepage": "https://github.com/clocksmith/doppler",
   "keywords": [
@@ -124,6 +142,9 @@
     "url": "https://github.com/clocksmith/doppler/issues"
   },
   "license": "Apache-2.0",
+  "publishConfig": {
+    "access": "public"
+  },
   "files": [
     "src",
     "src/gpu/kernels/*.wgsl",
@@ -140,5 +161,8 @@
     "jest": "^30.2.0",
     "onnxruntime-web": "^1.24.1",
     "playwright": "^1.58.2"
+  },
+  "optionalDependencies": {
+    "@simulatte/webgpu": "0.1.x"
   }
 }

package/src/client/doppler-api.browser.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export * from './doppler-api.d.ts';

package/src/client/doppler-api.browser.js ADDED Viewed

@@ -0,0 +1,288 @@
+import { loadLoRAFromManifest, loadLoRAFromUrl } from '../adapters/lora-loader.js';
+import { log } from '../debug/index.js';
+import { getManifestUrl, parseManifest } from '../formats/rdrr/index.js';
+import { createPipeline } from '../generation/index.js';
+import { getKernelCapabilities } from '../gpu/device.js';
+import { formatChatMessages } from '../inference/pipelines/text/chat-format.js';
+import { buildQuickstartModelBaseUrl, listQuickstartModels, resolveQuickstartModel } from './doppler-registry.js';
+const convenienceModelCache = new Map();
+const inFlightLoadCache = new Map();
+function emitLoadProgress(callback, phase, percent, message) {
+  if (typeof callback !== 'function') return;
+  callback({ phase, percent, message });
+}
+async function ensureWebGPUAvailable() {
+  if (typeof globalThis.navigator !== 'undefined' && globalThis.navigator?.gpu) {
+    return;
+  }
+  throw new Error('WebGPU is unavailable. Run in a WebGPU-capable browser.');
+}
+export function createDefaultNodeLoadProgressLogger() {
+  return (event) => {
+    const message = typeof event?.message === 'string' ? event.message.trim() : '';
+    if (!message) return;
+    log.info('doppler', message);
+  };
+}
+export function resolveLoadProgressHandlers(options = {}) {
+  const onProgress = typeof options?.onProgress === 'function' ? options.onProgress : null;
+  if (onProgress) {
+    return {
+      userProgress: onProgress,
+      pipelineProgress: onProgress,
+    };
+  }
+  return {
+    userProgress: null,
+    pipelineProgress: null,
+  };
+}
+async function fetchManifestFromBaseUrl(baseUrl) {
+  const response = await fetch(getManifestUrl(baseUrl));
+  if (!response.ok) {
+    throw new Error(`Failed to fetch manifest from ${baseUrl}: ${response.status}`);
+  }
+  return parseManifest(await response.text());
+}
+async function resolveModelSource(model) {
+  if (typeof model === 'string') {
+    const entry = await resolveQuickstartModel(model);
+    return {
+      modelId: entry.modelId,
+      baseUrl: buildQuickstartModelBaseUrl(entry),
+      manifest: null,
+    };
+  }
+  if (model && typeof model === 'object' && typeof model.url === 'string' && model.url.trim().length > 0) {
+    return {
+      modelId: model.url.trim(),
+      baseUrl: model.url.trim(),
+      manifest: null,
+    };
+  }
+  if (model && typeof model === 'object' && model.manifest && typeof model.manifest === 'object') {
+    const manifest = model.manifest;
+    const modelId = typeof manifest.modelId === 'string' && manifest.modelId.length > 0
+      ? manifest.modelId
+      : 'manifest';
+    return {
+      modelId,
+      baseUrl: typeof model.baseUrl === 'string' && model.baseUrl.length > 0 ? model.baseUrl : null,
+      manifest,
+    };
+  }
+  throw new Error('doppler.load expects a quickstart registry id, { url }, or { manifest, baseUrl? }.');
+}
+function countTokens(pipeline, text) {
+  if (!text || typeof text !== 'string') return 0;
+  try {
+    return pipeline?.tokenizer?.encode(text)?.length ?? 0;
+  } catch {
+    return 0;
+  }
+}
+function resolveChatPromptForUsage(pipeline, messages) {
+  const templateType = pipeline?.manifest?.inference?.chatTemplate?.enabled === false
+    ? null
+    : (pipeline?.manifest?.inference?.chatTemplate?.type ?? null);
+  try {
+    return formatChatMessages(messages, templateType);
+  } catch {
+    return messages.map((message) => String(message?.content ?? '')).join('\n');
+  }
+}
+async function collectText(iterable) {
+  let output = '';
+  for await (const token of iterable) {
+    output += token;
+  }
+  return output;
+}
+function createModelHandle(pipeline, resolved) {
+  return {
+    generate(prompt, options = {}) {
+      return pipeline.generate(prompt, options);
+    },
+    async generateText(prompt, options = {}) {
+      return collectText(pipeline.generate(prompt, options));
+    },
+    chat(messages, options = {}) {
+      return pipeline.generate(messages, options);
+    },
+    async chatText(messages, options = {}) {
+      const content = await collectText(pipeline.generate(messages, options));
+      const promptText = resolveChatPromptForUsage(pipeline, messages);
+      const promptTokens = countTokens(pipeline, promptText);
+      const completionTokens = countTokens(pipeline, content);
+      return {
+        content,
+        usage: {
+          promptTokens,
+          completionTokens,
+          totalTokens: promptTokens + completionTokens,
+        },
+      };
+    },
+    async loadLoRA(adapter) {
+      const lora = typeof adapter === 'string'
+        ? await loadLoRAFromUrl(adapter)
+        : await loadLoRAFromManifest(adapter);
+      pipeline.setLoRAAdapter(lora);
+    },
+    async unloadLoRA() {
+      pipeline.setLoRAAdapter(null);
+    },
+    async unload() {
+      await pipeline.unload();
+    },
+    get activeLoRA() {
+      return pipeline.getActiveLoRA()?.name ?? null;
+    },
+    get loaded() {
+      return pipeline.isLoaded === true;
+    },
+    get modelId() {
+      return resolved.modelId;
+    },
+    get manifest() {
+      return pipeline.manifest;
+    },
+    get deviceInfo() {
+      return getKernelCapabilities()?.adapterInfo ?? null;
+    },
+    advanced: {
+      prefillKV(prompt, options = {}) {
+        return pipeline.prefillKVOnly(prompt, options);
+      },
+      generateWithPrefixKV(prefix, prompt, options = {}) {
+        return pipeline.generateWithPrefixKV(prefix, prompt, options);
+      },
+    },
+  };
+}
+export async function load(model, options = {}) {
+  const { userProgress, pipelineProgress } = resolveLoadProgressHandlers(options);
+  emitLoadProgress(userProgress, 'resolve', 5, 'Resolving model');
+  const resolved = await resolveModelSource(model);
+  await ensureWebGPUAvailable();
+  emitLoadProgress(userProgress, 'manifest', 15, 'Fetching manifest');
+  const manifest = resolved.manifest ?? await fetchManifestFromBaseUrl(resolved.baseUrl);
+  emitLoadProgress(userProgress, 'load', 25, 'Loading weights');
+  const pipeline = await createPipeline(manifest, {
+    baseUrl: resolved.baseUrl ?? undefined,
+    runtimeConfig: options.runtimeConfig,
+    onProgress: pipelineProgress
+      ? (progress) => emitLoadProgress(
+        pipelineProgress,
+        'load',
+        Math.max(25, Math.min(99, Math.round(progress.percent))),
+        progress.message || 'Loading weights'
+      )
+      : undefined,
+  });
+  emitLoadProgress(userProgress, 'ready', 100, 'Model ready');
+  return createModelHandle(pipeline, resolved);
+}
+async function getCachedModel(model, options = {}) {
+  const resolved = await resolveModelSource(model);
+  const cacheKey = resolved.modelId;
+  const cached = convenienceModelCache.get(cacheKey);
+  if (cached?.loaded) {
+    return cached;
+  }
+  if (cached && !cached.loaded) {
+    convenienceModelCache.delete(cacheKey);
+  }
+  if (!inFlightLoadCache.has(cacheKey)) {
+    inFlightLoadCache.set(cacheKey, load(model, options).then((instance) => {
+      convenienceModelCache.set(cacheKey, instance);
+      inFlightLoadCache.delete(cacheKey);
+      return instance;
+    }).catch((error) => {
+      inFlightLoadCache.delete(cacheKey);
+      throw error;
+    }));
+  }
+  return inFlightLoadCache.get(cacheKey);
+}
+async function* dopplerGenerate(prompt, options = {}) {
+  if (!options || typeof options !== 'object' || options.model == null) {
+    throw new Error('doppler() requires options.model.');
+  }
+  if (options.runtimeConfig !== undefined || options.runtimePreset !== undefined) {
+    throw new Error('doppler() does not accept load-affecting options. Use doppler.load(model, options) instead.');
+  }
+  const model = await getCachedModel(options.model, { onProgress: options.onProgress });
+  yield* model.generate(prompt, options);
+}
+export function doppler(prompt, options) {
+  return dopplerGenerate(prompt, options);
+}
+doppler.load = load;
+doppler.text = async function text(prompt, options = {}) {
+  if (!options || typeof options !== 'object' || options.model == null) {
+    throw new Error('doppler.text() requires options.model.');
+  }
+  const model = await getCachedModel(options.model, { onProgress: options.onProgress });
+  return model.generateText(prompt, options);
+};
+doppler.chat = function chat(messages, options = {}) {
+  if (!options || typeof options !== 'object' || options.model == null) {
+    throw new Error('doppler.chat() requires options.model.');
+  }
+  return (async function* run() {
+    const model = await getCachedModel(options.model, { onProgress: options.onProgress });
+    yield* model.chat(messages, options);
+  }());
+};
+doppler.chatText = async function chatText(messages, options = {}) {
+  if (!options || typeof options !== 'object' || options.model == null) {
+    throw new Error('doppler.chatText() requires options.model.');
+  }
+  const model = await getCachedModel(options.model, { onProgress: options.onProgress });
+  return model.chatText(messages, options);
+};
+doppler.evict = async function evict(model) {
+  const resolved = await resolveModelSource(model);
+  const cacheKey = resolved.modelId;
+  const cached = convenienceModelCache.get(cacheKey);
+  if (!cached) return false;
+  await cached.unload();
+  convenienceModelCache.delete(cacheKey);
+  return true;
+};
+doppler.evictAll = async function evictAll() {
+  const cachedModels = Array.from(convenienceModelCache.values());
+  convenienceModelCache.clear();
+  await Promise.allSettled(cachedModels.map((model) => model.unload()));
+};
+doppler.listModels = async function listModels() {
+  const models = await listQuickstartModels();
+  return models.map((entry) => entry.aliases[0] || entry.modelId);
+};

package/src/client/doppler-api.js CHANGED Viewed

@@ -4,7 +4,6 @@ import { getManifestUrl, parseManifest } from '../formats/rdrr/index.js';
 import { createPipeline } from '../generation/index.js';
 import { getKernelCapabilities } from '../gpu/device.js';
 import { formatChatMessages } from '../inference/pipelines/text/chat-format.js';
-import { bootstrapNodeWebGPU } from '../tooling/node-webgpu.js';
 import { buildQuickstartModelBaseUrl, listQuickstartModels, resolveQuickstartModel } from './doppler-registry.js';
 const convenienceModelCache = new Map();
@@ -21,6 +20,7 @@ async function ensureWebGPUAvailable() {
     return;
   }
   if (isNodeRuntime()) {
+    const { bootstrapNodeWebGPU } = await import('../tooling/node-webgpu.js');
     const result = await bootstrapNodeWebGPU();
     if (result.ok && globalThis.navigator?.gpu) {
       return;

package/src/client/doppler-provider/types.js CHANGED Viewed

@@ -1,4 +1,4 @@
-export const DOPPLER_PROVIDER_VERSION = '0.1.0';
+export { DOPPLER_PROVIDER_VERSION } from '../../version.js';
 export const DopplerCapabilities = {
   available: false,

package/src/config/execution-contract-check.d.ts CHANGED Viewed

@@ -1,3 +1,10 @@
+import type {
+  ExecutionV0ContractArtifact,
+} from './execution-v0-contract-check.js';
+import type {
+  ExecutionV0GraphContractArtifact,
+} from './execution-v0-graph-contract-check.js';
 export interface ExecutionContractStepFacts {
   id: string;
   phase: 'prefill' | 'decode' | 'both';
@@ -34,6 +41,28 @@ export interface ManifestExecutionContractValidationResult extends ExecutionCont
   facts: ExecutionContractFacts;
 }
+export interface ExecutionContractArtifact {
+  schemaVersion: 1;
+  source: 'doppler';
+  ok: boolean;
+  checks: ExecutionContractCheckResult[];
+  errors: string[];
+  session: ExecutionContractSessionFacts | null;
+  steps: {
+    total: number;
+    attention: number;
+    attentionPhases: {
+      prefill: number;
+      decode: number;
+      both: number;
+    };
+  } | null;
+  executionV0?: {
+    kernelProfiles: ExecutionV0ContractArtifact | null;
+    graph: ExecutionV0GraphContractArtifact | null;
+  };
+}
 export declare function sanitizeLeanModuleName(value: unknown): string;
 export declare function extractExecutionContractFacts(
@@ -47,3 +76,7 @@ export declare function validateExecutionContractFacts(
 export declare function validateManifestExecutionContract(
   manifest: Record<string, unknown>
 ): ManifestExecutionContractValidationResult;
+export declare function buildExecutionContractArtifact(
+  manifest: Record<string, unknown>
+): ExecutionContractArtifact | null;

package/src/config/execution-contract-check.js CHANGED Viewed

@@ -1,4 +1,7 @@
 import { DEFAULT_BATCHING_DEFAULTS, DEFAULT_GENERATION_CONFIG } from './schema/inference-defaults.schema.js';
+import { buildExecutionV0ContractArtifact } from './execution-v0-contract-check.js';
+import { buildExecutionV0GraphContractArtifact } from './execution-v0-graph-contract-check.js';
+import { EXECUTION_V0_SCHEMA_ID } from './schema/execution-v0.schema.js';
 import { DEFAULT_KVCACHE_CONFIG } from './schema/kvcache.schema.js';
 const KV_LAYOUTS = new Set(['contiguous', 'paged', 'tiered', 'bdpa']);
@@ -243,3 +246,72 @@ export function validateManifestExecutionContract(manifest) {
     facts,
   };
 }
+export function buildExecutionContractArtifact(manifest) {
+  if (!manifest || typeof manifest !== 'object') {
+    return null;
+  }
+  if (manifest.modelType === 'diffusion' || manifest.modelType === 'energy') {
+    return null;
+  }
+  if (!manifest.architecture || !manifest.inference || typeof manifest.inference !== 'object') {
+    return null;
+  }
+  try {
+    const evaluation = validateManifestExecutionContract(manifest);
+    const attentionPhaseCounts = { prefill: 0, decode: 0, both: 0 };
+    for (const step of evaluation.facts.steps) {
+      if (step.opClass !== 'attention') continue;
+      if (Object.prototype.hasOwnProperty.call(attentionPhaseCounts, step.phase)) {
+        attentionPhaseCounts[step.phase] += 1;
+      }
+    }
+    const executionV0 =
+      manifest?.inference?.schema === EXECUTION_V0_SCHEMA_ID
+        ? {
+            kernelProfiles: buildExecutionV0ContractArtifact(manifest.inference, {
+              modelId: evaluation.facts.modelId,
+            }),
+            graph: buildExecutionV0GraphContractArtifact({
+              modelId: evaluation.facts.modelId,
+              numLayers: manifest?.architecture?.numLayers,
+              manifestInference: manifest.inference,
+            }),
+          }
+        : null;
+    const nestedChecks = [];
+    const nestedErrors = [];
+    if (executionV0?.kernelProfiles) {
+      nestedChecks.push(...executionV0.kernelProfiles.checks);
+      nestedErrors.push(...executionV0.kernelProfiles.errors);
+    }
+    if (executionV0?.graph) {
+      nestedChecks.push(...executionV0.graph.checks);
+      nestedErrors.push(...executionV0.graph.errors);
+    }
+    return {
+      schemaVersion: 1,
+      source: 'doppler',
+      ok: evaluation.ok && nestedErrors.length === 0,
+      checks: [...evaluation.checks, ...nestedChecks],
+      errors: [...evaluation.errors, ...nestedErrors],
+      session: evaluation.facts.session,
+      steps: {
+        total: evaluation.facts.steps.length,
+        attention: attentionPhaseCounts.prefill + attentionPhaseCounts.decode + attentionPhaseCounts.both,
+        attentionPhases: attentionPhaseCounts,
+      },
+      ...(executionV0 ? { executionV0 } : {}),
+    };
+  } catch (error) {
+    return {
+      schemaVersion: 1,
+      source: 'doppler',
+      ok: false,
+      checks: [],
+      errors: [error instanceof Error ? error.message : String(error)],
+      session: null,
+      steps: null,
+    };
+  }
+}