npm - @simulatte/doppler - Versions diffs - 0.1.8 → 0.1.9 - Mend

@simulatte/doppler 0.1.8 → 0.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

package/CHANGELOG.md +14 -1
package/README.md +25 -6
package/package.json +5 -3
package/src/client/doppler-api.browser.js +6 -0
package/src/client/doppler-api.d.ts +3 -0
package/src/client/doppler-api.js +11 -2
package/src/client/doppler-registry.js +3 -5
package/src/client/doppler-registry.json +16 -0
package/src/config/kernels/kernel-ref-digests.js +23 -21
package/src/config/kernels/moe/mixtral.paths.json +46 -0
package/src/config/loader.js +6 -0
package/src/config/platforms/loader.js +3 -1
package/src/config/presets/kernel-paths/gemma3-q4k-dequant-f32a-nosubgroups.json +16 -16
package/src/config/presets/kernel-paths/gemma3-q4k-dequant-f32a-online.json +8 -8
package/src/config/presets/kernel-paths/gemma3-q4k-dequant-f32a-small-attn.json +61 -0
package/src/config/presets/kernel-paths/registry.json +7 -0
package/src/config/presets/models/gemma3.json +2 -1
package/src/config/presets/models/gemma4.json +61 -0
package/src/config/presets/models/granite-docling.json +70 -0
package/src/config/presets/models/lfm2.json +6 -1
package/src/config/presets/models/qwen3_vl.json +40 -0
package/src/config/presets/runtime/experiments/bench/gemma3-bench-q4k.json +2 -1
package/src/config/presets/runtime/experiments/verify/lfm2-verify.json +46 -0
package/src/config/presets/runtime/experiments/verify/translategemma-verify.json +39 -0
package/src/config/presets/runtime/modes/trace-layers.json +1 -0
package/src/config/presets/runtime/tiers/gemma4-16gb.json +69 -0
package/src/config/presets/runtime/tiers/gemma4-24gb.json +66 -0
package/src/config/presets/runtime/tiers/gemma4-32gb.json +66 -0
package/src/config/runtime.js +3 -0
package/src/config/schema/debug.schema.d.ts +40 -0
package/src/config/schema/debug.schema.js +28 -0
package/src/config/schema/index.js +2 -0
package/src/config/schema/inference-defaults.schema.js +1 -1
package/src/config/schema/kernel-path.schema.d.ts +1 -0
package/src/config/schema/memory-limits.schema.js +2 -2
package/src/config/schema/storage.schema.js +1 -1
package/src/converter/conversion-plan.js +1 -1
package/src/converter/core.js +17 -8
package/src/converter/quantizer.d.ts +5 -0
package/src/converter/quantizer.js +15 -0
package/src/distribution/shard-delivery.js +34 -0
package/src/formats/rdrr/classification.js +32 -0
package/src/gpu/kernel-runtime.js +4 -2
package/src/gpu/kernels/attention.js +2 -1
package/src/gpu/kernels/dequant_f16_out.wgsl +4 -2
package/src/gpu/kernels/dequant_f16_out_vec4.wgsl +5 -2
package/src/gpu/kernels/dequant_shared.wgsl +4 -2
package/src/gpu/kernels/dequant_shared_vec4.wgsl +4 -2
package/src/gpu/kernels/dequant_subgroup.wgsl +6 -2
package/src/gpu/kernels/gated-short-conv.d.ts +63 -0
package/src/gpu/kernels/gated-short-conv.js +284 -0
package/src/gpu/kernels/linear-attention-core.js +37 -17
package/src/gpu/kernels/matmul-selection.js +1 -0
package/src/gpu/kernels/matmul.d.ts +3 -0
package/src/gpu/kernels/matmul.js +70 -1
package/src/gpu/kernels/matmul_gemv_subgroup.wgsl +77 -79
package/src/gpu/kernels/sample.js +1 -3
package/src/gpu/kernels/sample.wgsl +39 -9
package/src/gpu/kernels/sample_f16.wgsl +38 -8
package/src/gpu/kernels/shader-cache.js +9 -4
package/src/inference/kv-cache/base.js +3 -10
package/src/inference/pipelines/diffusion/pipeline.js +2 -1
package/src/inference/pipelines/diffusion/text-encoder-gpu.js +2 -1
package/src/inference/pipelines/text/attention/projections.d.ts +3 -0
package/src/inference/pipelines/text/attention/projections.js +13 -2
package/src/inference/pipelines/text/attention/record.js +1 -0
package/src/inference/pipelines/text/attention/run.js +9 -0
package/src/inference/pipelines/text/config.d.ts +1 -0
package/src/inference/pipelines/text/config.js +32 -4
package/src/inference/pipelines/text/embed.js +26 -7
package/src/inference/pipelines/text/execution-v0-runtime-builders.js +10 -3
package/src/inference/pipelines/text/execution-v0.js +12 -1
package/src/inference/pipelines/text/generator-helpers.js +1 -0
package/src/inference/pipelines/text/generator-runtime.js +14 -0
package/src/inference/pipelines/text/generator-steps.d.ts +9 -0
package/src/inference/pipelines/text/generator-steps.js +46 -29
package/src/inference/pipelines/text/generator.d.ts +5 -0
package/src/inference/pipelines/text/generator.js +320 -166
package/src/inference/pipelines/text/init.d.ts +2 -0
package/src/inference/pipelines/text/init.js +19 -5
package/src/inference/pipelines/text/layer.js +37 -8
package/src/inference/pipelines/text/moe-gpu.js +21 -3
package/src/inference/pipelines/text/moe-shape-validator.d.ts +9 -0
package/src/inference/pipelines/text/moe-shape-validator.js +31 -11
package/src/inference/pipelines/text/ops.js +123 -53
package/src/inference/pipelines/text/probes.js +1 -0
package/src/inference/pipelines/text/state.js +2 -0
package/src/inference/pipelines/text.d.ts +5 -0
package/src/inference/pipelines/text.js +59 -1
package/src/inference/pipelines/vision/encoder.js +386 -0
package/src/inference/pipelines/vision/image-preprocess.js +151 -0
package/src/inference/pipelines/vision/index.js +173 -0
package/src/inference/pipelines/vision/ops.js +78 -0
package/src/inference/pipelines/vision/patch-embed.js +151 -0
package/src/inference/test-harness.js +9 -7
package/src/loader/doppler-loader.d.ts +3 -0
package/src/loader/doppler-loader.js +20 -3
package/src/loader/experts/expert-cache.js +6 -2
package/src/loader/experts/expert-loader.js +6 -2
package/src/loader/layer-loader.js +42 -3
package/src/loader/manifest-config.js +3 -1
package/src/loader/tensors/tensor-loader.d.ts +3 -0
package/src/loader/tensors/tensor-loader.js +124 -3
package/src/rules/kernels/moe.rules.mixtral.json +75 -0
package/src/rules/kernels/softmax.rules.json +2 -0
package/src/rules/rule-registry.d.ts +1 -0
package/src/rules/rule-registry.js +2 -0
package/src/storage/quickstart-downloader.d.ts +3 -0
package/src/storage/quickstart-downloader.js +27 -30
package/src/tooling/node-converter.js +25 -7
package/src/tooling/node-source-runtime.js +29 -5
package/src/tooling/node-webgpu.js +24 -7
package/src/utils/hf-resolve-url.d.ts +16 -0
package/src/utils/hf-resolve-url.js +17 -0
package/src/version.js +1 -1
package/src/tooling/node-convert.d.ts +0 -54

package/src/rules/kernels/moe.rules.mixtral.json ADDED Viewed

@@ -0,0 +1,75 @@
+{
+  "vendorQuirkProfile": [
+    {
+      "match": {
+        "vendor": {
+          "contains": ["intel", "amd"]
+        }
+      },
+      "value": {
+        "preferVec4Dequant": false,
+        "dequantTileShape": "scalar",
+        "routerWorkgroupSize": 128,
+        "maxTokensPerExpertScale": 0.85
+      }
+    },
+    {
+      "match": {
+        "vendor": {
+          "contains": ["nvidia", "apple", "qualcomm"]
+        }
+      },
+      "value": {
+        "preferVec4Dequant": false,
+        "dequantTileShape": "scalar",
+        "routerWorkgroupSize": 256,
+        "maxTokensPerExpertScale": 1.0
+      }
+    },
+    {
+      "match": {},
+      "value": {
+        "preferVec4Dequant": false,
+        "dequantTileShape": "scalar",
+        "routerWorkgroupSize": 128,
+        "maxTokensPerExpertScale": 1.0
+      }
+    }
+  ],
+  "routerTopKVariant": [
+    {
+      "match": { "modelType": "mixtral", "hasF16": true, "hasSubgroups": true, "routerDtype": "f32" },
+      "value": "softmax_topk_f32_subgroup"
+    },
+    {
+      "match": { "modelType": "mixtral", "routerDtype": "f32" },
+      "value": "softmax_topk_f32"
+    },
+    {
+      "match": { "modelType": "mixtral" },
+      "value": "softmax_topk_f32"
+    }
+  ],
+  "dequantVariant": [
+    {
+      "match": { "modelType": "mixtral", "weightsDtype": "q4k", "hasF16": true, "hasSubgroups": true, "outputDtype": "f32" },
+      "value": "q4k_expert_dequant_f32_subgroup"
+    },
+    {
+      "match": { "modelType": "mixtral", "weightsDtype": "q4k", "outputDtype": "f16", "hasF16": true },
+      "value": "q4k_expert_dequant_f16"
+    },
+    {
+      "match": { "modelType": "mixtral", "weightsDtype": "q4k" },
+      "value": "q4k_expert_dequant_f32"
+    },
+    {
+      "match": { "modelType": "mixtral", "weightsDtype": "f16", "outputDtype": "f16", "hasF16": true },
+      "value": "f16_expert_passthrough"
+    },
+    {
+      "match": { "modelType": "mixtral" },
+      "value": "f16_expert_upcast_f32"
+    }
+  ]
+}

package/src/rules/kernels/softmax.rules.json CHANGED Viewed

@@ -16,6 +16,8 @@
       },
       "value": "gptoss_router_topk"
     },
+    { "match": { "modelType": "mixtral", "inputDtype": "f16", "weightsDtype": "f16" }, "value": "fused_f16_w16" },
+    { "match": { "modelType": "mixtral" }, "value": "fused" },
     { "match": { "inputDtype": "f16", "weightsDtype": "f16" }, "value": "fused_f16_w16" },
     { "match": { "inputDtype": "f16" }, "value": "fused_f16" },
     { "match": {}, "value": "fused" }

package/src/rules/rule-registry.d.ts CHANGED Viewed

@@ -20,6 +20,7 @@ type KernelRuleGroup =
   | 'matmul'
   | 'moe'
   | 'moeGptoss'
+  | 'moeMixtral'
   | 'residual'
   | 'rmsnorm'
   | 'rope'

package/src/rules/rule-registry.js CHANGED Viewed

@@ -38,6 +38,7 @@ const layernormRules = await loadJson('./kernels/layernorm.rules.json', import.m
 const matmulRules = await loadJson('./kernels/matmul.rules.json', import.meta.url, 'Failed to load rules');
 const kernelMoeRules = await loadJson('./kernels/moe.rules.json', import.meta.url, 'Failed to load rules');
 const kernelMoeGptOssRules = await loadJson('./kernels/moe.rules.gptoss.json', import.meta.url, 'Failed to load rules');
+const kernelMoeMixtralRules = await loadJson('./kernels/moe.rules.mixtral.json', import.meta.url, 'Failed to load rules');
 const modulateRules = await loadJson('./kernels/modulate.rules.json', import.meta.url, 'Failed to load rules');
 const pixelShuffleRules = await loadJson('./kernels/pixel_shuffle.rules.json', import.meta.url, 'Failed to load rules');
 const repeatChannelsRules = await loadJson('./kernels/repeat-channels.rules.json', import.meta.url, 'Failed to load rules');
@@ -113,6 +114,7 @@ const RULE_SETS = {
     matmul: matmulRules,
     moe: kernelMoeRules,
     moeGptoss: kernelMoeGptOssRules,
+    moeMixtral: kernelMoeMixtralRules,
     modulate: modulateRules,
     pixel_shuffle: pixelShuffleRules,
     repeatChannels: repeatChannelsRules,

package/src/storage/quickstart-downloader.d.ts CHANGED Viewed

@@ -13,6 +13,7 @@
 import type { DownloadProgress } from './downloader.js';
 import type { PreflightResult, ModelRequirements } from './preflight.js';
+import type { HfResolveConfig } from '../utils/hf-resolve-url.js';
 /**
  * Remote model configuration
@@ -24,6 +25,8 @@ export interface RemoteModelConfig {
   displayName: string;
   /** Base URL for shards (any static CDN) */
   baseUrl?: string | null;
+  /** Hosted Hugging Face source used when baseUrl is omitted */
+  hf?: HfResolveConfig | null;
   /** Model requirements for pre-flight checks */
   requirements: ModelRequirements;
 }

package/src/storage/quickstart-downloader.js CHANGED Viewed

@@ -7,6 +7,7 @@ import {
 } from './preflight.js';
 import { formatBytes } from './quota.js';
 import { getCdnBasePath } from './download-types.js';
+import { buildHfResolveBaseUrl, DEFAULT_HF_CDN_BASE_URL } from '../utils/hf-resolve-url.js';
 // ============================================================================
 // Model Registry
@@ -15,40 +16,14 @@ import { getCdnBasePath } from './download-types.js';
 let cdnBaseOverride = null;
-function getEffectiveCDNBaseUrl() {
-  const runtimeBase = getCdnBasePath();
-  const base = cdnBaseOverride ?? runtimeBase ?? '';
-  if (base) return base;
-  // Auto-detect: use same origin for Firebase Hosting or local dev
-  if (typeof globalThis.location !== 'undefined') {
-    const path = globalThis.location.pathname || '';
-    if (
-      path === '/d' ||
-      path.startsWith('/d/') ||
-      path === '/doppler' ||
-      path.startsWith('/doppler/') ||
-      path === '/dr' ||
-      path.startsWith('/dr/') ||
-      globalThis.location.host.includes('replo')
-    ) {
-      return `${globalThis.location.origin}/doppler/models`;
-    }
-    return `${globalThis.location.origin}/models`;
-  }
-  // Fallback for non-browser-global contexts
-  return '/models';
-}
 export function setCDNBaseUrl(url) {
-  cdnBaseOverride = url.replace(/\/$/, ''); // Remove trailing slash
+  const normalized = typeof url === 'string' ? url.trim().replace(/\/$/, '') : '';
+  cdnBaseOverride = normalized || null;
 }
 export function getCDNBaseUrl() {
-  return getEffectiveCDNBaseUrl();
+  return cdnBaseOverride ?? getCdnBasePath() ?? DEFAULT_HF_CDN_BASE_URL;
 }
@@ -57,12 +32,22 @@ export const QUICKSTART_MODELS = {
     modelId: 'gemma-3-270m-it-q4k-ehf16-af32',
     displayName: 'Gemma 3 270M IT (Q4K)',
     baseUrl: null,
+    hf: {
+      repoId: 'Clocksmith/rdrr',
+      revision: 'ca6f0dbdf3882d3893a65cf48f2bb6f1520df162',
+      path: 'models/gemma-3-270m-it-q4k-ehf16-af32',
+    },
     requirements: MODEL_REQUIREMENTS['gemma-3-270m-it-q4k-ehf16-af32'],
   },
   'google-embeddinggemma-300m-q4k-ehf16-af32': {
     modelId: 'google-embeddinggemma-300m-q4k-ehf16-af32',
     displayName: 'EmbeddingGemma 300M (Q4K)',
     baseUrl: null,
+    hf: {
+      repoId: 'Clocksmith/rdrr',
+      revision: '7e79c466d54455bd370c81685956ea9abae0fd30',
+      path: 'models/google-embeddinggemma-300m-q4k-ehf16-af32',
+    },
     requirements: MODEL_REQUIREMENTS['google-embeddinggemma-300m-q4k-ehf16-af32'],
   },
 };
@@ -82,6 +67,18 @@ export function registerQuickStartModel(config) {
   QUICKSTART_MODELS[config.modelId] = config;
 }
+function resolveQuickStartModelBaseUrl(config) {
+  if (typeof config?.baseUrl === 'string' && config.baseUrl.trim().length > 0) {
+    return config.baseUrl.trim().replace(/\/$/, '');
+  }
+  if (config?.hf) {
+    return buildHfResolveBaseUrl(config.hf, { cdnBasePath: getCDNBaseUrl() });
+  }
+  throw new Error(
+    `Quickstart model "${config?.modelId ?? 'unknown'}" is missing an explicit baseUrl or hosted Hugging Face source.`
+  );
+}
 // ============================================================================
 // Download Functions
 // ============================================================================
@@ -190,7 +187,7 @@ export async function downloadQuickStartModel(
       signal,
     };
-    const baseUrl = config.baseUrl ?? `${getEffectiveCDNBaseUrl()}/${config.modelId}`;
+    const baseUrl = resolveQuickStartModelBaseUrl(config);
     const success = await downloadModel(
       baseUrl,
       onProgress,

package/src/tooling/node-converter.js CHANGED Viewed

@@ -541,18 +541,24 @@ async function listRelativeFiles(rootDir, relDir = '', out = []) {
   return out;
 }
-async function clearExistingShardFiles(outputDir) {
+async function clearExistingConversionOutputs(outputDir) {
   let entries;
   try {
     entries = await fs.readdir(outputDir, { withFileTypes: true });
   } catch {
     return;
   }
-  const shardFiles = entries
-    .filter((entry) => entry.isFile() && /^shard_\d{5}\.bin$/i.test(entry.name))
+  const artifactFiles = entries
+    .filter((entry) => (
+      entry.isFile()
+      && (
+        /^shard_\d{5}\.bin$/i.test(entry.name)
+        || entry.name === 'manifest.json'
+      )
+    ))
     .map((entry) => path.join(outputDir, entry.name));
-  if (shardFiles.length === 0) return;
-  await Promise.all(shardFiles.map((filePath) => fs.unlink(filePath)));
+  if (artifactFiles.length === 0) return;
+  await Promise.all(artifactFiles.map((filePath) => fs.unlink(filePath)));
 }
 function createNodeConvertIO(outputDir, options) {
@@ -1153,7 +1159,7 @@ export async function convertSafetensorsDirectory(options) {
   const outputDir = resolveOutputDir(outputDirOverride, converterConfig, modelId);
   await fs.mkdir(outputDir, { recursive: true });
-  await clearExistingShardFiles(outputDir);
+  await clearExistingConversionOutputs(outputDir);
   const model = {
     name: path.basename(inputDir),
@@ -1180,6 +1186,15 @@ export async function convertSafetensorsDirectory(options) {
     computeHash,
     readRange: fileRangeReader.readRange,
   });
+  const deferredManifestState = {
+    manifest: null,
+  };
+  const convertIo = {
+    ...io,
+    async writeManifest(manifest) {
+      deferredManifestState.manifest = manifest;
+    },
+  };
   const manifestArchitecture = modelKind === 'diffusion' ? 'diffusion' : architecture;
   let workerPool = null;
   let workerTensorTransformer = null;
@@ -1244,7 +1259,7 @@ export async function convertSafetensorsDirectory(options) {
     }));
     const convertTimer = createStageTimer('Convert tensors');
-    result = await convertModel(model, io, {
+    result = await convertModel(model, convertIo, {
       modelId,
       modelType: resolvedModelType,
       quantization: targetQuantization,
@@ -1282,6 +1297,9 @@ export async function convertSafetensorsDirectory(options) {
   }
   normalizeTokenizerManifest(result.manifest);
+  if (!deferredManifestState.manifest) {
+    throw new Error('node convert: convert core did not produce a manifest.');
+  }
   await io.writeManifest(result.manifest);
   const report = buildConvertReport(result, {

package/src/tooling/node-source-runtime.js CHANGED Viewed

@@ -1,4 +1,6 @@
+import { createReadStream } from 'node:fs';
 import fs from 'node:fs/promises';
+import { createHash } from 'node:crypto';
 import path from 'node:path';
 import {
   HEADER_READ_SIZE,
@@ -16,7 +18,6 @@ import { parseTransformerModel } from '../converter/parsers/transformer.js';
 import { parseGGUFHeader } from '../formats/gguf/types.js';
 import { parseSafetensorsHeader } from '../formats/safetensors/types.js';
 import { log } from '../debug/index.js';
-import { computeHash } from '../storage/shard-manager.js';
 import {
   buildSourceRuntimeBundle,
   createSourceStorageContext,
@@ -137,7 +138,12 @@ async function readRange(filePath, offset, length) {
       return new ArrayBuffer(0);
     }
     const out = Buffer.allocUnsafe(end - start);
-    await handle.read(out, 0, out.length, start);
+    let pos = 0;
+    while (pos < out.length) {
+      const { bytesRead } = await handle.read(out, pos, out.length - pos, start + pos);
+      if (bytesRead === 0) break;
+      pos += bytesRead;
+    }
     return out.buffer.slice(out.byteOffset, out.byteOffset + out.byteLength);
   } finally {
     await handle.close();
@@ -449,18 +455,36 @@ async function addHashesToFileEntries(entries, hashAlgorithm) {
   for (const entry of Array.isArray(entries) ? entries : []) {
     const filePath = normalizePath(entry?.path);
     if (!filePath) continue;
-    const bytes = await readFileBytes(filePath, `source asset (${filePath})`);
+    const stats = await getPathStats(filePath, `source asset (${filePath})`);
     normalized.push({
       ...entry,
       path: filePath,
-      size: Number.isFinite(entry?.size) ? Math.max(0, Math.floor(Number(entry.size))) : bytes.byteLength,
-      hash: await computeHash(new Uint8Array(bytes), hashAlgorithm),
+      size: Number.isFinite(entry?.size) ? Math.max(0, Math.floor(Number(entry.size))) : Number(stats.size),
+      hash: await computeFileHash(filePath, hashAlgorithm),
       hashAlgorithm,
     });
   }
   return normalized;
 }
+async function computeFileHash(filePath, hashAlgorithm) {
+  return new Promise((resolve, reject) => {
+    const hash = createHash(hashAlgorithm);
+    const stream = createReadStream(filePath);
+    stream.on('data', (chunk) => {
+      hash.update(chunk);
+    });
+    stream.on('end', () => {
+      resolve(hash.digest('hex'));
+    });
+    stream.on('error', (error) => {
+      const message = error instanceof Error ? error.message : String(error);
+      reject(new Error(`Failed to stream source asset "${filePath}" for hashing: ${message}`));
+    });
+  });
+}
 export async function resolveNodeSourceRuntimeBundle(options = {}) {
   const inputPath = normalizePath(options.inputPath);
   if (!inputPath) {

package/src/tooling/node-webgpu.js CHANGED Viewed

@@ -51,7 +51,7 @@ function resolveCandidateModuleSpecifier(candidate) {
 }
 function resolveDefaultWebgpuModuleSpecifiers() {
-  return ['@simulatte/webgpu', 'webgpu'];
+  return ['webgpu', '@simulatte/webgpu'];
 }
 function resolveExplicitWebgpuModuleSpecifier() {
@@ -189,18 +189,35 @@ function resolveGpuFromModule(mod) {
     return fromModule;
   }
-  const factory = mod.create || mod.default?.create;
-  if (typeof factory === 'function') {
-    let created = null;
+  const tryCreateFactory = (factory) => {
+    if (typeof factory !== 'function') {
+      return null;
+    }
     try {
-      created = factory([]);
+      return factory([]);
     } catch {
       try {
-        created = factory();
+        return factory();
       } catch {
-        created = null;
+        return null;
       }
     }
+  };
+  const instanceFactory = mod.createInstance || mod.default?.createInstance;
+  const createdFromInstanceFactory = tryCreateFactory(instanceFactory);
+  if (createdFromInstanceFactory) {
+    if (typeof createdFromInstanceFactory.requestAdapter === 'function') {
+      return createdFromInstanceFactory;
+    }
+    if (createdFromInstanceFactory.gpu && typeof createdFromInstanceFactory.gpu.requestAdapter === 'function') {
+      return createdFromInstanceFactory.gpu;
+    }
+  }
+  const factory = mod.create || mod.default?.create;
+  if (typeof factory === 'function') {
+    const created = tryCreateFactory(factory);
     if (created) {
       if (typeof created.requestAdapter === 'function') {
         return created;

package/src/utils/hf-resolve-url.d.ts ADDED Viewed

@@ -0,0 +1,16 @@
+export interface HfResolveConfig {
+  repoId: string;
+  revision?: string | null;
+  path: string;
+}
+export interface HfResolveUrlOptions {
+  cdnBasePath?: string;
+}
+export declare const DEFAULT_HF_CDN_BASE_URL: string;
+export declare function buildHfResolveBaseUrl(
+  hfConfig: HfResolveConfig | null | undefined,
+  options?: HfResolveUrlOptions
+): string;

package/src/utils/hf-resolve-url.js ADDED Viewed

@@ -0,0 +1,17 @@
+export const DEFAULT_HF_CDN_BASE_URL = 'https://huggingface.co';
+export function buildHfResolveBaseUrl(hfConfig, options = {}) {
+  const repoId = typeof hfConfig?.repoId === 'string' ? hfConfig.repoId.trim() : '';
+  const repoPath = typeof hfConfig?.path === 'string' ? hfConfig.path.trim().replace(/^\/+/, '') : '';
+  if (!repoId || !repoPath) {
+    throw new Error('Hosted Hugging Face source requires repoId and path.');
+  }
+  const revision = typeof hfConfig?.revision === 'string' && hfConfig.revision.trim().length > 0
+    ? hfConfig.revision.trim()
+    : 'main';
+  const cdnBasePath = typeof options?.cdnBasePath === 'string' && options.cdnBasePath.trim().length > 0
+    ? options.cdnBasePath.trim()
+    : DEFAULT_HF_CDN_BASE_URL;
+  return `${cdnBasePath.replace(/\/$/, '')}/${repoId}/resolve/${revision}/${repoPath}`;
+}

package/src/version.js CHANGED Viewed

@@ -1,2 +1,2 @@
-export const DOPPLER_VERSION = '0.1.7';
+export const DOPPLER_VERSION = '0.1.9';
 export const DOPPLER_PROVIDER_VERSION = DOPPLER_VERSION;

package/src/tooling/node-convert.d.ts DELETED Viewed

@@ -1,54 +0,0 @@
-import type { ConverterConfigSchema } from '../config/schema/converter.schema.js';
-import type { ExecutionContractArtifact } from '../config/execution-contract-check.js';
-import type { ExecutionV0GraphContractArtifact } from '../config/execution-v0-graph-contract-check.js';
-import type { ManifestRequiredInferenceFieldsArtifact } from '../config/required-inference-fields-contract-check.js';
-import type { SavedReportInfo } from '../storage/reports.js';
-export interface NodeConvertProgress {
-  stage: string | null;
-  current: number | null;
-  total: number | null;
-  message: string | null;
-  tensorName?: string | null;
-  tensorBytesCurrent?: number | null;
-  tensorBytesTotal?: number | null;
-}
-export interface NodeConvertExecutionConfig {
-  workers?: number | null;
-  workerCountPolicy?: 'cap' | 'error' | null;
-  maxInFlightJobs?: number | null;
-  rowChunkRows?: number | null;
-  rowChunkMinTensorBytes?: number | null;
-  useGpuCast?: boolean | null;
-  gpuCastMinTensorBytes?: number | null;
-}
-export interface ConvertSafetensorsDirectoryOptions {
-  /** Directory with safetensors/diffusion assets, or a direct .gguf file path. */
-  inputDir: string;
-  outputDir?: string | null;
-  modelId?: string | null;
-  converterConfig?: Partial<ConverterConfigSchema> | null;
-  execution?: NodeConvertExecutionConfig | null;
-  onProgress?: (progress: NodeConvertProgress) => void;
-}
-export interface ConvertSafetensorsDirectoryResult {
-  manifest: Record<string, unknown>;
-  shardCount: number;
-  tensorCount: number;
-  executionContractArtifact: ExecutionContractArtifact | null;
-  executionV0GraphContractArtifact: ExecutionV0GraphContractArtifact | null;
-  layerPatternContractArtifact: Record<string, unknown> | null;
-  requiredInferenceFieldsArtifact: ManifestRequiredInferenceFieldsArtifact | null;
-  report: Record<string, unknown>;
-  reportInfo: SavedReportInfo;
-  presetId: string;
-  modelType: string;
-  outputDir: string;
-}
-export declare function convertSafetensorsDirectory(
-  options: ConvertSafetensorsDirectoryOptions
-): Promise<ConvertSafetensorsDirectoryResult>;