npm - @simulatte/doppler - Versions diffs - 0.1.4 → 0.1.5 - Mend

@simulatte/doppler 0.1.4 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

package/README.md +4 -3
package/package.json +25 -4
package/src/client/doppler-api.browser.d.ts +1 -0
package/src/client/doppler-api.browser.js +288 -0
package/src/client/doppler-api.js +1 -1
package/src/client/doppler-provider/types.js +1 -1
package/src/config/execution-contract-check.d.ts +33 -0
package/src/config/execution-contract-check.js +72 -0
package/src/config/execution-v0-contract-check.d.ts +94 -0
package/src/config/execution-v0-contract-check.js +251 -0
package/src/config/execution-v0-graph-contract-check.d.ts +20 -0
package/src/config/execution-v0-graph-contract-check.js +64 -0
package/src/config/kernel-path-contract-check.d.ts +76 -0
package/src/config/kernel-path-contract-check.js +479 -0
package/src/config/kernel-path-loader.d.ts +16 -0
package/src/config/kernel-path-loader.js +54 -0
package/src/config/kernels/kernel-ref-digests.js +12 -0
package/src/config/kernels/registry.json +556 -0
package/src/config/loader.js +50 -46
package/src/config/merge-contract-check.d.ts +16 -0
package/src/config/merge-contract-check.js +321 -0
package/src/config/merge-helpers.d.ts +58 -0
package/src/config/merge-helpers.js +54 -0
package/src/config/merge.js +3 -6
package/src/config/presets/models/janus-text.json +2 -0
package/src/config/quantization-contract-check.d.ts +12 -0
package/src/config/quantization-contract-check.js +91 -0
package/src/config/required-inference-fields-contract-check.d.ts +24 -0
package/src/config/required-inference-fields-contract-check.js +231 -0
package/src/config/schema/browser-suite-metrics.schema.d.ts +17 -0
package/src/config/schema/browser-suite-metrics.schema.js +46 -0
package/src/config/schema/conversion-report.schema.d.ts +40 -0
package/src/config/schema/conversion-report.schema.js +108 -0
package/src/config/schema/doppler.schema.js +12 -18
package/src/config/schema/index.d.ts +22 -0
package/src/config/schema/index.js +18 -0
package/src/converter/core.d.ts +10 -0
package/src/converter/core.js +27 -2
package/src/converter/parsers/diffusion.js +63 -3
package/src/gpu/kernels/depthwise_conv2d.d.ts +29 -0
package/src/gpu/kernels/depthwise_conv2d.js +98 -0
package/src/gpu/kernels/depthwise_conv2d.wgsl +58 -0
package/src/gpu/kernels/depthwise_conv2d_f16.wgsl +62 -0
package/src/gpu/kernels/grouped_pointwise_conv2d.d.ts +27 -0
package/src/gpu/kernels/grouped_pointwise_conv2d.js +92 -0
package/src/gpu/kernels/grouped_pointwise_conv2d.wgsl +47 -0
package/src/gpu/kernels/grouped_pointwise_conv2d_f16.wgsl +51 -0
package/src/gpu/kernels/index.d.ts +30 -0
package/src/gpu/kernels/index.js +25 -0
package/src/gpu/kernels/relu.d.ts +18 -0
package/src/gpu/kernels/relu.js +45 -0
package/src/gpu/kernels/relu.wgsl +21 -0
package/src/gpu/kernels/relu_f16.wgsl +23 -0
package/src/gpu/kernels/repeat_channels.d.ts +21 -0
package/src/gpu/kernels/repeat_channels.js +60 -0
package/src/gpu/kernels/repeat_channels.wgsl +29 -0
package/src/gpu/kernels/repeat_channels_f16.wgsl +31 -0
package/src/gpu/kernels/sana_linear_attention.d.ts +27 -0
package/src/gpu/kernels/sana_linear_attention.js +122 -0
package/src/gpu/kernels/sana_linear_attention_apply.wgsl +44 -0
package/src/gpu/kernels/sana_linear_attention_apply_f16.wgsl +47 -0
package/src/gpu/kernels/sana_linear_attention_summary.wgsl +47 -0
package/src/gpu/kernels/sana_linear_attention_summary_f16.wgsl +49 -0
package/src/index-browser.d.ts +1 -1
package/src/index-browser.js +2 -2
package/src/index.js +1 -1
package/src/inference/browser-harness.js +62 -22
package/src/inference/pipelines/diffusion/init.js +14 -0
package/src/inference/pipelines/diffusion/pipeline.js +206 -77
package/src/inference/pipelines/diffusion/sana-transformer.d.ts +53 -0
package/src/inference/pipelines/diffusion/sana-transformer.js +738 -0
package/src/inference/pipelines/diffusion/scheduler.d.ts +17 -1
package/src/inference/pipelines/diffusion/scheduler.js +91 -3
package/src/inference/pipelines/diffusion/text-encoder-gpu.d.ts +6 -4
package/src/inference/pipelines/diffusion/text-encoder-gpu.js +270 -0
package/src/inference/pipelines/diffusion/text-encoder.js +18 -1
package/src/inference/pipelines/diffusion/types.d.ts +4 -0
package/src/inference/pipelines/diffusion/vae.js +782 -78
package/src/inference/pipelines/text/config.d.ts +5 -0
package/src/inference/pipelines/text/config.js +1 -1
package/src/inference/pipelines/text/execution-v0.js +14 -93
package/src/rules/execution-rules-contract-check.d.ts +17 -0
package/src/rules/execution-rules-contract-check.js +245 -0
package/src/rules/kernels/depthwise-conv2d.rules.json +6 -0
package/src/rules/kernels/grouped-pointwise-conv2d.rules.json +6 -0
package/src/rules/kernels/relu.rules.json +6 -0
package/src/rules/kernels/repeat-channels.rules.json +6 -0
package/src/rules/kernels/sana-linear-attention.rules.json +6 -0
package/src/rules/layer-pattern-contract-check.d.ts +17 -0
package/src/rules/layer-pattern-contract-check.js +231 -0
package/src/rules/rule-registry.d.ts +28 -0
package/src/rules/rule-registry.js +38 -0
package/src/tooling/conversion-config-materializer.d.ts +24 -0
package/src/tooling/conversion-config-materializer.js +99 -0
package/src/tooling/lean-execution-contract-runner.d.ts +43 -0
package/src/tooling/lean-execution-contract-runner.js +158 -0
package/src/tooling/node-convert.d.ts +10 -0
package/src/tooling/node-converter.js +59 -0
package/src/tooling/node-webgpu.js +9 -9
package/src/version.d.ts +2 -0
package/src/version.js +2 -0
package/tools/convert-safetensors-node.js +47 -0
package/tools/doppler-cli.js +115 -1

package/src/inference/pipelines/text/config.d.ts CHANGED Viewed

@@ -210,6 +210,11 @@ export interface ManifestWithInference {
  */
 export function hasManifestInference(manifest: Manifest): manifest is Manifest & { inference: ManifestInferenceSchema };
+export function validateRequiredInferenceFields(
+  inf: ManifestInferenceSchema,
+  modelId: string
+): void;
 /**
  * Convert MergedConfig to ParsedModelConfig.
  */

package/src/inference/pipelines/text/config.js CHANGED Viewed

@@ -129,7 +129,7 @@ export function hasManifestInference(manifest) {
 }
-function validateRequiredInferenceFields(inf, modelId) {
+export function validateRequiredInferenceFields(inf, modelId) {
   const errors = [];

package/src/inference/pipelines/text/execution-v0.js CHANGED Viewed

@@ -1,4 +1,12 @@
 import { mergeRuntimeValues } from '../../../config/runtime-merge.js';
+import {
+  buildExecutionV0KernelProfileKey,
+  indexExecutionV0KernelProfiles,
+  normalizeExecutionV0Dtype,
+  resolveExecutionV0KernelProfile,
+  resolveExecutionV0KVIO,
+  resolveExecutionV0Precision,
+} from '../../../config/execution-v0-contract-check.js';
 import {
   EXECUTION_V0_SCHEMA_ID,
   DEFAULT_EXECUTION_V0_POLICIES,
@@ -59,13 +67,9 @@ function cloneJson(value) {
   return JSON.parse(JSON.stringify(value));
 }
-function normalizeDtype(value, label) {
-  const normalized = String(value ?? '').trim().toLowerCase();
-  if (normalized !== 'f16' && normalized !== 'f32') {
-    throw new Error(`[ExecutionV0] ${label} must be "f16" or "f32"; got "${value}"`);
-  }
-  return normalized;
-}
+const normalizeDtype = normalizeExecutionV0Dtype;
+const resolvePrecision = resolveExecutionV0Precision;
+const resolveKVIO = resolveExecutionV0KVIO;
 function normalizePhase(value, label) {
   const normalized = String(value ?? '').trim().toLowerCase();
@@ -117,10 +121,7 @@ function stepHasLayer(step, layerIdx) {
   return step.layers.includes(layerIdx);
 }
-function buildKernelProfileKey(kernelRef) {
-  if (!kernelRef) return null;
-  return `${kernelRef.id}|${kernelRef.version}|${kernelRef.digest}`;
-}
+const buildKernelProfileKey = buildExecutionV0KernelProfileKey;
 function normalizeSlot(value, label) {
   if (typeof value !== 'string' || value.trim().length === 0) {
@@ -212,90 +213,10 @@ function hasDefinedPath(root, pathSegments) {
   return current !== undefined;
 }
-function indexKernelProfiles(sessionDefaults) {
-  const byKey = new Map();
-  const profiles = sessionDefaults?.compute?.kernelProfiles ?? [];
-  for (const profile of profiles) {
-    assertKernelRef(profile.kernelRef, 'sessionDefaults.compute.kernelProfiles[].kernelRef');
-    byKey.set(buildKernelProfileKey(profile.kernelRef), profile);
-  }
-  return byKey;
-}
+const indexKernelProfiles = indexExecutionV0KernelProfiles;
 function resolveProfile(profileIndex, step) {
-  const key = buildKernelProfileKey(step.kernelRef);
-  if (!key) return null;
-  return profileIndex.get(key) ?? null;
-}
-function resolvePrecision(step, profile, sessionDefaults) {
-  const defaults = sessionDefaults.compute.defaults;
-  const precision = {
-    inputDtype: step.precision?.inputDtype
-      ?? profile?.precision?.inputDtype
-      ?? null,
-    mathDtype: step.precision?.mathDtype
-      ?? profile?.precision?.mathDtype
-      ?? defaults.mathDtype,
-    accumDtype: step.precision?.accumDtype
-      ?? profile?.precision?.accumDtype
-      ?? defaults.accumDtype,
-    outputDtype: step.precision?.outputDtype
-      ?? profile?.precision?.outputDtype
-      ?? defaults.outputDtype,
-  };
-  const sources = {
-    inputDtype: step.precision?.inputDtype != null
-      ? 'manifest'
-      : profile?.precision?.inputDtype != null
-        ? 'kernelProfile'
-        : 'derived',
-    mathDtype: step.precision?.mathDtype != null
-      ? 'manifest'
-      : profile?.precision?.mathDtype != null
-        ? 'kernelProfile'
-        : 'sessionDefault',
-    accumDtype: step.precision?.accumDtype != null
-      ? 'manifest'
-      : profile?.precision?.accumDtype != null
-        ? 'kernelProfile'
-        : 'sessionDefault',
-    outputDtype: step.precision?.outputDtype != null
-      ? 'manifest'
-      : profile?.precision?.outputDtype != null
-        ? 'kernelProfile'
-        : 'sessionDefault',
-  };
-  return { precision, sources };
-}
-function resolveKVIO(step, profile, sessionDefaults) {
-  if (step.kvIO) {
-    return {
-      value: {
-        readDtype: normalizeDtype(step.kvIO.readDtype, `${step.id}.kvIO.readDtype`),
-        writeDtype: normalizeDtype(step.kvIO.writeDtype, `${step.id}.kvIO.writeDtype`),
-      },
-      source: 'manifest',
-    };
-  }
-  if (profile?.kvIO) {
-    return {
-      value: {
-        readDtype: normalizeDtype(profile.kvIO.readDtype, `${step.id}.profile.kvIO.readDtype`),
-        writeDtype: normalizeDtype(profile.kvIO.writeDtype, `${step.id}.profile.kvIO.writeDtype`),
-      },
-      source: 'kernelProfile',
-    };
-  }
-  const kvDtype = normalizeDtype(
-    sessionDefaults?.kvcache?.kvDtype ?? sessionDefaults.compute.defaults.activationDtype,
-    `${step.id}.sessionDefaults.kvcache.kvDtype`
-  );
-  return {
-    value: { readDtype: kvDtype, writeDtype: kvDtype },
-    source: 'sessionDefault',
-  };
+  return resolveExecutionV0KernelProfile(profileIndex, step);
 }
 function validateStepShape(step, index) {

package/src/rules/execution-rules-contract-check.d.ts ADDED Viewed

@@ -0,0 +1,17 @@
+export interface InferenceExecutionRulesContractArtifact {
+  schemaVersion: 1;
+  source: 'doppler';
+  ok: boolean;
+  checks: Array<{ id: string; ok: boolean }>;
+  errors: string[];
+  stats: {
+    decodeRecorderRules: number;
+    batchDecodeRules: number;
+    decodeRecorderContexts: number;
+    batchDecodeContexts: number;
+  };
+}
+export declare function buildInferenceExecutionRulesContractArtifact(
+  ruleGroup: Record<string, unknown> | null | undefined
+): InferenceExecutionRulesContractArtifact;

package/src/rules/execution-rules-contract-check.js ADDED Viewed

@@ -0,0 +1,245 @@
+import { selectByRules } from '../gpu/kernels/rule-matcher.js';
+function isPlainObject(value) {
+  return value != null && typeof value === 'object' && !Array.isArray(value);
+}
+function matchesExactObject(actual, expected) {
+  if (!isPlainObject(actual) || !isPlainObject(expected)) {
+    return false;
+  }
+  const actualKeys = Object.keys(actual).sort();
+  const expectedKeys = Object.keys(expected).sort();
+  if (actualKeys.length !== expectedKeys.length) {
+    return false;
+  }
+  for (let i = 0; i < actualKeys.length; i += 1) {
+    if (actualKeys[i] !== expectedKeys[i]) {
+      return false;
+    }
+  }
+  for (const key of expectedKeys) {
+    const expectedValue = expected[key];
+    const actualValue = actual[key];
+    if (isPlainObject(expectedValue)) {
+      if (!matchesExactObject(actualValue, expectedValue)) {
+        return false;
+      }
+      continue;
+    }
+    if (Array.isArray(expectedValue)) {
+      if (!Array.isArray(actualValue) || actualValue.length !== expectedValue.length) {
+        return false;
+      }
+      for (let i = 0; i < expectedValue.length; i += 1) {
+        if (actualValue[i] !== expectedValue[i]) {
+          return false;
+        }
+      }
+      continue;
+    }
+    if (actualValue !== expectedValue) {
+      return false;
+    }
+  }
+  return true;
+}
+function decodeRecorderSemantic(context) {
+  return context.hasDevice === true
+    && context.debug !== true
+    && context.disableCommandBatching !== true
+    && context.kvLayout !== 'bdpa_paged';
+}
+function batchDecodeSemantic(context) {
+  return context.batchSize > 1
+    && context.useGPU === true
+    && context.gpuSamplingAvailable === true
+    && context.disableMultiTokenDecode !== true
+    && context.disableCommandBatching !== true
+    && context.isBdpaPagedLayout !== true
+    && context.finitenessFallbackWindowOpen !== true;
+}
+function enumerateDecodeRecorderContexts() {
+  const values = [true, false];
+  const kvLayouts = ['bdpa_paged', 'paged', null];
+  const contexts = [];
+  for (const hasDevice of values) {
+    for (const debug of values) {
+      for (const disableCommandBatching of values) {
+        for (const kvLayout of kvLayouts) {
+          contexts.push({
+            hasDevice,
+            debug,
+            disableCommandBatching,
+            kvLayout,
+          });
+        }
+      }
+    }
+  }
+  return contexts;
+}
+function enumerateBatchDecodeContexts() {
+  const values = [true, false];
+  const batchSizes = [1, 2];
+  const contexts = [];
+  for (const batchSize of batchSizes) {
+    for (const useGPU of values) {
+      for (const gpuSamplingAvailable of values) {
+        for (const disableMultiTokenDecode of values) {
+          for (const disableCommandBatching of values) {
+            for (const isBdpaPagedLayout of values) {
+              for (const finitenessFallbackWindowOpen of values) {
+                contexts.push({
+                  batchSize,
+                  useGPU,
+                  gpuSamplingAvailable,
+                  disableMultiTokenDecode,
+                  disableCommandBatching,
+                  isBdpaPagedLayout,
+                  finitenessFallbackWindowOpen,
+                });
+              }
+            }
+          }
+        }
+      }
+    }
+  }
+  return contexts;
+}
+function checkRuleShape(rules, expectedFirstMatch, label) {
+  if (!Array.isArray(rules)) {
+    return {
+      ok: false,
+      errors: [`[ExecutionRulesContract] ${label} must be an array.`],
+    };
+  }
+  if (rules.length !== 2) {
+    return {
+      ok: false,
+      errors: [`[ExecutionRulesContract] ${label} must contain exactly 2 rules; got ${rules.length}.`],
+    };
+  }
+  const [firstRule, secondRule] = rules;
+  const errors = [];
+  if (!matchesExactObject(firstRule?.match, expectedFirstMatch) || firstRule?.value !== true) {
+    errors.push(`[ExecutionRulesContract] ${label} first rule drifted from the expected enabling predicate.`);
+  }
+  if (!matchesExactObject(secondRule?.match, {}) || secondRule?.value !== false) {
+    errors.push(`[ExecutionRulesContract] ${label} fallback rule must be { match: {}, value: false }.`);
+  }
+  return {
+    ok: errors.length === 0,
+    errors,
+  };
+}
+function checkRuleSemantics(rules, contexts, expectedValue, label) {
+  const errors = [];
+  for (const context of contexts) {
+    const actual = selectByRules(rules, context);
+    const expected = expectedValue(context);
+    if (actual !== expected) {
+      errors.push(
+        `[ExecutionRulesContract] ${label} mismatched context ${JSON.stringify(context)}: ` +
+        `expected ${JSON.stringify(expected)}, got ${JSON.stringify(actual)}.`
+      );
+      break;
+    }
+  }
+  return {
+    ok: errors.length === 0,
+    errors,
+    sampledContexts: contexts.length,
+  };
+}
+export function buildInferenceExecutionRulesContractArtifact(ruleGroup) {
+  const errors = [];
+  const checks = [];
+  const decodeRules = ruleGroup?.decodeRecorderEnabled;
+  const batchRules = ruleGroup?.batchDecodeEnabled;
+  const decodeShape = checkRuleShape(
+    decodeRules,
+    {
+      hasDevice: true,
+      debug: false,
+      disableCommandBatching: false,
+      kvLayout: { neq: 'bdpa_paged' },
+    },
+    'decodeRecorderEnabled'
+  );
+  errors.push(...decodeShape.errors);
+  checks.push({
+    id: 'inference.execution.decodeRecorderEnabled.shape',
+    ok: decodeShape.ok,
+  });
+  const decodeSemantics = Array.isArray(decodeRules)
+    ? checkRuleSemantics(
+      decodeRules,
+      enumerateDecodeRecorderContexts(),
+      decodeRecorderSemantic,
+      'decodeRecorderEnabled'
+    )
+    : { ok: false, errors: ['[ExecutionRulesContract] decodeRecorderEnabled is unavailable for semantic check.'], sampledContexts: 0 };
+  errors.push(...decodeSemantics.errors);
+  checks.push({
+    id: 'inference.execution.decodeRecorderEnabled.semantics',
+    ok: decodeSemantics.ok,
+  });
+  const batchShape = checkRuleShape(
+    batchRules,
+    {
+      batchSize: { gt: 1 },
+      useGPU: true,
+      gpuSamplingAvailable: true,
+      disableMultiTokenDecode: false,
+      disableCommandBatching: false,
+      isBdpaPagedLayout: false,
+      finitenessFallbackWindowOpen: false,
+    },
+    'batchDecodeEnabled'
+  );
+  errors.push(...batchShape.errors);
+  checks.push({
+    id: 'inference.execution.batchDecodeEnabled.shape',
+    ok: batchShape.ok,
+  });
+  const batchSemantics = Array.isArray(batchRules)
+    ? checkRuleSemantics(
+      batchRules,
+      enumerateBatchDecodeContexts(),
+      batchDecodeSemantic,
+      'batchDecodeEnabled'
+    )
+    : { ok: false, errors: ['[ExecutionRulesContract] batchDecodeEnabled is unavailable for semantic check.'], sampledContexts: 0 };
+  errors.push(...batchSemantics.errors);
+  checks.push({
+    id: 'inference.execution.batchDecodeEnabled.semantics',
+    ok: batchSemantics.ok,
+  });
+  return {
+    schemaVersion: 1,
+    source: 'doppler',
+    ok: errors.length === 0,
+    checks,
+    errors,
+    stats: {
+      decodeRecorderRules: Array.isArray(decodeRules) ? decodeRules.length : 0,
+      batchDecodeRules: Array.isArray(batchRules) ? batchRules.length : 0,
+      decodeRecorderContexts: decodeSemantics.sampledContexts,
+      batchDecodeContexts: batchSemantics.sampledContexts,
+    },
+  };
+}

package/src/rules/kernels/depthwise-conv2d.rules.json ADDED Viewed

@@ -0,0 +1,6 @@
+{
+  "variant": [
+    { "match": { "isF16": true }, "value": "default_f16" },
+    { "match": {}, "value": "default" }
+  ]
+}

package/src/rules/kernels/grouped-pointwise-conv2d.rules.json ADDED Viewed

@@ -0,0 +1,6 @@
+{
+  "variant": [
+    { "match": { "isF16": true }, "value": "default_f16" },
+    { "match": {}, "value": "default" }
+  ]
+}

package/src/rules/kernels/relu.rules.json ADDED Viewed

@@ -0,0 +1,6 @@
+{
+  "variant": [
+    { "match": { "dtype": "f16" }, "value": "default_f16" },
+    { "match": {}, "value": "default" }
+  ]
+}

package/src/rules/kernels/repeat-channels.rules.json ADDED Viewed

@@ -0,0 +1,6 @@
+{
+  "variant": [
+    { "match": { "dtype": "f16" }, "value": "default_f16" },
+    { "match": {}, "value": "default" }
+  ]
+}

package/src/rules/kernels/sana-linear-attention.rules.json ADDED Viewed

@@ -0,0 +1,6 @@
+{
+  "variant": [
+    { "match": { "isF16": true }, "value": "default_f16" },
+    { "match": {}, "value": "default" }
+  ]
+}

package/src/rules/layer-pattern-contract-check.d.ts ADDED Viewed

@@ -0,0 +1,17 @@
+export interface LayerPatternContractArtifact {
+  schemaVersion: 1;
+  source: 'doppler';
+  ok: boolean;
+  checks: Array<{ id: string; ok: boolean }>;
+  errors: string[];
+  stats: {
+    patternKindRules: number;
+    layerTypeRules: number;
+    patternKindContexts: number;
+    layerTypeContexts: number;
+  };
+}
+export declare function buildLayerPatternContractArtifact(
+  ruleGroup: Record<string, unknown> | null | undefined
+): LayerPatternContractArtifact;