npm - @open-mercato/ai-assistant - Versions diffs - 0.6.1-develop.3246.1.dbef9d7392 → 0.6.1-develop.3256.1.fe3dec2464 - Mend

@open-mercato/ai-assistant 0.6.1-develop.3246.1.dbef9d7392 → 0.6.1-develop.3256.1.fe3dec2464

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (133) hide show

package/src/modules/ai_assistant/lib/model-factory.ts CHANGED Viewed

@@ -10,13 +10,16 @@
  *
  *   1. `callerOverride` (non-empty string) — highest precedence, e.g. the
  *      `modelOverride` field on `runAiAgentText`/`runAiAgentObject`.
+ *      Accepts a slash-qualified `<provider>/<model>` shorthand (Phase 1).
  *   2. Env variable `OM_AI_<MODULE>_MODEL` (uppercased `moduleId`) when
  *      `moduleId` is provided. Example:
  *      `OM_AI_INBOX_OPS_MODEL=claude-haiku-4-5`,
  *      `OM_AI_CATALOG_MODEL=gpt-4o-mini`. The legacy
  *      `<MODULE>_AI_MODEL` form (e.g. `INBOX_OPS_AI_MODEL`) is read as a
  *      backward-compatibility fallback when the canonical name is unset.
+ *      Accepts a slash-qualified shorthand (Phase 1).
  *   3. `agentDefaultModel` — typically `AiAgentDefinition.defaultModel`.
+ *      Accepts a slash-qualified `<provider>/<model>` shorthand (Phase 1).
  *   4. Global env `OM_AI_MODEL` (canonical) with `OPENCODE_MODEL` kept as
  *      a backward-compatibility fallback. Accepts either a plain model id
  *      (`gpt-5-mini`) or a slash-qualified id (`openai/gpt-5-mini`).
@@ -26,15 +29,23 @@
  *   5. The configured provider's own default model id
  *      (`provider.defaultModel`).
  *
- * Resolution walks the `llmProviderRegistry`'s `resolveFirstConfigured()`
- * output. The walk's `order` argument is seeded from (in priority order):
+ * Every model-axis source is parsed through {@link parseSlashShorthand}.
+ * Resolution walks the chain top-down and takes the first non-null hint as
+ * the registry-walk seed:
  *
- *   1. The slash-qualified provider hint extracted from `OM_AI_MODEL` —
- *      consumes the provider axis for this resolution.
- *   2. `OM_AI_PROVIDER` (canonical) with `OPENCODE_PROVIDER` as a
- *      backward-compatibility fallback — names a registered provider id;
- *      falls through transparently when the named provider is
- *      registered-but-unconfigured.
+ *   Provider-axis seed order (highest priority first):
+ *   1. Slash-prefix from `callerOverride` (Phase 1).
+ *   2. `providerOverride` — request-time provider override (Phase 1).
+ *   3. Slash-prefix from `OM_AI_<MODULE>_MODEL` (legacy `<MODULE>_AI_MODEL`) (Phase 1).
+ *   4. `OM_AI_<MODULE>_PROVIDER` env (legacy `<MODULE>_AI_PROVIDER`) (Phase 1).
+ *   5. Slash-prefix from `agentDefaultModel` (Phase 1).
+ *   6. `agentDefaultProvider` — `AiAgentDefinition.defaultProvider` (Phase 1).
+ *   7. Slash-prefix from `OM_AI_MODEL` (legacy `OPENCODE_MODEL`) (Phase 0).
+ *   8. `OM_AI_PROVIDER` (legacy `OPENCODE_PROVIDER`) (Phase 0).
+ *
+ * The `OM_AI_*` env knobs are canonical; the legacy `OPENCODE_PROVIDER` /
+ * `OPENCODE_MODEL` envs stay bound to the OpenCode Code Mode stack and are
+ * also honored as backward-compatibility fallbacks here.
  *
  * The factory throws {@link AiModelFactoryError} when no provider is
  * configured — every current call site already expects the throw (see the
@@ -49,7 +60,15 @@
 import type { AwilixContainer } from 'awilix'
 import type { EnvLookup, LlmProvider } from '@open-mercato/shared/lib/ai/llm-provider'
 import { llmProviderRegistry } from '@open-mercato/shared/lib/ai/llm-provider-registry'
-import { resolveAiProviderIdFromEnv } from '@open-mercato/shared/lib/ai/opencode-provider'
+import {
+  intersectAllowlists,
+  canonicalProviderId,
+  isModelAllowedForProviderInEffective,
+  isProviderAllowedInEffective,
+  providerIdAliases,
+  type EffectiveAllowlist,
+  type TenantAllowlistSnapshot,
+} from './model-allowlist'
 /**
  * Minimal AI SDK LanguageModel shape — the factory exposes the protocol-
@@ -72,13 +91,26 @@ export interface AiModelFactoryInput {
    * the legacy `<MODULE>_AI_MODEL` form honored as a backward-compatibility
    * fallback. Example: `moduleId: 'inbox_ops'` → canonical env var
    * `OM_AI_INBOX_OPS_MODEL` (legacy `INBOX_OPS_AI_MODEL`).
+   *
+   * Also enables the `OM_AI_<MODULE>_PROVIDER` env axis (legacy
+   * `<MODULE>_AI_PROVIDER` honored as a backward-compatibility fallback).
    */
   moduleId?: string
   /**
    * Agent-level default, typically `AiAgentDefinition.defaultModel`. Used
    * when neither `callerOverride` nor the module env override is present.
+   * Accepts a slash-qualified `<provider>/<model>` shorthand (Phase 1).
    */
   agentDefaultModel?: string
+  /**
+   * Agent-level default provider, typically `AiAgentDefinition.defaultProvider`.
+   * Named provider id; falls through transparently when the named provider is
+   * registered-but-unconfigured. Sits between `OM_AI_<MODULE>_PROVIDER`
+   * and the global `OM_AI_PROVIDER` in the provider-axis seed list above.
+   *
+   * Phase 1 of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  agentDefaultProvider?: string
   /**
    * Per-call override (e.g. `runAiAgentText({ modelOverride })`). Wins over
    * every other source when it is a non-empty trimmed string. Empty strings
@@ -86,6 +118,84 @@ export interface AiModelFactoryInput {
    * callers MUST NOT need a separate "clear override" API.
    */
   callerOverride?: string
+  /**
+   * Request-time provider override — wins for the provider axis at the same
+   * priority as `callerOverride` for the model axis. A non-empty string
+   * that does not match any registered provider id is silently ignored and
+   * the factory falls through to the next provider source.
+   *
+   * Phase 1 of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  providerOverride?: string
+  /**
+   * Agent-level default base URL, typically `AiAgentDefinition.defaultBaseUrl`.
+   * Sits between the `<MODULE>_AI_BASE_URL` env var and the preset's own
+   * `baseURLEnvKeys` in the resolution chain.
+   *
+   * Phase 2 of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  agentDefaultBaseUrl?: string
+  /**
+   * Per-call base URL override that wins over every other source. Intended
+   * for programmatic callers only — the HTTP query-param baseUrl and the
+   * AI_RUNTIME_BASEURL_ALLOWLIST arrive in Phase 4a.
+   *
+   * Phase 2 of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  baseUrlOverride?: string
+  /**
+   * Per-tenant default loaded from `ai_agent_runtime_overrides` by the agent
+   * runtime (best-effort, fail-open). Sits at step 3 of the resolution chain
+   * between the caller/request override (step 1–2) and the module-env axis
+   * (step 4).
+   *
+   * Honored ONLY when `allowRuntimeModelOverride !== false` on the agent
+   * definition. The agent runtime is responsible for hydration — the factory
+   * does NOT load the row itself.
+   *
+   * Phase 4a of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  tenantOverride?: {
+    providerId?: string | null
+    modelId?: string | null
+    baseURL?: string | null
+  }
+  /**
+   * Per-request override forwarded from the HTTP dispatcher query params
+   * (`?provider=`, `?model=`, `?baseUrl=`). Sits at step 1 of the resolution
+   * chain — wins over everything else for that turn.
+   *
+   * Honored ONLY when `allowRuntimeModelOverride !== false` on the agent.
+   * The dispatcher validates all three values before setting this input.
+   *
+   * Phase 4a of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  requestOverride?: {
+    providerId?: string | null
+    modelId?: string | null
+    baseURL?: string | null
+  }
+  /**
+   * When false, steps 1 (requestOverride) and 3 (tenantOverride) of the
+   * resolution chain are skipped. Agents that pin a specific model for
+   * correctness reasons set `AiAgentDefinition.allowRuntimeModelOverride =
+   * false`. Default behavior (omitted) is permissive (= true).
+   *
+   * Phase 4a of spec `2026-04-27-ai-agents-provider-model-baseurl-overrides`.
+   */
+  allowRuntimeModelOverride?: boolean
+  /**
+   * Optional tenant allowlist snapshot (Phase 1780-6). When supplied, the
+   * factory clips the resolved (provider, model) to the intersection of the
+   * env allowlist (`OM_AI_AVAILABLE_*`) and this tenant allowlist. Pass `null`
+   * or omit to fall back to env-only enforcement.
+   *
+   * The settings PUT route validates writes against the env allowlist before
+   * persisting, so the snapshot here is trusted to be a subset of env. The
+   * factory still defends against drift (env tightened after write) by
+   * intersecting at resolution time.
+   */
+  tenantAllowlist?: TenantAllowlistSnapshot | null
 }
 /**
@@ -111,11 +221,32 @@ export interface AiModelResolution {
    *   `OPENCODE_MODEL` fallback supplied the model id.
    */
   source:
+    | 'request_override'
     | 'caller_override'
+    | 'tenant_override'
     | 'module_env'
     | 'agent_default'
     | 'env_default'
     | 'provider_default'
+    | 'allowlist_fallback'
+  /**
+   * Resolved base URL passed to the adapter (if any). Undefined when the
+   * adapter will use its built-in default. Included for observability and
+   * test assertions; never exposed over HTTP (Phase 4a adds the allowlist).
+   */
+  baseURL?: string
+  /**
+   * Populated when the env-driven OM_AI_AVAILABLE_PROVIDERS /
+   * OM_AI_AVAILABLE_MODELS_<PROVIDER> allowlist rejected the originally
+   * resolved (provider, model) and the factory fell back to a safe pair.
+   * Includes the rejected ids and a human-readable reason so the UI / logs
+   * can surface why the runtime did not honor the requested combination.
+   */
+  allowlistFallback?: {
+    originalProviderId: string
+    originalModelId: string
+    reason: string
+  }
 }
 /**
@@ -167,6 +298,14 @@ export interface AiModelFactoryRegistry {
    * behavior).
    */
   get?(id: string): LlmProvider | null
+  /**
+   * Optional registry enumeration used by the Phase 1780-6 allowlist
+   * intersection so the env model lists are pre-loaded for every provider
+   * (and not just the resolved one). Test doubles MAY omit this — the
+   * factory still defends correctly by also seeding the resolved provider's
+   * id directly into `intersectAllowlists(...)`.
+   */
+  list?(): readonly LlmProvider[]
 }
 /**
@@ -180,7 +319,7 @@ export interface CreateModelFactoryDependencies {
    * `order` argument to prefer the operator-selected provider.
    */
   registry?: AiModelFactoryRegistry
-  /** Env lookup for `<MODULE>_AI_MODEL` + provider credentials. */
+  /** Env lookup for `OM_AI_<MODULE>_MODEL` + provider credentials. */
   env?: EnvLookup
 }
@@ -196,15 +335,19 @@ function normalizeOverride(value: string | undefined): string | null {
  * `OPENCODE_PROVIDER` resolves to a known provider — in that case the
  * registry falls back to its default registration walk.
  */
-function readProviderOrderFromEnv(env: EnvLookup): readonly string[] | undefined {
-  const raw = normalizeOverride(env.OM_AI_PROVIDER) ?? normalizeOverride(env.OPENCODE_PROVIDER)
-  if (!raw) return undefined
-  // Reuse the shared resolver so unknown ids fall back through both keys.
-  // When the raw value is unknown the resolver returns the default; passing
-  // that through as an explicit hint is still safe because the registry
-  // only honors registered + configured providers.
-  const resolved = resolveAiProviderIdFromEnv(env)
-  return [resolved]
+function readGlobalProviderFromEnv(
+  env: EnvLookup,
+  registry: Pick<AiModelFactoryRegistry, 'get'>,
+): string | null {
+  const candidates = [normalizeOverride(env.OM_AI_PROVIDER), normalizeOverride(env.OPENCODE_PROVIDER)]
+  for (const candidate of candidates) {
+    if (!candidate) continue
+    if (!registry.get) return providerIdAliases(candidate)[0] ?? candidate
+    for (const alias of providerIdAliases(candidate)) {
+      if (registry.get(alias)) return alias
+    }
+  }
+  return null
 }
 /**
@@ -216,7 +359,7 @@ function readGlobalModelFromEnv(env: EnvLookup): string | null {
 }
 /** Canonical per-module model env. Example: `OM_AI_INBOX_OPS_MODEL`. */
-function moduleEnvVarName(moduleId: string): string {
+function moduleModelEnvVarName(moduleId: string): string {
   return `OM_AI_${moduleId.toUpperCase()}_MODEL`
 }
@@ -224,17 +367,53 @@ function moduleEnvVarName(moduleId: string): string {
  * Legacy per-module model env (pre-OM_AI_* rename). Example:
  * `INBOX_OPS_AI_MODEL`. Read as a backward-compatibility fallback only.
  */
-function legacyModuleEnvVarName(moduleId: string): string {
+function legacyModuleModelEnvVarName(moduleId: string): string {
   return `${moduleId.toUpperCase()}_AI_MODEL`
 }
-function readModuleEnvOverride(env: EnvLookup, moduleId: string): string | null {
+function readModuleModelEnvOverride(env: EnvLookup, moduleId: string): string | null {
+  return (
+    normalizeOverride(env[moduleModelEnvVarName(moduleId)]) ??
+    normalizeOverride(env[legacyModuleModelEnvVarName(moduleId)])
+  )
+}
+/** Canonical per-module provider env. Example: `OM_AI_INBOX_OPS_PROVIDER`. */
+function moduleProviderEnvVarName(moduleId: string): string {
+  return `OM_AI_${moduleId.toUpperCase()}_PROVIDER`
+}
+/**
+ * Legacy per-module provider env (pre-OM_AI_* rename). Example:
+ * `INBOX_OPS_AI_PROVIDER`. Read as a backward-compatibility fallback only.
+ */
+function legacyModuleProviderEnvVarName(moduleId: string): string {
+  return `${moduleId.toUpperCase()}_AI_PROVIDER`
+}
+function readModuleProviderEnvOverride(env: EnvLookup, moduleId: string): string | null {
   return (
-    normalizeOverride(env[moduleEnvVarName(moduleId)]) ??
-    normalizeOverride(env[legacyModuleEnvVarName(moduleId)])
+    normalizeOverride(env[moduleProviderEnvVarName(moduleId)]) ??
+    normalizeOverride(env[legacyModuleProviderEnvVarName(moduleId)])
   )
 }
+function normalizeProviderHint(
+  providerId: string | null,
+  registry: AiModelFactoryRegistry,
+): string | null {
+  if (!providerId) return null
+  const knownProviderIds = registry.list?.().map((provider) => provider.id) ?? []
+  if (knownProviderIds.length > 0) {
+    return canonicalProviderId(providerId, knownProviderIds)
+  }
+  return providerIdAliases(providerId)[0] ?? providerId
+}
+function moduleBaseUrlEnvVarName(moduleId: string): string {
+  return `${moduleId.toUpperCase()}_AI_BASE_URL`
+}
 /**
  * Splits a slash-qualified model token (e.g. `openai/gpt-5-mini`) into
  * `{ providerHint, modelId }` when the prefix matches a registered provider
@@ -280,20 +459,84 @@ export function createModelFactory(
   return {
     resolveModel(input: AiModelFactoryInput): AiModelResolution {
+      const hasModule = typeof input.moduleId === 'string' && input.moduleId.length > 0
+      // When allowRuntimeModelOverride is explicitly false, skip steps 1
+      // (requestOverride) and 3 (tenantOverride) — the agent pins a model.
+      const runtimeOverridesAllowed = input.allowRuntimeModelOverride !== false
+      // --- Step 1: requestOverride (HTTP query params) — gated by flag ---
+      const requestModelRaw = runtimeOverridesAllowed
+        ? normalizeOverride(input.requestOverride?.modelId ?? undefined)
+        : null
+      const requestProviderRaw = runtimeOverridesAllowed
+        ? normalizeOverride(input.requestOverride?.providerId ?? undefined)
+        : null
+      const requestBaseUrlRaw = runtimeOverridesAllowed
+        ? normalizeOverride(input.requestOverride?.baseURL ?? undefined)
+        : null
+      // --- Step 2: callerOverride (programmatic) ---
+      const callerRaw = normalizeOverride(input.callerOverride)
+      // --- Step 3: tenantOverride (DB row) — gated by flag ---
+      const tenantModelRaw = runtimeOverridesAllowed
+        ? normalizeOverride(input.tenantOverride?.modelId ?? undefined)
+        : null
+      const tenantProviderRaw = runtimeOverridesAllowed
+        ? normalizeOverride(input.tenantOverride?.providerId ?? undefined)
+        : null
+      const tenantBaseUrlRaw = runtimeOverridesAllowed
+        ? normalizeOverride(input.tenantOverride?.baseURL ?? undefined)
+        : null
+      // --- Steps 4+: env / agent / global ---
+      const moduleModelRaw = hasModule
+        ? readModuleModelEnvOverride(env, input.moduleId!)
+        : null
+      const agentModelRaw = normalizeOverride(input.agentDefaultModel)
       // OM_AI_MODEL is canonical; the legacy OPENCODE_MODEL is read as a
       // backward-compatibility fallback through readGlobalModelFromEnv.
-      const globalModelEnv = readGlobalModelFromEnv(env)
-      // Slash-qualified env-model values consume the provider axis at the
-      // env-default step. Phase 1 of the per-axis-overrides spec generalizes
-      // the parser to every model-axis source.
-      const globalModelParsed = globalModelEnv
-        ? parseSlashShorthand(globalModelEnv, registry)
+      const globalModelRaw = readGlobalModelFromEnv(env)
+      // Parse slash shorthand on every model-axis source.
+      const requestModelParsed = requestModelRaw ? parseSlashShorthand(requestModelRaw, registry) : null
+      const callerParsed = callerRaw ? parseSlashShorthand(callerRaw, registry) : null
+      const tenantModelParsed = tenantModelRaw ? parseSlashShorthand(tenantModelRaw, registry) : null
+      const moduleModelParsed = moduleModelRaw ? parseSlashShorthand(moduleModelRaw, registry) : null
+      const agentModelParsed = agentModelRaw ? parseSlashShorthand(agentModelRaw, registry) : null
+      const globalModelParsed = globalModelRaw ? parseSlashShorthand(globalModelRaw, registry) : null
+      // --- Provider-axis: walk from highest to lowest priority for the seed.
+      // A slash-qualified hint from a model source wins over a plain provider
+      // source at the same priority step. We walk top-down and take the first
+      // non-null hint.
+      const providerOverrideRaw = normalizeOverride(input.providerOverride)
+      const moduleProviderRaw = hasModule
+        ? readModuleProviderEnvOverride(env, input.moduleId!)
         : null
-      const slashProviderHint = globalModelParsed?.providerHint ?? null
-      const providerOrderFromEnv = readProviderOrderFromEnv(env)
-      const order = slashProviderHint
-        ? [slashProviderHint, ...(providerOrderFromEnv ?? [])]
-        : providerOrderFromEnv
+      const agentDefaultProviderRaw = normalizeOverride(input.agentDefaultProvider)
+      // OM_AI_PROVIDER is canonical; the legacy OPENCODE_PROVIDER is read as
+      // a backward-compatibility fallback through readGlobalProviderFromEnv.
+      const globalProviderRaw = readGlobalProviderFromEnv(env, registry)
+      // Walk the provider-axis seed list: slash hint beats plain provider at
+      // the same step. We keep only the first (highest-priority) non-null hint.
+      const providerHintCandidates: Array<string | null> = [
+        requestModelParsed?.providerHint ?? null,
+        normalizeProviderHint(requestProviderRaw, registry),
+        callerParsed?.providerHint ?? null,
+        normalizeProviderHint(providerOverrideRaw, registry),
+        tenantModelParsed?.providerHint ?? null,
+        normalizeProviderHint(tenantProviderRaw, registry),
+        moduleModelParsed?.providerHint ?? null,
+        normalizeProviderHint(moduleProviderRaw, registry),
+        agentModelParsed?.providerHint ?? null,
+        normalizeProviderHint(agentDefaultProviderRaw, registry),
+        globalModelParsed?.providerHint ?? null,
+        globalProviderRaw,
+      ]
+      const orderHint = providerHintCandidates.find((hint) => hint !== null) ?? null
+      const order = orderHint ? [orderHint] : undefined
       const provider = registry.resolveFirstConfigured({ env, order })
       if (!provider) {
@@ -310,43 +553,228 @@ export function createModelFactory(
         )
       }
-      const callerOverride = normalizeOverride(input.callerOverride)
-      const moduleEnvOverride =
-        input.moduleId && input.moduleId.length > 0
-          ? readModuleEnvOverride(env, input.moduleId)
-          : null
-      const agentDefault = normalizeOverride(input.agentDefaultModel)
-      // The slash parser already split the global model token; use the
-      // post-parse model id so `OM_AI_MODEL=openai/gpt-5-mini` resolves
-      // model `gpt-5-mini` against provider `openai`.
-      const envDefaultModel = globalModelParsed?.modelId ?? globalModelEnv
+      // --- Model-axis: use the post-parse model id from the winning source.
       let modelId: string
       let source: AiModelResolution['source']
-      if (callerOverride) {
-        modelId = callerOverride
+      if (requestModelParsed) {
+        modelId = requestModelParsed.modelId
+        source = 'request_override'
+      } else if (callerParsed) {
+        modelId = callerParsed.modelId
         source = 'caller_override'
-      } else if (moduleEnvOverride) {
-        modelId = moduleEnvOverride
+      } else if (tenantModelParsed) {
+        modelId = tenantModelParsed.modelId
+        source = 'tenant_override'
+      } else if (moduleModelParsed) {
+        modelId = moduleModelParsed.modelId
         source = 'module_env'
-      } else if (agentDefault) {
-        modelId = agentDefault
+      } else if (agentModelParsed) {
+        modelId = agentModelParsed.modelId
         source = 'agent_default'
-      } else if (envDefaultModel) {
-        modelId = envDefaultModel
+      } else if (globalModelParsed) {
+        modelId = globalModelParsed.modelId
         source = 'env_default'
       } else {
         modelId = provider.defaultModel
         source = 'provider_default'
       }
-      const model = provider.createModel({ modelId, apiKey })
+      // --- BaseURL-axis resolution (highest to lowest priority) ---
+      // 1. requestOverride.baseURL (HTTP dispatcher) — gated by allowRuntimeModelOverride
+      // 2. baseUrlOverride (programmatic caller)
+      // 3. tenantOverride.baseURL (DB row) — gated by allowRuntimeModelOverride
+      // 4. <MODULE>_AI_BASE_URL env
+      // 5. agentDefaultBaseUrl
+      // Steps 6-7 (preset env + preset default) are handled inside the adapter's
+      // createModel when no explicit baseURL is passed.
+      const resolvedBaseURL = requestBaseUrlRaw
+        ?? normalizeOverride(input.baseUrlOverride)
+        ?? tenantBaseUrlRaw
+        ?? (hasModule ? normalizeOverride(env[moduleBaseUrlEnvVarName(input.moduleId!)]) : null)
+        ?? normalizeOverride(input.agentDefaultBaseUrl)
+        ?? undefined
+      // --- Allowlist enforcement (Phase 1780-5 + 1780-6) -------------------
+      // OM_AI_AVAILABLE_PROVIDERS / OM_AI_AVAILABLE_MODELS_<PROVIDER> clip
+      // the resolution to an operator-approved set. The optional tenant
+      // allowlist snapshot narrows the env outer constraint further. If the
+      // resolved pair isn't allowed, fall back to a safe (provider, model)
+      // — never throw, so a stale tenant override or chat picker can't take
+      // the runtime down. The fallback is logged so the operator can see
+      // what happened.
+      const registryProviderIds = registry.list?.()?.map((p) => p.id) ?? []
+      const tenantProviderIds = input.tenantAllowlist
+        ? Object.keys(input.tenantAllowlist.allowedModelsByProvider ?? {})
+        : []
+      const knownProviderIds = Array.from(
+        new Set([provider.id, ...registryProviderIds, ...tenantProviderIds]),
+      )
+      const effectiveAllowlist = intersectAllowlists(
+        env,
+        knownProviderIds,
+        input.tenantAllowlist ?? null,
+      )
+      const allowlistResult = enforceAllowlist({
+        env,
+        registry,
+        resolved: { provider, modelId },
+        agentDefaultProvider: agentDefaultProviderRaw,
+        agentDefaultModel: agentModelParsed?.modelId ?? agentModelRaw,
+        effective: effectiveAllowlist,
+      })
+      const finalProvider = allowlistResult.provider
+      const finalModelId = allowlistResult.modelId
+      const finalSource = allowlistResult.fallback ? 'allowlist_fallback' : source
+      const finalApiKey = allowlistResult.fallback
+        ? finalProvider.resolveApiKey(env)
+        : apiKey
+      if (!finalApiKey) {
+        throw new AiModelFactoryError(
+          'api_key_missing',
+          `LLM provider "${finalProvider.id}" is advertised as configured but resolveApiKey() returned empty.`,
+        )
+      }
+      const model = finalProvider.createModel({
+        modelId: finalModelId,
+        apiKey: finalApiKey,
+        baseURL: resolvedBaseURL,
+      })
       return {
         model,
-        modelId,
-        providerId: provider.id,
-        source,
+        modelId: finalModelId,
+        providerId: finalProvider.id,
+        source: finalSource,
+        ...(resolvedBaseURL !== undefined ? { baseURL: resolvedBaseURL } : {}),
+        ...(allowlistResult.fallback
+          ? {
+              allowlistFallback: {
+                originalProviderId: provider.id,
+                originalModelId: modelId,
+                reason: allowlistResult.fallback,
+              },
+            }
+          : {}),
       }
     },
   }
 }
+interface EnforceAllowlistInput {
+  env: EnvLookup
+  registry: AiModelFactoryRegistry
+  resolved: { provider: LlmProvider; modelId: string }
+  agentDefaultProvider: string | null
+  agentDefaultModel: string | null
+  effective: EffectiveAllowlist
+}
+interface EnforceAllowlistResult {
+  provider: LlmProvider
+  modelId: string
+  /** Populated only when the resolved pair was rejected. */
+  fallback: string | null
+}
+/**
+ * Clips a resolved `(provider, model)` to what the effective allowlist
+ * permits (env intersected with optional tenant allowlist).
+ *
+ * Order of fallback when the resolved provider is not allowed:
+ *  1. The agent's `defaultProvider` (if allowed and configured).
+ *  2. The first allowed provider that is also configured in the registry.
+ *
+ * Order of fallback when the model is not allowed for the resolved provider:
+ *  1. The agent's `defaultModel` (if allowed for that provider).
+ *  2. The provider's `defaultModel` (if allowed).
+ *  3. The first model from the effective allowlist for that provider.
+ *
+ * Both fall-back paths emit a `console.warn` so the operator can see why the
+ * runtime did not honor the requested combination. The function never throws.
+ */
+function enforceAllowlist(input: EnforceAllowlistInput): EnforceAllowlistResult {
+  const { registry, resolved, agentDefaultProvider, agentDefaultModel, effective } = input
+  let provider = resolved.provider
+  let modelId = resolved.modelId
+  let fallback: string | null = null
+  if (effective.providers !== null && !isProviderAllowedInEffective(effective, provider.id)) {
+    const replacement = pickAllowedProvider({
+      registry,
+      agentDefaultProvider,
+      effective,
+    })
+    if (replacement) {
+      const source = effective.tenantOverridesActive
+        ? 'the effective allowlist (env ∩ tenant)'
+        : 'OM_AI_AVAILABLE_PROVIDERS'
+      fallback = `Provider "${provider.id}" is not in ${source}; using "${replacement.id}" instead.`
+      console.warn(`[AI Model Factory] ${fallback}`)
+      provider = replacement
+      modelId = pickAllowedModel({
+        provider,
+        preferred: agentDefaultModel,
+        effective,
+      })
+    }
+    // If no replacement is configured we keep the resolved provider — the
+    // throw at the api-key gate will surface the misconfiguration to the
+    // operator instead of silently masking it.
+  }
+  if (!isModelAllowedForProviderInEffective(effective, provider.id, modelId)) {
+    const replacementModel = pickAllowedModel({
+      provider,
+      preferred: agentDefaultModel,
+      effective,
+    })
+    if (replacementModel !== modelId) {
+      const source = effective.tenantOverridesActive
+        ? `the effective allowlist (env ∩ tenant) for "${provider.id}"`
+        : `OM_AI_AVAILABLE_MODELS_${provider.id.toUpperCase()}`
+      const reason = `Model "${modelId}" is not in ${source}; using "${replacementModel}" instead.`
+      console.warn(`[AI Model Factory] ${reason}`)
+      fallback = fallback ? `${fallback} ${reason}` : reason
+      modelId = replacementModel
+    }
+  }
+  return { provider, modelId, fallback }
+}
+function pickAllowedProvider(input: {
+  registry: AiModelFactoryRegistry
+  agentDefaultProvider: string | null
+  effective: EffectiveAllowlist
+}): LlmProvider | null {
+  const { registry, agentDefaultProvider, effective } = input
+  if (agentDefaultProvider) {
+    if (isProviderAllowedInEffective(effective, agentDefaultProvider)) {
+      const provider = registry.get?.(agentDefaultProvider)
+      if (provider && provider.isConfigured(process.env as EnvLookup)) return provider
+    }
+  }
+  const allowed = effective.providers
+  if (!allowed) return null
+  for (const id of allowed) {
+    const provider = registry.get?.(id)
+    if (provider && provider.isConfigured(process.env as EnvLookup)) return provider
+  }
+  return null
+}
+function pickAllowedModel(input: {
+  provider: LlmProvider
+  preferred: string | null
+  effective: EffectiveAllowlist
+}): string {
+  const { provider, preferred, effective } = input
+  const allowed = effective.modelsByProvider[provider.id]
+  if (allowed === undefined) {
+    return preferred && preferred.length > 0 ? preferred : provider.defaultModel
+  }
+  if (preferred && allowed.includes(preferred)) return preferred
+  if (allowed.includes(provider.defaultModel)) return provider.defaultModel
+  return allowed[0] ?? provider.defaultModel
+}