npm - @lota-sdk/core - Versions diffs - 0.4.10 → 0.4.11 - Mend

@lota-sdk/core 0.4.10 → 0.4.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

package/package.json +2 -2
package/src/ai-gateway/ai-gateway.ts +149 -95
package/src/ai-gateway/index.ts +16 -1
package/src/config/agent-defaults.ts +4 -120
package/src/config/logger.ts +18 -34
package/src/config/thread-defaults.ts +1 -18
package/src/create-runtime.ts +90 -28
package/src/db/base.service.ts +30 -38
package/src/db/service.ts +489 -545
package/src/effect/index.ts +0 -2
package/src/effect/layers.ts +6 -13
package/src/embeddings/provider.ts +2 -7
package/src/index.ts +4 -5
package/src/queues/autonomous-job.queue.ts +159 -113
package/src/queues/context-compaction.queue.ts +39 -25
package/src/queues/delayed-node-promotion.queue.ts +56 -29
package/src/queues/document-processor.queue.ts +5 -3
package/src/queues/index.ts +1 -0
package/src/queues/memory-consolidation.queue.ts +79 -53
package/src/queues/organization-learning.queue.ts +63 -39
package/src/queues/plan-agent-heartbeat.queue.ts +104 -79
package/src/queues/plan-scheduler.queue.ts +100 -84
package/src/queues/post-chat-memory.queue.ts +55 -33
package/src/queues/queue-factory.ts +40 -41
package/src/queues/queues.service.ts +61 -0
package/src/queues/title-generation.queue.ts +42 -31
package/src/redis/org-memory-lock.ts +24 -9
package/src/redis/redis-lease-lock.ts +8 -1
package/src/runtime/agent-identity-overrides.ts +7 -3
package/src/runtime/agent-runtime-policy.ts +9 -4
package/src/runtime/agent-stream-helpers.ts +9 -4
package/src/runtime/context-compaction/context-compaction-runtime.ts +28 -32
package/src/runtime/context-compaction/context-compaction.ts +9 -7
package/src/runtime/domain-layer.ts +15 -4
package/src/runtime/execution-plan-visibility.ts +5 -2
package/src/runtime/graph-designer.ts +0 -22
package/src/runtime/index.ts +1 -0
package/src/runtime/indexed-repositories-policy.ts +2 -6
package/src/runtime/plugin-resolution.ts +29 -12
package/src/runtime/post-turn-side-effects.ts +139 -141
package/src/runtime/runtime-config.ts +0 -6
package/src/runtime/runtime-extensions.ts +0 -54
package/src/runtime/runtime-lifecycle.ts +4 -4
package/src/runtime/runtime-services.ts +122 -53
package/src/runtime/runtime-worker-registry.ts +113 -30
package/src/runtime/social-chat/social-chat-agent-runner.ts +6 -3
package/src/runtime/social-chat/social-chat-history.ts +3 -1
package/src/runtime/social-chat/social-chat.ts +35 -20
package/src/runtime/team-consultation/team-consultation-orchestrator.ts +6 -5
package/src/runtime/team-consultation/team-consultation-prompts.ts +11 -6
package/src/runtime/thread-chat-helpers.ts +18 -9
package/src/runtime/thread-turn-context.ts +7 -47
package/src/runtime/turn-lifecycle.ts +6 -14
package/src/services/agent-activity.service.ts +168 -175
package/src/services/agent-executor.service.ts +35 -16
package/src/services/attachment.service.ts +4 -70
package/src/services/autonomous-job.service.ts +53 -61
package/src/services/context-compaction.service.ts +7 -9
package/src/services/execution-plan/execution-plan-graph.ts +106 -115
package/src/services/execution-plan/execution-plan-schedule.ts +1 -15
package/src/services/execution-plan/execution-plan.service.ts +67 -50
package/src/services/global-orchestrator.service.ts +18 -7
package/src/services/graph-full-routing.ts +7 -6
package/src/services/memory/memory-conversation.ts +10 -5
package/src/services/memory/memory.service.ts +11 -8
package/src/services/ownership-dispatcher.service.ts +16 -5
package/src/services/plan/plan-agent-heartbeat.service.ts +29 -15
package/src/services/plan/plan-agent-query.service.ts +12 -8
package/src/services/plan/plan-completion-side-effects.ts +93 -101
package/src/services/plan/plan-cycle.service.ts +7 -45
package/src/services/plan/plan-deadline.service.ts +28 -17
package/src/services/plan/plan-event-delivery.service.ts +47 -40
package/src/services/plan/plan-executor-context.ts +2 -0
package/src/services/plan/plan-executor-graph.ts +366 -391
package/src/services/plan/plan-executor.service.ts +13 -91
package/src/services/plan/plan-scheduler.service.ts +62 -49
package/src/services/plan/plan-transaction-events.ts +1 -1
package/src/services/recent-activity-title.service.ts +6 -2
package/src/services/thread/thread-bootstrap.ts +11 -9
package/src/services/thread/thread-message.service.ts +6 -5
package/src/services/thread/thread-turn-execution.ts +86 -82
package/src/services/thread/thread-turn-preparation.service.ts +47 -24
package/src/services/thread/thread-turn-streaming.ts +20 -25
package/src/services/thread/thread-turn.ts +25 -44
package/src/services/thread/thread.service.ts +21 -6
package/src/system-agents/recent-activity-title-refiner.agent.ts +8 -5
package/src/system-agents/thread-router.agent.ts +23 -20
package/src/tools/execution-plan.tool.ts +8 -3
package/src/tools/fetch-webpage.tool.ts +10 -9
package/src/tools/firecrawl-client.ts +0 -15
package/src/tools/remember-memory.tool.ts +3 -6
package/src/tools/research-topic.tool.ts +12 -3
package/src/tools/search-web.tool.ts +10 -9
package/src/tools/search.tool.ts +4 -5
package/src/tools/team-think.tool.ts +139 -121
package/src/workers/bootstrap.ts +9 -10
package/src/workers/memory-consolidation.worker.ts +4 -1
package/src/workers/organization-learning.worker.ts +15 -2
package/src/workers/regular-chat-memory-digest.helpers.ts +3 -4
package/src/workers/regular-chat-memory-digest.runner.ts +21 -14
package/src/workers/skill-extraction.runner.ts +13 -15
package/src/workers/worker-utils.ts +6 -18
package/src/effect/awaitable-effect.ts +0 -96
package/src/effect/runtime-ref.ts +0 -25
package/src/effect/runtime.ts +0 -46
package/src/redis/runtime-connection.ts +0 -20
package/src/runtime/runtime-accessors.ts +0 -92
package/src/runtime/runtime-token.ts +0 -47

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lota-sdk/core",
-  "version": "0.4.10",
+  "version": "0.4.11",
   "type": "module",
   "main": "./src/index.ts",
   "types": "./src/index.ts",
@@ -31,7 +31,7 @@
     "@ai-sdk/openai": "^3.0.53",
     "@chat-adapter/slack": "^4.26.0",
     "@chat-adapter/state-ioredis": "^4.26.0",
-    "@lota-sdk/shared": "0.4.10",
+    "@lota-sdk/shared": "0.4.11",
     "@mendable/firecrawl-js": "^4.18.3",
     "@surrealdb/node": "^3.0.3",
     "ai": "^6.0.167",

package/src/ai-gateway/ai-gateway.ts CHANGED Viewed

@@ -6,7 +6,6 @@ import { Cause, Clock, Context, Duration, Effect, ExecutionPlan, Fiber, Layer, S
 import { DEFAULT_AI_GATEWAY_URL } from '../config/constants'
 import { AiGenerationError, ConfigurationError } from '../effect/errors'
-import { resolveLotaService } from '../effect/runtime'
 import { RuntimeConfigServiceTag } from '../effect/services'
 import { getDirectOpenRouterProvider, normalizeDirectOpenRouterModelId } from '../openrouter/direct-provider'
 import { isRecord, readString } from '../utils/string'
@@ -24,6 +23,8 @@ type AiGatewayGeneratedContent = AiGatewayGenerateResult['content'][number]
 type AiGatewayStreamPart = AiGatewayStreamResult['stream'] extends ReadableStream<infer T> ? T : never
 type AiGatewayProviderOptions = NonNullable<AiGatewayCallOptions['providerOptions']>
 type AiGatewayAttemptResult<A> = { source: string; result: A }
+// eslint-disable-next-line @typescript-eslint/no-redundant-type-constituents
+type AiGatewayRunFork = <A, E>(effect: Effect.Effect<A, E, never>) => Fiber.Fiber<A, E | unknown>
 class AiGatewayGenerateAttempt extends Context.Service<
   AiGatewayGenerateAttempt,
@@ -271,12 +272,13 @@ function withAiGatewayResilience<A>(source: string, effect: Effect.Effect<A, AiG
 function withAiGatewayStreamIdleTimeout(
   stream: ReadableStream<AiGatewayStreamPart>,
   source: string,
+  runFork: AiGatewayRunFork,
   onFinalize?: () => void,
 ): ReadableStream<AiGatewayStreamPart> {
   let closed = false
   let reader: ReadableStreamDefaultReader<AiGatewayStreamPart> | null = null
-  let idleTimeoutFiber: ReturnType<typeof Effect.runFork> | null = null
-  let bodyPumpFiber: ReturnType<typeof Effect.runFork> | null = null
+  let idleTimeoutFiber: Fiber.Fiber<unknown, unknown> | null = null
+  let bodyPumpFiber: Fiber.Fiber<unknown, unknown> | null = null
   let finalized = false
   const finalize = () => {
@@ -285,9 +287,9 @@ function withAiGatewayStreamIdleTimeout(
     onFinalize?.()
   }
-  const interruptFiber = (fiber: ReturnType<typeof Effect.runFork> | null) => {
+  const interruptFiber = (fiber: Fiber.Fiber<unknown, unknown> | null) => {
     if (!fiber) return
-    void Effect.runFork(Fiber.interrupt(fiber))
+    void runFork(Fiber.interrupt(fiber))
   }
   const stopIdleTimeout = () => {
@@ -351,7 +353,7 @@ function withAiGatewayStreamIdleTimeout(
   const resetIdleTimeout = (controller: ReadableStreamDefaultController<AiGatewayStreamPart>) => {
     stopIdleTimeout()
-    idleTimeoutFiber = Effect.runFork(
+    idleTimeoutFiber = runFork(
       Effect.sleep(Duration.millis(AI_GATEWAY_STREAM_IDLE_TIMEOUT_MS)).pipe(
         Effect.flatMap(() =>
           Effect.gen(function* () {
@@ -417,7 +419,7 @@ function withAiGatewayStreamIdleTimeout(
     start(controller) {
       const streamReader = stream.getReader()
       reader = streamReader
-      bodyPumpFiber = Effect.runFork(pumpStreamEffect(streamReader, controller))
+      bodyPumpFiber = runFork(pumpStreamEffect(streamReader, controller))
     },
     cancel(reason) {
       closed = true
@@ -493,40 +495,22 @@ export const AiGatewayLive = Layer.effect(
 type AiGatewayRuntimeConfig = Context.Service.Shape<typeof RuntimeConfigServiceTag>
-let currentAiGateway: AiGatewayTag['Service'] | null = null
-let currentAiGatewayRuntimeConfig: AiGatewayRuntimeConfig | null = null
-export function configureAiGatewayRuntimeAccessors(params: {
-  aiGateway: AiGatewayTag['Service']
-  runtimeConfig: AiGatewayRuntimeConfig
-}): void {
-  currentAiGateway = params.aiGateway
-  currentAiGatewayRuntimeConfig = params.runtimeConfig
-}
-export function clearAiGatewayRuntimeAccessors(): void {
-  currentAiGateway = null
-  currentAiGatewayRuntimeConfig = null
-}
-function getAiGateway(): AiGatewayTag['Service'] {
-  return currentAiGateway ?? resolveLotaService(AiGatewayTag)
-}
-function getAiGatewayRuntimeConfig(): AiGatewayRuntimeConfig {
-  return currentAiGatewayRuntimeConfig ?? resolveLotaService(RuntimeConfigServiceTag)
-}
-function withAiGatewayConcurrency<A>(effect: Effect.Effect<A, AiGenerationError>): Effect.Effect<A, AiGenerationError> {
-  return getAiGateway().semaphore.withPermit(effect)
+function withAiGatewayConcurrency<A>(
+  effect: Effect.Effect<A, AiGenerationError>,
+): Effect.Effect<A, AiGenerationError, AiGatewayTag> {
+  return Effect.gen(function* () {
+    const gateway = yield* AiGatewayTag
+    return yield* gateway.semaphore.withPermit(effect)
+  })
 }
 function withAiGatewayStreamConcurrency(
   effect: Effect.Effect<AiGatewayAttemptResult<AiGatewayStreamResult>, AiGenerationError>,
-): Effect.Effect<AiGatewayAttemptResult<AiGatewayStreamResult>, AiGenerationError> {
+  runFork: AiGatewayRunFork,
+): Effect.Effect<AiGatewayAttemptResult<AiGatewayStreamResult>, AiGenerationError, AiGatewayTag> {
   return Effect.uninterruptibleMask((restore) =>
     Effect.gen(function* () {
-      const { semaphore } = getAiGateway()
+      const { semaphore } = yield* AiGatewayTag
       const currentContext = yield* Effect.context<never>()
       yield* semaphore.take(1)
@@ -551,7 +535,7 @@ function withAiGatewayStreamConcurrency(
         ...attempt,
         result: {
           ...attempt.result,
-          stream: withAiGatewayStreamIdleTimeout(attempt.result.stream, attempt.source, release),
+          stream: withAiGatewayStreamIdleTimeout(attempt.result.stream, attempt.source, runFork, release),
         },
       }
     }),
@@ -638,18 +622,20 @@ function isOpenRouterModel(modelId: string): boolean {
   return modelId.trim().toLowerCase().startsWith('openrouter/')
 }
-function hasDirectOpenRouterFallback(modelId: string): boolean {
-  const config = getAiGatewayRuntimeConfig()
+function hasDirectOpenRouterFallback(config: AiGatewayRuntimeConfig, modelId: string): boolean {
   return isOpenRouterModel(modelId) && Boolean(config.aiGateway.openRouterApiKey?.trim())
 }
-function getDirectOpenRouterChatModel(modelId: string): AiGatewayLanguageModel {
-  const config = getAiGatewayRuntimeConfig()
+function getDirectOpenRouterChatModel(config: AiGatewayRuntimeConfig, modelId: string): AiGatewayLanguageModel {
   return getDirectOpenRouterProvider(config.aiGateway.openRouterApiKey).chat(normalizeDirectOpenRouterModelId(modelId))
 }
-function shouldFallbackToDirectOpenRouter(modelId: string, error: AiGenerationError): boolean {
-  return hasDirectOpenRouterFallback(modelId) && isRetryableAiGatewayError(error)
+function shouldFallbackToDirectOpenRouter(
+  config: AiGatewayRuntimeConfig,
+  modelId: string,
+  error: AiGenerationError,
+): boolean {
+  return hasDirectOpenRouterFallback(config, modelId) && isRetryableAiGatewayError(error)
 }
 function attemptAiGatewayGenerate(
@@ -681,22 +667,25 @@ function attemptAiGatewayStream(
 }
 function attemptDirectOpenRouterGenerate(
+  config: AiGatewayRuntimeConfig,
   modelId: string,
   params: AiGatewayCallOptions,
 ): Effect.Effect<AiGatewayAttemptResult<AiGatewayGenerateResult>, AiGenerationError> {
-  const model = getDirectOpenRouterChatModel(modelId)
+  const model = getDirectOpenRouterChatModel(config, modelId)
   return attemptAiGatewayGenerate('openrouter.generate', () => model.doGenerate(params))
 }
 function attemptDirectOpenRouterStream(
+  config: AiGatewayRuntimeConfig,
   modelId: string,
   params: AiGatewayCallOptions,
 ): Effect.Effect<AiGatewayAttemptResult<AiGatewayStreamResult>, AiGenerationError> {
-  const model = getDirectOpenRouterChatModel(modelId)
+  const model = getDirectOpenRouterChatModel(config, modelId)
   return attemptAiGatewayStream('openrouter.stream', () => model.doStream(params))
 }
 function executeGenerateAttemptPlan(
+  config: AiGatewayRuntimeConfig,
   modelId: string,
   params: AiGatewayCallOptions,
   doGenerate: () => PromiseLike<AiGatewayGenerateResult>,
@@ -709,7 +698,7 @@ function executeGenerateAttemptPlan(
     return yield* attempt.execute
   })
-  if (!hasDirectOpenRouterFallback(modelId)) {
+  if (!hasDirectOpenRouterFallback(config, modelId)) {
     return effect.pipe(
       Effect.provide(primary),
       Effect.withSpan('AiGateway.executeGeneratePlan'),
@@ -723,9 +712,9 @@ function executeGenerateAttemptPlan(
         { provide: primary },
         {
           provide: Layer.succeed(AiGatewayGenerateAttempt, {
-            execute: attemptDirectOpenRouterGenerate(modelId, params),
+            execute: attemptDirectOpenRouterGenerate(config, modelId, params),
           }),
-          while: (error: AiGenerationError) => shouldFallbackToDirectOpenRouter(modelId, error),
+          while: (error: AiGenerationError) => shouldFallbackToDirectOpenRouter(config, modelId, error),
         },
       ),
     ),
@@ -735,6 +724,7 @@ function executeGenerateAttemptPlan(
 }
 function executeStreamAttemptPlan(
+  config: AiGatewayRuntimeConfig,
   modelId: string,
   params: AiGatewayCallOptions,
   doStream: () => PromiseLike<AiGatewayStreamResult>,
@@ -747,7 +737,7 @@ function executeStreamAttemptPlan(
     return yield* attempt.execute
   })
-  if (!hasDirectOpenRouterFallback(modelId)) {
+  if (!hasDirectOpenRouterFallback(config, modelId)) {
     return effect.pipe(
       Effect.provide(primary),
       Effect.withSpan('AiGateway.executeStreamPlan'),
@@ -760,8 +750,10 @@ function executeStreamAttemptPlan(
       ExecutionPlan.make(
         { provide: primary },
         {
-          provide: Layer.succeed(AiGatewayStreamAttempt, { execute: attemptDirectOpenRouterStream(modelId, params) }),
-          while: (error: AiGenerationError) => shouldFallbackToDirectOpenRouter(modelId, error),
+          provide: Layer.succeed(AiGatewayStreamAttempt, {
+            execute: attemptDirectOpenRouterStream(config, modelId, params),
+          }),
+          while: (error: AiGenerationError) => shouldFallbackToDirectOpenRouter(config, modelId, error),
         },
       ),
     ),
@@ -849,7 +841,56 @@ function addAiGatewayReasoningRawChunks(
   return { ...params, includeRawChunks: true }
 }
-function createAiGatewayLanguageModelMiddleware(modelId: string): LanguageModelMiddleware {
+function resolveProviderModel(
+  provider: ReturnType<typeof createOpenAI>,
+  modelId: string,
+  providerId: string,
+): AiGatewayLanguageModel {
+  return providerId === OPENAI_CHAT_PROVIDER_ID ? provider.chat(modelId) : provider(modelId)
+}
+// Module-level Promise slot that `createLotaRuntime` populates during boot.
+// This is a legitimate per-process singleton (mirrors the worker bootstrap
+// pattern in `workers/bootstrap.ts`): the AI gateway middleware is dispatched
+// by AI SDK callers that live outside Effect context, so the middleware needs
+// a way to run gateway Effects without capturing a `ManagedRuntime` through
+// every `aiGatewayModel(modelId)` call site.
+//
+// Only `createLotaRuntime` writes to the slot; resetting on disconnect is a
+// Phase 3b concern — for now it stays alive for the process lifetime.
+let aiGatewayRuntimeReady: Promise<{
+  gateway: Context.Service.Shape<typeof AiGatewayTag>
+  runtimeConfig: Context.Service.Shape<typeof RuntimeConfigServiceTag>
+  runPromise: <A, E>(effect: Effect.Effect<A, E, never>) => Promise<A>
+  runFork: AiGatewayRunFork
+}> | null = null
+export function bindAiGatewayRuntime(params: {
+  gateway: Context.Service.Shape<typeof AiGatewayTag>
+  runtimeConfig: Context.Service.Shape<typeof RuntimeConfigServiceTag>
+  runPromise: <A, E>(effect: Effect.Effect<A, E, never>) => Promise<A>
+  runFork: AiGatewayRunFork
+}): void {
+  aiGatewayRuntimeReady = Promise.resolve(params)
+}
+export function clearAiGatewayRuntime(): void {
+  aiGatewayRuntimeReady = null
+}
+async function getAiGatewayRuntime(): Promise<{
+  gateway: Context.Service.Shape<typeof AiGatewayTag>
+  runtimeConfig: Context.Service.Shape<typeof RuntimeConfigServiceTag>
+  runPromise: <A, E>(effect: Effect.Effect<A, E, never>) => Promise<A>
+  runFork: AiGatewayRunFork
+}> {
+  if (!aiGatewayRuntimeReady) {
+    throw new Error('AI gateway runtime has not been initialized. Call createLotaRuntime() first.')
+  }
+  return aiGatewayRuntimeReady
+}
+function createAiGatewayLanguageModelMiddleware(modelId: string, providerId: string): LanguageModelMiddleware {
   return {
     specificationVersion: 'v3',
     transformParams: ({ params, type }) =>
@@ -858,10 +899,12 @@ function createAiGatewayLanguageModelMiddleware(modelId: string): LanguageModelM
           addAiGatewayReasoningRawChunks(normalizeAiGatewayChatProviderOptions(params, modelId), type),
         ),
       ),
-    wrapGenerate: ({ doGenerate, params }) =>
-      Effect.runPromise(
+    wrapGenerate: async ({ params }) => {
+      const { gateway, runtimeConfig, runPromise } = await getAiGatewayRuntime()
+      const model = resolveProviderModel(gateway.provider, modelId, providerId)
+      return runPromise(
         withAiGatewayConcurrency(
-          executeGenerateAttemptPlan(modelId, params, doGenerate).pipe(
+          executeGenerateAttemptPlan(runtimeConfig, modelId, params, () => model.doGenerate(params)).pipe(
             Effect.map(({ result }) => ({
               ...result,
               content: injectAiGatewayChatReasoningContent(
@@ -870,12 +913,15 @@ function createAiGatewayLanguageModelMiddleware(modelId: string): LanguageModelM
               ),
             })),
           ),
-        ),
-      ),
-    wrapStream: ({ doStream, params }) =>
-      Effect.runPromise(
+        ).pipe(Effect.provideService(AiGatewayTag, gateway)),
+      )
+    },
+    wrapStream: async ({ params }) => {
+      const { gateway, runtimeConfig, runPromise, runFork } = await getAiGatewayRuntime()
+      const model = resolveProviderModel(gateway.provider, modelId, providerId)
+      return runPromise(
         withAiGatewayStreamConcurrency(
-          executeStreamAttemptPlan(modelId, params, doStream).pipe(
+          executeStreamAttemptPlan(runtimeConfig, modelId, params, () => model.doStream(params)).pipe(
             Effect.map((attempt) => ({
               ...attempt,
               result: isReasoningEnabled(params)
@@ -883,8 +929,12 @@ function createAiGatewayLanguageModelMiddleware(modelId: string): LanguageModelM
                 : attempt.result,
             })),
           ),
-        ).pipe(Effect.map(({ result }) => result)),
-      ),
+          runFork,
+        )
+          .pipe(Effect.map(({ result }) => result))
+          .pipe(Effect.provideService(AiGatewayTag, gateway)),
+      )
+    },
   }
 }
@@ -921,36 +971,42 @@ function withAiGatewayDevTools<TModel extends AiGatewayLanguageModel>(model: TMo
   return wrapLanguageModel({ model, middleware: devToolsMiddleware() }) as TModel
 }
-function createLazyAiGatewayLanguageModel(params: {
-  modelId: string
-  providerId: string
-  resolve: () => AiGatewayLanguageModel
-}): AiGatewayLanguageModel {
+function createAiGatewayLanguageModelPlaceholder(modelId: string, providerId: string): AiGatewayLanguageModel {
+  const unreachable = (method: string) =>
+    Promise.reject(
+      new Error(
+        `[ai-gateway] AiGateway language model ${modelId}.${method} was invoked without the gateway middleware; ` +
+          'this call path should be fully handled by createAiGatewayLanguageModelMiddleware.',
+      ),
+    )
   return {
     specificationVersion: 'v3',
-    provider: params.providerId,
-    modelId: params.modelId,
+    provider: providerId,
+    modelId,
     supportedUrls: {},
-    doGenerate: (options) => params.resolve().doGenerate(options),
-    doStream: (options) => params.resolve().doStream(options),
+    doGenerate: () => unreachable('doGenerate'),
+    doStream: () => unreachable('doStream'),
   }
 }
-function createLazyAiGatewayEmbeddingModel(modelId: string): AiGatewayEmbeddingModel {
+function createAiGatewayEmbeddingModelPlaceholder(modelId: string): AiGatewayEmbeddingModel {
   return {
     specificationVersion: 'v3',
     provider: OPENAI_EMBEDDING_PROVIDER_ID,
     modelId,
     maxEmbeddingsPerCall: OPENAI_EMBEDDING_MAX_PER_CALL,
     supportsParallelCalls: true,
-    doEmbed: (options) => getAiGatewayProvider().embeddingModel(modelId).doEmbed(options),
+    doEmbed: () =>
+      Promise.reject(
+        new Error(
+          `[ai-gateway] AiGateway embedding model ${modelId}.doEmbed was invoked without the gateway middleware; ` +
+            'this call path should be fully handled by aiGatewayEmbeddingModel middleware.',
+        ),
+      ),
   }
 }
-export function getAiGatewayProvider() {
-  return getAiGateway().provider
-}
 export function aiGatewayModel(modelId: string) {
   if (isOpenRouterModel(modelId)) {
     return aiGatewayChatModel(modelId)
@@ -958,12 +1014,8 @@ export function aiGatewayModel(modelId: string) {
   return withAiGatewayDevTools(
     wrapLanguageModel({
-      model: createLazyAiGatewayLanguageModel({
-        modelId,
-        providerId: OPENAI_RESPONSES_PROVIDER_ID,
-        resolve: () => getAiGatewayProvider()(modelId),
-      }),
-      middleware: createAiGatewayLanguageModelMiddleware(modelId),
+      model: createAiGatewayLanguageModelPlaceholder(modelId, OPENAI_RESPONSES_PROVIDER_ID),
+      middleware: createAiGatewayLanguageModelMiddleware(modelId, OPENAI_RESPONSES_PROVIDER_ID),
     }),
   )
 }
@@ -975,30 +1027,32 @@ export function aiGatewayOpenRouterResponseHealingModel(modelId: string) {
 export function aiGatewayChatModel(modelId: string) {
   return withAiGatewayDevTools(
     wrapLanguageModel({
-      model: createLazyAiGatewayLanguageModel({
-        modelId,
-        providerId: OPENAI_CHAT_PROVIDER_ID,
-        resolve: () => getAiGatewayProvider().chat(modelId),
-      }),
-      middleware: createAiGatewayLanguageModelMiddleware(modelId),
+      model: createAiGatewayLanguageModelPlaceholder(modelId, OPENAI_CHAT_PROVIDER_ID),
+      middleware: createAiGatewayLanguageModelMiddleware(modelId, OPENAI_CHAT_PROVIDER_ID),
     }),
   )
 }
 export function aiGatewayEmbeddingModel(modelId: string) {
   return wrapEmbeddingModel({
-    model: createLazyAiGatewayEmbeddingModel(modelId),
+    model: createAiGatewayEmbeddingModelPlaceholder(modelId),
     middleware: {
       specificationVersion: 'v3',
-      wrapEmbed: ({ doEmbed }) =>
-        Effect.runPromise(
+      wrapEmbed: async ({ params }) => {
+        const { gateway, runPromise } = await getAiGatewayRuntime()
+        const embeddingModel = gateway.provider.embeddingModel(modelId)
+        return runPromise(
           withAiGatewayConcurrency(
             withAiGatewayResilience(
               'ai-gateway.embed',
-              Effect.tryPromise({ try: doEmbed, catch: (cause) => classifyAiGatewayError('ai-gateway.embed', cause) }),
-            ),
-          ).pipe(Effect.withSpan('AiGateway.embed'), Effect.annotateSpans({ modelId })),
-        ),
+              Effect.tryPromise({
+                try: () => embeddingModel.doEmbed(params),
+                catch: (cause) => classifyAiGatewayError('ai-gateway.embed', cause),
+              }),
+            ).pipe(Effect.withSpan('AiGateway.embed'), Effect.annotateSpans({ modelId })),
+          ).pipe(Effect.provideService(AiGatewayTag, gateway)),
+        )
+      },
     },
   })
 }

package/src/ai-gateway/index.ts CHANGED Viewed

@@ -1,2 +1,17 @@
-export * from './ai-gateway'
+export {
+  AiGatewayLive,
+  AiGatewayTag,
+  DEFAULT_AI_GATEWAY_URL,
+  aiGatewayChatModel,
+  aiGatewayEmbeddingModel,
+  aiGatewayModel,
+  aiGatewayOpenRouterResponseHealingModel,
+  bindAiGatewayRuntime,
+  extractAiGatewayChatReasoningDeltaText,
+  extractAiGatewayChatReasoningText,
+  injectAiGatewayChatReasoningContent,
+  injectAiGatewayChatReasoningStream,
+  normalizeAiGatewayChatProviderOptions,
+  normalizeAiGatewayUrl,
+} from './ai-gateway'
 export * from './cache-headers'

package/src/config/agent-defaults.ts CHANGED Viewed

@@ -1,8 +1,6 @@
 import type { ToolSet } from 'ai'
 import { ConfigurationError } from '../effect/errors'
-import { resolveLotaService } from '../effect/runtime'
-import { AgentConfigServiceTag, AgentFactoryServiceTag } from '../effect/services'
 import type {
   AgentFactory,
   AgentRuntimeConfigParams,
@@ -130,125 +128,11 @@ export interface CoreThreadProfile {
   instructions: string
 }
-let currentResolvedAgentConfig: ResolvedAgentConfig | null = null
-let currentResolvedAgentFactoryConfig: ResolvedAgentFactoryConfig | null = null
-export function configureAgentRuntimeDefaults(params: {
-  agentConfig: ResolvedAgentConfig
-  agentFactoryConfig: ResolvedAgentFactoryConfig
-}): void {
-  currentResolvedAgentConfig = params.agentConfig
-  currentResolvedAgentFactoryConfig = params.agentFactoryConfig
-}
-export function clearAgentRuntimeDefaults(): void {
-  currentResolvedAgentConfig = null
-  currentResolvedAgentFactoryConfig = null
-}
-function resolveAgentConfigFromRuntime(): ResolvedAgentConfig {
-  return currentResolvedAgentConfig ?? resolveLotaService(AgentConfigServiceTag)
-}
-function resolveAgentFactoryConfigFromRuntime(): ResolvedAgentFactoryConfig {
-  return currentResolvedAgentFactoryConfig ?? resolveLotaService(AgentFactoryServiceTag)
-}
-export function getResolvedAgentConfig(): ResolvedAgentConfig {
-  return resolveAgentConfigFromRuntime()
-}
-export function getResolvedAgentFactoryConfig(): ResolvedAgentFactoryConfig {
-  return resolveAgentFactoryConfigFromRuntime()
-}
-export function isAgentName(value: unknown): value is string {
-  return typeof value === 'string' && resolveAgentConfigFromRuntime().rosterSet.has(value)
-}
-export function getAgentRoster(): readonly string[] {
-  return resolveAgentConfigFromRuntime().roster
-}
-export function getAgentDisplayNames(): Record<string, string> {
-  return resolveAgentConfigFromRuntime().displayNames
-}
-export function getAgentShortDisplayNames(): Record<string, string> {
-  return resolveAgentConfigFromRuntime().shortDisplayNames
-}
-export function getAgentDescriptions(): Record<string, string> {
-  return resolveAgentConfigFromRuntime().descriptions
-}
-export function getLeadAgentId(): string {
-  return resolveAgentConfigFromRuntime().leadAgentId
-}
-export function getLeadAgentDisplayName(): string {
-  const resolved = resolveAgentConfigFromRuntime()
-  return resolved.displayNames[resolved.leadAgentId] ?? resolved.leadAgentId
-}
-export function getRouterModelId(): string | undefined {
-  return resolveAgentConfigFromRuntime().routerModelId
-}
-export function getTeamConsultParticipants(): readonly string[] {
-  return resolveAgentConfigFromRuntime().teamConsultParticipants
-}
-export function getCoreThreadProfile(coreType: string): CoreThreadProfile {
-  return resolveAgentConfigFromRuntime().getCoreThreadProfile(coreType)
+export function isAgentName(agentConfig: ResolvedAgentConfig, value: unknown): value is string {
+  return typeof value === 'string' && agentConfig.rosterSet.has(value)
 }
-export function resolveAgentNameAlias(value: unknown): string | undefined {
+export function resolveAgentNameAlias(agentConfig: ResolvedAgentConfig, value: unknown): string | undefined {
   if (typeof value !== 'string') return undefined
-  return resolveAgentConfigFromRuntime().aliasMap.get(normalizeAgentLookupKey(value))
-}
-export function getCreateAgentRegistry(): AgentFactory {
-  return resolveAgentFactoryConfigFromRuntime().createAgent
-}
-export function buildAgentTools(...args: Parameters<AgentToolBuilder>): ReturnType<AgentToolBuilder> {
-  return resolveAgentFactoryConfigFromRuntime().buildAgentTools(...args)
-}
-export function getAgentRuntimeConfig(
-  ...args: Parameters<AgentRuntimeConfigProvider>
-): ReturnType<AgentRuntimeConfigProvider> {
-  return resolveAgentFactoryConfigFromRuntime().getAgentRuntimeConfig(...args)
-}
-export function getPluginRuntime(): Record<string, unknown> | undefined {
-  return resolveAgentFactoryConfigFromRuntime().pluginRuntime
-}
-const AGENT_MENTION_REGEX = /(^|[^\w])@([a-z][a-z0-9_-]*)\b/gi
-export interface AgentMentionMatch {
-  agent: string
-  mention: string
-  index: number
-  length: number
-}
-export function extractAgentMentions(message: string, agentConfig?: ResolvedAgentConfig): AgentMentionMatch[] {
-  const matches: AgentMentionMatch[] = []
-  if (!message.trim()) return matches
-  const resolvedConfig = agentConfig ?? resolveAgentConfigFromRuntime()
-  const regex = new RegExp(AGENT_MENTION_REGEX)
-  for (const rawMatch of message.matchAll(regex)) {
-    const prefix = rawMatch[1]
-    const rawAgent = rawMatch[2].toLowerCase()
-    if (!resolvedConfig.rosterSet.has(rawAgent)) continue
-    const index = rawMatch.index + prefix.length
-    matches.push({ agent: rawAgent, mention: `@${rawAgent}`, index, length: rawAgent.length + 1 })
-  }
-  return matches
+  return agentConfig.aliasMap.get(normalizeAgentLookupKey(value))
 }