npm - @lota-sdk/core - Versions diffs - 0.4.12 → 0.4.14 - Mend

@lota-sdk/core 0.4.12 → 0.4.14

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (139) hide show

package/package.json +4 -4
package/src/ai/embedding-cache.ts +17 -11
package/src/ai-gateway/ai-gateway.ts +164 -94
package/src/ai-gateway/index.ts +4 -1
package/src/config/agent-defaults.ts +2 -2
package/src/config/agent-types.ts +1 -1
package/src/create-runtime.ts +259 -200
package/src/db/cursor-pagination.ts +2 -9
package/src/db/memory-store.ts +194 -175
package/src/db/memory.ts +125 -71
package/src/db/schema-fingerprint.ts +5 -4
package/src/db/service-normalization.ts +4 -3
package/src/db/service.ts +3 -2
package/src/db/startup.ts +15 -16
package/src/effect/errors.ts +161 -21
package/src/effect/index.ts +0 -1
package/src/embeddings/provider.ts +15 -7
package/src/queues/autonomous-job.queue.ts +10 -22
package/src/queues/delayed-node-promotion.queue.ts +8 -14
package/src/queues/document-processor.queue.ts +13 -4
package/src/queues/memory-consolidation.queue.ts +26 -14
package/src/queues/plan-agent-heartbeat.queue.ts +10 -9
package/src/queues/plan-scheduler.queue.ts +37 -15
package/src/queues/queue-factory.ts +59 -35
package/src/queues/standalone-worker.ts +3 -2
package/src/redis/connection.ts +10 -3
package/src/redis/org-memory-lock.ts +1 -1
package/src/redis/redis-lease-lock.ts +5 -5
package/src/redis/stream-context.ts +1 -1
package/src/runtime/chat-message.ts +64 -1
package/src/runtime/chat-run-orchestration.ts +33 -20
package/src/runtime/context-compaction/context-compaction-runtime.ts +14 -7
package/src/runtime/context-compaction/context-compaction.ts +78 -66
package/src/runtime/domain-layer.ts +13 -7
package/src/runtime/execution-plan.ts +7 -3
package/src/runtime/live-turn-trace.ts +6 -49
package/src/runtime/memory/memory-block.ts +3 -9
package/src/runtime/memory/memory-scope.ts +3 -1
package/src/runtime/plugin-resolution.ts +2 -1
package/src/runtime/post-turn-side-effects.ts +6 -5
package/src/runtime/retrieval-adapters.ts +8 -20
package/src/runtime/runtime-config.ts +3 -9
package/src/runtime/runtime-extensions.ts +2 -4
package/src/runtime/runtime-lifecycle.ts +56 -16
package/src/runtime/runtime-services.ts +180 -102
package/src/runtime/runtime-worker-registry.ts +3 -1
package/src/runtime/social-chat/social-chat-agent-runner.ts +1 -1
package/src/runtime/social-chat/social-chat-history.ts +21 -18
package/src/runtime/social-chat/social-chat.ts +356 -223
package/src/runtime/specialist-runner.ts +3 -1
package/src/runtime/team-consultation/team-consultation-orchestrator.ts +3 -2
package/src/runtime/thread-turn-context.ts +142 -102
package/src/runtime/turn-lifecycle.ts +15 -46
package/src/services/agent-activity.service.ts +1 -1
package/src/services/agent-executor.service.ts +107 -77
package/src/services/autonomous-job.service.ts +354 -293
package/src/services/background-work.service.ts +3 -3
package/src/services/context-compaction.service.ts +7 -2
package/src/services/document-chunk.service.ts +50 -32
package/src/services/execution-plan/execution-plan-schedule.ts +5 -3
package/src/services/execution-plan/execution-plan.service.ts +162 -179
package/src/services/feedback-loop.service.ts +5 -4
package/src/services/graph-full-routing.ts +37 -36
package/src/services/institutional-memory.service.ts +28 -30
package/src/services/learned-skill.service.ts +107 -72
package/src/services/memory/memory-errors.ts +4 -23
package/src/services/memory/memory-org-memory.ts +10 -5
package/src/services/memory/memory-rerank.ts +18 -6
package/src/services/memory/memory.service.ts +170 -111
package/src/services/memory/rerank.service.ts +29 -20
package/src/services/organization-member.service.ts +1 -1
package/src/services/organization.service.ts +69 -75
package/src/services/ownership-dispatcher.service.ts +40 -39
package/src/services/plan/plan-agent-heartbeat.service.ts +26 -23
package/src/services/plan/plan-agent-query.service.ts +39 -31
package/src/services/plan/plan-completion-side-effects.ts +13 -17
package/src/services/plan/plan-coordination.service.ts +2 -1
package/src/services/plan/plan-cycle.service.ts +6 -5
package/src/services/plan/plan-deadline.service.ts +57 -54
package/src/services/plan/plan-event-delivery.service.ts +5 -4
package/src/services/plan/plan-executor-graph.ts +18 -15
package/src/services/plan/plan-executor.service.ts +235 -262
package/src/services/plan/plan-run.service.ts +169 -93
package/src/services/plan/plan-scheduler.service.ts +192 -202
package/src/services/plan/plan-template.service.ts +1 -1
package/src/services/plan/plan-transaction-events.ts +1 -1
package/src/services/plan/plan-workspace.service.ts +23 -14
package/src/services/plugin-executor.service.ts +5 -9
package/src/services/queue-job.service.ts +117 -59
package/src/services/recent-activity-title.service.ts +13 -12
package/src/services/recent-activity.service.ts +6 -1
package/src/services/social-chat-history.service.ts +29 -25
package/src/services/system-executor.service.ts +5 -9
package/src/services/thread/thread-active-run.ts +2 -2
package/src/services/thread/thread-listing.ts +61 -57
package/src/services/thread/thread-memory-block.ts +73 -48
package/src/services/thread/thread-message.service.ts +76 -65
package/src/services/thread/thread-record-store.ts +8 -8
package/src/services/thread/thread-title.service.ts +10 -4
package/src/services/thread/thread-turn-execution.ts +43 -45
package/src/services/thread/thread-turn-preparation.service.ts +257 -135
package/src/services/thread/thread-turn-streaming.ts +82 -85
package/src/services/thread/thread-turn.ts +8 -8
package/src/services/thread/thread.service.ts +135 -100
package/src/services/user.service.ts +45 -48
package/src/storage/attachment-parser.ts +6 -2
package/src/storage/attachment-storage.service.ts +5 -6
package/src/storage/generated-document-storage.service.ts +1 -1
package/src/system-agents/context-compaction.agent.ts +10 -9
package/src/system-agents/delegated-agent-factory.ts +30 -6
package/src/system-agents/memory-reranker.agent.ts +10 -9
package/src/system-agents/memory.agent.ts +10 -9
package/src/system-agents/recent-activity-title-refiner.agent.ts +13 -15
package/src/system-agents/regular-chat-memory-digest.agent.ts +13 -12
package/src/system-agents/skill-extractor.agent.ts +13 -12
package/src/system-agents/skill-manager.agent.ts +13 -12
package/src/system-agents/thread-router.agent.ts +10 -5
package/src/system-agents/title-generator.agent.ts +13 -12
package/src/tools/fetch-webpage.tool.ts +13 -13
package/src/tools/memory-block.tool.ts +3 -1
package/src/tools/plan-approval.tool.ts +4 -2
package/src/tools/read-file-parts.tool.ts +10 -4
package/src/tools/remember-memory.tool.ts +3 -1
package/src/tools/research-topic.tool.ts +9 -5
package/src/tools/search-web.tool.ts +16 -16
package/src/tools/search.tool.ts +20 -5
package/src/tools/team-think.tool.ts +61 -38
package/src/utils/async.ts +5 -5
package/src/utils/errors.ts +19 -18
package/src/utils/sse-keepalive.ts +28 -25
package/src/workers/bootstrap.ts +75 -11
package/src/workers/memory-consolidation.worker.ts +82 -91
package/src/workers/organization-learning.worker.ts +14 -4
package/src/workers/regular-chat-memory-digest.runner.ts +105 -67
package/src/workers/skill-extraction.runner.ts +97 -61
package/src/workers/utils/repo-structure-extractor.ts +13 -8
package/src/workers/utils/thread-message-query.ts +24 -24
package/src/workers/worker-utils.ts +23 -4
package/src/effect/helpers.ts +0 -123

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lota-sdk/core",
-  "version": "0.4.12",
+  "version": "0.4.14",
   "type": "module",
   "main": "./src/index.ts",
   "types": "./src/index.ts",
@@ -31,13 +31,13 @@
     "@ai-sdk/openai": "^3.0.53",
     "@chat-adapter/slack": "^4.26.0",
     "@chat-adapter/state-ioredis": "^4.26.0",
-    "@lota-sdk/shared": "0.4.12",
+    "@lota-sdk/shared": "0.4.14",
     "@mendable/firecrawl-js": "^4.18.3",
     "@surrealdb/node": "^3.0.3",
     "ai": "^6.0.168",
-    "bullmq": "^5.74.1",
+    "bullmq": "^5.74.2",
     "chat": "^4.26.0",
-    "effect": "^4.0.0-beta.50",
+    "effect": "^4.0.0-beta.52",
     "hono": "^4.12.14",
     "ioredis": "5.9.3",
     "mammoth": "^1.12.0",

package/src/ai/embedding-cache.ts CHANGED Viewed

@@ -1,7 +1,9 @@
 import { Context, Effect, Layer, Schema } from 'effect'
 import type IORedis from 'ioredis'
+import { RuntimeBridgeTag } from '../ai-gateway/ai-gateway'
 import { aiLogger } from '../config/logger'
+import { ERROR_TAGS } from '../effect/errors'
 import { RedisServiceTag, RuntimeConfigServiceTag } from '../effect/services'
 import { sha256Hex } from '../utils/crypto'
@@ -9,7 +11,7 @@ export const DEFAULT_EMBEDDING_CACHE_TTL_SECONDS = 7200
 const EMBEDDING_CACHE_KEY_PREFIX = 'emb'
 const EmbeddingCacheJsonSchema = Schema.fromJsonString(Schema.Array(Schema.Number))
-class EmbeddingCacheError extends Schema.TaggedErrorClass<EmbeddingCacheError>()('EmbeddingCacheError', {
+class EmbeddingCacheError extends Schema.TaggedErrorClass<EmbeddingCacheError>()(ERROR_TAGS.EmbeddingCacheError, {
   message: Schema.String,
   operation: Schema.Literals(['get', 'set']),
   cause: Schema.optional(Schema.Defect),
@@ -29,7 +31,8 @@ export class EmbeddingCache {
   constructor(
     private redis: IORedis,
-    private ttlSeconds: number = DEFAULT_EMBEDDING_CACHE_TTL_SECONDS,
+    private ttlSeconds: number,
+    private readonly runPromise: <A, E = never>(effect: Effect.Effect<A, E>) => Promise<A>,
   ) {}
   private buildKey(model: string, text: string): string {
@@ -37,10 +40,6 @@ export class EmbeddingCache {
     return `${EMBEDDING_CACHE_KEY_PREFIX}:${model}:${hash}`
   }
-  private runEffect<A>(effect: Effect.Effect<A>): Promise<A> {
-    return Effect.runPromise(effect)
-  }
   private fetchFromRedisEffect(key: string): Effect.Effect<number[] | null> {
     const redis = this.redis
@@ -58,7 +57,7 @@ export class EmbeddingCache {
           new EmbeddingCacheError({ message: 'Embedding cache parse failed.', operation: 'get', cause }),
       })
     }).pipe(
-      Effect.catchTag('EmbeddingCacheError', (error) => {
+      Effect.catchTag(ERROR_TAGS.EmbeddingCacheError, (error) => {
         aiLogger.warn`${error.message}: ${error.cause}`
         return Effect.succeed<number[] | null>(null)
       }),
@@ -71,7 +70,7 @@ export class EmbeddingCache {
     const pending = this.inflight.get(key)
     if (pending) return pending
-    const promise = this.runEffect(this.fetchFromRedisEffect(key))
+    const promise = this.runPromise(this.fetchFromRedisEffect(key))
     this.inflight.set(key, promise)
     void promise.finally(() => this.inflight.delete(key))
@@ -95,7 +94,7 @@ export class EmbeddingCache {
       })
     }).pipe(
       Effect.asVoid,
-      Effect.catchTag('EmbeddingCacheError', (error) => {
+      Effect.catchTag(ERROR_TAGS.EmbeddingCacheError, (error) => {
         aiLogger.warn`${error.message}: ${error.cause}`
         return Effect.void
       }),
@@ -103,7 +102,7 @@ export class EmbeddingCache {
   }
   set(model: string, text: string, embedding: number[]): Promise<void> {
-    return this.runEffect(this.setEffect(model, text, embedding))
+    return this.runPromise(this.setEffect(model, text, embedding))
   }
 }
@@ -111,11 +110,18 @@ export class EmbeddingCacheTag extends Context.Service<EmbeddingCacheTag, Embedd
   '@lota-sdk/core/EmbeddingCache',
 ) {}
+/**
+ * `EmbeddingCache` needs a `runPromise` to convert internal Effect chains into
+ * the Promise API that AI SDK `embed` / `embedMany` expect. The layer yields
+ * `RuntimeBridgeTag` once and captures it — callers never prop-drill
+ * `runPromise` through this module.
+ */
 export const EmbeddingCacheLive = Layer.effect(
   EmbeddingCacheTag,
   Effect.gen(function* () {
     const redis = yield* RedisServiceTag
     const config = yield* RuntimeConfigServiceTag
-    return new EmbeddingCache(redis.getConnection(), config.memory.embeddingCacheTtlSeconds)
+    const bridge = yield* RuntimeBridgeTag
+    return new EmbeddingCache(redis.getConnection(), config.memory.embeddingCacheTtlSeconds, bridge.runPromise)
   }),
 )

package/src/ai-gateway/ai-gateway.ts CHANGED Viewed

@@ -5,7 +5,7 @@ import type { LanguageModelMiddleware } from 'ai'
 import { Cause, Clock, Context, Duration, Effect, ExecutionPlan, Fiber, Layer, Semaphore } from 'effect'
 import { DEFAULT_AI_GATEWAY_URL } from '../config/constants'
-import { AiGenerationError, ConfigurationError } from '../effect/errors'
+import { ERROR_TAGS, AiGenerationError, ConfigurationError } from '../effect/errors'
 import { RuntimeConfigServiceTag } from '../effect/services'
 import { getDirectOpenRouterProvider, normalizeDirectOpenRouterModelId } from '../openrouter/direct-provider'
 import { isRecord, readString } from '../utils/string'
@@ -26,15 +26,15 @@ type AiGatewayAttemptResult<A> = { source: string; result: A }
 // eslint-disable-next-line @typescript-eslint/no-redundant-type-constituents
 type AiGatewayRunFork = <A, E>(effect: Effect.Effect<A, E, never>) => Fiber.Fiber<A, E | unknown>
-class AiGatewayGenerateAttempt extends Context.Service<
-  AiGatewayGenerateAttempt,
+class AiGatewayGenerateAttemptTag extends Context.Service<
+  AiGatewayGenerateAttemptTag,
   { readonly execute: Effect.Effect<AiGatewayAttemptResult<AiGatewayGenerateResult>, AiGenerationError> }
->()('@lota-sdk/core/internal/AiGatewayGenerateAttempt') {}
+>()('@lota-sdk/core/internal/AiGatewayGenerateAttemptTag') {}
-class AiGatewayStreamAttempt extends Context.Service<
-  AiGatewayStreamAttempt,
+class AiGatewayStreamAttemptTag extends Context.Service<
+  AiGatewayStreamAttemptTag,
   { readonly execute: Effect.Effect<AiGatewayAttemptResult<AiGatewayStreamResult>, AiGenerationError> }
->()('@lota-sdk/core/internal/AiGatewayStreamAttempt') {}
+>()('@lota-sdk/core/internal/AiGatewayStreamAttemptTag') {}
 const EXPECTED_GATEWAY_KEY_PREFIX = 'sk-bf-'
 const AI_GATEWAY_VIRTUAL_KEY_HEADER = 'x-bf-vk'
@@ -71,7 +71,7 @@ const RETRYABLE_NETWORK_ERROR_PATTERNS = [
 ]
 function isAiGenerationError(error: unknown): error is AiGenerationError {
-  return isRecord(error) && error._tag === 'AiGenerationError'
+  return isRecord(error) && error._tag === ERROR_TAGS.AiGenerationError
 }
 function getNumericField(value: Record<string, unknown>, key: string): number | null {
@@ -244,7 +244,7 @@ function withAiGatewayResilience<A>(source: string, effect: Effect.Effect<A, AiG
   const retryEffect = Effect.gen(function* () {
     const runAttempt = (attempt: number): Effect.Effect<A, AiGenerationError> =>
       effect.pipe(
-        Effect.catchTag('AiGenerationError', (error) =>
+        Effect.catchTag(ERROR_TAGS.AiGenerationError, (error) =>
           Effect.gen(function* () {
             if (!isRetryableAiGatewayError(error) || attempt >= AI_GATEWAY_MAX_RETRIES - 1) {
               return yield* error
@@ -371,7 +371,15 @@ function withAiGatewayStreamIdleTimeout(
             reader = null
             if (!streamReader) return
-            yield* Effect.tryPromise(() => streamReader.cancel(timeoutError)).pipe(Effect.catch(() => Effect.void))
+            yield* Effect.tryPromise({
+              try: () => streamReader.cancel(timeoutError),
+              catch: (cause) =>
+                new AiGenerationError({
+                  source,
+                  message: `[${source}] Stream cancel failed.`,
+                  ...(cause instanceof Error ? { providerData: cause.message } : {}),
+                }),
+            }).pipe(Effect.catch(() => Effect.void))
           }),
         ),
       ),
@@ -388,7 +396,15 @@ function withAiGatewayStreamIdleTimeout(
       for (;;) {
         if (closed) return
-        const { done, value } = yield* Effect.tryPromise(() => streamReader.read())
+        const { done, value } = yield* Effect.tryPromise({
+          try: () => streamReader.read(),
+          catch: (cause) =>
+            new AiGenerationError({
+              source,
+              message: `[${source}] Stream read failed.`,
+              ...(cause instanceof Error ? { providerData: cause.message } : {}),
+            }),
+        })
         if (done) {
           stopIdleTimeout()
           yield* Effect.sync(() => closeStream(controller))
@@ -434,7 +450,15 @@ function withAiGatewayStreamIdleTimeout(
       }
       return Effect.runPromise(
-        Effect.tryPromise(() => streamReader.cancel(reason)).pipe(Effect.catch(() => Effect.void)),
+        Effect.tryPromise({
+          try: () => streamReader.cancel(reason),
+          catch: (cause) =>
+            new AiGenerationError({
+              source,
+              message: `[${source}] Stream cancel failed.`,
+              ...(cause instanceof Error ? { providerData: cause.message } : {}),
+            }),
+        }).pipe(Effect.catch(() => Effect.void)),
       )
     },
   })
@@ -457,12 +481,22 @@ function withDefaultAiGatewayCacheHeaders(params: AiGatewayCallOptions): AiGatew
   return { ...params, headers: mergeAiGatewayHeaders(params.headers, buildAiGatewayCacheHeaders('lota-sdk')) }
 }
+function normalizeAiGatewayUrlEffect(value: string): Effect.Effect<string, ConfigurationError> {
+  const trimmed = value.trim()
+  if (!trimmed) {
+    return Effect.fail(
+      new ConfigurationError({ message: '[ai-gateway] AI gateway URL is required.', key: 'aiGateway.url' }),
+    )
+  }
+  const normalized = trimmed.replace(/\/+$/, '')
+  return Effect.succeed(normalized.endsWith('/v1') ? normalized : `${normalized}/v1`)
+}
 function normalizeAiGatewayUrl(value: string): string {
   const trimmed = value.trim()
   if (!trimmed) {
     throw new ConfigurationError({ message: '[ai-gateway] AI gateway URL is required.', key: 'aiGateway.url' })
   }
   const normalized = trimmed.replace(/\/+$/, '')
   return normalized.endsWith('/v1') ? normalized : `${normalized}/v1`
 }
@@ -473,10 +507,10 @@ export class AiGatewayTag extends Context.Service<
   { readonly semaphore: Semaphore.Semaphore; readonly provider: ReturnType<typeof createOpenAI> }
 >()('@lota-sdk/core/AiGateway') {}
-export const AiGatewayLive = Layer.effect(
-  AiGatewayTag,
-  Effect.gen(function* () {
-    const config = yield* RuntimeConfigServiceTag
+export function makeAiGatewayService(
+  config: AiGatewayRuntimeConfig,
+): Effect.Effect<Context.Service.Shape<typeof AiGatewayTag>, ConfigurationError> {
+  return Effect.gen(function* () {
     const semaphore = yield* Semaphore.make(config.aiGateway.maxConcurrency)
     const apiKey = config.aiGateway.key.trim()
@@ -486,10 +520,18 @@ export const AiGatewayLive = Layer.effect(
         key: 'aiGateway.key',
       })
     }
-    const baseURL = normalizeAiGatewayUrl(config.aiGateway.url)
+    const baseURL = yield* normalizeAiGatewayUrlEffect(config.aiGateway.url)
     const provider = createOpenAI({ baseURL, apiKey, headers: { [AI_GATEWAY_VIRTUAL_KEY_HEADER]: apiKey } })
     return AiGatewayTag.of({ semaphore, provider })
+  })
+}
+export const AiGatewayLive = Layer.effect(
+  AiGatewayTag,
+  Effect.gen(function* () {
+    const config = yield* RuntimeConfigServiceTag
+    return yield* makeAiGatewayService(config)
   }),
 )
@@ -514,11 +556,26 @@ function withAiGatewayStreamConcurrency(
       const currentContext = yield* Effect.context<never>()
       yield* semaphore.take(1)
-      // NOTE: manual release intentional — permit outlives Effect scope for the
-      // stream lifetime. The stream consumer drains asynchronously after this
-      // Effect resolves; the permit is released by either the idle-timeout
-      // finalize callback or the error path below. The `released` guard makes
-      // the release idempotent across those paths.
+      // Permit-release impedance bridge. The semaphore permit MUST outlive
+      // the surrounding Effect because the returned ReadableStream is drained
+      // by an external consumer (AI SDK middleware → fetch consumer) on a
+      // promise/callback timeline that has no Effect scope to attach to.
+      //
+      // We considered Layer.scoped + Effect.acquireRelease here. It does not
+      // fit: the stream's close/cancel/idle-timeout callbacks fire from
+      // outside any Effect, so a Scope-bound finalizer cannot observe them
+      // without running the close itself through `Effect.runFork(Scope.close)`
+      // — which is the same imperative shape as the latch below, just more
+      // ceremony.
+      //
+      // The `released = false` latch keeps `release()` idempotent across the
+      // three callback edges that can fire it:
+      //   1. error path        — Effect.catchTag + Effect.sync(release)
+      //   2. interrupt path    — Effect.onInterrupt + Effect.sync(release)
+      //   3. idle-timeout path — withAiGatewayStreamIdleTimeout's onFinalize
+      //
+      // `Effect.runForkWith(currentContext)(semaphore.release(1))` preserves
+      // span/logger context across the boundary so observability stays intact.
       let released = false
       const release = () => {
         if (released) return
@@ -527,7 +584,9 @@ function withAiGatewayStreamConcurrency(
       }
       const attempt = yield* restore(effect).pipe(
-        Effect.catchTag('AiGenerationError', (error) => Effect.sync(release).pipe(Effect.andThen(Effect.fail(error)))),
+        Effect.catchTag(ERROR_TAGS.AiGenerationError, (error) =>
+          Effect.sync(release).pipe(Effect.andThen(Effect.fail(error))),
+        ),
         Effect.onInterrupt(() => Effect.sync(release)),
       )
@@ -736,11 +795,11 @@ function executeGenerateAttemptPlan(
   params: AiGatewayCallOptions,
   doGenerate: () => PromiseLike<AiGatewayGenerateResult>,
 ): Effect.Effect<AiGatewayAttemptResult<AiGatewayGenerateResult>, AiGenerationError> {
-  const primary = Layer.succeed(AiGatewayGenerateAttempt, {
+  const primary = Layer.succeed(AiGatewayGenerateAttemptTag, {
     execute: attemptAiGatewayGenerate('ai-gateway.generate', doGenerate),
   })
   const effect = Effect.gen(function* () {
-    const attempt = yield* AiGatewayGenerateAttempt
+    const attempt = yield* AiGatewayGenerateAttemptTag
     return yield* attempt.execute
   })
@@ -757,7 +816,7 @@ function executeGenerateAttemptPlan(
       ExecutionPlan.make(
         { provide: primary },
         {
-          provide: Layer.succeed(AiGatewayGenerateAttempt, {
+          provide: Layer.succeed(AiGatewayGenerateAttemptTag, {
             execute: attemptDirectOpenRouterGenerate(config, modelId, params),
           }),
           while: (error: AiGenerationError) => shouldFallbackToDirectOpenRouter(config, modelId, error),
@@ -775,11 +834,11 @@ function executeStreamAttemptPlan(
   params: AiGatewayCallOptions,
   doStream: () => PromiseLike<AiGatewayStreamResult>,
 ): Effect.Effect<AiGatewayAttemptResult<AiGatewayStreamResult>, AiGenerationError> {
-  const primary = Layer.succeed(AiGatewayStreamAttempt, {
+  const primary = Layer.succeed(AiGatewayStreamAttemptTag, {
     execute: attemptAiGatewayStream('ai-gateway.stream', doStream),
   })
   const effect = Effect.gen(function* () {
-    const attempt = yield* AiGatewayStreamAttempt
+    const attempt = yield* AiGatewayStreamAttemptTag
     return yield* attempt.execute
   })
@@ -796,7 +855,7 @@ function executeStreamAttemptPlan(
       ExecutionPlan.make(
         { provide: primary },
         {
-          provide: Layer.succeed(AiGatewayStreamAttempt, {
+          provide: Layer.succeed(AiGatewayStreamAttemptTag, {
             execute: attemptDirectOpenRouterStream(config, modelId, params),
           }),
           while: (error: AiGenerationError) => shouldFallbackToDirectOpenRouter(config, modelId, error),
@@ -911,48 +970,18 @@ function resolveProviderModel(
   return providerId === OPENAI_CHAT_PROVIDER_ID ? provider.chat(modelId) : provider(modelId)
 }
-// Module-level Promise slot that `createLotaRuntime` populates during boot.
-// This is a legitimate per-process singleton (mirrors the worker bootstrap
-// pattern in `workers/bootstrap.ts`): the AI gateway middleware is dispatched
-// by AI SDK callers that live outside Effect context, so the middleware needs
-// a way to run gateway Effects without capturing a `ManagedRuntime` through
-// every `aiGatewayModel(modelId)` call site.
-//
-// Only `createLotaRuntime` writes to the slot; resetting on disconnect is a
-// Phase 3b concern — for now it stays alive for the process lifetime.
-let aiGatewayRuntimeReady: Promise<{
-  gateway: Context.Service.Shape<typeof AiGatewayTag>
-  runtimeConfig: Context.Service.Shape<typeof RuntimeConfigServiceTag>
-  runPromise: <A, E>(effect: Effect.Effect<A, E, never>) => Promise<A>
-  runFork: AiGatewayRunFork
-}> | null = null
-export function bindAiGatewayRuntime(params: {
-  gateway: Context.Service.Shape<typeof AiGatewayTag>
-  runtimeConfig: Context.Service.Shape<typeof RuntimeConfigServiceTag>
-  runPromise: <A, E>(effect: Effect.Effect<A, E, never>) => Promise<A>
-  runFork: AiGatewayRunFork
-}): void {
-  aiGatewayRuntimeReady = Promise.resolve(params)
-}
-export function clearAiGatewayRuntime(): void {
-  aiGatewayRuntimeReady = null
-}
-async function getAiGatewayRuntime(): Promise<{
+export type AiGatewayDeps = {
   gateway: Context.Service.Shape<typeof AiGatewayTag>
   runtimeConfig: Context.Service.Shape<typeof RuntimeConfigServiceTag>
   runPromise: <A, E>(effect: Effect.Effect<A, E, never>) => Promise<A>
   runFork: AiGatewayRunFork
-}> {
-  if (!aiGatewayRuntimeReady) {
-    throw new Error('AI gateway runtime has not been initialized. Call createLotaRuntime() first.')
-  }
-  return aiGatewayRuntimeReady
 }
-function createAiGatewayLanguageModelMiddleware(modelId: string, providerId: string): LanguageModelMiddleware {
+function createAiGatewayLanguageModelMiddleware(
+  modelId: string,
+  providerId: string,
+  deps: AiGatewayDeps,
+): LanguageModelMiddleware {
   return {
     specificationVersion: 'v3',
     transformParams: ({ params, type }) =>
@@ -961,12 +990,11 @@ function createAiGatewayLanguageModelMiddleware(modelId: string, providerId: str
           addAiGatewayReasoningRawChunks(normalizeAiGatewayChatProviderOptions(params, modelId), type),
         ),
       ),
-    wrapGenerate: async ({ params }) => {
-      const { gateway, runtimeConfig, runPromise } = await getAiGatewayRuntime()
-      const model = resolveProviderModel(gateway.provider, modelId, providerId)
-      return runPromise(
+    wrapGenerate: ({ params }) => {
+      const model = resolveProviderModel(deps.gateway.provider, modelId, providerId)
+      return deps.runPromise(
         withAiGatewayConcurrency(
-          executeGenerateAttemptPlan(runtimeConfig, modelId, params, () => model.doGenerate(params)).pipe(
+          executeGenerateAttemptPlan(deps.runtimeConfig, modelId, params, () => model.doGenerate(params)).pipe(
             Effect.map(({ result }) => ({
               ...result,
               content: injectAiGatewayChatReasoningContent(
@@ -975,15 +1003,14 @@ function createAiGatewayLanguageModelMiddleware(modelId: string, providerId: str
               ),
             })),
           ),
-        ).pipe(Effect.provideService(AiGatewayTag, gateway)),
+        ).pipe(Effect.provideService(AiGatewayTag, deps.gateway)),
       )
     },
-    wrapStream: async ({ params }) => {
-      const { gateway, runtimeConfig, runPromise, runFork } = await getAiGatewayRuntime()
-      const model = resolveProviderModel(gateway.provider, modelId, providerId)
-      return runPromise(
+    wrapStream: ({ params }) => {
+      const model = resolveProviderModel(deps.gateway.provider, modelId, providerId)
+      return deps.runPromise(
         withAiGatewayStreamConcurrency(
-          executeStreamAttemptPlan(runtimeConfig, modelId, params, () => model.doStream(params)).pipe(
+          executeStreamAttemptPlan(deps.runtimeConfig, modelId, params, () => model.doStream(params)).pipe(
             Effect.map((attempt) => ({
               ...attempt,
               result: isReasoningEnabled(params)
@@ -991,10 +1018,11 @@ function createAiGatewayLanguageModelMiddleware(modelId: string, providerId: str
                 : attempt.result,
             })),
           ),
-          runFork,
-        )
-          .pipe(Effect.map(({ result }) => result))
-          .pipe(Effect.provideService(AiGatewayTag, gateway)),
+          deps.runFork,
+        ).pipe(
+          Effect.map(({ result }) => result),
+          Effect.provideService(AiGatewayTag, deps.gateway),
+        ),
       )
     },
   }
@@ -1069,41 +1097,40 @@ function createAiGatewayEmbeddingModelPlaceholder(modelId: string): AiGatewayEmb
   }
 }
-export function aiGatewayModel(modelId: string) {
+export function aiGatewayModel(modelId: string, deps: AiGatewayDeps) {
   if (isOpenRouterModel(modelId)) {
-    return aiGatewayChatModel(modelId)
+    return aiGatewayChatModel(modelId, deps)
   }
   return withAiGatewayDevTools(
     wrapLanguageModel({
       model: createAiGatewayLanguageModelPlaceholder(modelId, OPENAI_RESPONSES_PROVIDER_ID),
-      middleware: createAiGatewayLanguageModelMiddleware(modelId, OPENAI_RESPONSES_PROVIDER_ID),
+      middleware: createAiGatewayLanguageModelMiddleware(modelId, OPENAI_RESPONSES_PROVIDER_ID, deps),
     }),
   )
 }
-export function aiGatewayOpenRouterResponseHealingModel(modelId: string) {
-  return aiGatewayChatModel(modelId)
+export function aiGatewayOpenRouterResponseHealingModel(modelId: string, deps: AiGatewayDeps) {
+  return aiGatewayChatModel(modelId, deps)
 }
-export function aiGatewayChatModel(modelId: string) {
+export function aiGatewayChatModel(modelId: string, deps: AiGatewayDeps) {
   return withAiGatewayDevTools(
     wrapLanguageModel({
       model: createAiGatewayLanguageModelPlaceholder(modelId, OPENAI_CHAT_PROVIDER_ID),
-      middleware: createAiGatewayLanguageModelMiddleware(modelId, OPENAI_CHAT_PROVIDER_ID),
+      middleware: createAiGatewayLanguageModelMiddleware(modelId, OPENAI_CHAT_PROVIDER_ID, deps),
     }),
   )
 }
-export function aiGatewayEmbeddingModel(modelId: string) {
+export function aiGatewayEmbeddingModel(modelId: string, deps: AiGatewayDeps) {
   return wrapEmbeddingModel({
     model: createAiGatewayEmbeddingModelPlaceholder(modelId),
     middleware: {
       specificationVersion: 'v3',
-      wrapEmbed: async ({ params }) => {
-        const { gateway, runPromise } = await getAiGatewayRuntime()
-        const embeddingModel = gateway.provider.embeddingModel(modelId)
-        return runPromise(
+      wrapEmbed: ({ params }) => {
+        const embeddingModel = deps.gateway.provider.embeddingModel(modelId)
+        return deps.runPromise(
           withAiGatewayConcurrency(
             withAiGatewayResilience(
               'ai-gateway.embed',
@@ -1112,11 +1139,54 @@ export function aiGatewayEmbeddingModel(modelId: string) {
                 catch: (cause) => classifyAiGatewayError('ai-gateway.embed', cause),
               }),
             ).pipe(Effect.withSpan('AiGateway.embed'), Effect.annotateSpans({ modelId })),
-          ).pipe(Effect.provideService(AiGatewayTag, gateway)),
+          ).pipe(Effect.provideService(AiGatewayTag, deps.gateway)),
         )
       },
     },
   })
 }
+/**
+ * Pre-bound AI gateway model surface. Produced once per `LotaRuntime` in
+ * `createLotaRuntime` and provided via `AiGatewayModelsTag` so services and
+ * system-agent factories consume it through standard DI rather than an
+ * ambient module slot.
+ */
+export type AiGatewayModels = {
+  model(modelId: string): ReturnType<typeof aiGatewayModel>
+  chatModel(modelId: string): ReturnType<typeof aiGatewayChatModel>
+  embeddingModel(modelId: string): ReturnType<typeof aiGatewayEmbeddingModel>
+  openRouterResponseHealingModel(modelId: string): ReturnType<typeof aiGatewayOpenRouterResponseHealingModel>
+}
+export function createAiGatewayModels(deps: AiGatewayDeps): AiGatewayModels {
+  return {
+    model: (modelId: string) => aiGatewayModel(modelId, deps),
+    chatModel: (modelId: string) => aiGatewayChatModel(modelId, deps),
+    embeddingModel: (modelId: string) => aiGatewayEmbeddingModel(modelId, deps),
+    openRouterResponseHealingModel: (modelId: string) => aiGatewayOpenRouterResponseHealingModel(modelId, deps),
+  }
+}
+export class AiGatewayModelsTag extends Context.Service<AiGatewayModelsTag, AiGatewayModels>()(
+  '@lota-sdk/core/AiGatewayModels',
+) {}
+/**
+ * Runtime bridge surface. Services and tool factories that need to convert
+ * Effects to Promises at a host boundary (AI SDK tool callbacks, BullMQ worker
+ * processors, etc.) yield this tag to obtain the `runPromise` and `runFork`
+ * bound to the outer `ManagedRuntime`. Provided once in `createLotaRuntime`
+ * via a function-local holder so services DI their runtime bridge rather than
+ * capturing context with `Effect.runPromiseWith`.
+ */
+export type RuntimeBridge = {
+  runPromise: <A, E>(effect: Effect.Effect<A, E, never>, options?: { signal?: AbortSignal }) => Promise<A>
+  runFork: AiGatewayRunFork
+}
+export class RuntimeBridgeTag extends Context.Service<RuntimeBridgeTag, RuntimeBridge>()(
+  '@lota-sdk/core/RuntimeBridge',
+) {}
 export { DEFAULT_AI_GATEWAY_URL, normalizeAiGatewayUrl }

package/src/ai-gateway/index.ts CHANGED Viewed

@@ -1,12 +1,14 @@
 export {
   AiGatewayLive,
+  AiGatewayModelsTag,
   AiGatewayTag,
   DEFAULT_AI_GATEWAY_URL,
+  RuntimeBridgeTag,
   aiGatewayChatModel,
   aiGatewayEmbeddingModel,
   aiGatewayModel,
   aiGatewayOpenRouterResponseHealingModel,
-  bindAiGatewayRuntime,
+  createAiGatewayModels,
   extractAiGatewayChatReasoningDeltaText,
   extractAiGatewayChatReasoningText,
   injectAiGatewayChatReasoningContent,
@@ -14,4 +16,5 @@ export {
   normalizeAiGatewayChatProviderOptions,
   normalizeAiGatewayUrl,
 } from './ai-gateway'
+export type { AiGatewayDeps, AiGatewayModels, RuntimeBridge } from './ai-gateway'
 export * from './cache-headers'

package/src/config/agent-defaults.ts CHANGED Viewed

@@ -8,8 +8,8 @@ import type {
   AgentToolBuilder,
 } from './agent-types'
-function defaultBuildAgentTools(): ToolSet {
-  return {}
+function defaultBuildAgentTools(): Promise<ToolSet> {
+  return Promise.resolve({})
 }
 function defaultGetAgentRuntimeConfig(params: AgentRuntimeConfigParams) {

package/src/config/agent-types.ts CHANGED Viewed

@@ -55,7 +55,7 @@ export type AgentCreator = <TTools extends ToolSet>(
 export type AgentFactory = Partial<Record<string, AgentCreator>>
 /** Builds the tool set for a given agent. */
-export type AgentToolBuilder = (params: AgentToolBuilderParams) => ToolSet | Promise<ToolSet>
+export type AgentToolBuilder = (params: AgentToolBuilderParams) => Promise<ToolSet>
 /** Returns runtime configuration for a given agent. */
 export type AgentRuntimeConfigProvider = (params: AgentRuntimeConfigParams) => AgentRuntimeConfig<string>