npm - ai-functions - Versions diffs - 2.0.2 → 2.1.3 - Mend

ai-functions 2.0.2 → 2.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

package/.turbo/turbo-build.log +4 -5
package/CHANGELOG.md +38 -0
package/LICENSE +21 -0
package/README.md +361 -159
package/dist/ai-promise.d.ts +47 -0
package/dist/ai-promise.d.ts.map +1 -1
package/dist/ai-promise.js +291 -3
package/dist/ai-promise.js.map +1 -1
package/dist/ai.d.ts +17 -18
package/dist/ai.d.ts.map +1 -1
package/dist/ai.js +93 -39
package/dist/ai.js.map +1 -1
package/dist/batch-map.d.ts +46 -4
package/dist/batch-map.d.ts.map +1 -1
package/dist/batch-map.js +35 -2
package/dist/batch-map.js.map +1 -1
package/dist/batch-queue.d.ts +116 -12
package/dist/batch-queue.d.ts.map +1 -1
package/dist/batch-queue.js +47 -2
package/dist/batch-queue.js.map +1 -1
package/dist/budget.d.ts +272 -0
package/dist/budget.d.ts.map +1 -0
package/dist/budget.js +500 -0
package/dist/budget.js.map +1 -0
package/dist/cache.d.ts +272 -0
package/dist/cache.d.ts.map +1 -0
package/dist/cache.js +412 -0
package/dist/cache.js.map +1 -0
package/dist/context.d.ts +32 -1
package/dist/context.d.ts.map +1 -1
package/dist/context.js +16 -1
package/dist/context.js.map +1 -1
package/dist/eval/runner.d.ts +2 -1
package/dist/eval/runner.d.ts.map +1 -1
package/dist/eval/runner.js.map +1 -1
package/dist/generate.d.ts.map +1 -1
package/dist/generate.js +6 -10
package/dist/generate.js.map +1 -1
package/dist/index.d.ts +27 -20
package/dist/index.d.ts.map +1 -1
package/dist/index.js +72 -42
package/dist/index.js.map +1 -1
package/dist/primitives.d.ts +17 -0
package/dist/primitives.d.ts.map +1 -1
package/dist/primitives.js +19 -1
package/dist/primitives.js.map +1 -1
package/dist/retry.d.ts +303 -0
package/dist/retry.d.ts.map +1 -0
package/dist/retry.js +539 -0
package/dist/retry.js.map +1 -0
package/dist/schema.d.ts.map +1 -1
package/dist/schema.js +1 -9
package/dist/schema.js.map +1 -1
package/dist/tool-orchestration.d.ts +391 -0
package/dist/tool-orchestration.d.ts.map +1 -0
package/dist/tool-orchestration.js +663 -0
package/dist/tool-orchestration.js.map +1 -0
package/dist/types.d.ts +50 -33
package/dist/types.d.ts.map +1 -1
package/evalite.config.js +14 -0
package/evals/classification.eval.js +97 -0
package/evals/marketing.eval.js +289 -0
package/evals/math.eval.js +83 -0
package/evals/run-evals.js +151 -0
package/evals/structured-output.eval.js +131 -0
package/evals/writing.eval.js +105 -0
package/examples/batch-blog-posts.js +128 -0
package/package.json +26 -26
package/src/ai-promise.ts +359 -3
package/src/ai.ts +155 -110
package/src/batch/anthropic.js +256 -0
package/src/batch/bedrock.js +584 -0
package/src/batch/cloudflare.js +287 -0
package/src/batch/google.js +359 -0
package/src/batch/index.js +30 -0
package/src/batch/memory.js +187 -0
package/src/batch/openai.js +402 -0
package/src/batch-map.ts +46 -4
package/src/batch-queue.ts +116 -12
package/src/budget.ts +727 -0
package/src/cache.ts +653 -0
package/src/context.ts +33 -1
package/src/eval/index.js +7 -0
package/src/eval/models.js +119 -0
package/src/eval/runner.js +147 -0
package/src/eval/runner.ts +3 -2
package/src/generate.ts +7 -12
package/src/index.ts +231 -53
package/src/primitives.ts +19 -1
package/src/retry.ts +776 -0
package/src/schema.ts +1 -10
package/src/tool-orchestration.ts +1008 -0
package/src/types.ts +59 -41
package/test/ai-proxy.test.js +157 -0
package/test/async-iterators.test.js +261 -0
package/test/backward-compat.test.ts +147 -0
package/test/batch-autosubmit-errors.test.ts +598 -0
package/test/batch-background.test.js +352 -0
package/test/batch-blog-posts.test.js +293 -0
package/test/blog-generation.test.js +390 -0
package/test/browse-read.test.js +480 -0
package/test/budget-tracking.test.ts +800 -0
package/test/cache.test.ts +712 -0
package/test/context-isolation.test.ts +687 -0
package/test/core-functions.test.js +490 -0
package/test/decide.test.js +260 -0
package/test/define.test.js +232 -0
package/test/e2e-bedrock-manual.js +136 -0
package/test/e2e-bedrock.test.js +164 -0
package/test/e2e-flex-gateway.js +131 -0
package/test/e2e-flex-manual.js +156 -0
package/test/e2e-flex.test.js +174 -0
package/test/e2e-google-manual.js +150 -0
package/test/e2e-google.test.js +181 -0
package/test/embeddings.test.js +220 -0
package/test/evals/define-function.eval.test.js +309 -0
package/test/evals/deterministic.eval.test.ts +376 -0
package/test/evals/primitives.eval.test.js +360 -0
package/test/function-types.test.js +407 -0
package/test/generate-core.test.js +213 -0
package/test/generate.test.js +143 -0
package/test/generic-order.test.ts +342 -0
package/test/implicit-batch.test.js +326 -0
package/test/json-parse-error-handling.test.ts +463 -0
package/test/retry.test.ts +1016 -0
package/test/schema.test.js +96 -0
package/test/streaming.test.ts +316 -0
package/test/tagged-templates.test.js +240 -0
package/test/tool-orchestration.test.ts +770 -0
package/vitest.config.js +39 -0

package/test/context-isolation.test.ts ADDED Viewed

@@ -0,0 +1,687 @@
+/**
+ * Tests for Concurrent Context Isolation
+ *
+ * TDD: RED phase - These tests expose race conditions in global context management
+ *
+ * The current implementation uses a global `defaultClient` variable that can cause
+ * context bleeding between concurrent operations. These tests demonstrate:
+ *
+ * 1. Context leakage between concurrent Promise.all operations
+ * 2. Configuration changes affecting in-flight requests
+ * 3. API key isolation failure in multi-tenant scenarios
+ * 4. Async/await interleaving causing wrong context
+ *
+ * Expected: These tests should FAIL or be FLAKY with the current implementation,
+ * demonstrating the need for AsyncLocalStorage-based context isolation.
+ */
+import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest'
+import {
+  configure,
+  resetContext,
+  withContext,
+  getContext,
+  getModel,
+  getProvider,
+  getBatchMode,
+  type ExecutionContext,
+} from '../src/context.js'
+// ============================================================================
+// Test Utilities
+// ============================================================================
+/**
+ * Simulates an async AI operation that takes variable time
+ * This helps expose race conditions by introducing realistic delays
+ */
+async function simulateAICall(delayMs: number): Promise<ExecutionContext> {
+  // Capture context at start
+  const startContext = getContext()
+  // Simulate network delay
+  await new Promise(resolve => setTimeout(resolve, delayMs))
+  // Capture context at end - should be same as start!
+  const endContext = getContext()
+  return {
+    // Return both for comparison
+    ...endContext,
+    _startModel: startContext.model,
+    _startProvider: startContext.provider,
+  } as ExecutionContext & { _startModel?: string; _startProvider?: string }
+}
+/**
+ * Creates a delayed operation that should maintain its context
+ */
+function createDelayedContextCapture(delayMs: number) {
+  return async (): Promise<{ model: string | undefined; provider: string | undefined }> => {
+    const beforeDelay = { model: getModel(), provider: getProvider() }
+    await new Promise(resolve => setTimeout(resolve, delayMs))
+    const afterDelay = { model: getModel(), provider: getProvider() }
+    // These should be equal - if not, context leaked!
+    return {
+      model: afterDelay.model,
+      provider: afterDelay.provider,
+      _beforeModel: beforeDelay.model,
+      _beforeProvider: beforeDelay.provider,
+    } as { model: string | undefined; provider: string | undefined }
+  }
+}
+// ============================================================================
+// Context Isolation Tests
+// ============================================================================
+describe('Concurrent Context Isolation', () => {
+  beforeEach(() => {
+    resetContext()
+  })
+  afterEach(() => {
+    resetContext()
+  })
+  describe('Promise.all Context Leakage', () => {
+    it('should isolate context between concurrent withContext calls', async () => {
+      // This test exposes the race condition in the fallback implementation
+      // where global context is temporarily modified and restored
+      const results = await Promise.all([
+        withContext({ model: 'claude-opus-4-5', provider: 'anthropic' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 50))
+          return { model: getModel(), provider: getProvider() }
+        }),
+        withContext({ model: 'gpt-4o', provider: 'openai' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 10))
+          return { model: getModel(), provider: getProvider() }
+        }),
+        withContext({ model: 'gemini-pro', provider: 'google' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 30))
+          return { model: getModel(), provider: getProvider() }
+        }),
+      ])
+      // Each operation should see its own context, not another's
+      expect(results[0]).toEqual({ model: 'claude-opus-4-5', provider: 'anthropic' })
+      expect(results[1]).toEqual({ model: 'gpt-4o', provider: 'openai' })
+      expect(results[2]).toEqual({ model: 'gemini-pro', provider: 'google' })
+    })
+    it('should not leak context when operations complete in different order', async () => {
+      // Operations with different completion times
+      const contexts: Array<{ model: string | undefined; provider: string | undefined; order: number }> = []
+      await Promise.all([
+        withContext({ model: 'slow-model', provider: 'anthropic' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 100))
+          contexts.push({ model: getModel(), provider: getProvider(), order: 1 })
+        }),
+        withContext({ model: 'fast-model', provider: 'openai' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 10))
+          contexts.push({ model: getModel(), provider: getProvider(), order: 2 })
+        }),
+      ])
+      // Fast model completes first (order 2), slow model second (order 1)
+      // But each should see its own model
+      const slowResult = contexts.find(c => c.order === 1)
+      const fastResult = contexts.find(c => c.order === 2)
+      expect(slowResult?.model).toBe('slow-model')
+      expect(fastResult?.model).toBe('fast-model')
+    })
+    it('should handle nested withContext calls concurrently', async () => {
+      const results = await Promise.all([
+        withContext({ model: 'outer-1' }, async () => {
+          const outerModel = getModel()
+          const innerResult = await withContext({ model: 'inner-1' }, async () => {
+            await new Promise(resolve => setTimeout(resolve, 20))
+            return getModel()
+          })
+          // After inner completes, should restore outer context
+          const afterInnerModel = getModel()
+          return { outerModel, innerResult, afterInnerModel }
+        }),
+        withContext({ model: 'outer-2' }, async () => {
+          const outerModel = getModel()
+          await new Promise(resolve => setTimeout(resolve, 10))
+          return { outerModel, innerResult: null, afterInnerModel: getModel() }
+        }),
+      ])
+      expect(results[0].outerModel).toBe('outer-1')
+      expect(results[0].innerResult).toBe('inner-1')
+      expect(results[0].afterInnerModel).toBe('outer-1')
+      expect(results[1].outerModel).toBe('outer-2')
+      expect(results[1].afterInnerModel).toBe('outer-2')
+    })
+  })
+  describe('API Key Isolation (Multi-tenant)', () => {
+    it('should isolate API keys between concurrent tenant requests', async () => {
+      // Simulate multi-tenant scenario where each request has different credentials
+      interface TenantContext {
+        apiKey: string
+        tenantId: string
+      }
+      const tenantResults: Array<TenantContext & { seenApiKey: string }> = []
+      await Promise.all([
+        withContext({ metadata: { apiKey: 'tenant-1-key', tenantId: 'tenant-1' } }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 50))
+          const ctx = getContext()
+          tenantResults.push({
+            apiKey: 'tenant-1-key',
+            tenantId: 'tenant-1',
+            seenApiKey: (ctx.metadata as TenantContext)?.apiKey,
+          })
+        }),
+        withContext({ metadata: { apiKey: 'tenant-2-key', tenantId: 'tenant-2' } }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 10))
+          const ctx = getContext()
+          tenantResults.push({
+            apiKey: 'tenant-2-key',
+            tenantId: 'tenant-2',
+            seenApiKey: (ctx.metadata as TenantContext)?.apiKey,
+          })
+        }),
+        withContext({ metadata: { apiKey: 'tenant-3-key', tenantId: 'tenant-3' } }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 30))
+          const ctx = getContext()
+          tenantResults.push({
+            apiKey: 'tenant-3-key',
+            tenantId: 'tenant-3',
+            seenApiKey: (ctx.metadata as TenantContext)?.apiKey,
+          })
+        }),
+      ])
+      // Each tenant should see their own API key, not another tenant's!
+      // This is a critical security issue if context leaks
+      for (const result of tenantResults) {
+        expect(result.seenApiKey).toBe(result.apiKey)
+      }
+    })
+  })
+  describe('Configuration Changes Mid-flight', () => {
+    it('should not affect in-flight requests when global config changes', async () => {
+      configure({ model: 'initial-model', provider: 'anthropic' })
+      // Start a long-running operation
+      const operationPromise = withContext({}, async () => {
+        const startModel = getModel()
+        await new Promise(resolve => setTimeout(resolve, 100))
+        const endModel = getModel()
+        return { startModel, endModel }
+      })
+      // Change global config while operation is in flight
+      await new Promise(resolve => setTimeout(resolve, 10))
+      configure({ model: 'changed-model', provider: 'openai' })
+      const result = await operationPromise
+      // The operation should see consistent context throughout
+      // Even though global config changed mid-flight
+      expect(result.startModel).toBe(result.endModel)
+      expect(result.startModel).toBe('initial-model')
+    })
+    it.skip('should isolate configure() calls from concurrent operations (known limitation - use withContext)', async () => {
+      const results: string[] = []
+      await Promise.all([
+        // Operation 1: Set config and use it
+        (async () => {
+          configure({ model: 'op1-model' })
+          await new Promise(resolve => setTimeout(resolve, 50))
+          results.push(`op1: ${getModel()}`)
+        })(),
+        // Operation 2: Set different config
+        (async () => {
+          await new Promise(resolve => setTimeout(resolve, 10))
+          configure({ model: 'op2-model' })
+          await new Promise(resolve => setTimeout(resolve, 10))
+          results.push(`op2: ${getModel()}`)
+        })(),
+      ])
+      // With proper isolation, each operation would see its own config
+      // With current implementation, they interfere with each other
+      // The test documents the expected behavior vs actual behavior
+      expect(results).toContain('op1: op1-model')
+      expect(results).toContain('op2: op2-model')
+    })
+  })
+  describe('Async/Await Interleaving', () => {
+    it('should maintain context across await points', async () => {
+      const results: Array<{ step: string; model: string | undefined }> = []
+      await withContext({ model: 'test-model' }, async () => {
+        results.push({ step: 'before-await-1', model: getModel() })
+        await new Promise(resolve => setTimeout(resolve, 10))
+        results.push({ step: 'after-await-1', model: getModel() })
+        await new Promise(resolve => setTimeout(resolve, 10))
+        results.push({ step: 'after-await-2', model: getModel() })
+        await new Promise(resolve => setTimeout(resolve, 10))
+        results.push({ step: 'after-await-3', model: getModel() })
+      })
+      // All steps should see the same model
+      for (const result of results) {
+        expect(result.model).toBe('test-model')
+      }
+    })
+    it('should handle interleaved async generators', async () => {
+      async function* contextAwareGenerator(contextModel: string, steps: number) {
+        for (let i = 0; i < steps; i++) {
+          await new Promise(resolve => setTimeout(resolve, Math.random() * 20))
+          yield { step: i, model: getModel(), expected: contextModel }
+        }
+      }
+      const results: Array<{ step: number; model: string | undefined; expected: string }> = []
+      // Run generators concurrently in different contexts
+      await Promise.all([
+        withContext({ model: 'generator-1' }, async () => {
+          for await (const item of contextAwareGenerator('generator-1', 5)) {
+            results.push(item)
+          }
+        }),
+        withContext({ model: 'generator-2' }, async () => {
+          for await (const item of contextAwareGenerator('generator-2', 5)) {
+            results.push(item)
+          }
+        }),
+      ])
+      // Each generator should see its own context
+      for (const result of results) {
+        expect(result.model).toBe(result.expected)
+      }
+    })
+  })
+  describe('Batch Mode Isolation', () => {
+    it('should isolate batch mode settings between concurrent operations', async () => {
+      const results = await Promise.all([
+        withContext({ batchMode: 'immediate' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 30))
+          return getBatchMode()
+        }),
+        withContext({ batchMode: 'deferred' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 10))
+          return getBatchMode()
+        }),
+        withContext({ batchMode: 'flex' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 20))
+          return getBatchMode()
+        }),
+      ])
+      expect(results[0]).toBe('immediate')
+      expect(results[1]).toBe('deferred')
+      expect(results[2]).toBe('flex')
+    })
+  })
+  describe('High Concurrency Stress Test', () => {
+    it('should maintain context isolation under high concurrency', async () => {
+      const concurrency = 50
+      const operations = Array.from({ length: concurrency }, (_, i) => i)
+      const results = await Promise.all(
+        operations.map(i =>
+          withContext({ model: `model-${i}`, metadata: { opId: i } }, async () => {
+            // Random delay to maximize interleaving
+            await new Promise(resolve => setTimeout(resolve, Math.random() * 50))
+            const ctx = getContext()
+            return {
+              expected: `model-${i}`,
+              actual: ctx.model,
+              opId: (ctx.metadata as { opId: number })?.opId,
+            }
+          })
+        )
+      )
+      // Every operation should see its own context
+      let failures = 0
+      for (const result of results) {
+        if (result.expected !== result.actual) {
+          failures++
+        }
+      }
+      // With proper isolation, there should be 0 failures
+      // With the current global-based fallback, we expect failures
+      expect(failures).toBe(0)
+    })
+    it('should handle rapid context switches without corruption', async () => {
+      const iterations = 100
+      const errors: string[] = []
+      for (let i = 0; i < iterations; i++) {
+        const expectedModel = `rapid-${i}`
+        await withContext({ model: expectedModel }, async () => {
+          const actualModel = getModel()
+          if (actualModel !== expectedModel) {
+            errors.push(`Iteration ${i}: expected ${expectedModel}, got ${actualModel}`)
+          }
+        })
+      }
+      expect(errors).toEqual([])
+    })
+  })
+  describe('Context Restoration After Error', () => {
+    it('should restore context after exception in withContext', async () => {
+      configure({ model: 'original-model' })
+      try {
+        await withContext({ model: 'error-model' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 10))
+          throw new Error('Test error')
+        })
+      } catch {
+        // Expected error
+      }
+      // Context should be restored to original
+      expect(getModel()).toBe('original-model')
+    })
+    it('should restore context even when nested contexts throw', async () => {
+      configure({ model: 'root-model' })
+      try {
+        await withContext({ model: 'outer-model' }, async () => {
+          await withContext({ model: 'inner-model' }, async () => {
+            await new Promise(resolve => setTimeout(resolve, 10))
+            throw new Error('Inner error')
+          })
+        })
+      } catch {
+        // Expected error
+      }
+      // Context should be fully restored
+      expect(getModel()).toBe('root-model')
+    })
+    it('should isolate error context from parallel operations', async () => {
+      const results: Array<{ id: number; model: string | undefined; error?: boolean }> = []
+      await Promise.allSettled([
+        withContext({ model: 'success-1' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 50))
+          results.push({ id: 1, model: getModel() })
+        }),
+        withContext({ model: 'error-op' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 20))
+          throw new Error('Deliberate error')
+        }),
+        withContext({ model: 'success-2' }, async () => {
+          await new Promise(resolve => setTimeout(resolve, 30))
+          results.push({ id: 2, model: getModel() })
+        }),
+      ])
+      // The error in one operation should not affect others
+      const op1 = results.find(r => r.id === 1)
+      const op2 = results.find(r => r.id === 2)
+      expect(op1?.model).toBe('success-1')
+      expect(op2?.model).toBe('success-2')
+    })
+  })
+})
+// ============================================================================
+// Global Configure Race Conditions
+// ============================================================================
+describe('Global Configure Race Conditions', () => {
+  beforeEach(() => {
+    resetContext()
+  })
+  afterEach(() => {
+    resetContext()
+  })
+  // NOTE: These tests document the EXPECTED race conditions when using configure()
+  // concurrently. The configure() function is for setting global defaults at startup,
+  // NOT for concurrent tenant isolation. Use withContext() for that.
+  //
+  // These tests are marked as .skip because they document known limitations,
+  // not bugs. The correct fix is to use withContext() for concurrent scenarios.
+  it.skip('should not allow configure() to affect already-started operations (known limitation - use withContext)', async () => {
+    // This is the core race condition: configure() modifies globalContext
+    // which is read by getContext() at arbitrary times
+    configure({ model: 'original' })
+    const operationResults: Array<{ stage: string; model: string | undefined }> = []
+    // Start operation that reads context multiple times
+    const operation = (async () => {
+      operationResults.push({ stage: 'start', model: getModel() })
+      await new Promise(resolve => setTimeout(resolve, 30))
+      operationResults.push({ stage: 'middle', model: getModel() })
+      await new Promise(resolve => setTimeout(resolve, 30))
+      operationResults.push({ stage: 'end', model: getModel() })
+    })()
+    // Interfering configure() calls while operation is running
+    await new Promise(resolve => setTimeout(resolve, 10))
+    configure({ model: 'interference-1' })
+    await new Promise(resolve => setTimeout(resolve, 20))
+    configure({ model: 'interference-2' })
+    await new Promise(resolve => setTimeout(resolve, 20))
+    configure({ model: 'interference-3' })
+    await operation
+    // The operation should see consistent context throughout
+    // But with global configure(), each stage might see different models!
+    const models = operationResults.map(r => r.model)
+    const uniqueModels = new Set(models)
+    // If isolation is working, should only see 1 model
+    // If broken, might see multiple models
+    expect(uniqueModels.size).toBe(1)
+    expect(models[0]).toBe('original')
+  })
+  it.skip('should demonstrate configure() race in multi-tenant scenario (known limitation - use withContext)', async () => {
+    // Simulate multiple tenants configuring their own settings
+    // This is a realistic scenario that will fail without proper isolation
+    const tenantOperations = [
+      { tenantId: 'tenant-a', model: 'claude-opus-4-5', delay: 100 },
+      { tenantId: 'tenant-b', model: 'gpt-4o', delay: 50 },
+      { tenantId: 'tenant-c', model: 'gemini-pro', delay: 75 },
+    ]
+    const results: Array<{ tenantId: string; expected: string; actual: string | undefined }> = []
+    await Promise.all(
+      tenantOperations.map(async ({ tenantId, model, delay }) => {
+        // Each tenant configures their model
+        configure({ model })
+        // Some processing time...
+        await new Promise(resolve => setTimeout(resolve, delay))
+        // Check what model they see - should be their configured model
+        const actualModel = getModel()
+        results.push({ tenantId, expected: model, actual: actualModel })
+      })
+    )
+    // Each tenant should see their own model
+    // This WILL fail because configure() races with other tenants
+    for (const result of results) {
+      expect(result.actual).toBe(result.expected)
+    }
+  })
+  it('should show configure() racing with withContext()', async () => {
+    configure({ model: 'global-model' })
+    const results: string[] = []
+    await Promise.all([
+      // Operation using withContext (should be isolated)
+      withContext({ model: 'isolated-model' }, async () => {
+        results.push(`withContext-start: ${getModel()}`)
+        await new Promise(resolve => setTimeout(resolve, 50))
+        results.push(`withContext-end: ${getModel()}`)
+      }),
+      // Operation modifying global config (affects anyone reading globalContext)
+      (async () => {
+        await new Promise(resolve => setTimeout(resolve, 25))
+        configure({ model: 'racing-model' })
+        results.push(`configure-done: ${getModel()}`)
+      })(),
+    ])
+    // withContext should maintain isolation
+    expect(results).toContain('withContext-start: isolated-model')
+    expect(results).toContain('withContext-end: isolated-model')
+  })
+  it.skip('should expose getGlobalContext() mutation issues (known limitation - use withContext)', async () => {
+    configure({ model: 'safe-model' })
+    // Multiple operations reading global context
+    const reads: Array<{ time: number; model: string | undefined }> = []
+    const readerPromise = (async () => {
+      for (let i = 0; i < 10; i++) {
+        const ctx = getContext()
+        reads.push({ time: Date.now(), model: ctx.model })
+        await new Promise(resolve => setTimeout(resolve, 10))
+      }
+    })()
+    // Concurrent writer
+    const writerPromise = (async () => {
+      for (let i = 0; i < 5; i++) {
+        await new Promise(resolve => setTimeout(resolve, 15))
+        configure({ model: `mutated-${i}` })
+      }
+    })()
+    await Promise.all([readerPromise, writerPromise])
+    // The reader should see consistent values if properly isolated
+    // With current implementation, it will see a mix of values
+    const uniqueModels = new Set(reads.map(r => r.model))
+    // Document the race condition - multiple values seen
+    // With proper isolation, should only see initial value
+    console.log('Models seen during concurrent read/write:', [...uniqueModels])
+    // This assertion documents expected behavior - only 1 model should be seen
+    expect(uniqueModels.size).toBe(1)
+  })
+})
+// ============================================================================
+// Edge Cases and Regression Tests
+// ============================================================================
+describe('Context Edge Cases', () => {
+  beforeEach(() => {
+    resetContext()
+  })
+  afterEach(() => {
+    resetContext()
+  })
+  it('should handle undefined context values', async () => {
+    const results = await Promise.all([
+      withContext({ model: undefined }, async () => {
+        await new Promise(resolve => setTimeout(resolve, 10))
+        return getModel()
+      }),
+      withContext({ model: 'defined-model' }, async () => {
+        await new Promise(resolve => setTimeout(resolve, 5))
+        return getModel()
+      }),
+    ])
+    // Default model should be returned for undefined
+    expect(results[0]).toBe('sonnet')
+    expect(results[1]).toBe('defined-model')
+  })
+  it('should handle empty context object', async () => {
+    configure({ model: 'configured-model' })
+    const result = await withContext({}, async () => {
+      await new Promise(resolve => setTimeout(resolve, 10))
+      return getModel()
+    })
+    // Should inherit from global config
+    expect(result).toBe('configured-model')
+  })
+  it('should handle deeply nested concurrent contexts', async () => {
+    const results: string[] = []
+    await Promise.all([
+      withContext({ model: 'level-0-a' }, async () => {
+        results.push(`0a: ${getModel()}`)
+        await withContext({ model: 'level-1-a' }, async () => {
+          results.push(`1a: ${getModel()}`)
+          await Promise.all([
+            withContext({ model: 'level-2-a1' }, async () => {
+              await new Promise(resolve => setTimeout(resolve, 20))
+              results.push(`2a1: ${getModel()}`)
+            }),
+            withContext({ model: 'level-2-a2' }, async () => {
+              await new Promise(resolve => setTimeout(resolve, 10))
+              results.push(`2a2: ${getModel()}`)
+            }),
+          ])
+          results.push(`1a-after: ${getModel()}`)
+        })
+        results.push(`0a-after: ${getModel()}`)
+      }),
+      withContext({ model: 'level-0-b' }, async () => {
+        await new Promise(resolve => setTimeout(resolve, 15))
+        results.push(`0b: ${getModel()}`)
+      }),
+    ])
+    // Verify each level sees correct context
+    expect(results).toContain('0a: level-0-a')
+    expect(results).toContain('1a: level-1-a')
+    expect(results).toContain('2a1: level-2-a1')
+    expect(results).toContain('2a2: level-2-a2')
+    expect(results).toContain('1a-after: level-1-a')
+    expect(results).toContain('0a-after: level-0-a')
+    expect(results).toContain('0b: level-0-b')
+  })
+})