npm - @outputai/llm - Versions diffs - 0.6.1-dev.daae905.0 → 0.6.1-next.2cc4685.0 - Mend

@outputai/llm 0.6.1-dev.daae905.0 → 0.6.1-next.2cc4685.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

package/package.json +2 -2
package/src/agent.js +15 -9
package/src/agent.spec.js +295 -214
package/src/ai_model.js +79 -36
package/src/ai_model.spec.js +31 -13
package/src/ai_sdk.js +55 -79
package/src/ai_sdk.spec.js +464 -611
package/src/ai_sdk_options.js +61 -0
package/src/ai_sdk_options.spec.js +164 -0
package/src/cost/index.js +1 -1
package/src/index.d.ts +230 -175
package/src/index.js +2 -2
package/src/prompt/escape.js +65 -0
package/src/prompt/escape.spec.js +159 -0
package/src/{load_content.js → prompt/load_content.js} +1 -22
package/src/{load_content.spec.js → prompt/load_content.spec.js} +6 -6
package/src/prompt/loader.js +49 -0
package/src/prompt/loader.spec.js +274 -0
package/src/{prompt_loader_validation.spec.js → prompt/loader_validation.spec.js} +40 -7
package/src/prompt/parser.js +19 -0
package/src/{parser.spec.js → prompt/parser.spec.js} +74 -29
package/src/prompt/prepare_text.js +27 -0
package/src/prompt/prepare_text.spec.js +141 -0
package/src/{skill.js → prompt/skill.js} +19 -0
package/src/prompt/skill.spec.js +172 -0
package/src/{prompt_validations.js → prompt/validations.js} +32 -6
package/src/{prompt_validations.spec.js → prompt/validations.spec.js} +189 -1
package/src/utils/__fixtures__/image_response.json +38 -0
package/src/utils/__fixtures__/stream_response.json +294 -0
package/src/utils/__fixtures__/text_response.json +201 -0
package/src/utils/error_handler.js +65 -0
package/src/utils/error_handler.spec.js +195 -0
package/src/utils/image.js +10 -0
package/src/utils/image.spec.js +20 -0
package/src/utils/response_wrappers.js +46 -19
package/src/utils/response_wrappers.spec.js +130 -70
package/src/utils/source_extraction.js +17 -27
package/src/utils/trace.js +2 -3
package/src/utils/trace.spec.js +9 -13
package/src/validations.js +54 -2
package/src/validations.spec.js +166 -0
package/src/parser.js +0 -28
package/src/prompt_loader.js +0 -80
package/src/prompt_loader.spec.js +0 -358
package/src/skill.d.ts +0 -49

package/src/ai_sdk.spec.js CHANGED Viewed

@@ -1,13 +1,58 @@
 import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+const aiFns = vi.hoisted( () => ( {
+  generateText: vi.fn(),
+  streamText: vi.fn(),
+  generateImage: vi.fn(),
+  stepCountIs: vi.fn( count => ( { type: 'step-count', count } ) )
+} ) );
+const validators = vi.hoisted( () => ( {
+  validateGenerateTextArgs: vi.fn(),
+  validateStreamTextArgs: vi.fn(),
+  validateGenerateImageArgs: vi.fn()
+} ) );
+const promptMocks = vi.hoisted( () => ( {
+  loadPrompt: vi.fn(),
+  prepareTextPrompt: vi.fn()
+} ) );
+const optionMocks = vi.hoisted( () => ( {
+  loadAiSdkTextOptions: vi.fn(),
+  loadAiSdkImageOptions: vi.fn()
+} ) );
 const traceMocks = vi.hoisted( () => ( {
-  startTrace: vi.fn( () => 'trace-id' ),
+  startTrace: vi.fn(),
   endTraceWithError: vi.fn()
 } ) );
 const wrapMocks = vi.hoisted( () => ( {
   wrapTextResponse: vi.fn(),
-  wrapStreamOnFinishResponse: vi.fn()
+  wrapStreamOnFinishResponse: vi.fn(),
+  wrapImageResponse: vi.fn()
+} ) );
+const errorMocks = vi.hoisted( () => ( {
+  mapAiError: vi.fn( error => error )
+} ) );
+vi.mock( 'ai', () => aiFns );
+vi.mock( './validations.js', () => validators );
+vi.mock( './prompt/loader.js', () => ( {
+  loadPrompt: ( ...args ) => promptMocks.loadPrompt( ...args )
+} ) );
+vi.mock( './prompt/prepare_text.js', () => ( {
+  prepareTextPrompt: ( ...args ) => promptMocks.prepareTextPrompt( ...args )
+} ) );
+vi.mock( './ai_sdk_options.js', () => ( {
+  loadAiSdkTextOptions: ( ...args ) => optionMocks.loadAiSdkTextOptions( ...args ),
+  loadAiSdkImageOptions: ( ...args ) => optionMocks.loadAiSdkImageOptions( ...args )
 } ) );
 vi.mock( './utils/trace.js', () => ( {
@@ -17,688 +62,496 @@ vi.mock( './utils/trace.js', () => ( {
 vi.mock( './utils/response_wrappers.js', () => ( {
   wrapTextResponse: ( ...args ) => wrapMocks.wrapTextResponse( ...args ),
-  wrapStreamOnFinishResponse: ( ...args ) => wrapMocks.wrapStreamOnFinishResponse( ...args )
+  wrapStreamOnFinishResponse: ( ...args ) => wrapMocks.wrapStreamOnFinishResponse( ...args ),
+  wrapImageResponse: ( ...args ) => wrapMocks.wrapImageResponse( ...args )
 } ) );
-const loadModelImpl = vi.fn();
-const loadToolsImpl = vi.fn();
-vi.mock( './ai_model.js', () => ( {
-  loadModel: ( ...values ) => loadModelImpl( ...values ),
-  loadTools: ( ...values ) => loadToolsImpl( ...values )
+vi.mock( './utils/error_handler.js', () => ( {
+  mapAiError: ( ...args ) => errorMocks.mapAiError( ...args )
 } ) );
-const aiFns = {
-  generateText: vi.fn(),
-  streamText: vi.fn(),
-  tool: vi.fn( def => def ),
-  stepCountIs: vi.fn( n => ( { type: 'stepCount', count: n } ) )
-};
-vi.mock( 'ai', () => ( aiFns ) );
+const importSut = async () => import( './ai_sdk.js' );
-const validators = {
-  validateGenerateTextArgs: vi.fn(),
-  validateStreamTextArgs: vi.fn()
+const loadedPrompt = {
+  name: 'test@v1',
+  config: { model: 'test-model' },
+  messages: [ { role: 'user', content: 'Hello' } ]
 };
-vi.mock( './validations.js', () => ( validators ) );
-const loadPromptImpl = vi.fn();
-vi.mock( './prompt_loader.js', () => ( {
-  loadPrompt: ( ...values ) => loadPromptImpl( ...values )
-} ) );
+const textOptions = {
+  model: 'MODEL',
+  messages: loadedPrompt.messages,
+  providerOptions: { test: true }
+};
-const loadPromptSkillsImpl = vi.fn();
-const loadColocatedSkillsImpl = vi.fn().mockReturnValue( [] );
-vi.mock( './skill.js', async importOriginal => {
-  const original = await importOriginal();
-  return {
-    ...original,
-    loadPromptSkills: ( ...args ) => loadPromptSkillsImpl( ...args ),
-    loadColocatedSkills: ( ...args ) => loadColocatedSkillsImpl( ...args )
-  };
-} );
+const textResponse = {
+  text: 'TEXT',
+  totalUsage: { inputTokens: 1, outputTokens: 2 },
+  finishReason: 'stop'
+};
-const importSut = async () => import( './ai_sdk.js' );
+const streamResult = {
+  textStream: 'TEXT_STREAM',
+  fullStream: 'FULL_STREAM'
+};
-const basePrompt = {
-  config: {
-    provider: 'openai',
-    model: 'gpt-4o-mini',
-    temperature: 0.3,
-    providerOptions: { thinking: { enabled: true } }
+const imageOptions = {
+  model: 'IMAGE_MODEL',
+  prompt: {
+    text: 'Generate an image'
   },
-  messages: [ { role: 'user', content: 'Hi' } ]
+  providerOptions: { openai: { quality: 'high' } }
 };
-/** Mutable payload from `AI.generateText` — identity checks prove `generateText` returns `wrapTextResponse(...)` without substitution. */
-const generateTextAiFixture = {
-  response: {
-    text: 'TEXT',
-    sources: [],
-    usage: { inputTokens: 10, outputTokens: 5, totalTokens: 15 },
-    totalUsage: { inputTokens: 10, outputTokens: 5, totalTokens: 15 },
-    finishReason: 'stop'
-  }
+const imageResponse = {
+  images: [ { mediaType: 'image/png', base64: 'aW1hZ2U=' } ],
+  usage: { inputTokens: 1, outputTokens: 2 }
 };
-beforeEach( () => {
-  loadModelImpl.mockReset().mockReturnValue( 'MODEL' );
-  loadPromptImpl.mockReset().mockReturnValue( { ...basePrompt, messages: [ ...basePrompt.messages ] } );
-  aiFns.tool.mockReset().mockImplementation( def => def );
-  aiFns.stepCountIs.mockReset().mockImplementation( n => ( { type: 'stepCount', count: n } ) );
-  loadPromptSkillsImpl.mockReset().mockReturnValue( [] );
-  loadColocatedSkillsImpl.mockReset().mockReturnValue( [] );
-  traceMocks.startTrace.mockReset().mockReturnValue( 'trace-id' );
-  traceMocks.endTraceWithError.mockReset();
-  wrapMocks.wrapTextResponse.mockReset().mockImplementation( async ( { response } ) => response );
-  wrapMocks.wrapStreamOnFinishResponse.mockReset().mockImplementation( ( { onFinish } ) => ( {
-    async onFinish( response ) {
-      onFinish?.( response );
-    }
-  } ) );
-  const defaultUsage = { inputTokens: 10, outputTokens: 5, totalTokens: 15 };
-  generateTextAiFixture.response = {
-    text: 'TEXT',
-    sources: [],
-    usage: defaultUsage,
-    totalUsage: defaultUsage,
-    finishReason: 'stop'
-  };
-  aiFns.generateText.mockReset().mockResolvedValue( generateTextAiFixture.response );
-  aiFns.streamText.mockReset().mockReturnValue( {
-    textStream: 'MOCK_TEXT_STREAM',
-    fullStream: 'MOCK_FULL_STREAM',
-    text: Promise.resolve( 'STREAMED_TEXT' ),
-    usage: Promise.resolve( { inputTokens: 10, outputTokens: 5, totalTokens: 15 } ),
-    finishReason: Promise.resolve( 'stop' ),
-    sources: Promise.resolve( [] )
-  } );
-} );
-afterEach( async () => {
-  await vi.resetModules();
-  vi.clearAllMocks();
-} );
 describe( 'ai_sdk', () => {
-  it( 'generateText: validates, delegates trace/wrap utils, calls AI and returns wrapTextResponse output', async () => {
-    const { generateText } = await importSut();
-    const defaultUsage = { inputTokens: 10, outputTokens: 5, totalTokens: 15 };
-    const result = await generateText( { prompt: 'test_prompt@v1' } );
-    expect( validators.validateGenerateTextArgs ).toHaveBeenCalledWith( { prompt: 'test_prompt@v1' } );
-    expect( loadPromptImpl ).toHaveBeenCalledWith( 'test_prompt@v1', undefined, undefined );
-    expect( traceMocks.startTrace ).toHaveBeenCalledTimes( 1 );
-    expect( traceMocks.startTrace ).toHaveBeenCalledWith( expect.objectContaining( {
-      name: 'generateText',
-      prompt: 'test_prompt@v1'
-    } ) );
-    expect( wrapMocks.wrapTextResponse ).toHaveBeenCalledTimes( 1 );
-    expect( wrapMocks.wrapTextResponse ).toHaveBeenCalledWith( {
-      traceId: 'trace-id',
-      modelId: basePrompt.config.model,
-      response: generateTextAiFixture.response
+  beforeEach( () => {
+    aiFns.generateText.mockReset().mockResolvedValue( textResponse );
+    aiFns.streamText.mockReset().mockReturnValue( streamResult );
+    aiFns.generateImage.mockReset().mockResolvedValue( imageResponse );
+    aiFns.stepCountIs.mockReset().mockImplementation( count => ( { type: 'step-count', count } ) );
+    validators.validateGenerateTextArgs.mockReset();
+    validators.validateStreamTextArgs.mockReset();
+    validators.validateGenerateImageArgs.mockReset();
+    promptMocks.loadPrompt.mockReset().mockReturnValue( loadedPrompt );
+    promptMocks.prepareTextPrompt.mockReset().mockReturnValue( {
+      loadedPrompt,
+      tools: null
     } );
-    expect( loadModelImpl ).toHaveBeenCalledWith( basePrompt );
-    expect( aiFns.generateText ).toHaveBeenCalledWith( {
-      model: 'MODEL',
-      messages: basePrompt.messages,
-      temperature: 0.3,
-      maxRetries: 0,
-      providerOptions: basePrompt.config.providerOptions
-    } );
-    expect( result ).toBe( generateTextAiFixture.response );
-    expect( result.totalUsage ).toEqual( defaultUsage );
-  } );
+    optionMocks.loadAiSdkTextOptions.mockReset().mockReturnValue( textOptions );
+    optionMocks.loadAiSdkImageOptions.mockReset().mockReturnValue( imageOptions );
-  it( 'generateText: passes provider-specific options to AI SDK', async () => {
-    const promptWithProviderOptions = {
-      config: {
-        provider: 'anthropic',
-        model: 'claude-sonnet-4-20250514',
-        providerOptions: {
-          thinking: {
-            type: 'enabled',
-            budgetTokens: 5000
-          },
-          anthropic: {
-            effort: 'medium',
-            customOption: 'value'
-          },
-          customField: 'should-be-passed'
-        }
-      },
-      messages: [ { role: 'user', content: 'Test' } ]
-    };
-    loadPromptImpl.mockReturnValueOnce( promptWithProviderOptions );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1' } );
-    expect( aiFns.generateText ).toHaveBeenCalledWith( {
-      model: 'MODEL',
-      messages: promptWithProviderOptions.messages,
-      maxRetries: 0,
-      providerOptions: {
-        thinking: {
-          type: 'enabled',
-          budgetTokens: 5000
-        },
-        anthropic: {
-          effort: 'medium',
-          customOption: 'value'
-        },
-        customField: 'should-be-passed'
-      }
-    } );
-  } );
+    traceMocks.startTrace.mockReset().mockReturnValue( 'trace-id' );
+    traceMocks.endTraceWithError.mockReset();
-  it( 'generateText: passes through providerMetadata', async () => {
-    const usageProvider = { inputTokens: 10, outputTokens: 5, totalTokens: 15 };
-    aiFns.generateText.mockResolvedValueOnce( {
-      text: 'TEXT',
-      sources: [],
-      usage: usageProvider,
-      totalUsage: usageProvider,
-      finishReason: 'stop',
-      providerMetadata: { anthropic: { cacheReadInputTokens: 50 } }
+    wrapMocks.wrapTextResponse.mockReset().mockResolvedValue( { wrapped: textResponse } );
+    wrapMocks.wrapStreamOnFinishResponse.mockReset().mockReturnValue( {
+      onFinish: vi.fn()
     } );
-    const { generateText } = await importSut();
-    const result = await generateText( { prompt: 'test_prompt@v1' } );
-    expect( result.providerMetadata ).toEqual( { anthropic: { cacheReadInputTokens: 50 } } );
-  } );
-  it( 'generateText: passes through warnings and response metadata', async () => {
-    const usageWarnings = { inputTokens: 10, outputTokens: 5, totalTokens: 15 };
-    aiFns.generateText.mockResolvedValueOnce( {
-      text: 'TEXT',
-      sources: [],
-      usage: usageWarnings,
-      totalUsage: usageWarnings,
-      finishReason: 'stop',
-      warnings: [ { type: 'other', message: 'Test warning' } ],
-      response: { id: 'req_123', modelId: 'gpt-4o-2024-05-13' }
+    wrapMocks.wrapImageResponse.mockReset().mockResolvedValue( { wrapped: imageResponse } );
+    errorMocks.mapAiError.mockReset().mockImplementation( error => error );
+  } );
+  afterEach( async () => {
+    await vi.resetModules();
+  } );
+  describe( 'generateText', () => {
+    it( 'prepares, validates, traces, calls AI SDK, and wraps the response', async () => {
+      const { generateText } = await importSut();
+      const variables = { topic: 'testing' };
+      const tools = { calculator: { description: 'Calculator' } };
+      const skills = [ { name: 'style', description: 'Style', instructions: '# Style' } ];
+      promptMocks.prepareTextPrompt.mockReturnValueOnce( {
+        loadedPrompt,
+        tools
+      } );
+      const result = await generateText( {
+        prompt: 'test@v1',
+        variables,
+        promptDir: '/prompts',
+        skills,
+        maxSteps: 4,
+        tools: { userTool: true },
+        temperature: 0.2
+      } );
+      expect( promptMocks.prepareTextPrompt ).toHaveBeenCalledWith( {
+        prompt: 'test@v1',
+        variables,
+        promptDir: '/prompts',
+        skills,
+        tools: { userTool: true }
+      } );
+      expect( validators.validateGenerateTextArgs ).toHaveBeenCalledWith( {
+        prompt: 'test@v1',
+        variables,
+        promptDir: '/prompts',
+        skills,
+        maxSteps: 4
+      } );
+      expect( traceMocks.startTrace ).toHaveBeenCalledWith( {
+        name: 'generateText',
+        prompt: 'test@v1',
+        variables,
+        loadedPrompt
+      } );
+      expect( optionMocks.loadAiSdkTextOptions ).toHaveBeenCalledWith( loadedPrompt );
+      expect( aiFns.stepCountIs ).toHaveBeenCalledWith( 4 );
+      expect( aiFns.generateText ).toHaveBeenCalledWith( {
+        ...textOptions,
+        maxRetries: 0,
+        tools,
+        temperature: 0.2,
+        stopWhen: { type: 'step-count', count: 4 }
+      } );
+      expect( wrapMocks.wrapTextResponse ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        modelId: 'test-model',
+        response: textResponse
+      } );
+      expect( result ).toEqual( { wrapped: textResponse } );
     } );
-    const { generateText } = await importSut();
-    const result = await generateText( { prompt: 'test_prompt@v1' } );
-    expect( result.warnings ).toEqual( [ { type: 'other', message: 'Test warning' } ] );
-    expect( result.response ).toEqual( { id: 'req_123', modelId: 'gpt-4o-2024-05-13' } );
-  } );
+    it( 'uses resolved dynamic skills', async () => {
+      const { generateText } = await importSut();
+      const variables = { topic: 'testing' };
+      const resolvedSkills = [ { name: 'dynamic', description: 'Dynamic', instructions: '# Dynamic' } ];
+      const skills = vi.fn().mockResolvedValue( resolvedSkills );
-  it( 'generateText: traces error and rethrows when AI SDK fails', async () => {
-    const error = new Error( 'API rate limit exceeded' );
-    aiFns.generateText.mockRejectedValueOnce( error );
-    const { generateText } = await importSut();
+      await generateText( { prompt: 'test@v1', variables, skills } );
-    await expect( generateText( { prompt: 'test_prompt@v1' } ) ).rejects.toThrow( 'API rate limit exceeded' );
-    expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( { traceId: 'trace-id', error } );
-  } );
-  it( 'generateText: passes the AI response object through to wrapTextResponse and returns it', async () => {
-    const responseWithGetter = {
-      _internalText: 'TEXT_FROM_GETTER',
-      get text() {
-        return this._internalText;
-      },
-      sources: [],
-      usage: { inputTokens: 10, outputTokens: 5, totalTokens: 15 },
-      totalUsage: { inputTokens: 10, outputTokens: 5, totalTokens: 15 },
-      finishReason: 'stop'
-    };
-    aiFns.generateText.mockResolvedValueOnce( responseWithGetter );
-    const { generateText } = await importSut();
-    const out = await generateText( { prompt: 'test_prompt@v1' } );
-    expect( wrapMocks.wrapTextResponse ).toHaveBeenCalledWith( {
-      traceId: 'trace-id',
-      modelId: basePrompt.config.model,
-      response: responseWithGetter
+      expect( skills ).toHaveBeenCalledWith( variables );
+      expect( promptMocks.prepareTextPrompt ).toHaveBeenCalledWith( expect.objectContaining( {
+        skills: resolvedSkills
+      } ) );
     } );
-    expect( out ).toBe( responseWithGetter );
-    expect( out.text ).toBe( 'TEXT_FROM_GETTER' );
-  } );
-  it( 'generateText: passes through AI SDK options like tools and maxRetries', async () => {
-    const { generateText } = await importSut();
-    const mockTools = { calculator: { description: 'A calculator tool' } };
-    await generateText( {
-      prompt: 'test_prompt@v1',
-      tools: mockTools,
-      toolChoice: 'required',
-      maxRetries: 5,
-      seed: 42
-    } );
+    it( 'omits tools and stopWhen when no tools are prepared', async () => {
+      const { generateText } = await importSut();
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( {
-        tools: mockTools,
-        toolChoice: 'required',
-        maxRetries: 5,
-        seed: 42
-      } )
-    );
-  } );
+      await generateText( { prompt: 'test@v1' } );
-  it( 'generateText: user-provided temperature overrides prompt temperature', async () => {
-    loadPromptImpl.mockReturnValueOnce( {
-      config: {
-        provider: 'openai',
-        model: 'gpt-4o',
-        temperature: 0.7
-      },
-      messages: [ { role: 'user', content: 'Hi' } ]
+      expect( aiFns.stepCountIs ).not.toHaveBeenCalled();
+      expect( aiFns.generateText ).toHaveBeenCalledWith( {
+        ...textOptions,
+        maxRetries: 0
+      } );
     } );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', temperature: 0.2 } );
+    it( 'preserves caller-provided stopWhen when tools are prepared', async () => {
+      const { generateText } = await importSut();
+      const stopWhen = { type: 'custom-stop' };
+      promptMocks.prepareTextPrompt.mockReturnValueOnce( {
+        loadedPrompt,
+        tools: { load_skill: { description: 'Load skill' } }
+      } );
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( { temperature: 0.2 } )
-    );
-  } );
+      await generateText( { prompt: 'test@v1', stopWhen } );
-  it( 'generateText: passes through temperature: 0 from prompt', async () => {
-    loadPromptImpl.mockReturnValueOnce( {
-      config: {
-        provider: 'openai',
-        model: 'gpt-4o',
-        temperature: 0
-      },
-      messages: [ { role: 'user', content: 'Hi' } ]
+      expect( aiFns.stepCountIs ).not.toHaveBeenCalled();
+      expect( aiFns.generateText ).toHaveBeenCalledWith( expect.objectContaining( {
+        stopWhen
+      } ) );
     } );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1' } );
+    it( 'propagates validation errors before tracing or calling AI SDK', async () => {
+      const validationError = new Error( 'Invalid args' );
+      validators.validateGenerateTextArgs.mockImplementationOnce( () => {
+        throw validationError;
+      } );
+      const { generateText } = await importSut();
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( { temperature: 0 } )
-    );
-  } );
-  it( 'generateText: does not add structured output fields the AI response lacks', async () => {
-    const { generateText } = await importSut();
-    const result = await generateText( { prompt: 'test_prompt@v1' } );
-    expect( result.object ).toBeUndefined();
-  } );
-  it( 'generateText: passes through unknown future options for forward compatibility', async () => {
-    const { generateText } = await importSut();
-    await generateText( {
-      prompt: 'test_prompt@v1',
-      experimental_futureOption: { key: 'value' },
-      unknownOption: true
+      await expect( generateText( { prompt: '' } ) ).rejects.toThrow( validationError );
+      expect( traceMocks.startTrace ).not.toHaveBeenCalled();
+      expect( aiFns.generateText ).not.toHaveBeenCalled();
     } );
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( {
-        experimental_futureOption: { key: 'value' },
-        unknownOption: true
-      } )
-    );
+    it( 'traces and rethrows AI SDK errors', async () => {
+      const error = new Error( 'Provider failed' );
+      const mappedError = new Error( 'Mapped provider failed' );
+      aiFns.generateText.mockRejectedValueOnce( error );
+      errorMocks.mapAiError.mockReturnValueOnce( mappedError );
+      const { generateText } = await importSut();
+      await expect( generateText( { prompt: 'test@v1' } ) ).rejects.toThrow( mappedError );
+      expect( errorMocks.mapAiError ).toHaveBeenCalledWith( error );
+      expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        error: mappedError
+      } );
+    } );
   } );
-  it( 'streamText: validates, delegates trace/wrap utils, calls AI streamText and returns stream result', async () => {
-    const { streamText } = await importSut();
-    const result = streamText( { prompt: 'test_prompt@v1' } );
-    expect( validators.validateStreamTextArgs ).toHaveBeenCalledWith( { prompt: 'test_prompt@v1' } );
-    expect( loadPromptImpl ).toHaveBeenCalledWith( 'test_prompt@v1', undefined );
-    expect( traceMocks.startTrace ).toHaveBeenCalledTimes( 1 );
-    expect( loadModelImpl ).toHaveBeenCalledWith( basePrompt );
-    expect( aiFns.streamText ).toHaveBeenCalledWith(
-      expect.objectContaining( {
-        model: 'MODEL',
-        messages: basePrompt.messages,
-        temperature: 0.3,
+  describe( 'streamText', () => {
+    it( 'prepares, validates, traces, calls AI SDK, and returns the stream result', async () => {
+      const { streamText } = await importSut();
+      const variables = { topic: 'testing' };
+      const onFinish = vi.fn();
+      const tools = { calculator: { description: 'Calculator' } };
+      const skills = [ { name: 'style', description: 'Style', instructions: '# Style' } ];
+      promptMocks.prepareTextPrompt.mockReturnValueOnce( {
+        loadedPrompt,
+        tools
+      } );
+      const result = streamText( {
+        prompt: 'test@v1',
+        variables,
+        promptDir: '/prompts',
+        skills,
+        maxSteps: 4,
+        onFinish,
+        tools: { userTool: true },
+        temperature: 0.2
+      } );
+      expect( validators.validateStreamTextArgs ).toHaveBeenCalledWith( {
+        prompt: 'test@v1',
+        variables,
+        promptDir: '/prompts',
+        skills,
+        maxSteps: 4
+      } );
+      expect( promptMocks.prepareTextPrompt ).toHaveBeenCalledWith( {
+        prompt: 'test@v1',
+        variables,
+        promptDir: '/prompts',
+        skills,
+        tools: { userTool: true }
+      } );
+      expect( traceMocks.startTrace ).toHaveBeenCalledWith( {
+        name: 'streamText',
+        prompt: 'test@v1',
+        variables,
+        loadedPrompt
+      } );
+      expect( optionMocks.loadAiSdkTextOptions ).toHaveBeenCalledWith( loadedPrompt );
+      expect( wrapMocks.wrapStreamOnFinishResponse ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        modelId: 'test-model',
+        onFinish
+      } );
+      expect( aiFns.stepCountIs ).toHaveBeenCalledWith( 4 );
+      expect( aiFns.streamText ).toHaveBeenCalledWith( {
+        ...textOptions,
         maxRetries: 0,
-        providerOptions: basePrompt.config.providerOptions,
+        tools,
+        temperature: 0.2,
+        stopWhen: { type: 'step-count', count: 4 },
         onFinish: expect.any( Function ),
         onError: expect.any( Function )
-      } )
-    );
-    expect( result.textStream ).toBe( 'MOCK_TEXT_STREAM' );
-    expect( result.fullStream ).toBe( 'MOCK_FULL_STREAM' );
-  } );
-  it( 'streamText: forwards stream onFinish through wrapStreamOnFinishResponse to the user callback', async () => {
-    const { streamText } = await importSut();
-    const userOnFinish = vi.fn();
-    streamText( { prompt: 'test_prompt@v1', onFinish: userOnFinish } );
-    expect( wrapMocks.wrapStreamOnFinishResponse ).toHaveBeenCalledWith( expect.objectContaining( {
-      traceId: 'trace-id',
-      modelId: basePrompt.config.model,
-      onFinish: userOnFinish
-    } ) );
-    const callArgs = aiFns.streamText.mock.calls[0][0];
-    const usage = { inputTokens: 10, outputTokens: 5, totalTokens: 15 };
-    const finishEvent = {
-      text: 'STREAMED_TEXT',
-      usage,
-      totalUsage: usage,
-      providerMetadata: { anthropic: { cacheReadInputTokens: 50 } },
-      finishReason: 'stop'
-    };
-    await callArgs.onFinish( finishEvent );
-    expect( userOnFinish ).toHaveBeenCalledTimes( 1 );
-    expect( userOnFinish ).toHaveBeenCalledWith( finishEvent );
-  } );
+      } );
+      expect( result ).toBe( streamResult );
+    } );
-  it( 'streamText: onError callback traces error and calls user callback', async () => {
-    const { streamText } = await importSut();
-    const userOnError = vi.fn();
+    it( 'uses resolved dynamic skills', async () => {
+      const { streamText } = await importSut();
+      const variables = { topic: 'testing' };
+      const resolvedSkills = [ { name: 'dynamic', description: 'Dynamic', instructions: '# Dynamic' } ];
+      const skills = vi.fn().mockReturnValue( resolvedSkills );
-    streamText( { prompt: 'test_prompt@v1', onError: userOnError } );
+      streamText( { prompt: 'test@v1', variables, skills } );
-    const callArgs = aiFns.streamText.mock.calls[0][0];
-    const error = new Error( 'Stream failed' );
-    callArgs.onError( { error } );
+      expect( skills ).toHaveBeenCalledWith( variables );
+      expect( promptMocks.prepareTextPrompt ).toHaveBeenCalledWith( expect.objectContaining( {
+        skills: resolvedSkills
+      } ) );
+    } );
-    expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( { traceId: 'trace-id', error } );
-    expect( userOnError ).toHaveBeenCalledWith( { error } );
-  } );
+    it( 'throws when dynamic skills resolve asynchronously', async () => {
+      const { streamText } = await importSut();
+      const variables = { topic: 'testing' };
+      const skills = vi.fn().mockResolvedValue( [
+        { name: 'dynamic', description: 'Dynamic', instructions: '# Dynamic' }
+      ] );
-  it( 'streamText: works without user onFinish/onError callbacks', async () => {
-    const { streamText } = await importSut();
-    streamText( { prompt: 'test_prompt@v1' } );
-    const callArgs = aiFns.streamText.mock.calls[0][0];
-    const usage = { inputTokens: 10, outputTokens: 5, totalTokens: 15 };
-    const finishEvent = {
-      text: 'TEXT',
-      usage,
-      totalUsage: usage,
-      finishReason: 'stop'
-    };
-    await expect( callArgs.onFinish( finishEvent ) ).resolves.toBeUndefined();
-    expect( () => callArgs.onError( { error: new Error( 'fail' ) } ) ).not.toThrow();
-  } );
+      expect( () => streamText( { prompt: 'test@v1', variables, skills } ) )
+        .toThrow( 'streamText() skills must be synchronous' );
-  it( 'streamText: passes through AI SDK streaming options', async () => {
-    const { streamText } = await importSut();
-    const mockOnChunk = vi.fn();
-    const mockOnStepFinish = vi.fn();
-    const mockTransform = vi.fn();
-    const mockTools = { calculator: { description: 'A calculator tool' } };
-    streamText( {
-      prompt: 'test_prompt@v1',
-      tools: mockTools,
-      toolChoice: 'required',
-      maxRetries: 5,
-      onChunk: mockOnChunk,
-      onStepFinish: mockOnStepFinish,
-      experimental_transform: mockTransform
+      expect( skills ).toHaveBeenCalledWith( variables );
+      expect( promptMocks.prepareTextPrompt ).not.toHaveBeenCalled();
+      expect( aiFns.streamText ).not.toHaveBeenCalled();
     } );
-    expect( aiFns.streamText ).toHaveBeenCalledWith(
-      expect.objectContaining( {
-        tools: mockTools,
-        toolChoice: 'required',
-        maxRetries: 5,
-        onChunk: mockOnChunk,
-        onStepFinish: mockOnStepFinish,
-        experimental_transform: mockTransform
-      } )
-    );
-  } );
-  it( 'streamText: user onFinish/onError are not passed raw to AI SDK', async () => {
-    const { streamText } = await importSut();
-    const userOnFinish = vi.fn();
-    const userOnError = vi.fn();
+    it( 'omits tools and stopWhen when no tools are prepared', async () => {
+      const { streamText } = await importSut();
-    streamText( { prompt: 'test_prompt@v1', onFinish: userOnFinish, onError: userOnError } );
+      streamText( { prompt: 'test@v1' } );
-    const callArgs = aiFns.streamText.mock.calls[0][0];
-    expect( callArgs.onFinish ).not.toBe( userOnFinish );
-    expect( callArgs.onError ).not.toBe( userOnError );
-  } );
-  it( 'streamText: validation failure propagates synchronously', async () => {
-    const validationError = new Error( 'prompt is required' );
-    validators.validateStreamTextArgs.mockImplementationOnce( () => {
-      throw validationError;
+      expect( aiFns.stepCountIs ).not.toHaveBeenCalled();
+      expect( aiFns.streamText ).toHaveBeenCalledWith( {
+        ...textOptions,
+        maxRetries: 0,
+        onFinish: expect.any( Function ),
+        onError: expect.any( Function )
+      } );
     } );
-    const { streamText } = await importSut();
-    expect( () => streamText( { prompt: '' } ) ).toThrow( validationError );
-    expect( aiFns.streamText ).not.toHaveBeenCalled();
-  } );
-  it( 'streamText: trace start event includes correct name and details', async () => {
-    const { streamText } = await importSut();
-    const vars = { topic: 'testing' };
+    it( 'preserves caller-provided stopWhen when tools are prepared', async () => {
+      const { streamText } = await importSut();
+      const stopWhen = { type: 'custom-stop' };
+      promptMocks.prepareTextPrompt.mockReturnValueOnce( {
+        loadedPrompt,
+        tools: { load_skill: { description: 'Load skill' } }
+      } );
-    streamText( { prompt: 'test_prompt@v1', variables: vars } );
+      streamText( { prompt: 'test@v1', stopWhen } );
-    expect( traceMocks.startTrace ).toHaveBeenCalledWith( {
-      name: 'streamText',
-      prompt: 'test_prompt@v1',
-      variables: vars,
-      loadedPrompt: basePrompt
+      expect( aiFns.stepCountIs ).not.toHaveBeenCalled();
+      expect( aiFns.streamText ).toHaveBeenCalledWith( expect.objectContaining( {
+        stopWhen
+      } ) );
     } );
-  } );
-  it( 'streamText: traces error and rethrows when AI.streamText throws synchronously', async () => {
-    const syncError = new Error( 'Invalid model config' );
-    aiFns.streamText.mockImplementation( () => {
-      throw syncError;
+    it( 'traces stream onError events and calls the user callback', async () => {
+      const { streamText } = await importSut();
+      const onError = vi.fn();
+      const error = new Error( 'Stream failed' );
+      const mappedError = new Error( 'Mapped stream failed' );
+      errorMocks.mapAiError.mockReturnValueOnce( mappedError );
+      streamText( { prompt: 'test@v1', onError } );
+      const callOptions = aiFns.streamText.mock.calls[0][0];
+      callOptions.onError( { error } );
+      expect( errorMocks.mapAiError ).toHaveBeenCalledWith( error );
+      expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        error: mappedError
+      } );
+      expect( onError ).toHaveBeenCalledWith( { error: mappedError } );
     } );
-    const { streamText } = await importSut();
-    expect( () => streamText( { prompt: 'test_prompt@v1' } ) ).toThrow( syncError );
-    expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( { traceId: 'trace-id', error: syncError } );
-  } );
-  it( 'streamText: passes variables to prompt loader', async () => {
-    const { streamText } = await importSut();
-    const vars = { name: 'World', count: 5 };
+    it( 'does not pass the raw onFinish or onError callbacks to AI SDK', async () => {
+      const { streamText } = await importSut();
+      const onFinish = vi.fn();
+      const onError = vi.fn();
-    streamText( { prompt: 'test_prompt@v1', variables: vars } );
-    expect( loadPromptImpl ).toHaveBeenCalledWith( 'test_prompt@v1', vars );
-  } );
+      streamText( { prompt: 'test@v1', onFinish, onError } );
+      const callOptions = aiFns.streamText.mock.calls[0][0];
-  it( 'generateText: loads frontmatter skills from prompt config using promptFileDir', async () => {
-    const frontmatterSkill = { name: 'fm_skill', description: 'FM', instructions: '# FM' };
-    loadPromptImpl.mockReturnValue( {
-      ...basePrompt,
-      promptFileDir: '/some/prompt/dir',
-      config: { ...basePrompt.config, skills: [ './skills/' ] }
+      expect( callOptions.onFinish ).not.toBe( onFinish );
+      expect( callOptions.onError ).not.toBe( onError );
     } );
-    loadPromptSkillsImpl.mockReturnValue( [ frontmatterSkill ] );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1' } );
-    expect( loadPromptSkillsImpl ).toHaveBeenCalledWith( [ './skills/' ], '/some/prompt/dir' );
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    expect( callArgs.tools ).toHaveProperty( 'load_skill' );
-  } );
-  it( 'generateText: merges frontmatter skills with caller-provided skills', async () => {
-    const frontmatterSkill = { name: 'fm_skill', description: 'FM', instructions: '# FM' };
-    const callerSkill = { name: 'caller_skill', description: 'Caller', instructions: '# Caller' };
-    loadPromptImpl.mockReturnValue( {
-      ...basePrompt,
-      messages: [ ...basePrompt.messages ],
-      promptFileDir: '/some/prompt/dir',
-      config: { ...basePrompt.config, skills: [ './skills/' ] }
+    it( 'propagates validation errors before loading or tracing', async () => {
+      const validationError = new Error( 'Invalid args' );
+      validators.validateStreamTextArgs.mockImplementationOnce( () => {
+        throw validationError;
+      } );
+      const { streamText } = await importSut();
+      expect( () => streamText( { prompt: '' } ) ).toThrow( validationError );
+      expect( promptMocks.prepareTextPrompt ).not.toHaveBeenCalled();
+      expect( traceMocks.startTrace ).not.toHaveBeenCalled();
+      expect( aiFns.streamText ).not.toHaveBeenCalled();
     } );
-    loadPromptSkillsImpl.mockReturnValue( [ frontmatterSkill ] );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills: [ callerSkill ] } );
-    // Skills system message appended, loadPrompt called only once
-    expect( loadPromptImpl ).toHaveBeenCalledTimes( 1 );
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    const loadSkillResult = callArgs.tools.load_skill.execute( { name: 'caller_skill' } );
-    expect( loadSkillResult ).toBe( '# Caller' );
-  } );
-  it( 'generateText: skips frontmatter skill loading when no config.skills', async () => {
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1' } );
-    expect( loadPromptSkillsImpl ).not.toHaveBeenCalled();
-  } );
-  it( 'generateText: skips frontmatter skill loading when no promptFileDir', async () => {
-    loadPromptImpl.mockReturnValue( {
-      ...basePrompt,
-      config: { ...basePrompt.config, skills: [ './skills/' ] }
-      // no promptFileDir
+    it( 'traces and rethrows synchronous AI SDK errors', async () => {
+      const error = new Error( 'Invalid model' );
+      const mappedError = new Error( 'Mapped invalid model' );
+      aiFns.streamText.mockImplementationOnce( () => {
+        throw error;
+      } );
+      errorMocks.mapAiError.mockReturnValueOnce( mappedError );
+      const { streamText } = await importSut();
+      expect( () => streamText( { prompt: 'test@v1' } ) ).toThrow( mappedError );
+      expect( errorMocks.mapAiError ).toHaveBeenCalledWith( error );
+      expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        error: mappedError
+      } );
     } );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1' } );
-    expect( loadPromptSkillsImpl ).not.toHaveBeenCalled();
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    expect( callArgs.tools ).toBeUndefined();
   } );
-  it( 'generateText: appends skills system message when skills present', async () => {
-    const frontmatterSkill = { name: 'fm_skill', description: 'FM skill', instructions: '# FM' };
-    loadPromptImpl.mockReturnValue( {
-      ...basePrompt,
-      messages: [ ...basePrompt.messages ],
-      promptFileDir: '/dir',
-      config: { ...basePrompt.config, skills: [ './skills/' ] }
+  describe( 'generateImage', () => {
+    it( 'validates, loads prompt, traces, calls AI SDK, and wraps the response', async () => {
+      const { generateImage } = await importSut();
+      const variables = { scene: 'race cars' };
+      const images = [ Buffer.from( 'image-bytes' ) ];
+      const mask = Buffer.from( 'mask-bytes' );
+      const result = await generateImage( {
+        prompt: 'image@v1',
+        variables,
+        promptDir: '/prompts',
+        images,
+        mask,
+        n: 2,
+        providerOptions: { openai: { background: 'transparent' } }
+      } );
+      expect( validators.validateGenerateImageArgs ).toHaveBeenCalledWith( {
+        prompt: 'image@v1',
+        variables,
+        promptDir: '/prompts',
+        images,
+        mask
+      } );
+      expect( promptMocks.loadPrompt ).toHaveBeenCalledWith( 'image@v1', variables, '/prompts' );
+      expect( traceMocks.startTrace ).toHaveBeenCalledWith( {
+        name: 'generateImage',
+        prompt: 'image@v1',
+        variables,
+        loadedPrompt
+      } );
+      expect( optionMocks.loadAiSdkImageOptions ).toHaveBeenCalledWith( {
+        prompt: loadedPrompt,
+        images,
+        mask
+      } );
+      expect( aiFns.generateImage ).toHaveBeenCalledWith( {
+        ...imageOptions,
+        maxRetries: 0,
+        n: 2,
+        providerOptions: { openai: { background: 'transparent' } }
+      } );
+      expect( wrapMocks.wrapImageResponse ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        modelId: 'test-model',
+        response: imageResponse
+      } );
+      expect( result ).toEqual( { wrapped: imageResponse } );
     } );
-    loadPromptSkillsImpl.mockReturnValue( [ frontmatterSkill ] );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', variables: { topic: 'AI' } } );
-    // Single loadPrompt call — no two-pass render
-    expect( loadPromptImpl ).toHaveBeenCalledTimes( 1 );
-    // Skills system message inserted into messages
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    const skillsMsg = callArgs.messages.find( m => m.role === 'system' && m.content.includes( 'fm_skill' ) );
-    expect( skillsMsg ).toBeDefined();
-  } );
-  it( 'generateText: appends skills message and load_skill tool when skills provided', async () => {
-    const skills = [
-      { name: 'research', description: 'Research approach', instructions: '# Research\nDo research' }
-    ];
-    loadPromptImpl.mockReturnValue( { ...basePrompt, messages: [ ...basePrompt.messages ] } );
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills } );
-    expect( loadPromptImpl ).toHaveBeenCalledTimes( 1 );
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    expect( callArgs.tools ).toHaveProperty( 'load_skill' );
-    const skillsMsg = callArgs.messages.find( m => m.role === 'system' && m.content.includes( 'research' ) );
-    expect( skillsMsg ).toBeDefined();
-  } );
-  it( 'generateText: does not inject _system_skills or load_skill when skills is empty', async () => {
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills: [] } );
-    expect( loadPromptImpl ).toHaveBeenCalledWith( 'test_prompt@v1', undefined, undefined );
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    expect( callArgs.tools ).toBeUndefined();
-    expect( callArgs.stopWhen ).toBeUndefined();
-  } );
-  it( 'generateText: load_skill execute returns instructions for known skill', async () => {
-    const skills = [
-      { name: 'research', description: 'Research', instructions: '# Research\nDetailed steps' }
-    ];
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills } );
-    const { tools } = aiFns.generateText.mock.calls[0][0];
-    const result = tools.load_skill.execute( { name: 'research' } );
-    expect( result ).toBe( '# Research\nDetailed steps' );
-  } );
-  it( 'generateText: load_skill execute returns error for unknown skill', async () => {
-    const skills = [
-      { name: 'research', description: 'Research', instructions: '# Research' }
-    ];
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills } );
-    const { tools } = aiFns.generateText.mock.calls[0][0];
-    const result = tools.load_skill.execute( { name: 'unknown' } );
-    expect( result ).toMatch( /not found/ );
-    expect( result ).toContain( 'research' );
-  } );
-  it( 'generateText: sets stopWhen via maxSteps when skills present', async () => {
-    const skills = [ { name: 'skill', description: 'A skill', instructions: '# Skill' } ];
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills, maxSteps: 5 } );
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( { stopWhen: { type: 'stepCount', count: 5 } } )
-    );
-  } );
-  it( 'generateText: defaults maxSteps to 10 when skills present', async () => {
-    const skills = [ { name: 'skill', description: 'A skill', instructions: '# Skill' } ];
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills } );
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( { stopWhen: { type: 'stepCount', count: 10 } } )
-    );
-  } );
-  it( 'generateText: merges skill tools with user-provided tools', async () => {
-    const skills = [ { name: 'skill', description: 'A skill', instructions: '# Skill' } ];
-    const userTools = { calculator: { description: 'A calculator' } };
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills, tools: userTools } );
-    const { tools } = aiFns.generateText.mock.calls[0][0];
-    expect( tools ).toHaveProperty( 'load_skill' );
-    expect( tools ).toHaveProperty( 'calculator' );
-  } );
-  it( 'generateText: calls skill function with variables and uses resolved skills', async () => {
-    const resolvedSkill = { name: 'dynamic', description: 'Dynamic skill', instructions: '# Dynamic' };
-    const skillsFn = vi.fn().mockResolvedValue( [ resolvedSkill ] );
-    const vars = { topic: 'AI' };
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', variables: vars, skills: skillsFn } );
-    expect( skillsFn ).toHaveBeenCalledWith( vars );
-    expect( loadPromptImpl ).toHaveBeenCalledTimes( 1 );
-    const callArgs = aiFns.generateText.mock.calls[0][0];
-    expect( callArgs.tools ).toHaveProperty( 'load_skill' );
-    const skillsMsg = callArgs.messages.find( m => m.role === 'system' && m.content.includes( 'dynamic' ) );
-    expect( skillsMsg ).toBeDefined();
-  } );
+    it( 'supports text-to-image calls without images or mask', async () => {
+      const { generateImage } = await importSut();
+      await generateImage( { prompt: 'image@v1' } );
+      expect( validators.validateGenerateImageArgs ).toHaveBeenCalledWith( {
+        prompt: 'image@v1',
+        variables: undefined,
+        promptDir: undefined,
+        images: undefined,
+        mask: undefined
+      } );
+      expect( optionMocks.loadAiSdkImageOptions ).toHaveBeenCalledWith( {
+        prompt: loadedPrompt,
+        images: undefined,
+        mask: undefined
+      } );
+    } );
-  it( 'generateText: preserves caller stopWhen when skills present', async () => {
-    const skills = [ { name: 'skill', description: 'A skill', instructions: '# Skill' } ];
-    const customStop = { type: 'custom' };
-    const { generateText } = await importSut();
-    await generateText( { prompt: 'test_prompt@v1', skills, stopWhen: customStop } );
+    it( 'propagates validation errors before loading or tracing', async () => {
+      const validationError = new Error( 'Invalid image args' );
+      validators.validateGenerateImageArgs.mockImplementationOnce( () => {
+        throw validationError;
+      } );
+      const { generateImage } = await importSut();
+      await expect( generateImage( { prompt: '' } ) ).rejects.toThrow( validationError );
+      expect( promptMocks.loadPrompt ).not.toHaveBeenCalled();
+      expect( traceMocks.startTrace ).not.toHaveBeenCalled();
+      expect( aiFns.generateImage ).not.toHaveBeenCalled();
+    } );
-    expect( aiFns.generateText ).toHaveBeenCalledWith(
-      expect.objectContaining( { stopWhen: customStop } )
-    );
+    it( 'traces and rethrows AI SDK errors', async () => {
+      const error = new Error( 'Image provider failed' );
+      const mappedError = new Error( 'Mapped image provider failed' );
+      aiFns.generateImage.mockRejectedValueOnce( error );
+      errorMocks.mapAiError.mockReturnValueOnce( mappedError );
+      const { generateImage } = await importSut();
+      await expect( generateImage( { prompt: 'image@v1' } ) ).rejects.toThrow( mappedError );
+      expect( errorMocks.mapAiError ).toHaveBeenCalledWith( error );
+      expect( traceMocks.endTraceWithError ).toHaveBeenCalledWith( {
+        traceId: 'trace-id',
+        error: mappedError
+      } );
+    } );
   } );
 } );