npm - @ai-sdk/xai - Versions diffs - 0.0.0-64aae7dd-20260114144918 → 0.0.0-98261322-20260122142521 - Mend

@ai-sdk/xai 0.0.0-64aae7dd-20260114144918 → 0.0.0-98261322-20260122142521

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/CHANGELOG.md +64 -5
package/dist/index.js +1 -1
package/dist/index.mjs +1 -1
package/docs/01-xai.mdx +697 -0
package/package.json +11 -6
package/src/convert-to-xai-chat-messages.test.ts +243 -0
package/src/convert-to-xai-chat-messages.ts +142 -0
package/src/convert-xai-chat-usage.test.ts +240 -0
package/src/convert-xai-chat-usage.ts +23 -0
package/src/get-response-metadata.ts +19 -0
package/src/index.ts +14 -0
package/src/map-xai-finish-reason.ts +19 -0
package/src/responses/__fixtures__/xai-code-execution-tool.1.json +68 -0
package/src/responses/__fixtures__/xai-text-streaming.1.chunks.txt +698 -0
package/src/responses/__fixtures__/xai-text-with-reasoning-streaming-store-false.1.chunks.txt +655 -0
package/src/responses/__fixtures__/xai-text-with-reasoning-streaming.1.chunks.txt +679 -0
package/src/responses/__fixtures__/xai-web-search-tool.1.chunks.txt +274 -0
package/src/responses/__fixtures__/xai-web-search-tool.1.json +90 -0
package/src/responses/__fixtures__/xai-x-search-tool.1.json +149 -0
package/src/responses/__fixtures__/xai-x-search-tool.chunks.txt +1757 -0
package/src/responses/__snapshots__/xai-responses-language-model.test.ts.snap +21929 -0
package/src/responses/convert-to-xai-responses-input.test.ts +463 -0
package/src/responses/convert-to-xai-responses-input.ts +206 -0
package/src/responses/convert-xai-responses-usage.ts +24 -0
package/src/responses/map-xai-responses-finish-reason.ts +20 -0
package/src/responses/xai-responses-api.ts +393 -0
package/src/responses/xai-responses-language-model.test.ts +1803 -0
package/src/responses/xai-responses-language-model.ts +732 -0
package/src/responses/xai-responses-options.ts +34 -0
package/src/responses/xai-responses-prepare-tools.test.ts +497 -0
package/src/responses/xai-responses-prepare-tools.ts +226 -0
package/src/tool/code-execution.ts +17 -0
package/src/tool/index.ts +15 -0
package/src/tool/view-image.ts +20 -0
package/src/tool/view-x-video.ts +18 -0
package/src/tool/web-search.ts +56 -0
package/src/tool/x-search.ts +63 -0
package/src/version.ts +6 -0
package/src/xai-chat-language-model.test.ts +1805 -0
package/src/xai-chat-language-model.ts +681 -0
package/src/xai-chat-options.ts +131 -0
package/src/xai-chat-prompt.ts +44 -0
package/src/xai-error.ts +19 -0
package/src/xai-image-settings.ts +1 -0
package/src/xai-prepare-tools.ts +95 -0
package/src/xai-provider.test.ts +167 -0
package/src/xai-provider.ts +162 -0

package/src/xai-chat-language-model.test.ts ADDED Viewed

@@ -0,0 +1,1805 @@
+import { LanguageModelV3Prompt } from '@ai-sdk/provider';
+import { describe, it, expect, vi } from 'vitest';
+import { createTestServer } from '@ai-sdk/test-server/with-vitest';
+import { convertReadableStreamToArray } from '@ai-sdk/provider-utils/test';
+import { XaiChatLanguageModel } from './xai-chat-language-model';
+import { createXai } from './xai-provider';
+const TEST_PROMPT: LanguageModelV3Prompt = [
+  { role: 'user', content: [{ type: 'text', text: 'Hello' }] },
+];
+vi.mock('./version', () => ({
+  VERSION: '0.0.0-test',
+}));
+const testConfig = {
+  provider: 'xai.chat',
+  baseURL: 'https://api.x.ai/v1',
+  headers: () => ({ authorization: 'Bearer test-api-key' }),
+  generateId: () => 'test-id',
+};
+const model = new XaiChatLanguageModel('grok-beta', testConfig);
+const server = createTestServer({
+  'https://api.x.ai/v1/chat/completions': {},
+});
+describe('XaiChatLanguageModel', () => {
+  it('should be instantiated correctly', () => {
+    expect(model.modelId).toBe('grok-beta');
+    expect(model.provider).toBe('xai.chat');
+    expect(model.specificationVersion).toBe('v3');
+  });
+  it('should have supported URLs', () => {
+    expect(model.supportedUrls).toEqual({
+      'image/*': [/^https?:\/\/.*$/],
+    });
+  });
+  describe('doGenerate', () => {
+    function prepareJsonResponse({
+      content = '',
+      usage = {
+        prompt_tokens: 4,
+        total_tokens: 34,
+        completion_tokens: 30,
+      },
+      id = 'chatcmpl-test-id',
+      created = 1699472111,
+      model = 'grok-beta',
+      headers,
+    }: {
+      content?: string;
+      usage?: {
+        prompt_tokens: number;
+        total_tokens: number;
+        completion_tokens: number;
+      };
+      id?: string;
+      created?: number;
+      model?: string;
+      headers?: Record<string, string>;
+    }) {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        headers,
+        body: {
+          id,
+          object: 'chat.completion',
+          created,
+          model,
+          choices: [
+            {
+              index: 0,
+              message: {
+                role: 'assistant',
+                content,
+                tool_calls: null,
+              },
+              finish_reason: 'stop',
+            },
+          ],
+          usage,
+        },
+      };
+    }
+    it('should extract text content', async () => {
+      prepareJsonResponse({ content: 'Hello, World!' });
+      const { content } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "text": "Hello, World!",
+            "type": "text",
+          },
+        ]
+      `);
+    });
+    it('should avoid duplication when there is a trailing assistant message', async () => {
+      prepareJsonResponse({ content: 'prefix and more content' });
+      const { content } = await model.doGenerate({
+        prompt: [
+          { role: 'user', content: [{ type: 'text', text: 'Hello' }] },
+          {
+            role: 'assistant',
+            content: [{ type: 'text', text: 'prefix ' }],
+          },
+        ],
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "text": "prefix and more content",
+            "type": "text",
+          },
+        ]
+      `);
+    });
+    it('should extract tool call content', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          id: 'chatcmpl-test-tool-call',
+          object: 'chat.completion',
+          created: 1699472111,
+          model: 'grok-beta',
+          choices: [
+            {
+              index: 0,
+              message: {
+                role: 'assistant',
+                content: null,
+                tool_calls: [
+                  {
+                    id: 'call_test123',
+                    type: 'function',
+                    function: {
+                      name: 'weatherTool',
+                      arguments: '{"location": "paris"}',
+                    },
+                  },
+                ],
+              },
+              finish_reason: 'tool_calls',
+            },
+          ],
+          usage: {
+            prompt_tokens: 124,
+            total_tokens: 146,
+            completion_tokens: 22,
+          },
+        },
+      };
+      const { content } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "input": "{"location": "paris"}",
+            "toolCallId": "call_test123",
+            "toolName": "weatherTool",
+            "type": "tool-call",
+          },
+        ]
+      `);
+    });
+    it('should extract usage', async () => {
+      prepareJsonResponse({
+        usage: { prompt_tokens: 20, total_tokens: 25, completion_tokens: 5 },
+      });
+      const { usage } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(usage).toMatchInlineSnapshot(`
+        {
+          "inputTokens": {
+            "cacheRead": 0,
+            "cacheWrite": undefined,
+            "noCache": 20,
+            "total": 20,
+          },
+          "outputTokens": {
+            "reasoning": 0,
+            "text": 5,
+            "total": 5,
+          },
+          "raw": {
+            "completion_tokens": 5,
+            "prompt_tokens": 20,
+            "total_tokens": 25,
+          },
+        }
+      `);
+    });
+    it('should send additional response information', async () => {
+      prepareJsonResponse({
+        id: 'test-id',
+        created: 123,
+        model: 'test-model',
+      });
+      const { response } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect({
+        id: response?.id,
+        timestamp: response?.timestamp,
+        modelId: response?.modelId,
+      }).toStrictEqual({
+        id: 'test-id',
+        timestamp: new Date(123 * 1000),
+        modelId: 'test-model',
+      });
+    });
+    it('should expose the raw response headers', async () => {
+      prepareJsonResponse({
+        headers: { 'test-header': 'test-value' },
+      });
+      const { response } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(response?.headers).toStrictEqual({
+        // default headers:
+        'content-length': '271',
+        'content-type': 'application/json',
+        // custom header
+        'test-header': 'test-value',
+      });
+    });
+    it('should pass the model and the messages', async () => {
+      prepareJsonResponse({ content: '' });
+      await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+      });
+    });
+    it('should pass tools and toolChoice', async () => {
+      prepareJsonResponse({ content: '' });
+      await model.doGenerate({
+        tools: [
+          {
+            type: 'function',
+            name: 'test-tool',
+            inputSchema: {
+              type: 'object',
+              properties: { value: { type: 'string' } },
+              required: ['value'],
+              additionalProperties: false,
+              $schema: 'http://json-schema.org/draft-07/schema#',
+            },
+          },
+        ],
+        toolChoice: {
+          type: 'tool',
+          toolName: 'test-tool',
+        },
+        prompt: TEST_PROMPT,
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+        tools: [
+          {
+            type: 'function',
+            function: {
+              name: 'test-tool',
+              parameters: {
+                type: 'object',
+                properties: { value: { type: 'string' } },
+                required: ['value'],
+                additionalProperties: false,
+                $schema: 'http://json-schema.org/draft-07/schema#',
+              },
+            },
+          },
+        ],
+        tool_choice: {
+          type: 'function',
+          function: { name: 'test-tool' },
+        },
+      });
+    });
+    it('should pass parallel_function_calling provider option', async () => {
+      prepareJsonResponse({ content: '' });
+      await model.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: {
+            parallel_function_calling: false,
+          },
+        },
+      });
+      expect(await server.calls[0].requestBodyJson).toMatchObject({
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+        parallel_function_calling: false,
+      });
+    });
+    it('should pass headers', async () => {
+      prepareJsonResponse({ content: '' });
+      const modelWithHeaders = new XaiChatLanguageModel('grok-beta', {
+        provider: 'xai.chat',
+        baseURL: 'https://api.x.ai/v1',
+        headers: () => ({
+          authorization: 'Bearer test-api-key',
+          'Custom-Provider-Header': 'provider-header-value',
+        }),
+        generateId: () => 'test-id',
+      });
+      await modelWithHeaders.doGenerate({
+        prompt: TEST_PROMPT,
+        headers: {
+          'Custom-Request-Header': 'request-header-value',
+        },
+      });
+      const requestHeaders = server.calls[0].requestHeaders;
+      expect(requestHeaders).toStrictEqual({
+        authorization: 'Bearer test-api-key',
+        'content-type': 'application/json',
+        'custom-provider-header': 'provider-header-value',
+        'custom-request-header': 'request-header-value',
+      });
+    });
+    it('should include provider user agent when using createXai', async () => {
+      prepareJsonResponse({ content: '' });
+      const xai = createXai({
+        apiKey: 'test-api-key',
+        headers: { 'Custom-Provider-Header': 'provider-header-value' },
+      });
+      const modelWithHeaders = xai.chat('grok-beta');
+      await modelWithHeaders.doGenerate({
+        prompt: TEST_PROMPT,
+        headers: { 'Custom-Request-Header': 'request-header-value' },
+      });
+      expect(server.calls[0].requestUserAgent).toContain(
+        `ai-sdk/xai/0.0.0-test`,
+      );
+    });
+    it('should send request body', async () => {
+      prepareJsonResponse({ content: '' });
+      const { request } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(request).toMatchInlineSnapshot(`
+        {
+          "body": {
+            "max_completion_tokens": undefined,
+            "messages": [
+              {
+                "content": "Hello",
+                "role": "user",
+              },
+            ],
+            "model": "grok-beta",
+            "parallel_function_calling": undefined,
+            "reasoning_effort": undefined,
+            "response_format": undefined,
+            "search_parameters": undefined,
+            "seed": undefined,
+            "temperature": undefined,
+            "tool_choice": undefined,
+            "tools": undefined,
+            "top_p": undefined,
+          },
+        }
+      `);
+    });
+    it('should pass search parameters', async () => {
+      prepareJsonResponse({ content: '' });
+      await model.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: {
+            searchParameters: {
+              mode: 'auto',
+              returnCitations: true,
+              fromDate: '2024-01-01',
+              toDate: '2024-12-31',
+              maxSearchResults: 10,
+            },
+          },
+        },
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+        search_parameters: {
+          mode: 'auto',
+          return_citations: true,
+          from_date: '2024-01-01',
+          to_date: '2024-12-31',
+          max_search_results: 10,
+        },
+      });
+    });
+    it('should pass search parameters with sources array', async () => {
+      prepareJsonResponse({ content: '' });
+      await model.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: {
+            searchParameters: {
+              mode: 'on',
+              sources: [
+                {
+                  type: 'web',
+                  country: 'US',
+                  excludedWebsites: ['example.com'],
+                  safeSearch: false,
+                },
+                {
+                  type: 'x',
+                  includedXHandles: ['grok'],
+                  excludedXHandles: ['openai'],
+                  postFavoriteCount: 5,
+                  postViewCount: 50,
+                },
+                {
+                  type: 'news',
+                  country: 'GB',
+                },
+                {
+                  type: 'rss',
+                  links: ['https://status.x.ai/feed.xml'],
+                },
+              ],
+            },
+          },
+        },
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+        search_parameters: {
+          mode: 'on',
+          sources: [
+            {
+              type: 'web',
+              country: 'US',
+              excluded_websites: ['example.com'],
+              safe_search: false,
+            },
+            {
+              type: 'x',
+              included_x_handles: ['grok'],
+              excluded_x_handles: ['openai'],
+              post_favorite_count: 5,
+              post_view_count: 50,
+            },
+            {
+              type: 'news',
+              country: 'GB',
+            },
+            {
+              type: 'rss',
+              links: ['https://status.x.ai/feed.xml'],
+            },
+          ],
+        },
+      });
+    });
+    it('should extract content when message content is a content object', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          id: 'object-id',
+          object: 'chat.completion',
+          created: 1699472111,
+          model: 'grok-beta',
+          choices: [
+            {
+              index: 0,
+              message: {
+                role: 'assistant',
+                content: 'Hello from object',
+                tool_calls: null,
+              },
+              finish_reason: 'stop',
+            },
+          ],
+          usage: { prompt_tokens: 4, total_tokens: 34, completion_tokens: 30 },
+        },
+      };
+      const { content } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "text": "Hello from object",
+            "type": "text",
+          },
+        ]
+      `);
+    });
+    it('should extract citations as sources', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          id: 'citations-test',
+          object: 'chat.completion',
+          created: 1699472111,
+          model: 'grok-beta',
+          choices: [
+            {
+              index: 0,
+              message: {
+                role: 'assistant',
+                content: 'Here are the latest developments in AI.',
+                tool_calls: null,
+              },
+              finish_reason: 'stop',
+            },
+          ],
+          usage: { prompt_tokens: 4, total_tokens: 34, completion_tokens: 30 },
+          citations: [
+            'https://example.com/article1',
+            'https://example.com/article2',
+          ],
+        },
+      };
+      const { content } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: {
+            searchParameters: {
+              mode: 'auto',
+              returnCitations: true,
+            },
+          },
+        },
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "text": "Here are the latest developments in AI.",
+            "type": "text",
+          },
+          {
+            "id": "test-id",
+            "sourceType": "url",
+            "type": "source",
+            "url": "https://example.com/article1",
+          },
+          {
+            "id": "test-id",
+            "sourceType": "url",
+            "type": "source",
+            "url": "https://example.com/article2",
+          },
+        ]
+      `);
+    });
+    it('should handle complex search parameter combinations', async () => {
+      prepareJsonResponse({
+        content: 'Research results from multiple sources',
+      });
+      await model.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: {
+            searchParameters: {
+              mode: 'on',
+              returnCitations: true,
+              fromDate: '2024-01-01',
+              toDate: '2024-12-31',
+              maxSearchResults: 15,
+              sources: [
+                {
+                  type: 'web',
+                  country: 'US',
+                  allowedWebsites: ['arxiv.org', 'nature.com'],
+                  safeSearch: true,
+                },
+                {
+                  type: 'news',
+                  country: 'GB',
+                  excludedWebsites: ['tabloid.com'],
+                },
+                {
+                  type: 'x',
+                  includedXHandles: ['openai', 'deepmind'],
+                  excludedXHandles: ['grok'],
+                  postFavoriteCount: 10,
+                  postViewCount: 100,
+                },
+              ],
+            },
+          },
+        },
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+        search_parameters: {
+          mode: 'on',
+          return_citations: true,
+          from_date: '2024-01-01',
+          to_date: '2024-12-31',
+          max_search_results: 15,
+          sources: [
+            {
+              type: 'web',
+              country: 'US',
+              allowed_websites: ['arxiv.org', 'nature.com'],
+              safe_search: true,
+            },
+            {
+              type: 'news',
+              country: 'GB',
+              excluded_websites: ['tabloid.com'],
+            },
+            {
+              type: 'x',
+              included_x_handles: ['openai', 'deepmind'],
+              excluded_x_handles: ['grok'],
+              post_favorite_count: 10,
+              post_view_count: 100,
+            },
+          ],
+        },
+      });
+    });
+    it('should handle empty citations array', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          id: 'no-citations-test',
+          object: 'chat.completion',
+          created: 1699472111,
+          model: 'grok-beta',
+          choices: [
+            {
+              index: 0,
+              message: {
+                role: 'assistant',
+                content: 'Response without citations.',
+                tool_calls: null,
+              },
+              finish_reason: 'stop',
+            },
+          ],
+          usage: { prompt_tokens: 4, total_tokens: 34, completion_tokens: 30 },
+          citations: [],
+        },
+      };
+      const { content } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: {
+            searchParameters: {
+              mode: 'auto',
+              returnCitations: true,
+            },
+          },
+        },
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "text": "Response without citations.",
+            "type": "text",
+          },
+        ]
+      `);
+    });
+    it('should support json schema response format without warnings', async () => {
+      prepareJsonResponse({ content: '{"name":"john doe"}' });
+      const { warnings } = await model.doGenerate({
+        prompt: TEST_PROMPT,
+        responseFormat: {
+          type: 'json',
+          schema: {
+            type: 'object',
+            properties: {
+              name: { type: 'string' },
+            },
+            required: ['name'],
+            additionalProperties: false,
+          },
+        },
+      });
+      expect(warnings).toEqual([]);
+    });
+    it('should send json schema in response format', async () => {
+      prepareJsonResponse({ content: '{"name":"john"}' });
+      await model.doGenerate({
+        prompt: TEST_PROMPT,
+        responseFormat: {
+          type: 'json',
+          name: 'person',
+          schema: {
+            type: 'object',
+            properties: {
+              name: { type: 'string' },
+            },
+            required: ['name'],
+          },
+        },
+      });
+      expect(await server.calls[0].requestBodyJson).toMatchObject({
+        model: 'grok-beta',
+        response_format: {
+          type: 'json_schema',
+          json_schema: {
+            name: 'person',
+            schema: {
+              type: 'object',
+              properties: {
+                name: { type: 'string' },
+              },
+              required: ['name'],
+            },
+            strict: true,
+          },
+        },
+      });
+    });
+  });
+  describe('doStream', () => {
+    function prepareStreamResponse({
+      content,
+      headers,
+    }: {
+      content: string[];
+      headers?: Record<string, string>;
+    }) {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'stream-chunks',
+        headers,
+        chunks: [
+          `data: {"id":"35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe","object":"chat.completion.chunk",` +
+            `"created":1750537778,"model":"grok-beta","choices":[{"index":0,` +
+            `"delta":{"role":"assistant","content":""},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          ...content.map(text => {
+            return (
+              `data: {"id":"35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe","object":"chat.completion.chunk",` +
+              `"created":1750537778,"model":"grok-beta","choices":[{"index":0,` +
+              `"delta":{"role":"assistant","content":"${text}"},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`
+            );
+          }),
+          `data: {"id":"35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe","object":"chat.completion.chunk",` +
+            `"created":1750537778,"model":"grok-beta","choices":[{"index":0,` +
+            `"delta":{"content":""},"finish_reason":"stop"}],` +
+            `"usage":{"prompt_tokens":4,"total_tokens":36,"completion_tokens":32},"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          `data: [DONE]\n\n`,
+        ],
+      };
+    }
+    it('should stream text deltas', async () => {
+      prepareStreamResponse({ content: ['Hello', ', ', 'world!'] });
+      const { stream } = await model.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+      });
+      expect(await convertReadableStreamToArray(stream)).toMatchInlineSnapshot(`
+        [
+          {
+            "type": "stream-start",
+            "warnings": [],
+          },
+          {
+            "id": "35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "modelId": "grok-beta",
+            "timestamp": 2025-06-21T20:29:38.000Z,
+            "type": "response-metadata",
+          },
+          {
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-start",
+          },
+          {
+            "delta": "Hello",
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-delta",
+          },
+          {
+            "delta": ", ",
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-delta",
+          },
+          {
+            "delta": "world!",
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-delta",
+          },
+          {
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-end",
+          },
+          {
+            "finishReason": {
+              "raw": "stop",
+              "unified": "stop",
+            },
+            "type": "finish",
+            "usage": {
+              "inputTokens": {
+                "cacheRead": 0,
+                "cacheWrite": undefined,
+                "noCache": 4,
+                "total": 4,
+              },
+              "outputTokens": {
+                "reasoning": 0,
+                "text": 32,
+                "total": 32,
+              },
+              "raw": {
+                "completion_tokens": 32,
+                "prompt_tokens": 4,
+                "total_tokens": 36,
+              },
+            },
+          },
+        ]
+      `);
+    });
+    it('should avoid duplication when there is a trailing assistant message', async () => {
+      prepareStreamResponse({ content: ['prefix', ' and', ' more content'] });
+      const { stream } = await model.doStream({
+        prompt: [
+          { role: 'user', content: [{ type: 'text', text: 'Hello' }] },
+          {
+            role: 'assistant',
+            content: [{ type: 'text', text: 'prefix ' }],
+          },
+        ],
+        includeRawChunks: false,
+      });
+      expect(await convertReadableStreamToArray(stream)).toMatchInlineSnapshot(`
+        [
+          {
+            "type": "stream-start",
+            "warnings": [],
+          },
+          {
+            "id": "35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "modelId": "grok-beta",
+            "timestamp": 2025-06-21T20:29:38.000Z,
+            "type": "response-metadata",
+          },
+          {
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-start",
+          },
+          {
+            "delta": "prefix",
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-delta",
+          },
+          {
+            "delta": " and",
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-delta",
+          },
+          {
+            "delta": " more content",
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-delta",
+          },
+          {
+            "id": "text-35e18f56-4ec6-48e4-8ca0-c1c4cbeeebbe",
+            "type": "text-end",
+          },
+          {
+            "finishReason": {
+              "raw": "stop",
+              "unified": "stop",
+            },
+            "type": "finish",
+            "usage": {
+              "inputTokens": {
+                "cacheRead": 0,
+                "cacheWrite": undefined,
+                "noCache": 4,
+                "total": 4,
+              },
+              "outputTokens": {
+                "reasoning": 0,
+                "text": 32,
+                "total": 32,
+              },
+              "raw": {
+                "completion_tokens": 32,
+                "prompt_tokens": 4,
+                "total_tokens": 36,
+              },
+            },
+          },
+        ]
+      `);
+    });
+    it('should stream tool deltas', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'stream-chunks',
+        chunks: [
+          `data: {"id":"a9648117-740c-4270-9e07-6a8457f23b7a","object":"chat.completion.chunk","created":1750535985,"model":"grok-beta",` +
+            `"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          `data: {"id":"a9648117-740c-4270-9e07-6a8457f23b7a","object":"chat.completion.chunk","created":1750535985,"model":"grok-beta",` +
+            `"choices":[{"index":0,"delta":{"content":null,"tool_calls":[{"id":"call_yfBEybNYi","type":"function","function":{"name":"test-tool","arguments":` +
+            `"{\\"value\\":\\"Sparkle Day\\"}"` +
+            `}}]},"finish_reason":"tool_calls"}],"usage":{"prompt_tokens":183,"total_tokens":316,"completion_tokens":133},"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          'data: [DONE]\n\n',
+        ],
+      };
+      const { stream } = await model.doStream({
+        tools: [
+          {
+            type: 'function',
+            name: 'test-tool',
+            inputSchema: {
+              type: 'object',
+              properties: { value: { type: 'string' } },
+              required: ['value'],
+              additionalProperties: false,
+              $schema: 'http://json-schema.org/draft-07/schema#',
+            },
+          },
+        ],
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+      });
+      expect(await convertReadableStreamToArray(stream)).toMatchInlineSnapshot(`
+        [
+          {
+            "type": "stream-start",
+            "warnings": [],
+          },
+          {
+            "id": "a9648117-740c-4270-9e07-6a8457f23b7a",
+            "modelId": "grok-beta",
+            "timestamp": 2025-06-21T19:59:45.000Z,
+            "type": "response-metadata",
+          },
+          {
+            "id": "call_yfBEybNYi",
+            "toolName": "test-tool",
+            "type": "tool-input-start",
+          },
+          {
+            "delta": "{"value":"Sparkle Day"}",
+            "id": "call_yfBEybNYi",
+            "type": "tool-input-delta",
+          },
+          {
+            "id": "call_yfBEybNYi",
+            "type": "tool-input-end",
+          },
+          {
+            "input": "{"value":"Sparkle Day"}",
+            "toolCallId": "call_yfBEybNYi",
+            "toolName": "test-tool",
+            "type": "tool-call",
+          },
+          {
+            "finishReason": {
+              "raw": "tool_calls",
+              "unified": "tool-calls",
+            },
+            "type": "finish",
+            "usage": {
+              "inputTokens": {
+                "cacheRead": 0,
+                "cacheWrite": undefined,
+                "noCache": 183,
+                "total": 183,
+              },
+              "outputTokens": {
+                "reasoning": 0,
+                "text": 133,
+                "total": 133,
+              },
+              "raw": {
+                "completion_tokens": 133,
+                "prompt_tokens": 183,
+                "total_tokens": 316,
+              },
+            },
+          },
+        ]
+      `);
+    });
+    it('should expose the raw response headers', async () => {
+      prepareStreamResponse({
+        content: [],
+        headers: { 'test-header': 'test-value' },
+      });
+      const { response } = await model.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+      });
+      expect(response?.headers).toStrictEqual({
+        // default headers:
+        'content-type': 'text/event-stream',
+        'cache-control': 'no-cache',
+        connection: 'keep-alive',
+        // custom header
+        'test-header': 'test-value',
+      });
+    });
+    it('should pass the messages', async () => {
+      prepareStreamResponse({ content: [''] });
+      await model.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        stream: true,
+        model: 'grok-beta',
+        messages: [{ role: 'user', content: 'Hello' }],
+        stream_options: {
+          include_usage: true,
+        },
+      });
+    });
+    it('should pass headers', async () => {
+      prepareStreamResponse({ content: [] });
+      const modelWithHeaders = new XaiChatLanguageModel('grok-beta', {
+        provider: 'xai.chat',
+        baseURL: 'https://api.x.ai/v1',
+        headers: () => ({
+          authorization: 'Bearer test-api-key',
+          'Custom-Provider-Header': 'provider-header-value',
+        }),
+        generateId: () => 'test-id',
+      });
+      await modelWithHeaders.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+        headers: {
+          'Custom-Request-Header': 'request-header-value',
+        },
+      });
+      expect(server.calls[0].requestHeaders).toStrictEqual({
+        authorization: 'Bearer test-api-key',
+        'content-type': 'application/json',
+        'custom-provider-header': 'provider-header-value',
+        'custom-request-header': 'request-header-value',
+      });
+    });
+    it('should send request body', async () => {
+      prepareStreamResponse({ content: [] });
+      const { request } = await model.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+      });
+      expect(request).toMatchInlineSnapshot(`
+        {
+          "body": {
+            "max_completion_tokens": undefined,
+            "messages": [
+              {
+                "content": "Hello",
+                "role": "user",
+              },
+            ],
+            "model": "grok-beta",
+            "parallel_function_calling": undefined,
+            "reasoning_effort": undefined,
+            "response_format": undefined,
+            "search_parameters": undefined,
+            "seed": undefined,
+            "stream": true,
+            "stream_options": {
+              "include_usage": true,
+            },
+            "temperature": undefined,
+            "tool_choice": undefined,
+            "tools": undefined,
+            "top_p": undefined,
+          },
+        }
+      `);
+    });
+    it('should stream citations as sources', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'stream-chunks',
+        chunks: [
+          `data: {"id":"c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c","object":"chat.completion.chunk","created":1750538200,"model":"grok-beta",` +
+            `"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          `data: {"id":"c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c","object":"chat.completion.chunk","created":1750538200,"model":"grok-beta",` +
+            `"choices":[{"index":0,"delta":{"content":"Latest AI news"},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          `data: {"id":"c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c","object":"chat.completion.chunk","created":1750538200,"model":"grok-beta",` +
+            `"choices":[{"index":0,"delta":{},"finish_reason":"stop"}],` +
+            `"usage":{"prompt_tokens":4,"total_tokens":34,"completion_tokens":30},` +
+            `"citations":["https://example.com/source1","https://example.com/source2"],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+          `data: [DONE]\n\n`,
+        ],
+      };
+      const { stream } = await model.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+        providerOptions: {
+          xai: {
+            searchParameters: {
+              mode: 'auto',
+              returnCitations: true,
+            },
+          },
+        },
+      });
+      expect(await convertReadableStreamToArray(stream)).toMatchInlineSnapshot(`
+        [
+          {
+            "type": "stream-start",
+            "warnings": [],
+          },
+          {
+            "id": "c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c",
+            "modelId": "grok-beta",
+            "timestamp": 2025-06-21T20:36:40.000Z,
+            "type": "response-metadata",
+          },
+          {
+            "id": "text-c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c",
+            "type": "text-start",
+          },
+          {
+            "delta": "Latest AI news",
+            "id": "text-c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c",
+            "type": "text-delta",
+          },
+          {
+            "id": "test-id",
+            "sourceType": "url",
+            "type": "source",
+            "url": "https://example.com/source1",
+          },
+          {
+            "id": "test-id",
+            "sourceType": "url",
+            "type": "source",
+            "url": "https://example.com/source2",
+          },
+          {
+            "id": "text-c8e45f92-7a3b-4d8e-9c1f-5e6a8b9d2f4c",
+            "type": "text-end",
+          },
+          {
+            "finishReason": {
+              "raw": "stop",
+              "unified": "stop",
+            },
+            "type": "finish",
+            "usage": {
+              "inputTokens": {
+                "cacheRead": 0,
+                "cacheWrite": undefined,
+                "noCache": 4,
+                "total": 4,
+              },
+              "outputTokens": {
+                "reasoning": 0,
+                "text": 30,
+                "total": 30,
+              },
+              "raw": {
+                "completion_tokens": 30,
+                "prompt_tokens": 4,
+                "total_tokens": 34,
+              },
+            },
+          },
+        ]
+      `);
+    });
+  });
+  describe('reasoning models', () => {
+    const reasoningModel = new XaiChatLanguageModel('grok-3-mini', testConfig);
+    function prepareReasoningResponse({
+      content = 'The result is 303.',
+      reasoning_content = 'Let me calculate 101 multiplied by 3: 101 * 3 = 303.',
+      usage = {
+        prompt_tokens: 15,
+        total_tokens: 35,
+        completion_tokens: 20,
+        completion_tokens_details: {
+          reasoning_tokens: 10,
+        },
+      },
+    }: {
+      content?: string;
+      reasoning_content?: string;
+      usage?: {
+        prompt_tokens: number;
+        total_tokens: number;
+        completion_tokens: number;
+        completion_tokens_details?: {
+          reasoning_tokens?: number;
+        };
+      };
+    }) {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          id: 'chatcmpl-reasoning-test',
+          object: 'chat.completion',
+          created: 1699472111,
+          model: 'grok-3-mini',
+          choices: [
+            {
+              index: 0,
+              message: {
+                role: 'assistant',
+                content,
+                reasoning_content,
+                tool_calls: null,
+              },
+              finish_reason: 'stop',
+            },
+          ],
+          usage,
+        },
+      };
+    }
+    it('should pass reasoning_effort parameter', async () => {
+      prepareReasoningResponse({});
+      await reasoningModel.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: { reasoningEffort: 'high' },
+        },
+      });
+      expect(await server.calls[0].requestBodyJson).toStrictEqual({
+        model: 'grok-3-mini',
+        messages: [{ role: 'user', content: 'Hello' }],
+        reasoning_effort: 'high',
+      });
+    });
+    it('should extract reasoning content', async () => {
+      prepareReasoningResponse({
+        content: 'The answer is 303.',
+        reasoning_content: 'Let me think: 101 * 3 = 303.',
+      });
+      const { content } = await reasoningModel.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: { reasoningEffort: 'low' },
+        },
+      });
+      expect(content).toMatchInlineSnapshot(`
+        [
+          {
+            "text": "The answer is 303.",
+            "type": "text",
+          },
+          {
+            "text": "Let me think: 101 * 3 = 303.",
+            "type": "reasoning",
+          },
+        ]
+      `);
+    });
+    it('should extract reasoning tokens from usage', async () => {
+      prepareReasoningResponse({
+        usage: {
+          prompt_tokens: 15,
+          completion_tokens: 20,
+          total_tokens: 35,
+          completion_tokens_details: {
+            reasoning_tokens: 10,
+          },
+        },
+      });
+      const { usage } = await reasoningModel.doGenerate({
+        prompt: TEST_PROMPT,
+        providerOptions: {
+          xai: { reasoningEffort: 'high' },
+        },
+      });
+      expect(usage).toMatchInlineSnapshot(`
+        {
+          "inputTokens": {
+            "cacheRead": 0,
+            "cacheWrite": undefined,
+            "noCache": 15,
+            "total": 15,
+          },
+          "outputTokens": {
+            "reasoning": 10,
+            "text": 10,
+            "total": 20,
+          },
+          "raw": {
+            "completion_tokens": 20,
+            "completion_tokens_details": {
+              "reasoning_tokens": 10,
+            },
+            "prompt_tokens": 15,
+            "total_tokens": 35,
+          },
+        }
+      `);
+    });
+    it('should handle reasoning streaming', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'stream-chunks',
+        chunks: [
+          `data: {"id":"b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b","object":"chat.completion.chunk","created":1750538120,"model":"grok-3-mini",` +
+            `"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b","object":"chat.completion.chunk","created":1750538120,"model":"grok-3-mini",` +
+            `"choices":[{"index":0,"delta":{"reasoning_content":"Let me calculate: "},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b","object":"chat.completion.chunk","created":1750538120,"model":"grok-3-mini",` +
+            `"choices":[{"index":0,"delta":{"reasoning_content":"101 * 3 = 303"},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b","object":"chat.completion.chunk","created":1750538120,"model":"grok-3-mini",` +
+            `"choices":[{"index":0,"delta":{"content":"The answer is 303."},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b","object":"chat.completion.chunk","created":1750538120,"model":"grok-3-mini",` +
+            `"choices":[{"index":0,"delta":{},"finish_reason":"stop"}],` +
+            `"usage":{"prompt_tokens":15,"total_tokens":35,"completion_tokens":20,"completion_tokens_details":{"reasoning_tokens":10}},"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: [DONE]\n\n`,
+        ],
+      };
+      const { stream } = await reasoningModel.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+        providerOptions: {
+          xai: { reasoningEffort: 'low' },
+        },
+      });
+      expect(await convertReadableStreamToArray(stream)).toMatchInlineSnapshot(`
+        [
+          {
+            "type": "stream-start",
+            "warnings": [],
+          },
+          {
+            "id": "b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "modelId": "grok-3-mini",
+            "timestamp": 2025-06-21T20:35:20.000Z,
+            "type": "response-metadata",
+          },
+          {
+            "id": "reasoning-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "reasoning-start",
+          },
+          {
+            "delta": "Let me calculate: ",
+            "id": "reasoning-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "reasoning-delta",
+          },
+          {
+            "delta": "101 * 3 = 303",
+            "id": "reasoning-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "reasoning-delta",
+          },
+          {
+            "id": "reasoning-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "reasoning-end",
+          },
+          {
+            "id": "text-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "text-start",
+          },
+          {
+            "delta": "The answer is 303.",
+            "id": "text-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "text-delta",
+          },
+          {
+            "id": "text-b7f32e89-8d6c-4a1e-9f5b-2c8e7a9d4f6b",
+            "type": "text-end",
+          },
+          {
+            "finishReason": {
+              "raw": "stop",
+              "unified": "stop",
+            },
+            "type": "finish",
+            "usage": {
+              "inputTokens": {
+                "cacheRead": 0,
+                "cacheWrite": undefined,
+                "noCache": 15,
+                "total": 15,
+              },
+              "outputTokens": {
+                "reasoning": 10,
+                "text": 10,
+                "total": 20,
+              },
+              "raw": {
+                "completion_tokens": 20,
+                "completion_tokens_details": {
+                  "reasoning_tokens": 10,
+                },
+                "prompt_tokens": 15,
+                "total_tokens": 35,
+              },
+            },
+          },
+        ]
+      `);
+    });
+    it('should deduplicate repetitive reasoning deltas', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'stream-chunks',
+        chunks: [
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          // Multiple identical "Thinking..." deltas (simulating Grok 4 issue)
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{"reasoning_content":"Thinking... "},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{"reasoning_content":"Thinking... "},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{"reasoning_content":"Thinking... "},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          // Different reasoning content should still come through
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{"reasoning_content":"Actually calculating now..."},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{"content":"The answer is 42."},"finish_reason":null}],"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: {"id":"grok-4-test","object":"chat.completion.chunk","created":1750538120,"model":"grok-4-0709",` +
+            `"choices":[{"index":0,"delta":{},"finish_reason":"stop"}],` +
+            `"usage":{"prompt_tokens":15,"total_tokens":35,"completion_tokens":20,"completion_tokens_details":{"reasoning_tokens":10}},"system_fingerprint":"fp_reasoning_v1"}\n\n`,
+          `data: [DONE]\n\n`,
+        ],
+      };
+      const { stream } = await reasoningModel.doStream({
+        prompt: TEST_PROMPT,
+        includeRawChunks: false,
+        providerOptions: {
+          xai: { reasoningEffort: 'low' },
+        },
+      });
+      expect(await convertReadableStreamToArray(stream)).toMatchInlineSnapshot(`
+        [
+          {
+            "type": "stream-start",
+            "warnings": [],
+          },
+          {
+            "id": "grok-4-test",
+            "modelId": "grok-4-0709",
+            "timestamp": 2025-06-21T20:35:20.000Z,
+            "type": "response-metadata",
+          },
+          {
+            "id": "reasoning-grok-4-test",
+            "type": "reasoning-start",
+          },
+          {
+            "delta": "Thinking... ",
+            "id": "reasoning-grok-4-test",
+            "type": "reasoning-delta",
+          },
+          {
+            "delta": "Actually calculating now...",
+            "id": "reasoning-grok-4-test",
+            "type": "reasoning-delta",
+          },
+          {
+            "id": "reasoning-grok-4-test",
+            "type": "reasoning-end",
+          },
+          {
+            "id": "text-grok-4-test",
+            "type": "text-start",
+          },
+          {
+            "delta": "The answer is 42.",
+            "id": "text-grok-4-test",
+            "type": "text-delta",
+          },
+          {
+            "id": "text-grok-4-test",
+            "type": "text-end",
+          },
+          {
+            "finishReason": {
+              "raw": "stop",
+              "unified": "stop",
+            },
+            "type": "finish",
+            "usage": {
+              "inputTokens": {
+                "cacheRead": 0,
+                "cacheWrite": undefined,
+                "noCache": 15,
+                "total": 15,
+              },
+              "outputTokens": {
+                "reasoning": 10,
+                "text": 10,
+                "total": 20,
+              },
+              "raw": {
+                "completion_tokens": 20,
+                "completion_tokens_details": {
+                  "reasoning_tokens": 10,
+                },
+                "prompt_tokens": 15,
+                "total_tokens": 35,
+              },
+            },
+          },
+        ]
+      `);
+    });
+  });
+});
+describe('doStream with raw chunks', () => {
+  it('should stream raw chunks when includeRawChunks is true', async () => {
+    server.urls['https://api.x.ai/v1/chat/completions'].response = {
+      type: 'stream-chunks',
+      chunks: [
+        `data: {"id":"d9f56e23-8b4c-4e7a-9d2f-6c8a9b5e3f7d","object":"chat.completion.chunk","created":1750538300,"model":"grok-beta","choices":[{"index":0,"delta":{"role":"assistant","content":"Hello"},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+        `data: {"id":"e2a47b89-3f6d-4c8e-9a1b-7d5f8c9e2a4b","object":"chat.completion.chunk","created":1750538301,"model":"grok-beta","choices":[{"index":0,"delta":{"content":" world"},"finish_reason":null}],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+        `data: {"id":"f3b58c9a-4e7f-5d9e-ab2c-8e6f9d0e3b5c","object":"chat.completion.chunk","created":1750538302,"model":"grok-beta","choices":[{"index":0,"delta":{},"finish_reason":"stop"}],"usage":{"prompt_tokens":10,"completion_tokens":5,"total_tokens":15},"citations":["https://example.com"],"system_fingerprint":"fp_13a6dc65a6"}\n\n`,
+        'data: [DONE]\n\n',
+      ],
+    };
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+    const chunks = await convertReadableStreamToArray(stream);
+    expect(chunks).toMatchInlineSnapshot(`
+      [
+        {
+          "type": "stream-start",
+          "warnings": [],
+        },
+        {
+          "rawValue": {
+            "choices": [
+              {
+                "delta": {
+                  "content": "Hello",
+                  "role": "assistant",
+                },
+                "finish_reason": null,
+                "index": 0,
+              },
+            ],
+            "created": 1750538300,
+            "id": "d9f56e23-8b4c-4e7a-9d2f-6c8a9b5e3f7d",
+            "model": "grok-beta",
+            "object": "chat.completion.chunk",
+            "system_fingerprint": "fp_13a6dc65a6",
+          },
+          "type": "raw",
+        },
+        {
+          "id": "d9f56e23-8b4c-4e7a-9d2f-6c8a9b5e3f7d",
+          "modelId": "grok-beta",
+          "timestamp": 2025-06-21T20:38:20.000Z,
+          "type": "response-metadata",
+        },
+        {
+          "id": "text-d9f56e23-8b4c-4e7a-9d2f-6c8a9b5e3f7d",
+          "type": "text-start",
+        },
+        {
+          "delta": "Hello",
+          "id": "text-d9f56e23-8b4c-4e7a-9d2f-6c8a9b5e3f7d",
+          "type": "text-delta",
+        },
+        {
+          "rawValue": {
+            "choices": [
+              {
+                "delta": {
+                  "content": " world",
+                },
+                "finish_reason": null,
+                "index": 0,
+              },
+            ],
+            "created": 1750538301,
+            "id": "e2a47b89-3f6d-4c8e-9a1b-7d5f8c9e2a4b",
+            "model": "grok-beta",
+            "object": "chat.completion.chunk",
+            "system_fingerprint": "fp_13a6dc65a6",
+          },
+          "type": "raw",
+        },
+        {
+          "id": "text-e2a47b89-3f6d-4c8e-9a1b-7d5f8c9e2a4b",
+          "type": "text-start",
+        },
+        {
+          "delta": " world",
+          "id": "text-e2a47b89-3f6d-4c8e-9a1b-7d5f8c9e2a4b",
+          "type": "text-delta",
+        },
+        {
+          "rawValue": {
+            "choices": [
+              {
+                "delta": {},
+                "finish_reason": "stop",
+                "index": 0,
+              },
+            ],
+            "citations": [
+              "https://example.com",
+            ],
+            "created": 1750538302,
+            "id": "f3b58c9a-4e7f-5d9e-ab2c-8e6f9d0e3b5c",
+            "model": "grok-beta",
+            "object": "chat.completion.chunk",
+            "system_fingerprint": "fp_13a6dc65a6",
+            "usage": {
+              "completion_tokens": 5,
+              "prompt_tokens": 10,
+              "total_tokens": 15,
+            },
+          },
+          "type": "raw",
+        },
+        {
+          "id": "test-id",
+          "sourceType": "url",
+          "type": "source",
+          "url": "https://example.com",
+        },
+        {
+          "id": "text-d9f56e23-8b4c-4e7a-9d2f-6c8a9b5e3f7d",
+          "type": "text-end",
+        },
+        {
+          "id": "text-e2a47b89-3f6d-4c8e-9a1b-7d5f8c9e2a4b",
+          "type": "text-end",
+        },
+        {
+          "finishReason": {
+            "raw": "stop",
+            "unified": "stop",
+          },
+          "type": "finish",
+          "usage": {
+            "inputTokens": {
+              "cacheRead": 0,
+              "cacheWrite": undefined,
+              "noCache": 10,
+              "total": 10,
+            },
+            "outputTokens": {
+              "reasoning": 0,
+              "text": 5,
+              "total": 5,
+            },
+            "raw": {
+              "completion_tokens": 5,
+              "prompt_tokens": 10,
+              "total_tokens": 15,
+            },
+          },
+        },
+      ]
+    `);
+  });
+  describe('error handling', () => {
+    it('should throw APICallError when xai returns error with 200 status (doGenerate)', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          code: 'The service is currently unavailable',
+          error: 'Timed out waiting for first token',
+        },
+      };
+      await expect(model.doGenerate({ prompt: TEST_PROMPT })).rejects.toThrow(
+        'Timed out waiting for first token',
+      );
+    });
+    it('should throw APICallError when xai returns error with 200 status (doStream)', async () => {
+      server.urls['https://api.x.ai/v1/chat/completions'].response = {
+        type: 'json-value',
+        body: {
+          code: 'The service is currently unavailable',
+          error: 'Timed out waiting for first token',
+        },
+      };
+      await expect(model.doStream({ prompt: TEST_PROMPT })).rejects.toThrow(
+        'Timed out waiting for first token',
+      );
+    });
+  });
+});