npm - omnikey-cli - Versions diffs - 1.2.0 → 1.3.0 - Mend

omnikey-cli 1.2.0 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/backend-dist/__tests__/ai-client.adapters.test.js +247 -0
package/backend-dist/__tests__/ai-client.helpers.test.js +99 -0
package/backend-dist/__tests__/featureRoutes.runEnhancementModel.test.js +79 -0
package/backend-dist/ai-client.js +54 -6
package/backend-dist/featureRoutes.js +13 -7
package/package.json +1 -1

package/backend-dist/__tests__/ai-client.adapters.test.js ADDED Viewed

@@ -0,0 +1,247 @@
+"use strict";
+/**
+ * Per-provider adapter tests for temperature handling.
+ *
+ * The three SDKs (`openai`, `@anthropic-ai/sdk`, `@google/genai`) are mocked
+ * at the module boundary using `vi.mock`. Mock spies are declared inside a
+ * `vi.hoisted()` block so they are available when `vi.mock` factories run
+ * (vi.mock is hoisted to the top of the file).
+ *
+ * These tests never contact any real API.
+ */
+Object.defineProperty(exports, "__esModule", { value: true });
+const vitest_1 = require("vitest");
+const mocks = vitest_1.vi.hoisted(() => ({
+    openaiCreate: vitest_1.vi.fn(),
+    anthropicCreate: vitest_1.vi.fn(),
+    anthropicStream: vitest_1.vi.fn(),
+    geminiGenerate: vitest_1.vi.fn(),
+    geminiGenerateStream: vitest_1.vi.fn(),
+}));
+vitest_1.vi.mock('openai', () => ({
+    default: class MockOpenAI {
+        constructor(_opts) {
+            this.chat = { completions: { create: mocks.openaiCreate } };
+            this.images = { generate: vitest_1.vi.fn() };
+        }
+    },
+}));
+vitest_1.vi.mock('@anthropic-ai/sdk', () => ({
+    default: class MockAnthropic {
+        constructor(_opts) {
+            this.messages = { create: mocks.anthropicCreate, stream: mocks.anthropicStream };
+        }
+    },
+}));
+vitest_1.vi.mock('@google/genai', () => ({
+    GoogleGenAI: class MockGoogleGenAI {
+        constructor(_opts) {
+            this.models = {
+                generateContent: mocks.geminiGenerate,
+                generateContentStream: mocks.geminiGenerateStream,
+                generateImages: vitest_1.vi.fn(),
+            };
+        }
+    },
+    // The adapter file imports these as types-only but they still need to resolve.
+    Content: class {
+    },
+    Tool: class {
+    },
+}));
+const ai_client_1 = require("../ai-client");
+const messages = [{ role: 'user', content: 'hello' }];
+function asAsyncIterable(chunks) {
+    return {
+        [Symbol.asyncIterator]: async function* () {
+            for (const c of chunks)
+                yield c;
+        },
+    };
+}
+(0, vitest_1.beforeEach)(() => {
+    mocks.openaiCreate.mockReset();
+    mocks.anthropicCreate.mockReset();
+    mocks.anthropicStream.mockReset();
+    mocks.geminiGenerate.mockReset();
+    mocks.geminiGenerateStream.mockReset();
+});
+// ---------------------------------------------------------------------------
+// OpenAI
+// ---------------------------------------------------------------------------
+(0, vitest_1.describe)('OpenAIAdapter temperature handling', () => {
+    function mockCompleteResponse() {
+        mocks.openaiCreate.mockResolvedValueOnce({
+            choices: [{ message: { content: 'ok', tool_calls: undefined }, finish_reason: 'stop' }],
+            usage: { prompt_tokens: 1, completion_tokens: 1, total_tokens: 2 },
+        });
+    }
+    function mockStreamResponse() {
+        mocks.openaiCreate.mockResolvedValueOnce(asAsyncIterable([
+            { choices: [{ delta: { content: 'ok' } }] },
+            {
+                choices: [{ delta: {} }],
+                usage: { prompt_tokens: 1, completion_tokens: 1, total_tokens: 2 },
+            },
+        ]));
+    }
+    (0, vitest_1.it)('complete: passes temperature for gpt-4o-mini', async () => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.complete('gpt-4o-mini', messages, { temperature: 0.42 });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).toHaveProperty('temperature', 0.42);
+    });
+    (0, vitest_1.it)('complete: omits temperature for gpt-5.5 even if caller supplies one', async () => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.complete('gpt-5.5', messages, { temperature: 0.42 });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).not.toHaveProperty('temperature');
+    });
+    vitest_1.it.each(['gpt-5', 'gpt-5-mini', 'gpt-5.1', 'o1', 'o3-mini', 'o4-mini'])('complete: omits temperature for unsupported model %s', async (model) => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.complete(model, messages, { temperature: 0.7 });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).not.toHaveProperty('temperature');
+    });
+    (0, vitest_1.it)('streamComplete: passes temperature for gpt-4o-mini', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.streamComplete('gpt-4o-mini', messages, { temperature: 0.31 }, () => { });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).toHaveProperty('temperature', 0.31);
+        (0, vitest_1.expect)(body).toHaveProperty('stream', true);
+    });
+    (0, vitest_1.it)('streamComplete: omits temperature for gpt-5.5', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.streamComplete('gpt-5.5', messages, { temperature: 0.31 }, () => { });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).not.toHaveProperty('temperature');
+        (0, vitest_1.expect)(body).toHaveProperty('stream', true);
+    });
+    (0, vitest_1.it)('streamComplete: omits temperature even when caller passes empty options for gpt-5.5', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.streamComplete('gpt-5.5', messages, {}, () => { });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).not.toHaveProperty('temperature');
+    });
+    (0, vitest_1.it)('streamComplete: uses 0.3 default for supported model when caller omits temperature', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('openai', 'sk-test');
+        await client.streamComplete('gpt-4o-mini', messages, {}, () => { });
+        const body = mocks.openaiCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).toHaveProperty('temperature', 0.3);
+    });
+});
+// ---------------------------------------------------------------------------
+// Anthropic
+// ---------------------------------------------------------------------------
+(0, vitest_1.describe)('AnthropicAdapter temperature handling', () => {
+    function mockCompleteResponse() {
+        mocks.anthropicCreate.mockResolvedValueOnce({
+            content: [{ type: 'text', text: 'ok' }],
+            stop_reason: 'end_turn',
+            usage: { input_tokens: 1, output_tokens: 1 },
+        });
+    }
+    function mockStreamResponse() {
+        const finalMessage = vitest_1.vi.fn().mockResolvedValue({
+            usage: { input_tokens: 1, output_tokens: 1 },
+        });
+        const stream = asAsyncIterable([
+            { type: 'content_block_delta', delta: { type: 'text_delta', text: 'ok' } },
+        ]);
+        stream.finalMessage = finalMessage;
+        mocks.anthropicStream.mockReturnValueOnce(stream);
+    }
+    (0, vitest_1.it)('complete: passes temperature for claude-sonnet-4-5', async () => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('anthropic', 'sk-anthropic-test');
+        await client.complete('claude-sonnet-4-5', messages, { temperature: 0.42 });
+        const body = mocks.anthropicCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).toHaveProperty('temperature', 0.42);
+    });
+    vitest_1.it.each([
+        'claude-haiku-4-5-20251001',
+        'claude-opus-4-5',
+        'claude-opus-4-5-20251101',
+        'claude-opus-4-6',
+    ])('complete: passes temperature for supported model %s', async (model) => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('anthropic', 'sk-anthropic-test');
+        await client.complete(model, messages, { temperature: 0.5 });
+        const body = mocks.anthropicCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).toHaveProperty('temperature', 0.5);
+    });
+    vitest_1.it.each(['claude-opus-4-7', 'claude-opus-4-7-20260101'])('complete: omits temperature for unsupported model %s', async (model) => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('anthropic', 'sk-anthropic-test');
+        await client.complete(model, messages, { temperature: 0.5 });
+        const body = mocks.anthropicCreate.mock.calls[0][0];
+        (0, vitest_1.expect)(body).not.toHaveProperty('temperature');
+    });
+    (0, vitest_1.it)('streamComplete: passes temperature for claude-sonnet-4-5', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('anthropic', 'sk-anthropic-test');
+        await client.streamComplete('claude-sonnet-4-5', messages, { temperature: 0.6 }, () => { });
+        const body = mocks.anthropicStream.mock.calls[0][0];
+        (0, vitest_1.expect)(body).toHaveProperty('temperature', 0.6);
+    });
+    (0, vitest_1.it)('streamComplete: omits temperature for claude-opus-4-7', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('anthropic', 'sk-anthropic-test');
+        await client.streamComplete('claude-opus-4-7', messages, { temperature: 0.6 }, () => { });
+        const body = mocks.anthropicStream.mock.calls[0][0];
+        (0, vitest_1.expect)(body).not.toHaveProperty('temperature');
+    });
+});
+// ---------------------------------------------------------------------------
+// Gemini
+// ---------------------------------------------------------------------------
+(0, vitest_1.describe)('GeminiAdapter temperature handling', () => {
+    function mockCompleteResponse() {
+        mocks.geminiGenerate.mockResolvedValueOnce({
+            candidates: [
+                {
+                    content: { parts: [{ text: 'ok' }] },
+                    finishReason: 'STOP',
+                },
+            ],
+            usageMetadata: { promptTokenCount: 1, candidatesTokenCount: 1, totalTokenCount: 2 },
+        });
+    }
+    function mockStreamResponse() {
+        mocks.geminiGenerateStream.mockResolvedValueOnce(asAsyncIterable([
+            { text: 'ok' },
+            {
+                text: '',
+                usageMetadata: { promptTokenCount: 1, candidatesTokenCount: 1, totalTokenCount: 2 },
+            },
+        ]));
+    }
+    vitest_1.it.each(['gemini-2.5-flash', 'gemini-2.5-pro', 'gemini-3-pro'])('complete: passes temperature for %s (all Gemini models accept it)', async (model) => {
+        mockCompleteResponse();
+        const client = new ai_client_1.AIClient('gemini', 'gemini-test-key');
+        await client.complete(model, messages, { temperature: 0.42 });
+        const body = mocks.geminiGenerate.mock.calls[0][0];
+        (0, vitest_1.expect)(body.config).toHaveProperty('temperature', 0.42);
+    });
+    (0, vitest_1.it)('streamComplete: passes temperature for gemini-2.5-pro', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('gemini', 'gemini-test-key');
+        await client.streamComplete('gemini-2.5-pro', messages, { temperature: 0.31 }, () => { });
+        const body = mocks.geminiGenerateStream.mock.calls[0][0];
+        (0, vitest_1.expect)(body.config).toHaveProperty('temperature', 0.31);
+    });
+    (0, vitest_1.it)('streamComplete: applies default 0.3 when caller omits temperature', async () => {
+        mockStreamResponse();
+        const client = new ai_client_1.AIClient('gemini', 'gemini-test-key');
+        await client.streamComplete('gemini-2.5-pro', messages, {}, () => { });
+        const body = mocks.geminiGenerateStream.mock.calls[0][0];
+        (0, vitest_1.expect)(body.config).toHaveProperty('temperature', 0.3);
+    });
+});

package/backend-dist/__tests__/ai-client.helpers.test.js ADDED Viewed

@@ -0,0 +1,99 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+const vitest_1 = require("vitest");
+const ai_client_1 = require("../ai-client");
+(0, vitest_1.describe)('modelSupportsTemperature', () => {
+    (0, vitest_1.describe)('OpenAI', () => {
+        vitest_1.it.each([
+            ['gpt-4o-mini', true],
+            ['gpt-4o', true],
+            ['gpt-4-turbo', true],
+            ['gpt-3.5-turbo', true],
+        ])('allows temperature for %s', (model, expected) => {
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(model)).toBe(expected);
+        });
+        vitest_1.it.each([
+            ['gpt-5', false],
+            ['gpt-5-mini', false],
+            ['gpt-5.1', false],
+            ['gpt-5.5', false],
+            ['GPT-5.5', false], // case-insensitive
+        ])('rejects temperature for GPT-5 family member %s', (model, expected) => {
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(model)).toBe(expected);
+        });
+        vitest_1.it.each([
+            ['o1', false],
+            ['o1-preview', false],
+            ['o3', false],
+            ['o3-mini', false],
+            ['o4-mini', false],
+        ])('rejects temperature for reasoning model %s', (model, expected) => {
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(model)).toBe(expected);
+        });
+    });
+    (0, vitest_1.describe)('Gemini', () => {
+        vitest_1.it.each([
+            ['gemini-2.5-flash', true],
+            ['gemini-2.5-pro', true],
+            ['gemini-3-pro', true],
+            ['gemini-3.5-flash', true],
+        ])('allows temperature for %s', (model, expected) => {
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(model)).toBe(expected);
+        });
+    });
+    (0, vitest_1.describe)('Anthropic', () => {
+        vitest_1.it.each([
+            ['claude-haiku-4-5', true],
+            ['claude-haiku-4-5-20251001', true],
+            ['claude-sonnet-4-5', true],
+            ['claude-sonnet-4-5-20250929', true],
+            ['claude-opus-4-5', true],
+            ['claude-opus-4-5-20251101', true],
+            ['claude-opus-4-6', true],
+        ])('allows temperature for %s', (model, expected) => {
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(model)).toBe(expected);
+        });
+        vitest_1.it.each([
+            ['claude-opus-4-7', false],
+            ['claude-opus-4-7-20260101', false],
+            ['CLAUDE-OPUS-4-7', false], // case-insensitive
+        ])('rejects temperature for opus-4-7 variant %s', (model, expected) => {
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(model)).toBe(expected);
+        });
+    });
+});
+(0, vitest_1.describe)('getDefaultModel', () => {
+    (0, vitest_1.it)('returns the configured fast and smart tiers for each provider', () => {
+        // Don't pin exact model strings — they will be upgraded over time. Just
+        // assert that each provider returns a non-empty string for both tiers
+        // and that fast/smart differ (smart is meant to be a bigger model).
+        for (const provider of ['openai', 'gemini', 'anthropic']) {
+            const fast = (0, ai_client_1.getDefaultModel)(provider, 'fast');
+            const smart = (0, ai_client_1.getDefaultModel)(provider, 'smart');
+            (0, vitest_1.expect)(fast).toBeTruthy();
+            (0, vitest_1.expect)(smart).toBeTruthy();
+            (0, vitest_1.expect)(fast).not.toEqual(smart);
+        }
+    });
+    (0, vitest_1.it)('returns smart-tier models that are correctly classified by modelSupportsTemperature', () => {
+        // Regression guard: whenever a smart model is upgraded, the helper must
+        // continue to return the correct policy for it. This test is the single
+        // place that ties the two together so an accidental mismatch breaks the
+        // suite immediately.
+        const expectations = {
+            // OpenAI smart tier is in the GPT-5 family → no temperature.
+            openai: false,
+            // Gemini smart tier accepts temperature.
+            gemini: true,
+            // Anthropic smart tier is claude-opus-4-7 → no temperature.
+            anthropic: false,
+        };
+        for (const provider of Object.keys(expectations)) {
+            const expected = expectations[provider];
+            if (expected === null)
+                continue;
+            const smartModel = (0, ai_client_1.getDefaultModel)(provider, 'smart');
+            (0, vitest_1.expect)((0, ai_client_1.modelSupportsTemperature)(smartModel), `${provider} smart model "${smartModel}" should report temperature-support=${expected}`).toBe(expected);
+        }
+    });
+});

package/backend-dist/__tests__/featureRoutes.runEnhancementModel.test.js ADDED Viewed

@@ -0,0 +1,79 @@
+"use strict";
+/**
+ * Tests for the temperature-handling change in `runEnhancementModel`.
+ *
+ * - 'enhance' → { temperature: 0.3 }
+ * - 'grammar' → { temperature: 0.3 }
+ * - 'task'    → {}   (no temperature; smart-tier model decides for itself)
+ *
+ * Mocks `./ai-client` and `./models/subscriptionTaskTemplate` so the test
+ * stays a pure unit test and never touches the database or any SDK.
+ */
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+const vitest_1 = require("vitest");
+const winston_1 = __importDefault(require("winston"));
+const mocks = vitest_1.vi.hoisted(() => ({
+    streamComplete: vitest_1.vi.fn(),
+    getDefaultModel: vitest_1.vi.fn(),
+    findOne: vitest_1.vi.fn(),
+}));
+vitest_1.vi.mock('../ai-client', () => ({
+    aiClient: { streamComplete: mocks.streamComplete },
+    getDefaultModel: mocks.getDefaultModel,
+}));
+vitest_1.vi.mock('../models/subscriptionTaskTemplate', () => ({
+    SubscriptionTaskTemplate: { findOne: mocks.findOne },
+}));
+const featureRoutes_1 = require("../featureRoutes");
+function makeLogger() {
+    return winston_1.default.createLogger({
+        silent: true,
+        transports: [new winston_1.default.transports.Console({ silent: true })],
+    });
+}
+const fakeSubscription = { id: 'sub_test' };
+(0, vitest_1.beforeEach)(() => {
+    mocks.streamComplete.mockReset();
+    mocks.streamComplete.mockResolvedValue({ usage: undefined, model: 'mock-model' });
+    mocks.getDefaultModel.mockReset();
+    mocks.getDefaultModel.mockImplementation((_provider, tier) => tier === 'smart' ? 'smart-model-mock' : 'fast-model-mock');
+    mocks.findOne.mockReset();
+    // Default task template — plain text passes through `decompressString`
+    // so `getPromptForCommand('task', ...)` returns a non-empty prompt and the
+    // streamComplete path is reached.
+    mocks.findOne.mockResolvedValue({ instructions: 'You are a helpful task assistant.' });
+});
+(0, vitest_1.describe)('runEnhancementModel — temperature per command', () => {
+    (0, vitest_1.it)("passes temperature: 0.3 for cmd='enhance'", async () => {
+        const result = await (0, featureRoutes_1.runEnhancementModel)(makeLogger(), 'hello world', 'enhance', fakeSubscription);
+        (0, vitest_1.expect)(result).not.toBeNull();
+        (0, vitest_1.expect)(mocks.streamComplete).toHaveBeenCalledTimes(1);
+        const [, , options] = mocks.streamComplete.mock.calls[0];
+        (0, vitest_1.expect)(options).toEqual({ temperature: 0.3 });
+    });
+    (0, vitest_1.it)("passes temperature: 0.3 for cmd='grammar'", async () => {
+        const result = await (0, featureRoutes_1.runEnhancementModel)(makeLogger(), 'helo wrld', 'grammar', fakeSubscription);
+        (0, vitest_1.expect)(result).not.toBeNull();
+        (0, vitest_1.expect)(mocks.streamComplete).toHaveBeenCalledTimes(1);
+        const [, , options] = mocks.streamComplete.mock.calls[0];
+        (0, vitest_1.expect)(options).toEqual({ temperature: 0.3 });
+    });
+    (0, vitest_1.it)("omits temperature for cmd='task' (custom-task)", async () => {
+        const result = await (0, featureRoutes_1.runEnhancementModel)(makeLogger(), 'do the thing', 'task', fakeSubscription);
+        (0, vitest_1.expect)(result).not.toBeNull();
+        (0, vitest_1.expect)(mocks.streamComplete).toHaveBeenCalledTimes(1);
+        const [, , options] = mocks.streamComplete.mock.calls[0];
+        (0, vitest_1.expect)(options).toEqual({});
+        (0, vitest_1.expect)(options).not.toHaveProperty('temperature');
+    });
+    (0, vitest_1.it)("selects the smart-tier model for cmd='task' and fast-tier for enhance/grammar", async () => {
+        await (0, featureRoutes_1.runEnhancementModel)(makeLogger(), 'a', 'task', fakeSubscription);
+        await (0, featureRoutes_1.runEnhancementModel)(makeLogger(), 'b', 'enhance', fakeSubscription);
+        await (0, featureRoutes_1.runEnhancementModel)(makeLogger(), 'c', 'grammar', fakeSubscription);
+        const modelsCalled = mocks.streamComplete.mock.calls.map(([model]) => model);
+        (0, vitest_1.expect)(modelsCalled).toEqual(['smart-model-mock', 'fast-model-mock', 'fast-model-mock']);
+    });
+});

package/backend-dist/ai-client.js CHANGED Viewed

@@ -5,6 +5,7 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.aiClient = exports.AIClient = void 0;
 exports.getDefaultModel = getDefaultModel;
+exports.modelSupportsTemperature = modelSupportsTemperature;
 exports.getMaxMessageContentLength = getMaxMessageContentLength;
 exports.getMaxHistoryLength = getMaxHistoryLength;
 exports.getContextWindowSize = getContextWindowSize;
@@ -17,6 +18,12 @@ const config_1 = require("./config");
 // Default model mapping
 // ---------------------------------------------------------------------------
 const DEFAULT_MODELS = {
+    // Smart-tier picks track each provider's current flagship for
+    // reasoning/coding workloads. Update here when a newer model becomes
+    // generally available so both the feature routes and the agent server pick
+    // it up automatically. When swapping a smart model in, also verify whether
+    // it accepts the `temperature` parameter and update
+    // `modelSupportsTemperature` accordingly.
     openai: { fast: 'gpt-4o-mini', smart: 'gpt-5.5' },
     gemini: { fast: 'gemini-2.5-flash', smart: 'gemini-2.5-pro' },
     anthropic: { fast: 'claude-haiku-4-5-20251001', smart: 'claude-opus-4-7' },
@@ -24,6 +31,39 @@ const DEFAULT_MODELS = {
 function getDefaultModel(provider, tier) {
     return DEFAULT_MODELS[provider][tier];
 }
+/**
+ * Returns whether a given model accepts the `temperature` parameter.
+ *
+ * Provider-specific rules (validated against published API docs and SDKs as
+ * of late 2025 / early 2026):
+ *  - OpenAI GPT-5 family (`gpt-5`, `gpt-5-mini`, `gpt-5.1`, …): NOT supported.
+ *    The API only accepts the default value (1) and returns
+ *    `unsupported_value: 'temperature'` for anything else.
+ *  - OpenAI o-series reasoning models (`o1`, `o3`, `o4-mini`, …): NOT
+ *    supported for the same reason.
+ *  - OpenAI GPT-4 / GPT-4o / GPT-3.5: supported.
+ *  - Google Gemini (2.x and 3.x families): supported via `generationConfig`.
+ *  - Anthropic Claude (Sonnet, Haiku, and Opus 4.x): supported, with the
+ *    exception of `claude-opus-4-7` (and its dated revisions) which rejects
+ *    `temperature` just like the OpenAI GPT-5 family.
+ */
+function modelSupportsTemperature(model) {
+    // OpenAI GPT-5 family (gpt-5, gpt-5-mini, gpt-5.1, gpt-5.5, …) only
+    // accepts the default temperature (1) — anything else is rejected with
+    // `unsupported_value: 'temperature'`.
+    if (/^gpt-5(\b|[.\-])/i.test(model))
+        return false;
+    // OpenAI o-series reasoning models (o1, o3, o4-mini, …) likewise drop the
+    // `temperature` knob.
+    if (/^o[134](\b|[-_])/i.test(model))
+        return false;
+    // Anthropic's Claude Opus 4.7 line (and its dated revisions like
+    // `claude-opus-4-7-20260101`) does not accept `temperature`; the rest of
+    // the Claude 4.x family (Sonnet, Haiku, Opus 4.5/4.6) does.
+    if (/^claude-opus-4-7(\b|[-_])/i.test(model))
+        return false;
+    return true;
+}
 /**
  * Maximum character length for a single message content string per provider.
  *
@@ -88,7 +128,7 @@ class OpenAIAdapter {
             model,
             messages: oaiMessages,
             tools: tools?.length ? tools : undefined,
-            temperature: model === 'gpt-5.5' ? 1 : (options.temperature ?? 0.2),
+            ...(modelSupportsTemperature(model) ? { temperature: options.temperature ?? 0.2 } : {}),
             max_tokens: options.maxTokens,
         });
         const choice = completion.choices[0];
@@ -125,7 +165,9 @@ class OpenAIAdapter {
         const stream = await this.client.chat.completions.create({
             model,
             messages: oaiMessages,
-            temperature: options.temperature ?? 0.3,
+            ...(modelSupportsTemperature(model)
+                ? { temperature: options.temperature ?? 0.3 }
+                : {}),
             stream: true,
             stream_options: { include_usage: true },
         });
@@ -188,7 +230,7 @@ class AnthropicAdapter {
             ...(system ? { system } : {}),
             messages: anthropicMessages,
             ...(tools?.length ? { tools } : {}),
-            ...(model === 'claude-opus-4-7' ? {} : { temperature: options.temperature ?? 0.2 }),
+            ...(modelSupportsTemperature(model) ? { temperature: options.temperature ?? 0.2 } : {}),
         });
         const textContent = response.content
             .filter((b) => b.type === 'text')
@@ -235,7 +277,9 @@ class AnthropicAdapter {
             max_tokens: options.maxTokens ?? 8192,
             ...(system ? { system } : {}),
             messages: anthropicMessages,
-            temperature: options.temperature ?? 0.3,
+            ...(modelSupportsTemperature(model)
+                ? { temperature: options.temperature ?? 0.3 }
+                : {}),
         });
         for await (const event of stream) {
             if (event.type === 'content_block_delta' &&
@@ -269,7 +313,9 @@ class GeminiAdapter {
             config: {
                 ...(systemInstruction ? { systemInstruction } : {}),
                 ...(tools?.length ? { tools } : {}),
-                temperature: options.temperature ?? 0.2,
+                ...(modelSupportsTemperature(model)
+                    ? { temperature: options.temperature ?? 0.2 }
+                    : {}),
             },
         });
         const candidate = response.candidates?.[0];
@@ -320,7 +366,9 @@ class GeminiAdapter {
             contents,
             config: {
                 ...(systemInstruction ? { systemInstruction } : {}),
-                temperature: options.temperature ?? 0.3,
+                ...(modelSupportsTemperature(model)
+                    ? { temperature: options.temperature ?? 0.3 }
+                    : {}),
             },
         });
         let usage;

package/backend-dist/featureRoutes.js CHANGED Viewed

@@ -56,13 +56,12 @@ async function getPromptForCommand(logger, cmd, subscription) {
     return '';
 }
 function getModelForCommand(cmd) {
+    // 'task' is the custom-task command and routes to the smart-tier model.
+    // 'enhance' and 'grammar' use the fast tier. The actual model strings live
+    // in ai-client.ts (DEFAULT_MODELS) so all callers stay in sync when we
+    // upgrade to a newer flagship model.
     const tier = cmd === 'task' ? 'smart' : 'fast';
-    const models = {
-        openai: { fast: 'gpt-4o-mini', smart: 'gpt-5.5' },
-        gemini: { fast: 'gemini-2.5-flash', smart: 'gemini-2.5-pro' },
-        anthropic: { fast: 'claude-haiku-4-5-20251001', smart: 'claude-opus-4-7' },
-    };
-    return models[config_1.config.aiProvider]?.[tier] ?? 'gpt-4o-mini';
+    return (0, ai_client_1.getDefaultModel)(config_1.config.aiProvider, tier);
 }
 function createMessagesParams(cmd, input, prompt) {
     if (cmd === 'task') {
@@ -100,7 +99,14 @@ async function runEnhancementModel(logger, text, cmd, subscription, onDelta) {
     const messages = createMessagesParams(cmd, trimmed, prompt);
     let rawResponse = '';
     let usage;
-    const result = await ai_client_1.aiClient.streamComplete(model, messages, { temperature: 0.3 }, (delta) => {
+    // Smart-tier models (used by the custom-task command) include OpenAI's
+    // GPT-5 family, which rejects any non-default `temperature`. Even on
+    // providers where the smart model still accepts it (Gemini, Anthropic),
+    // omitting `temperature` keeps the request shape uniform across providers
+    // and lets each model use its own tuned default. The fast-tier models used
+    // by `enhance` and `grammar` keep the previous 0.3 default.
+    const completionOptions = cmd === 'task' ? {} : { temperature: 0.3 };
+    const result = await ai_client_1.aiClient.streamComplete(model, messages, completionOptions, (delta) => {
         rawResponse += delta;
         if (onDelta)
             onDelta(delta);

package/package.json CHANGED Viewed

@@ -4,7 +4,7 @@
     "access": "public",
     "registry": "https://registry.npmjs.org/"
   },
-  "version": "1.2.0",
+  "version": "1.3.0",
   "description": "CLI for onboarding users to Omnikey AI and configuring OPENAI_API_KEY. Use Yarn for install/build.",
   "engines": {
     "node": ">=14.0.0",