npm - genai-lite - Versions diffs - 0.4.0 → 0.4.1 - Mend

genai-lite 0.4.0 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/README.md +47 -37
package/dist/llm/LLMService.d.ts +29 -2
package/dist/llm/LLMService.js +67 -36
package/dist/llm/config.js +4 -4
package/dist/llm/services/SettingsManager.js +17 -11
package/dist/llm/types.d.ts +81 -22
package/dist/prompting/parser.d.ts +2 -2
package/dist/prompting/parser.js +2 -2
package/package.json +1 -1
package/dist/llm/LLMService.createMessages.test.d.ts +0 -4
package/dist/llm/LLMService.createMessages.test.js +0 -364
package/dist/llm/LLMService.original.d.ts +0 -147
package/dist/llm/LLMService.original.js +0 -656
package/dist/llm/LLMService.prepareMessage.test.d.ts +0 -1
package/dist/llm/LLMService.prepareMessage.test.js +0 -303
package/dist/llm/LLMService.presets.test.d.ts +0 -1
package/dist/llm/LLMService.presets.test.js +0 -210
package/dist/llm/LLMService.sendMessage.preset.test.d.ts +0 -1
package/dist/llm/LLMService.sendMessage.preset.test.js +0 -153
package/dist/llm/LLMService.test.d.ts +0 -1
package/dist/llm/LLMService.test.js +0 -639
package/dist/llm/clients/AnthropicClientAdapter.test.d.ts +0 -1
package/dist/llm/clients/AnthropicClientAdapter.test.js +0 -273
package/dist/llm/clients/GeminiClientAdapter.test.d.ts +0 -1
package/dist/llm/clients/GeminiClientAdapter.test.js +0 -405
package/dist/llm/clients/LlamaCppClientAdapter.test.d.ts +0 -1
package/dist/llm/clients/LlamaCppClientAdapter.test.js +0 -447
package/dist/llm/clients/LlamaCppServerClient.test.d.ts +0 -1
package/dist/llm/clients/LlamaCppServerClient.test.js +0 -294
package/dist/llm/clients/MockClientAdapter.test.d.ts +0 -1
package/dist/llm/clients/MockClientAdapter.test.js +0 -250
package/dist/llm/clients/OpenAIClientAdapter.test.d.ts +0 -1
package/dist/llm/clients/OpenAIClientAdapter.test.js +0 -258
package/dist/llm/clients/adapterErrorUtils.test.d.ts +0 -1
package/dist/llm/clients/adapterErrorUtils.test.js +0 -123
package/dist/llm/config.test.d.ts +0 -1
package/dist/llm/config.test.js +0 -176
package/dist/llm/services/AdapterRegistry.test.d.ts +0 -1
package/dist/llm/services/AdapterRegistry.test.js +0 -239
package/dist/llm/services/ModelResolver.test.d.ts +0 -1
package/dist/llm/services/ModelResolver.test.js +0 -179
package/dist/llm/services/PresetManager.test.d.ts +0 -1
package/dist/llm/services/PresetManager.test.js +0 -210
package/dist/llm/services/RequestValidator.test.d.ts +0 -1
package/dist/llm/services/RequestValidator.test.js +0 -159
package/dist/llm/services/SettingsManager.test.d.ts +0 -1
package/dist/llm/services/SettingsManager.test.js +0 -266
package/dist/prompting/builder.d.ts +0 -38
package/dist/prompting/builder.js +0 -63
package/dist/prompting/builder.test.d.ts +0 -4
package/dist/prompting/builder.test.js +0 -109
package/dist/prompting/content.test.d.ts +0 -4
package/dist/prompting/content.test.js +0 -212
package/dist/prompting/parser.test.d.ts +0 -4
package/dist/prompting/parser.test.js +0 -464
package/dist/prompting/template.test.d.ts +0 -1
package/dist/prompting/template.test.js +0 -250
package/dist/providers/fromEnvironment.test.d.ts +0 -1
package/dist/providers/fromEnvironment.test.js +0 -59

package/README.md CHANGED Viewed

@@ -295,9 +295,11 @@ if (response.object === 'chat.completion' && response.choices[0].reasoning) {
 - Not all models support reasoning - check the [supported models](#models-with-reasoning-support) list
 - The `reasoning` field in the response contains the model's thought process (when available)
-### Automatic Thinking Extraction
+### Thinking Extraction and Enforcement
-genai-lite can capture reasoning from any model by automatically extracting content wrapped in XML tags. When models output their thinking process in tags like `<thinking>`, the library automatically moves this content to the standardized `reasoning` field. This works with all models, providing a consistent interface for accessing model reasoning:
+For models without native reasoning, you can prompt them to output reasoning in XML tags like `<thinking>`. The library then extracts these tags and moves the content to the standardized `reasoning` field, providing a consistent interface across all models.
+**Key point:** The library doesn't make models think automatically—you must explicitly instruct non-reasoning models to use thinking tags in your prompt. The library then enforces that these tags are present (for non-reasoning models) or accepts native reasoning (for reasoning models).
 ```typescript
 // Prompt the model to think step-by-step in a <thinking> tag
@@ -312,7 +314,7 @@ const response = await llmService.sendMessage({
     content: 'Please think through this problem step by step before answering: What is 15% of 240?'
   }],
   settings: {
-    thinkingExtraction: { enabled: true } // Must explicitly enable
+    thinkingTagFallback: { enabled: true } // Must explicitly enable
   }
 });
@@ -334,25 +336,25 @@ const response = await llmService.sendMessage({
   modelId: 'claude-3-5-haiku-20241022',
   messages: [{ role: 'user', content: 'Solve this step by step...' }],
   settings: {
-    thinkingExtraction: {
+    thinkingTagFallback: {
       enabled: true,     // Must explicitly enable (default: false)
-      tag: 'scratchpad', // Custom tag name (default: 'thinking')
-      onMissing: 'auto'  // Smart enforcement (see below)
+      tagName: 'scratchpad', // Custom tag name (default: 'thinking')
+      enforce: true  // Smart enforcement (see below)
     }
   }
 });
 ```
-**The `onMissing` Property:**
+**The `enforce` Property:**
+The `enforce` boolean controls whether thinking tags are required when native reasoning is not active:
-The `onMissing` property controls what happens when the expected thinking tag is not found:
+- `enforce: true` - Error if tags missing AND native reasoning not active (smart enforcement)
+- `enforce: false` (default) - Extract tags if present, never error
-- `'ignore'`: Silently continue without the tag
-- `'warn'`: Log a warning but continue processing
-- `'error'`: Return an error response with the original response preserved in `partialResponse`
-- `'auto'` (default): Intelligently decide based on the model's native reasoning capabilities
+The enforcement is **always smart** - it automatically checks if native reasoning is active and only enforces when the model needs tags as a fallback.
-**How `'auto'` Mode Works:**
+**How Smart Enforcement Works:**
 ```typescript
 // With non-native reasoning models (e.g., GPT-4)
@@ -367,10 +369,10 @@ const response = await llmService.sendMessage({
     content: 'What is 15% of 240?'
   }],
   settings: {
-    thinkingExtraction: { enabled: true } // onMissing: 'auto' is default
+    thinkingTagFallback: { enabled: true, enforce: true }
   }
 });
-// Result: ERROR if <thinking> tag is missing (strict enforcement)
+// Result: ERROR if <thinking> tag is missing (native reasoning not active)
 // The response is still accessible via errorResponse.partialResponse
 // With native reasoning models (e.g., Claude with reasoning enabled)
@@ -380,10 +382,10 @@ const response = await llmService.sendMessage({
   messages: [/* same prompt */],
   settings: {
     reasoning: { enabled: true },
-    thinkingExtraction: { enabled: true }
+    thinkingTagFallback: { enabled: true, enforce: true }
   }
 });
-// Result: SUCCESS even if <thinking> tag is missing (lenient for native reasoning)
+// Result: SUCCESS even if <thinking> tag is missing (native reasoning is active)
 ```
 This intelligent enforcement ensures that:
@@ -510,13 +512,10 @@ The library provides a powerful `createMessages` method that combines template r
 // Basic example: Create model-aware messages
 const { messages, modelContext } = await llmService.createMessages({
   template: `
-    <SYSTEM>
-      You are a {{ thinking_enabled ? "thoughtful" : "helpful" }} assistant.
-      {{ thinking_available && !thinking_enabled ? "Note: Reasoning mode is available for complex problems." : "" }}
-    </SYSTEM>
+    <SYSTEM>You are a helpful assistant.</SYSTEM>
     <USER>{{ question }}</USER>
   `,
-  variables: {
+  variables: {
     question: 'What is the optimal algorithm for finding the shortest path in a weighted graph?'
   },
   presetId: 'anthropic-claude-3-7-sonnet-20250219-thinking'
@@ -560,14 +559,26 @@ The method provides:
 - **Template Rendering**: Full support for conditionals and variable substitution
 - **Role Tag Parsing**: Converts `<SYSTEM>`, `<USER>`, and `<ASSISTANT>` tags to messages
-Available model context variables:
-- `thinking_enabled`: Whether reasoning/thinking is enabled for this request
-- `thinking_available`: Whether the model supports reasoning/thinking
+**Available model context variables:**
+- `native_reasoning_active`: Whether native reasoning is **currently active** for this request
+  - `true`: The model is using built-in reasoning (e.g., Claude 4, o4-mini, Gemini 2.5 Pro with reasoning enabled)
+  - `false`: No native reasoning is active (either because the model doesn't support it, or it's been disabled)
+- `native_reasoning_capable`: Whether the model **has the capability** to use native reasoning
+  - `true`: Model supports native reasoning (may or may not be enabled)
+  - `false`: Model does not support native reasoning
 - `model_id`: The resolved model ID
 - `provider_id`: The resolved provider ID
 - `reasoning_effort`: The reasoning effort level if specified
 - `reasoning_max_tokens`: The reasoning token budget if specified
+**Best Practice for Templates:**
+When adding thinking tag instructions to your templates, **always use `requires_tags_for_thinking`** (the NOT operator). This ensures:
+- Models with active native reasoning get clean, direct prompts
+- Models without native reasoning get explicit instructions to use `<thinking>` tags
+Example: `{{ requires_tags_for_thinking ? ' Write your reasoning in <thinking> tags first.' : '' }}`
 #### Advanced Features
 **Dynamic Role Injection:**
@@ -617,7 +628,7 @@ const response = await llmService.sendMessage({
   modelId: 'gpt-4.1',
   messages,
   settings: {
-    thinkingExtraction: { enabled: true } // Default, but shown for clarity
+    thinkingTagFallback: { enabled: true } // Default, but shown for clarity
   }
 });
@@ -640,7 +651,7 @@ const creativeWritingTemplate = `
   "settings": {
     "temperature": 0.9,
     "maxTokens": 3000,
-    "thinkingExtraction": { "enabled": true, "tag": "reasoning" }
+    "thinkingTagFallback": { "enabled": true, "tagName": "reasoning" }
   }
 }
 </META>
@@ -1045,14 +1056,14 @@ const llmService = new LLMService(electronKeyProvider);
 genai-lite is written in TypeScript and provides comprehensive type definitions:
 ```typescript
-import type {
+import type {
   LLMChatRequest,
   LLMChatRequestWithPreset,
   LLMResponse,
   LLMFailureResponse,
   LLMSettings,
   LLMReasoningSettings,
-  LLMThinkingExtractionSettings,
+  LLMThinkingTagFallbackSettings,
   ApiKeyProvider,
   ModelPreset,
   LLMServiceOptions,
@@ -1324,24 +1335,23 @@ const { messages } = await llmService.createMessages({
   presetId: 'openai-gpt-4.1-default' // Optional: adds model context
 });
-// Advanced: Leverage model context for adaptive prompts
+// Advanced: Adaptive prompts based on model capabilities
 const { messages, modelContext } = await llmService.createMessages({
   template: `
     <SYSTEM>
-      You are a {{ thinking_enabled ? 'analytical problem solver' : 'quick helper' }}.
-      {{ model_id.includes('claude') ? 'Use your advanced reasoning capabilities.' : '' }}
+      You are a problem-solving assistant.
+      {{ requires_tags_for_thinking ? ' For complex problems, write your reasoning in <thinking> tags before answering.' : '' }}
     </SYSTEM>
-    <USER>
-      {{ thinking_enabled ? 'Please solve this step-by-step:' : 'Please answer:' }}
-      {{ question }}
-    </USER>
+    <USER>{{ question }}</USER>
   `,
+  // Note: Use requires_tags_for_thinking (NOT operator) - only instruct models that don't have active native reasoning
   variables: { question: 'What causes the seasons on Earth?' },
   presetId: 'anthropic-claude-3-7-sonnet-20250219-thinking'
 });
 console.log('Model context:', modelContext);
-// Output: { thinking_enabled: true, thinking_available: true, model_id: 'claude-3-7-sonnet-20250219', ... }
+// Output: { native_reasoning_active: true, native_reasoning_capable: true, model_id: 'claude-3-7-sonnet-20250219', ... }
+// Note: With a reasoning model, the system prompt won't include thinking tag instructions
 ```
 **Low-Level Utilities:**

package/dist/llm/LLMService.d.ts CHANGED Viewed

@@ -75,19 +75,45 @@ export declare class LLMService {
      * injection, and role tag parsing into a single, intuitive API. It replaces the need
      * to chain prepareMessage and buildMessagesFromTemplate for model-aware multi-turn prompts.
      *
+     * **Model Context Injection:**
+     * When a presetId or providerId/modelId is provided, this method automatically injects
+     * model context variables into your templates:
+     * - `native_reasoning_active`: Whether native reasoning is currently active
+     * - `native_reasoning_capable`: Whether the model supports native reasoning
+     * - `requires_tags_for_thinking`: Whether thinking tags are needed (true when native reasoning not active)
+     * - `model_id`, `provider_id`, `reasoning_effort`, `reasoning_max_tokens`
+     *
+     * **Best Practice for Thinking Tags:**
+     * When adding thinking tag instructions, use requires_tags_for_thinking:
+     * `{{ requires_tags_for_thinking ? 'Write your reasoning in <thinking> tags first.' : '' }}`
+     *
      * @param options Options for creating messages
-     * @returns Promise resolving to parsed messages and model context
+     * @returns Promise resolving to parsed messages, model context, and template settings
      *
      * @example
      * ```typescript
+     * // Basic usage
      * const { messages } = await llm.createMessages({
      *   template: `
-     *     <SYSTEM>You are a {{ thinking_enabled ? "thoughtful" : "helpful" }} assistant.</SYSTEM>
+     *     <SYSTEM>You are a helpful assistant.</SYSTEM>
      *     <USER>Help me with {{ task }}</USER>
      *   `,
      *   variables: { task: 'understanding async/await' },
      *   presetId: 'openai-gpt-4.1-default'
      * });
+     *
+     * // Model-aware template with thinking tags
+     * const { messages, modelContext } = await llm.createMessages({
+     *   template: `
+     *     <SYSTEM>
+     *       You are a problem-solving assistant.
+     *       {{ requires_tags_for_thinking ? 'For complex problems, write your reasoning in <thinking> tags first.' : '' }}
+     *     </SYSTEM>
+     *     <USER>{{ question }}</USER>
+     *   `,
+     *   variables: { question: 'Explain recursion' },
+     *   presetId: 'anthropic-claude-3-7-sonnet-20250219-thinking'
+     * });
      * ```
      */
     createMessages(options: {
@@ -96,6 +122,7 @@ export declare class LLMService {
         presetId?: string;
         providerId?: string;
         modelId?: string;
+        settings?: Partial<LLMSettings>;
     }): Promise<CreateMessagesResult>;
     /**
      * Gets information about registered adapters

package/dist/llm/LLMService.js CHANGED Viewed

@@ -145,30 +145,27 @@ class LLMService {
                 }
                 console.log(`Making LLM request with ${clientAdapter.constructor.name} for provider: ${providerId}`);
                 const result = await clientAdapter.sendMessage(internalRequest, apiKey);
-                // Post-process for thinking extraction
-                if (result.object === 'chat.completion' && internalRequest.settings.thinkingExtraction?.enabled) {
-                    const settings = internalRequest.settings.thinkingExtraction;
-                    const tagName = settings.tag || 'thinking';
-                    // Step 1: Resolve the effective onMissing strategy
-                    let effectiveOnMissing = settings.onMissing || 'auto';
-                    if (effectiveOnMissing === 'auto') {
-                        // Check if native reasoning is active
-                        const isNativeReasoningActive = modelInfo.reasoning?.supported === true &&
-                            (internalRequest.settings.reasoning?.enabled === true ||
-                                (modelInfo.reasoning?.enabledByDefault === true &&
-                                    internalRequest.settings.reasoning?.enabled !== false) || // Only if not explicitly disabled
-                                modelInfo.reasoning?.canDisable === false); // Always-on models
-                        effectiveOnMissing = isNativeReasoningActive ? 'ignore' : 'error';
-                    }
-                    // Step 2: Process the response
+                // Post-process for thinking tag fallback
+                // This feature extracts reasoning from XML tags when native reasoning is not active.
+                // It's a fallback mechanism for models without native reasoning or when native is disabled.
+                const fallbackSettings = internalRequest.settings.thinkingTagFallback;
+                if (result.object === 'chat.completion' && fallbackSettings && fallbackSettings.enabled !== false) {
+                    const tagName = fallbackSettings.tagName || 'thinking';
+                    // Check if native reasoning is active for this request
+                    const isNativeReasoningActive = modelInfo.reasoning?.supported === true &&
+                        (internalRequest.settings.reasoning?.enabled === true ||
+                            (modelInfo.reasoning?.enabledByDefault === true &&
+                                internalRequest.settings.reasoning?.enabled !== false) ||
+                            modelInfo.reasoning?.canDisable === false);
+                    // Process the response - extract thinking tags if present
                     const choice = result.choices[0];
                     if (choice?.message?.content) {
                         const { extracted, remaining } = (0, parser_1.extractInitialTaggedContent)(choice.message.content, tagName);
                         if (extracted !== null) {
+                            // Success: thinking tag found
                             console.log(`Extracted <${tagName}> block from response.`);
-                            // Handle the edge case: append to existing reasoning if present.
+                            // Handle the edge case: append to existing reasoning if present (e.g., native reasoning + thinking tags)
                             const existingReasoning = choice.reasoning || '';
-                            // Only add a separator when appending to existing reasoning
                             if (existingReasoning) {
                                 // Use a neutral markdown header that works for any consumer (human or AI)
                                 choice.reasoning = `${existingReasoning}\n\n#### Additional Reasoning\n\n${extracted}`;
@@ -180,17 +177,24 @@ class LLMService {
                             choice.message.content = remaining;
                         }
                         else {
-                            // Tag was not found, enforce the effective strategy
-                            if (effectiveOnMissing === 'error') {
+                            // Tag was not found
+                            // Enforce only if: (1) enforce: true AND (2) native reasoning is NOT active
+                            if (fallbackSettings.enforce === true && !isNativeReasoningActive) {
+                                const nativeReasoningCapable = modelInfo.reasoning?.supported === true;
                                 return {
                                     provider: providerId,
                                     model: modelId,
                                     error: {
-                                        message: `The model (${modelId}) response was expected to start with a <${tagName}> tag but it was not found. ` +
-                                            `This is enforced because the model does not have native reasoning active. ` +
-                                            `Either ensure your prompt instructs the model to use <${tagName}> tags, or enable native reasoning if supported.`,
-                                        code: "MISSING_EXPECTED_TAG",
+                                        message: `Model response missing required <${tagName}> tags.`,
+                                        code: "THINKING_TAGS_MISSING",
                                         type: "validation_error",
+                                        param: nativeReasoningCapable && !isNativeReasoningActive
+                                            ? `You disabled native reasoning for this model (${modelId}). ` +
+                                                `To see its reasoning, you must prompt it to use <${tagName}> tags. ` +
+                                                `Example: "Write your step-by-step reasoning in <${tagName}> tags before answering."`
+                                            : `This model (${modelId}) does not support native reasoning. ` +
+                                                `To get reasoning, you must prompt it to use <${tagName}> tags. ` +
+                                                `Example: "Write your step-by-step reasoning in <${tagName}> tags before answering."`,
                                     },
                                     object: "error",
                                     partialResponse: {
@@ -203,10 +207,7 @@ class LLMService {
                                     }
                                 };
                             }
-                            else if (effectiveOnMissing === 'warn') {
-                                console.warn(`Expected <${tagName}> tag was not found in the response from model ${modelId}.`);
-                            }
-                            // If 'ignore', do nothing
+                            // If enforce: false or native reasoning is active, do nothing
                         }
                     }
                 }
@@ -262,19 +263,45 @@ class LLMService {
      * injection, and role tag parsing into a single, intuitive API. It replaces the need
      * to chain prepareMessage and buildMessagesFromTemplate for model-aware multi-turn prompts.
      *
+     * **Model Context Injection:**
+     * When a presetId or providerId/modelId is provided, this method automatically injects
+     * model context variables into your templates:
+     * - `native_reasoning_active`: Whether native reasoning is currently active
+     * - `native_reasoning_capable`: Whether the model supports native reasoning
+     * - `requires_tags_for_thinking`: Whether thinking tags are needed (true when native reasoning not active)
+     * - `model_id`, `provider_id`, `reasoning_effort`, `reasoning_max_tokens`
+     *
+     * **Best Practice for Thinking Tags:**
+     * When adding thinking tag instructions, use requires_tags_for_thinking:
+     * `{{ requires_tags_for_thinking ? 'Write your reasoning in <thinking> tags first.' : '' }}`
+     *
      * @param options Options for creating messages
-     * @returns Promise resolving to parsed messages and model context
+     * @returns Promise resolving to parsed messages, model context, and template settings
      *
      * @example
      * ```typescript
+     * // Basic usage
      * const { messages } = await llm.createMessages({
      *   template: `
-     *     <SYSTEM>You are a {{ thinking_enabled ? "thoughtful" : "helpful" }} assistant.</SYSTEM>
+     *     <SYSTEM>You are a helpful assistant.</SYSTEM>
      *     <USER>Help me with {{ task }}</USER>
      *   `,
      *   variables: { task: 'understanding async/await' },
      *   presetId: 'openai-gpt-4.1-default'
      * });
+     *
+     * // Model-aware template with thinking tags
+     * const { messages, modelContext } = await llm.createMessages({
+     *   template: `
+     *     <SYSTEM>
+     *       You are a problem-solving assistant.
+     *       {{ requires_tags_for_thinking ? 'For complex problems, write your reasoning in <thinking> tags first.' : '' }}
+     *     </SYSTEM>
+     *     <USER>{{ question }}</USER>
+     *   `,
+     *   variables: { question: 'Explain recursion' },
+     *   presetId: 'anthropic-claude-3-7-sonnet-20250219-thinking'
+     * });
      * ```
      */
     async createMessages(options) {
@@ -290,7 +317,8 @@ class LLMService {
             const resolved = this.modelResolver.resolve({
                 presetId: options.presetId,
                 providerId: options.providerId,
-                modelId: options.modelId
+                modelId: options.modelId,
+                settings: options.settings
             });
             if (resolved.error) {
                 // If resolution fails, proceed without model context
@@ -300,12 +328,15 @@ class LLMService {
                 const { providerId, modelId, modelInfo, settings } = resolved;
                 // Merge settings with model defaults
                 const mergedSettings = this.settingsManager.mergeSettingsForModel(modelId, providerId, settings || {});
-                // Create model context
+                // Calculate native reasoning status
+                const nativeReasoningActive = !!(modelInfo.reasoning?.supported &&
+                    (mergedSettings.reasoning?.enabled === true ||
+                        (modelInfo.reasoning?.enabledByDefault && mergedSettings.reasoning?.enabled !== false)));
+                // Create model context with new property names
                 modelContext = {
-                    thinking_enabled: !!(modelInfo.reasoning?.supported &&
-                        (mergedSettings.reasoning?.enabled === true ||
-                            (modelInfo.reasoning?.enabledByDefault && mergedSettings.reasoning?.enabled !== false))),
-                    thinking_available: !!modelInfo.reasoning?.supported,
+                    native_reasoning_active: nativeReasoningActive,
+                    native_reasoning_capable: !!modelInfo.reasoning?.supported,
+                    requires_tags_for_thinking: !nativeReasoningActive,
                     model_id: modelId,
                     provider_id: providerId,
                     reasoning_effort: mergedSettings.reasoning?.effort,

package/dist/llm/config.js CHANGED Viewed

@@ -69,10 +69,10 @@ exports.DEFAULT_LLM_SETTINGS = {
         maxTokens: undefined,
         exclude: false,
     },
-    thinkingExtraction: {
-        enabled: false, // Now requires explicit opt-in, works with onMissing: 'auto'
-        tag: 'thinking',
-        onMissing: 'auto' // Smart enforcement based on native reasoning status
+    thinkingTagFallback: {
+        enabled: false,
+        tagName: 'thinking',
+        enforce: false
     },
 };
 /**

package/dist/llm/services/SettingsManager.js CHANGED Viewed

@@ -34,9 +34,9 @@ class SettingsManager {
                 ...modelDefaults.reasoning,
                 ...requestSettings?.reasoning,
             },
-            thinkingExtraction: {
-                ...modelDefaults.thinkingExtraction,
-                ...requestSettings?.thinkingExtraction,
+            thinkingTagFallback: {
+                ...modelDefaults.thinkingTagFallback,
+                ...requestSettings?.thinkingTagFallback,
             },
         };
         // Log the final settings for debugging
@@ -115,7 +115,7 @@ class SettingsManager {
             'supportsSystemMessage',
             'geminiSafetySettings',
             'reasoning',
-            'thinkingExtraction'
+            'thinkingTagFallback'
         ];
         // Check each setting field
         for (const [key, value] of Object.entries(settings)) {
@@ -195,22 +195,28 @@ class SettingsManager {
                 }
                 continue;
             }
-            if (key === 'thinkingExtraction' && typeof value === 'object' && value !== null) {
+            if (key === 'thinkingTagFallback' && typeof value === 'object' && value !== null) {
                 const thinkingValidated = {};
                 if ('enabled' in value && typeof value.enabled !== 'boolean') {
-                    console.warn(`Invalid thinkingExtraction.enabled value in template. Must be a boolean.`);
+                    console.warn(`Invalid thinkingTagFallback.enabled value in template. Must be a boolean.`);
                 }
                 else if ('enabled' in value) {
                     thinkingValidated.enabled = value.enabled;
                 }
-                if ('tag' in value && typeof value.tag !== 'string') {
-                    console.warn(`Invalid thinkingExtraction.tag value in template. Must be a string.`);
+                if ('tagName' in value && typeof value.tagName !== 'string') {
+                    console.warn(`Invalid thinkingTagFallback.tagName value in template. Must be a string.`);
                 }
-                else if ('tag' in value) {
-                    thinkingValidated.tag = value.tag;
+                else if ('tagName' in value) {
+                    thinkingValidated.tagName = value.tagName;
+                }
+                if ('enforce' in value && typeof value.enforce !== 'boolean') {
+                    console.warn(`Invalid thinkingTagFallback.enforce value in template. Must be a boolean.`);
+                }
+                else if ('enforce' in value) {
+                    thinkingValidated.enforce = value.enforce;
                 }
                 if (Object.keys(thinkingValidated).length > 0) {
-                    validated.thinkingExtraction = thinkingValidated;
+                    validated.thinkingTagFallback = thinkingValidated;
                 }
                 continue;
             }

package/dist/llm/types.d.ts CHANGED Viewed

@@ -43,28 +43,45 @@ export interface LLMReasoningSettings {
     exclude?: boolean;
 }
 /**
- * Settings for extracting 'thinking' content from the start of a response
+ * Settings for extracting reasoning from XML tags when native reasoning is not active.
+ *
+ * This is a fallback mechanism for getting reasoning from:
+ * 1. Models without native reasoning support (e.g., GPT-4, Claude 3.5)
+ * 2. Models with native reasoning disabled (to see the full reasoning trace)
+ *
+ * **Key use case:** Disable native reasoning on capable models to avoid obfuscation
+ * by providers, then prompt the model to use <thinking> tags for full visibility.
+ *
+ * **Important:** You must explicitly prompt the model to use thinking tags in your prompt.
+ * The library only extracts them - it doesn't generate them automatically.
  */
-export interface LLMThinkingExtractionSettings {
+export interface LLMThinkingTagFallbackSettings {
     /**
-     * If true, enables the automatic extraction of content from a specified XML tag.
-     * @default false
+     * Enable tag extraction fallback.
+     * When this object exists, extraction is enabled by default (enabled: true).
+     * Set to false to explicitly disable (useful for overriding inherited settings).
+     * @default true (when thinkingTagFallback object exists)
      */
     enabled?: boolean;
     /**
-     * The XML tag name to look for (e.g., 'thinking', 'reasoning', 'scratchpad').
+     * Name of the XML tag to extract.
      * @default 'thinking'
+     * @example tagName: 'scratchpad' will extract <scratchpad>...</scratchpad>
      */
-    tag?: string;
+    tagName?: string;
     /**
-     * Defines behavior when the tag is not found. 'auto' is the recommended default.
-     * - 'ignore': Silently continue without a warning or error.
-     * - 'warn': Log a console warning but return the response as-is.
-     * - 'error': Return an LLMFailureResponse, treating it as a failed request.
-     * - 'auto': Becomes 'error' unless the model has active native reasoning. If native reasoning is active, this becomes 'ignore'.
-     * @default 'auto'
+     * Enforce that thinking tags are present when native reasoning is not active.
+     *
+     * When true:
+     * - If native reasoning is active: No enforcement (model using native)
+     * - If native reasoning is NOT active: Error if tags missing (fallback required)
+     *
+     * This is always "smart" - it automatically detects whether native reasoning
+     * is active and only enforces when the model needs to use tags as a fallback.
+     *
+     * @default false
      */
-    onMissing?: 'ignore' | 'warn' | 'error' | 'auto';
+    enforce?: boolean;
 }
 /**
  * Configurable settings for LLM requests
@@ -91,10 +108,19 @@ export interface LLMSettings {
     /** Universal reasoning/thinking configuration */
     reasoning?: LLMReasoningSettings;
     /**
-     * Configuration for automatically extracting 'thinking' blocks from responses.
-     * Enabled by default.
+     * Extract reasoning from XML tags when native reasoning is not active.
+     *
+     * This is a fallback mechanism for getting reasoning from:
+     * 1. Models without native reasoning support (e.g., GPT-4, Claude 3.5)
+     * 2. Models with native reasoning disabled (to see the full reasoning trace)
+     *
+     * Key use case: Disable native reasoning on capable models to avoid obfuscation
+     * by providers, then prompt the model to use <thinking> tags for full visibility.
+     *
+     * Note: You must explicitly prompt the model to use thinking tags in your prompt.
+     * The library only extracts them - it doesn't generate them automatically.
      */
-    thinkingExtraction?: LLMThinkingExtractionSettings;
+    thinkingTagFallback?: LLMThinkingTagFallbackSettings;
 }
 /**
  * Request structure for chat completion
@@ -252,18 +278,51 @@ export declare const LLM_IPC_CHANNELS: {
  */
 export type LLMIPCChannelName = (typeof LLM_IPC_CHANNELS)[keyof typeof LLM_IPC_CHANNELS];
 /**
- * Model context variables injected into templates
+ * Model context variables injected into templates during createMessages()
+ *
+ * These variables enable templates to adapt based on the model's reasoning capabilities.
+ *
+ * **Key Usage Pattern:**
+ * When adding thinking tag instructions, use requires_tags_for_thinking:
+ * ```
+ * {{ requires_tags_for_thinking ? 'Write your reasoning in <thinking> tags first.' : '' }}
+ * ```
+ *
+ * This ensures:
+ * - Models with active native reasoning get clean prompts
+ * - Models without native reasoning get explicit tag instructions
  */
 export interface ModelContext {
-    /** Whether reasoning/thinking is enabled for this request */
-    thinking_enabled: boolean;
-    /** Whether the model supports reasoning/thinking */
-    thinking_available: boolean;
+    /**
+     * Whether native reasoning is CURRENTLY ACTIVE for this request.
+     * - true: Model is using built-in reasoning (Claude 4, o4-mini, Gemini with reasoning enabled)
+     * - false: No native reasoning is active (model doesn't support it OR it's been disabled)
+     *
+     * Use in templates when adapting behavior based on whether native reasoning is happening.
+     */
+    native_reasoning_active: boolean;
+    /**
+     * Whether the model HAS THE CAPABILITY to use native reasoning.
+     * - true: Model supports native reasoning (may or may not be enabled)
+     * - false: Model does not support native reasoning
+     *
+     * Use in templates to check if native reasoning is possible (not necessarily active).
+     */
+    native_reasoning_capable: boolean;
+    /**
+     * Whether this model/request requires thinking tags to produce reasoning.
+     * - true: Native reasoning is not active, model needs prompting to use <thinking> tags
+     * - false: Native reasoning is active, no need for thinking tags
+     *
+     * Use in templates for conditional thinking tag instructions:
+     * {{ requires_tags_for_thinking ? 'Write your reasoning in <thinking> tags first.' : '' }}
+     */
+    requires_tags_for_thinking: boolean;
     /** The resolved model ID */
     model_id: string;
     /** The resolved provider ID */
     provider_id: string;
-    /** Reasoning effort level if specified */
+    /** Reasoning effort level if specified ('low', 'medium', or 'high') */
     reasoning_effort?: string;
     /** Reasoning max tokens if specified */
     reasoning_max_tokens?: number;