npm - @smythos/sre - Versions diffs - 1.7.18 → 1.7.40 - Mend

@smythos/sre 1.7.18 → 1.7.40

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

package/src/subsystems/LLMManager/LLM.inference.ts CHANGED Viewed

@@ -13,14 +13,30 @@ import { TLLMChatResponse, TLLMMessageRole, TLLMModel, TLLMParams } from '@sre/t
 import { LLMConnector } from './LLM.service/LLMConnector';
 import { IModelsProviderRequest, ModelsProviderConnector } from './ModelsProvider.service/ModelsProviderConnector';
-const console = Logger('LLMInference');
+const logger = Logger('LLMInference');
 type TPromptParams = { query?: string; contextWindow?: any[]; files?: any[]; params: TLLMParams; onFallback?: (data: any) => void };
 export class LLMInference {
-    private model: string | TLLMModel;
-    private llmConnector: LLMConnector;
-    private modelProviderReq: IModelsProviderRequest;
+    private _model: string | TLLMModel;
+    public get model() {
+        return this._model;
+    }
+    public get modelId() {
+        return typeof this._model === 'string' ? this._model : this._model?.modelId;
+    }
+    private _llmConnector: LLMConnector;
+    public get llmConnector() {
+        return this._llmConnector;
+    }
+    private _modelProviderReq: IModelsProviderRequest;
+    public get modelProviderReq() {
+        return this._modelProviderReq;
+    }
+    private _llmProviderName: string;
+    public get llmProviderName() {
+        return this._llmProviderName;
+    }
     public teamId?: string;
     public static async getInstance(model: string | TLLMModel, candidate: AccessCandidate) {
@@ -34,18 +50,18 @@ export class LLMInference {
         const llmInference = new LLMInference();
         llmInference.teamId = teamId;
-        llmInference.modelProviderReq = modelsProvider.requester(candidate);
+        llmInference._modelProviderReq = modelsProvider.requester(candidate);
-        const llmProvider = await llmInference.modelProviderReq.getProvider(model);
-        if (llmProvider) {
-            llmInference.llmConnector = ConnectorService.getLLMConnector(llmProvider);
+        llmInference._llmProviderName = await llmInference._modelProviderReq.getProvider(model);
+        if (llmInference._llmProviderName) {
+            llmInference._llmConnector = ConnectorService.getLLMConnector(llmInference._llmProviderName);
         }
-        if (!llmInference.llmConnector) {
-            console.error(`Model ${model} unavailable for team ${teamId}`);
+        if (!llmInference._llmConnector) {
+            logger.warn(`Model ${model} unavailable for team ${teamId}`);
         }
-        llmInference.model = model;
+        llmInference._model = model;
         return llmInference;
     }
@@ -53,32 +69,32 @@ export class LLMInference {
     public static user(candidate: AccessCandidate): any {}
     public get connector(): LLMConnector {
-        return this.llmConnector;
+        return this._llmConnector;
     }
     public async prompt({ query, contextWindow, files, params, onFallback = () => {} }: TPromptParams, isInFallback: boolean = false) {
         let messages = contextWindow || [];
         if (query) {
-            const content = this.llmConnector.enhancePrompt(query, params);
+            const content = this._llmConnector.enhancePrompt(query, params);
             messages.push({ role: TLLMMessageRole.User, content });
         }
         // Reset the model, since the fallback model may change — especially when using user custom models.
-        params.model = this.model;
+        params.model = this._model;
         params.messages = messages;
         params.files = files;
         // If a fallback model is used, trigger the onFallback callback to notify the caller.
         if (isInFallback && typeof onFallback === 'function') {
-            onFallback({ model: this.model });
+            onFallback({ model: this._model });
         }
         try {
-            let response: TLLMChatResponse = await this.llmConnector.requester(AccessCandidate.agent(params.agentId)).request(params);
+            let response: TLLMChatResponse = await this._llmConnector.requester(AccessCandidate.agent(params.agentId)).request(params);
-            const result = this.llmConnector.postProcess(response?.content);
+            const result = this._llmConnector.postProcess(response?.content);
             if (result.error) {
                 // If the model stopped before completing the response, this is usually due to output token limit reached.
                 if (response.finishReason !== 'stop') {
@@ -102,12 +118,12 @@ export class LLMInference {
                     }
                 } catch (fallbackError) {
                     // If fallback also failed, log it but continue to throw original error
-                    console.warn('Fallback also failed:', fallbackError);
+                    logger.warn('Fallback also failed:', fallbackError);
                 }
             }
             // If fallback was not attempted or failed, throw the original error
-            console.error('Error in chatRequest: ', error);
+            logger.error('Error in chatRequest: ', error);
             throw error;
         }
     }
@@ -116,23 +132,23 @@ export class LLMInference {
         let messages = contextWindow || [];
         if (query) {
-            const content = this.llmConnector.enhancePrompt(query, params);
+            const content = this._llmConnector.enhancePrompt(query, params);
             messages.push({ role: TLLMMessageRole.User, content });
         }
         // Reset the model, since the fallback model may change — especially when using user custom models.
-        params.model = this.model;
+        params.model = this._model;
         params.messages = messages;
         params.files = files;
         // If a fallback model is used, trigger the onFallback callback to notify the caller.
         if (isInFallback && typeof onFallback === 'function') {
-            onFallback({ model: this.model });
+            onFallback({ model: this._model });
         }
         try {
-            return await this.llmConnector.user(AccessCandidate.agent(params.agentId)).streamRequest(params);
+            return await this._llmConnector.user(AccessCandidate.agent(params.agentId)).streamRequest(params);
         } catch (error) {
             // Attempt fallback for custom models (only if not already in fallback)
             if (!isInFallback) {
@@ -152,12 +168,12 @@ export class LLMInference {
                     }
                 } catch (fallbackError) {
                     // If fallback also failed, log it but continue to return error emitter
-                    console.warn('Fallback also failed:', fallbackError);
+                    logger.warn('Fallback also failed:', fallbackError);
                 }
             }
             // If fallback was not attempted or failed, return error emitter
-            console.error('Error in streamRequest:', error);
+            logger.error('Error in streamRequest:', error);
             const dummyEmitter = new EventEmitter();
             process.nextTick(() => {
@@ -224,22 +240,22 @@ export class LLMInference {
      * @returns The result from the fallback execution, or null if fallback should not be attempted
      */
     private async executeFallback(methodName: 'prompt' | 'promptStream', args: TPromptParams): Promise<any> {
-        const isCustomModel = await this.modelProviderReq.isUserCustomLLM(this.model);
-        const fallbackModel = await this.modelProviderReq.getFallbackLLM(this.model);
+        const isCustomModel = await this._modelProviderReq.isUserCustomLLM(this._model);
+        const fallbackModel = await this._modelProviderReq.getFallbackLLM(this._model);
         // Only execute fallback if it's a custom model with a configured fallback
         if (!isCustomModel || !fallbackModel) {
             return null;
         }
-        console.info(`Attempting fallback from ${this.model} to ${fallbackModel}`);
+        logger.info(`Attempting fallback from ${this._model} to ${fallbackModel}`);
         // Mutate the model and connector to use fallback
-        this.model = fallbackModel;
+        this._model = fallbackModel;
-        const llmProvider = await this.modelProviderReq.getProvider(fallbackModel);
+        const llmProvider = await this._modelProviderReq.getProvider(fallbackModel);
         if (llmProvider) {
-            this.llmConnector = ConnectorService.getLLMConnector(llmProvider);
+            this._llmConnector = ConnectorService.getLLMConnector(llmProvider);
         }
         // Call the appropriate method with isInFallback=true to prevent further fallbacks
@@ -252,13 +268,13 @@ export class LLMInference {
     public async imageGenRequest({ query, files, params }: TPromptParams) {
         params.prompt = query;
-        return this.llmConnector.user(AccessCandidate.agent(params.agentId)).imageGenRequest(params);
+        return this._llmConnector.user(AccessCandidate.agent(params.agentId)).imageGenRequest(params);
     }
     public async imageEditRequest({ query, files, params }: TPromptParams) {
         params.prompt = query;
         params.files = files;
-        return this.llmConnector.user(AccessCandidate.agent(params.agentId)).imageEditRequest(params);
+        return this._llmConnector.user(AccessCandidate.agent(params.agentId)).imageEditRequest(params);
     }
     //@deprecated
@@ -269,11 +285,11 @@ export class LLMInference {
                 throw new Error('Input messages are required.');
             }
-            const model = params.model || this.model;
+            const model = params.model || this._model;
-            return await this.llmConnector.user(AccessCandidate.agent(agentId)).streamRequest({ ...params, model });
+            return await this._llmConnector.user(AccessCandidate.agent(agentId)).streamRequest({ ...params, model });
         } catch (error) {
-            console.error('Error in streamRequest:', error);
+            logger.error('Error in streamRequest:', error);
             const dummyEmitter = new EventEmitter();
             process.nextTick(() => {
@@ -306,11 +322,11 @@ export class LLMInference {
             //FIXME we need to update the connector multimediaStreamRequest in order to ignore prompt param if not provided
             const userMessage = Array.isArray(params.messages) ? params.messages.pop() : {};
             const prompt = userMessage?.content || '';
-            const model = params.model || this.model;
+            const model = params.model || this._model;
-            return await this.llmConnector.user(AccessCandidate.agent(agentId)).multimodalStreamRequest(prompt, { ...params, model });
+            return await this._llmConnector.user(AccessCandidate.agent(agentId)).multimodalStreamRequest(prompt, { ...params, model });
         } catch (error: any) {
-            console.error('Error in multimodalRequest: ', error);
+            logger.error('Error in multimodalRequest: ', error);
             throw error;
         }
@@ -337,12 +353,12 @@ export class LLMInference {
         params.files = _files;
         try {
-            prompt = this.llmConnector.enhancePrompt(prompt, config);
-            const model = params.model || this.model;
+            prompt = this._llmConnector.enhancePrompt(prompt, config);
+            const model = params.model || this._model;
-            return await this.llmConnector.user(AccessCandidate.agent(agentId)).multimodalStreamRequest(prompt, { ...params, model });
+            return await this._llmConnector.user(AccessCandidate.agent(agentId)).multimodalStreamRequest(prompt, { ...params, model });
         } catch (error: any) {
-            console.error('Error in multimodalRequest: ', error);
+            logger.error('Error in multimodalRequest: ', error);
             throw error;
         }
@@ -376,7 +392,7 @@ export class LLMInference {
         //#region get max model context
-        const modelInfo = await this.modelProviderReq.getModelInfo(this.model, true);
+        const modelInfo = await this._modelProviderReq.getModelInfo(this._model, true);
         let maxModelContext = modelInfo?.tokens;
         let maxModelOutputTokens = modelInfo?.completionTokens || modelInfo?.tokens;
         // const isStandardLLM = LLMRegistry.isStandardLLM(this.model);
@@ -399,10 +415,10 @@ export class LLMInference {
         }
         if (maxInputContext <= 0) {
-            console.warn('Max input context is 0, returning empty context window, This usually indicates a wrong model configuration');
+            logger.warn('Max input context is 0, returning empty context window, This usually indicates a wrong model configuration');
         }
-        console.debug(
+        logger.debug(
             `Context Window Configuration: Max Input Tokens: ${maxInputContext}, Max Output Tokens: ${maxOutputContext}, Max Model Tokens: ${maxModelContext}`
         );
         const systemMessage = { role: 'system', content: systemPrompt };
@@ -473,7 +489,7 @@ function countTokens(content: any, model: 'gpt-4o' | 'gpt-4o-mini' = 'gpt-4o') {
         const tokens = encodeChat([{ role: 'user', content: _stringifiedContent } as ChatMessage], model);
         return tokens.length;
     } catch (error) {
-        console.warn('Error in countTokens: ', error);
+        logger.warn('Error in countTokens: ', error);
         return 0;
     }
 }

package/src/subsystems/LLMManager/LLM.service/connectors/Anthropic.class.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 import EventEmitter from 'events';
 import Anthropic from '@anthropic-ai/sdk';
+import type { MessageStreamEvents } from '@anthropic-ai/sdk/lib/MessageStream';
 import { JSON_RESPONSE_INSTRUCTION, BUILT_IN_MODEL_PREFIX } from '@sre/constants';
 import { BinaryInput } from '@sre/helpers/BinaryInput.helper';
@@ -35,6 +36,26 @@ const LEGACY_THINKING_MODELS = ['smythos/claude-3.7-sonnet-thinking', 'claude-3.
 // Type aliases
 type AnthropicMessageParams = Anthropic.MessageCreateParamsNonStreaming | Anthropic.Messages.MessageStreamParams;
+type AnthropicStreamEventType = keyof MessageStreamEvents;
+// Event names automatically validated against MessageStreamEvents type
+// TypeScript will error if any events are missing or incorrect
+// This ensures we always use the correct event names as defined by Anthropic SDK
+const AnthropicStreamEvent = {
+    connect: 'connect',
+    streamEvent: 'streamEvent',
+    text: 'text',
+    citation: 'citation',
+    inputJson: 'inputJson',
+    thinking: 'thinking',
+    signature: 'signature',
+    message: 'message',
+    contentBlock: 'contentBlock',
+    finalMessage: 'finalMessage',
+    error: 'error',
+    abort: 'abort',
+    end: 'end',
+} satisfies Record<keyof MessageStreamEvents, AnthropicStreamEventType>;
 // TODO [Forhad]: implement proper typing
@@ -132,34 +153,38 @@ export class AnthropicConnector extends LLMConnector {
             const needsPrefillInjection = this.hasPrefillText(body.messages);
             let prefillInjected = false;
-            stream.on('streamEvent', (event: any) => {
+            stream.on(AnthropicStreamEvent.streamEvent, (event: any) => {
                 if (event.message?.usage) {
                     //console.log('usage', event.message?.usage);
                 }
             });
-            stream.on('error', (error) => {
+            stream.on(AnthropicStreamEvent.error, (error) => {
                 //console.log('error', error);
-                emitter.emit('error', error);
+                emitter.emit(TLLMEvent.Error, error);
             });
-            stream.on('text', (text: string) => {
+            stream.on(AnthropicStreamEvent.message, (message) => {
+                emitter.emit(TLLMEvent.Data, message);
+            });
+            stream.on(AnthropicStreamEvent.text, (text: string) => {
                 // Inject prefill text only once at the very beginning if needed
                 if (needsPrefillInjection && !prefillInjected) {
                     text = `${PREFILL_TEXT_FOR_JSON_RESPONSE}${text}`;
                     prefillInjected = true;
                 }
-                emitter.emit('content', text);
+                emitter.emit(TLLMEvent.Content, text);
             });
-            stream.on('thinking', (thinking) => {
+            stream.on(AnthropicStreamEvent.thinking, (thinking) => {
                 // Handle thinking blocks during streaming
-                emitter.emit('thinking', thinking);
+                emitter.emit(TLLMEvent.Thinking, thinking);
             });
-            stream.on('finalMessage', (finalMessage) => {
+            stream.on(AnthropicStreamEvent.finalMessage, (finalMessage) => {
                 let finishReason = 'stop';
                 // Preserve thinking blocks for subsequent tool interactions
                 thinkingBlocks = finalMessage.content.filter((block) => block.type === 'thinking' || block.type === 'redacted_thinking');
@@ -197,12 +222,12 @@ export class AnthropicConnector extends LLMConnector {
                     usage_data.push(reportedUsage);
                 }
                 if (finishReason !== 'stop' && finishReason !== 'end_turn') {
-                    emitter.emit('interrupted', finishReason);
+                    emitter.emit(TLLMEvent.Interrupted, finishReason);
                 }
                 //only emit end event after processing the final message
                 setTimeout(() => {
-                    emitter.emit('end', toolsData, usage_data, finishReason);
+                    emitter.emit(TLLMEvent.End, toolsData, usage_data, finishReason);
                 }, 100);
             });

package/src/subsystems/LLMManager/LLM.service/connectors/Bedrock.class.ts CHANGED Viewed

@@ -126,14 +126,14 @@ export class BedrockConnector extends LLMConnector {
                         // Handle message start
                         if (chunk.messageStart) {
                             currentMessage.role = chunk.messageStart.role || '';
-                            emitter.emit('data', { role: currentMessage.role });
+                            emitter.emit(TLLMEvent.Data, { role: currentMessage.role });
                         }
                         // Handle content deltas
                         if (chunk.contentBlockDelta?.delta?.text) {
                             currentMessage.content += chunk.contentBlockDelta.delta.text;
-                            emitter.emit('data', chunk.contentBlockDelta.delta.text);
-                            emitter.emit('content', chunk.contentBlockDelta.delta.text, currentMessage.role);
+                            emitter.emit(TLLMEvent.Data, chunk.contentBlockDelta.delta.text);
+                            emitter.emit(TLLMEvent.Content, chunk.contentBlockDelta.delta.text, currentMessage.role);
                         }
                         // Handle tool use start
@@ -175,10 +175,18 @@ export class BedrockConnector extends LLMConnector {
                         // Handle message completion
                         if (chunk.messageStop) {
+                            const finishReason = chunk.messageStop.stopReason || 'stop';
                             if (currentMessage.toolCalls.length > 0) {
                                 emitter.emit(TLLMEvent.ToolInfo, currentMessage.toolCalls);
                             }
-                            emitter.emit(TLLMEvent.End, currentMessage.toolCalls);
+                            // Emit interrupted event if finishReason is not 'stop'
+                            if (finishReason !== 'stop' && finishReason !== 'end_turn') {
+                                emitter.emit(TLLMEvent.Interrupted, finishReason);
+                            }
+                            emitter.emit(TLLMEvent.End, currentMessage.toolCalls, [], finishReason);
                         }
                         if (chunk?.metadata?.usage) {

package/src/subsystems/LLMManager/LLM.service/connectors/Echo.class.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import { JSONContent } from '@sre/helpers/JsonContent.helper';
 import { LLMConnector } from '../LLMConnector';
 import EventEmitter from 'events';
-import { APIKeySource, ILLMRequestFuncParams, TLLMChatResponse, TLLMPreparedParams } from '@sre/types/LLM.types';
+import { APIKeySource, ILLMRequestFuncParams, TLLMChatResponse, TLLMEvent, TLLMPreparedParams } from '@sre/types/LLM.types';
 import { Logger } from '@sre/helpers/Log.helper';
 import { delay } from '@sre/utils/index';
 import { hookAsync } from '@sre/Core/HookService';
@@ -54,13 +54,13 @@ export class EchoConnector extends LLMConnector {
                     const isLastChunk = i === chunks.length - 1;
                     // Add space between chunks except for the last one to avoid trailing space in file URLs
                     const delta = { content: chunks[i] + (isLastChunk ? '' : ' ') };
-                    emitter.emit('data', delta);
-                    emitter.emit('content', delta.content);
+                    emitter.emit(TLLMEvent.Data, delta);
+                    emitter.emit(TLLMEvent.Content, delta.content);
                 }
                 // Emit end event after all chunks are processed
                 setTimeout(() => {
-                    emitter.emit('end', [], []); // Empty arrays for toolsData and usage_data
+                    emitter.emit(TLLMEvent.End, [], [], 'stop'); // Empty arrays for toolsData and usage_data, with finishReason
                 }, 100);
             })();