npm - @equinor/fusion-framework-cli-plugin-ai-chat - Versions diffs - 1.0.0 - Mend

@equinor/fusion-framework-cli-plugin-ai-chat 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/CHANGELOG.md +57 -0
package/LICENSE +21 -0
package/README.md +113 -0
package/dist/esm/chat.js +294 -0
package/dist/esm/chat.js.map +1 -0
package/dist/esm/index.js +11 -0
package/dist/esm/index.js.map +1 -0
package/dist/esm/system-message-template.js +25 -0
package/dist/esm/system-message-template.js.map +1 -0
package/dist/esm/version.js +3 -0
package/dist/esm/version.js.map +1 -0
package/dist/tsconfig.tsbuildinfo +1 -0
package/dist/types/chat.d.ts +6 -0
package/dist/types/index.d.ts +7 -0
package/dist/types/system-message-template.d.ts +10 -0
package/dist/types/version.d.ts +1 -0
package/package.json +60 -0
package/src/chat.ts +429 -0
package/src/index.ts +13 -0
package/src/system-message-template.ts +24 -0
package/src/version.ts +2 -0
package/tsconfig.json +24 -0
package/vitest.config.ts +14 -0

package/src/chat.ts ADDED Viewed

@@ -0,0 +1,429 @@
+import { createCommand, createOption } from 'commander';
+import type { ChatMessage } from '@equinor/fusion-framework-module-ai/lib';
+import { from } from 'rxjs';
+import {
+  withOptions as withAiOptions,
+  type AiOptions,
+} from '@equinor/fusion-framework-cli-plugin-ai-base/command-options';
+import { createInterface } from 'node:readline';
+import { setupFramework } from '@equinor/fusion-framework-cli-plugin-ai-base';
+import { createSystemMessage } from './system-message-template.js';
+import {
+  RunnablePassthrough,
+  RunnableSequence,
+  type RunnableInterface,
+} from '@langchain/core/runnables';
+import { StringOutputParser } from '@langchain/core/output_parsers';
+/**
+ * CLI command: `ai chat`
+ *
+ * Interactive chat with Large Language Models using inquirer for a smooth CLI experience.
+ * Enhanced with vector store context retrieval for more accurate and relevant responses.
+ *
+ * Features:
+ * - Interactive conversation mode with inquirer prompts
+ * - Real-time streaming responses from AI models
+ * - Intelligent message history compression using AI summarization
+ * - Automatic vector store context retrieval for enhanced responses
+ * - Special commands: exit, quit, clear, help
+ * - Support for Azure OpenAI models and Azure Cognitive Search
+ * - Live typing effect for AI responses
+ * - Configurable context retrieval limits
+ *
+ * Usage:
+ *   $ ffc ai chat [options]
+ *
+ * Options:
+ *   --openai-api-key <key>              API key for Azure OpenAI
+ *   --openai-api-version <version>       API version (default: 2024-02-15-preview)
+ *   --openai-instance <name>             Azure OpenAI instance name
+ *   --openai-chat-deployment <name>      Azure OpenAI chat deployment name
+ *   --openai-embedding-deployment <name> Azure OpenAI embedding deployment name
+ *   --azure-search-endpoint <url>        Azure Search endpoint URL
+ *   --azure-search-api-key <key>        Azure Search API key
+ *   --azure-search-index-name <name>     Azure Search index name
+ *   --use-context                        Use vector store context (default: true)
+ *   --context-limit <number>             Max context documents to retrieve (default: 5)
+ *   --history-limit <number>             Max messages to keep in conversation history (default: 20, auto-compresses at 10)
+ *   --verbose                            Enable verbose output
+ *
+ * Environment Variables:
+ *   AZURE_OPENAI_API_KEY                    API key for Azure OpenAI
+ *   AZURE_OPENAI_API_VERSION                API version
+ *   AZURE_OPENAI_INSTANCE_NAME              Instance name
+ *   AZURE_OPENAI_CHAT_DEPLOYMENT_NAME        Chat deployment name
+ *   AZURE_OPENAI_EMBEDDING_DEPLOYMENT_NAME   Embedding deployment name
+ *   AZURE_SEARCH_ENDPOINT                    Azure Search endpoint
+ *   AZURE_SEARCH_API_KEY                     Azure Search API key
+ *   AZURE_SEARCH_INDEX_NAME                  Azure Search index name
+ *
+ * Interactive Commands:
+ *   exit/quit  - End the conversation
+ *   clear      - Clear conversation history
+ *   help       - Show available commands
+ *   Ctrl+C     - Exit immediately
+ *
+ * Examples:
+ *   $ ffc ai chat
+ *   $ ffc ai chat --context-limit 10
+ *   $ ffc ai chat --history-limit 100
+ *   $ ffc ai chat --verbose --azure-search-endpoint https://my-search.search.windows.net
+ */
+/**
+ * Command options for the chat command
+ */
+type CommandOptions = AiOptions & {
+  /** Enable verbose output for debugging */
+  verbose?: boolean;
+  /** Maximum number of context documents to retrieve from vector store */
+  contextLimit?: number;
+  /** Maximum number of messages to keep in conversation history */
+  historyLimit?: number;
+};
+const _command = createCommand('chat')
+  .description('Interactive chat with Large Language Models')
+  .addOption(createOption('--verbose', 'Enable verbose output').default(false))
+  .addOption(
+    createOption('--context-limit <number>', 'Maximum number of context documents to retrieve')
+      .default(5)
+      .argParser(parseInt),
+  )
+  .addOption(
+    createOption(
+      '--history-limit <number>',
+      'Maximum number of messages to keep in conversation history',
+    )
+      .default(20)
+      .argParser(parseInt),
+  )
+  .action(async (options: CommandOptions) => {
+    // Initialize the framework
+    const framework = await setupFramework(options);
+    // Get the AI provider
+    const aiProvider = framework.ai;
+    if (options.verbose) {
+      console.log('✅ Framework initialized successfully');
+      console.log('💬 Starting interactive chat...');
+      console.log('🔍 Context retrieval enabled');
+      console.log(`📝 Message history limit: ${options.historyLimit || 20} messages`);
+      if (options.azureSearchEndpoint) {
+        console.log(`📚 Using vector store: ${options.azureSearchIndexName}`);
+      } else {
+        console.log('⚠️  No vector store configured - context retrieval will be skipped');
+      }
+      console.log('🔍 Using model:', options.openaiChatDeployment);
+      console.log('Type "exit" or "quit" to end the conversation');
+      console.log('Type "clear" to clear the conversation history');
+      console.log('Press Ctrl+C to exit immediately');
+      console.log('');
+    }
+    // Start interactive chat
+    if (!options.openaiChatDeployment) {
+      throw new Error('Chat deployment name is required');
+    }
+    if (!options.azureSearchIndexName) {
+      throw new Error('Azure Search index name is required');
+    }
+    const chatService = framework.ai.getService('chat', options.openaiChatDeployment);
+    const vectorStoreService = aiProvider.getService('search', options.azureSearchIndexName);
+    if (options.verbose) {
+      console.log('🔧 Configuring retriever with options:', {
+        k: options.contextLimit || 5,
+        searchType: 'similarity',
+      });
+    }
+    // Configure retriever with similarity search (not MMR) for more predictable results
+    // MMR (Maximum Marginal Relevance) can sometimes cause issues with Azure Search
+    const retriever = vectorStoreService.asRetriever({
+      k: options.contextLimit || 5,
+      searchType: 'similarity',
+    });
+    /**
+     * Retrieves relevant context documents from the vector store for a given query
+     * @param input - The user's query string
+     * @returns Promise resolving to formatted context string or error message
+     */
+    const retrieveContext = async (input: string) => {
+      try {
+        if (options.verbose) {
+          console.log('🔍 Retrieving context for query:', input);
+        }
+        const docs = await retriever.invoke(input);
+        console.log('📄 Retrieved documents:', docs?.length || 0);
+        if (options.verbose) {
+          for (const doc of docs) {
+            console.log('📄 Document:', {
+              pageContent: `${doc.pageContent.substring(0, 100)}...`,
+              metadata: doc.metadata,
+            });
+          }
+        }
+        if (!docs || docs.length === 0) {
+          return 'No relevant context found.';
+        }
+        return docs.map((doc) => doc.pageContent).join('\n');
+      } catch (error) {
+        console.error('❌ Error retrieving context:', error);
+        if (options.verbose) {
+          console.error('Full error details:', error);
+        }
+        return 'Error retrieving context.';
+      }
+    };
+    // Create a custom runnable that formats the prompt as ChatMessage[]
+    // This chain step retrieves context and formats it into a proper message array
+    const formatPromptAsMessages = new RunnablePassthrough().pipe(
+      async (input: { userMessage: string; messageHistory: ChatMessage[] }) => {
+        // Retrieve relevant context from vector store based on user's message
+        const context = await retrieveContext(input.userMessage);
+        // Build system message with retrieved context for RAG (Retrieval-Augmented Generation)
+        // Emphasizes using FUSION framework knowledge from the provided context
+        const systemMessage = createSystemMessage(context);
+        // Build the complete message array with system message, history, and current user message
+        // Order: system message (with context) -> conversation history -> current user message
+        const messages: ChatMessage[] = [
+          { role: 'system', content: systemMessage },
+          ...input.messageHistory,
+          { role: 'user', content: input.userMessage },
+        ];
+        return messages;
+      },
+    );
+    // Create the chatbot chain using LangChain's RunnableSequence
+    // Chain flow: format messages -> invoke chat model -> parse string output
+    // Note: Type assertion needed because IModel extends RunnableInterface but TypeScript
+    // doesn't recognize the compatibility without explicit casting
+    const chain = RunnableSequence.from([
+      formatPromptAsMessages,
+      chatService as unknown as RunnableInterface,
+      new StringOutputParser(),
+    ]);
+    const messageHistory: ChatMessage[] = [];
+    /**
+     * Summarizes the oldest messages in the conversation history using AI
+     * This helps compress long conversation histories while preserving important context
+     * @param messages - Array of messages to summarize
+     * @returns Promise resolving to a summary message that can replace the original messages
+     */
+    const summarizeOldMessages = async (messages: ChatMessage[]): Promise<ChatMessage> => {
+      // Convert messages to a text format for summarization
+      const conversationText = messages.map((msg) => `${msg.role}: ${msg.content}`).join('\n');
+      const summaryPrompt = `Please provide a concise summary of the following conversation history. Focus on key topics, decisions, and important context that should be remembered for the ongoing conversation:
+${conversationText}
+Summary:`;
+      try {
+        // Use the chat service to generate a summary of the conversation
+        const summaryResponse = await chatService.invoke([
+          { role: 'user', content: summaryPrompt },
+        ]);
+        return {
+          role: 'assistant',
+          content: `[Previous conversation summary: ${summaryResponse}]`,
+        };
+      } catch (error) {
+        console.error('❌ Error summarizing conversation:', error);
+        // Fallback to a simple summary if AI summarization fails
+        // This ensures the conversation can continue even if summarization fails
+        return {
+          role: 'assistant',
+          content: `[Previous conversation summary: ${messages.length} messages about various topics]`,
+        };
+      }
+    };
+    /**
+     * Manages message history with intelligent compression using AI summarization
+     * Implements a two-stage compression strategy:
+     * 1. When history reaches 10 messages, summarize oldest 5 messages using AI
+     * 2. If history still exceeds limit after compression, remove oldest non-summary messages
+     * @param history - Current message history array (will be mutated)
+     * @param newMessage - New message to add to history
+     * @param limit - Maximum number of messages to keep in history
+     * @returns Updated message history with compression applied
+     */
+    const addMessageToHistory = async (
+      history: ChatMessage[],
+      newMessage: ChatMessage,
+      limit: number,
+    ): Promise<ChatMessage[]> => {
+      history.push(newMessage);
+      // Stage 1: AI-based compression when history reaches 10 messages
+      // Summarize the oldest 5 messages and replace them with a single summary message
+      // This preserves important context while reducing token usage
+      let hasSummary = false;
+      if (history.length >= 10) {
+        if (options.verbose) {
+          console.log('🔄 Compressing conversation history with AI summarization...');
+        }
+        // Remove oldest 5 messages and summarize them
+        const oldestMessages = history.splice(0, 5);
+        const summary = await summarizeOldMessages(oldestMessages);
+        // Insert the summary at the beginning to maintain chronological order
+        history.unshift(summary);
+        hasSummary = true;
+        if (options.verbose) {
+          console.log(
+            `📝 Compressed 5 messages into 1 summary. History now has ${history.length} messages.`,
+          );
+        }
+      }
+      // Stage 2: Hard limit enforcement if history still exceeds limit after compression
+      // If we just created a summary, start removing from position 1 to preserve it
+      // Otherwise, remove from position 0 as usual
+      if (history.length > limit) {
+        const messagesToRemove = history.length - limit;
+        const startIndex = hasSummary ? 1 : 0;
+        // Ensure we don't remove more messages than available (keeping summary if it exists)
+        const maxRemovable = hasSummary ? history.length - 2 : history.length - 1;
+        const actualRemoval = Math.min(messagesToRemove, Math.max(0, maxRemovable));
+        if (actualRemoval > 0) {
+          history.splice(startIndex, actualRemoval);
+          if (options.verbose) {
+            console.log(
+              `🗑️  Removed ${actualRemoval} messages. History now has ${history.length} messages.`,
+            );
+          }
+        }
+      }
+      return history;
+    };
+    console.log('💬 Chat ready! Start typing your message...\n');
+    console.log('💡 Press Ctrl+C to exit at any time\n');
+    // Create readline interface for better Ctrl+C handling
+    // This provides better control over input/output and signal handling
+    const rl = createInterface({
+      input: process.stdin,
+      output: process.stdout,
+    });
+    // Handle Ctrl+C gracefully to prevent abrupt termination
+    const handleExit = () => {
+      console.log('\n\n👋 Goodbye!');
+      rl.close();
+      process.exit(0);
+    };
+    process.on('SIGINT', handleExit);
+    process.on('SIGTERM', handleExit);
+    // Interactive chat loop - continues until user exits
+    while (true) {
+      try {
+        // Prompt user for input using readline
+        const userMessage = await new Promise<string>((resolve) => {
+          rl.question('You: ', (answer) => {
+            resolve(answer.trim());
+          });
+        });
+        // Skip empty messages
+        if (!userMessage) {
+          console.log('Please enter a message\n');
+          continue;
+        }
+        // Handle special commands
+        if (userMessage.toLowerCase() === 'clear') {
+          messageHistory.length = 0;
+          console.log('\n🧹 Conversation history cleared!\n');
+          continue;
+        }
+        // Add user message to history (with automatic compression if needed)
+        await addMessageToHistory(
+          messageHistory,
+          { role: 'user', content: userMessage },
+          options.historyLimit || 20,
+        );
+        // Show typing indicator
+        console.log('\n🤖 AI Response:');
+        // Use LangChain runnable chain for RAG (Retrieval-Augmented Generation)
+        try {
+          if (options.verbose) {
+            console.log('🔍 Using LangChain chain with context retrieval...');
+            console.log(`📝 Message history contains ${messageHistory.length} messages`);
+          }
+          // Stream the response from the chain for real-time output
+          const responseStream = await chain.stream({ userMessage, messageHistory });
+          // Collect the full response while streaming chunks to stdout
+          // This allows users to see the response as it's generated
+          const fullResponse = await new Promise<string>((resolve, reject) => {
+            let fullResponse = '';
+            from(responseStream).subscribe({
+              next: (chunk) => {
+                // Write each chunk immediately for streaming effect
+                process.stdout.write(String(chunk));
+                fullResponse += chunk;
+              },
+              error: (error) => {
+                reject(error);
+              },
+              complete: () => {
+                resolve(fullResponse);
+              },
+            });
+          });
+          // Add AI response to history for context in future messages
+          await addMessageToHistory(
+            messageHistory,
+            { role: 'assistant', content: fullResponse },
+            options.historyLimit || 20,
+          );
+        } catch (error) {
+          console.error('\n❌ Chain error:', error);
+          console.log('Falling back to basic chat...');
+        }
+        console.log('');
+      } catch (error) {
+        console.error('\n❌ Error during chat:', error);
+        console.log('');
+      }
+    }
+  });
+/**
+ * CLI command for interactive chat with AI models.
+ * Enhanced with AI options including chat, embedding, and search capabilities.
+ */
+export const command = withAiOptions(_command, {
+  includeChat: true,
+  includeEmbedding: true,
+  includeSearch: true,
+});
+export default command;

package/src/index.ts ADDED Viewed

@@ -0,0 +1,13 @@
+import type { Command } from 'commander';
+import { registerAiPlugin } from '@equinor/fusion-framework-cli-plugin-ai-base';
+import { command as chatCommand } from './chat.js';
+/**
+ * Registers the AI chat plugin command with the CLI program
+ * @param program - The Commander program instance to register commands with
+ */
+export function registerChatPlugin(program: Command): void {
+  registerAiPlugin(program, chatCommand);
+}
+export default registerChatPlugin;

package/src/system-message-template.ts ADDED Viewed

@@ -0,0 +1,24 @@
+/**
+ * System message template for FUSION framework chat assistant
+ *
+ * This template emphasizes using FUSION knowledge from the provided context
+ * to provide accurate and comprehensive answers about the FUSION framework.
+ *
+ * @param context - The retrieved context from the vector store containing FUSION knowledge
+ * @returns Formatted system message string for the AI chat assistant
+ */
+export function createSystemMessage(context: string): string {
+  return `You are a helpful assistant specialized in the FUSION framework. Your primary goal is to use FUSION knowledge from the provided context to answer questions accurately and comprehensively.
+**Priority Guidelines:**
+1. **Always prioritize FUSION-specific information** from the context below when answering questions
+2. Use FUSION framework patterns, APIs, conventions, and best practices from the context
+3. Reference specific FUSION modules, packages, or components mentioned in the context when relevant
+4. If the context contains FUSION documentation, code examples, or implementation details, use them as the basis for your response
+5. Only provide general answers if the context doesn't contain relevant FUSION information, and clearly state when you're doing so
+**Context (FUSION Knowledge Base):**
+${context}
+Remember: Your expertise comes from the FUSION context provided above. Use it as extensively as possible to provide accurate, framework-specific guidance.`;
+}

package/src/version.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ // Generated by genversion.
2	+ export const version = '1.0.0';

package/tsconfig.json ADDED Viewed

@@ -0,0 +1,24 @@
+{
+  "extends": "../../../tsconfig.base.json",
+  "compilerOptions": {
+    "module": "NodeNext",
+    "moduleResolution": "NodeNext",
+    "outDir": "dist/esm",
+    "rootDir": "src",
+    "declarationDir": "./dist/types",
+    "baseUrl": "."
+  },
+  "references": [
+    {
+      "path": "../ai-base"
+    },
+    {
+      "path": "../../modules/ai"
+    },
+    {
+      "path": "../../modules/module"
+    }
+  ],
+  "include": ["src/**/*"],
+  "exclude": ["node_modules"]
+}

package/vitest.config.ts ADDED Viewed

@@ -0,0 +1,14 @@
+import { defineConfig } from 'vitest/config';
+export default defineConfig({
+  test: {
+    globals: true,
+    environment: 'node',
+    include: ['src/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html'],
+      exclude: ['**/*.test.ts', '**/dist/**', '**/node_modules/**'],
+    },
+  },
+});