npm - @juspay/neurolink - Versions diffs - 5.1.0 → 5.3.0 - Mend

@juspay/neurolink 5.1.0 → 5.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (190) hide show

package/CHANGELOG.md +21 -9
package/README.md +123 -126
package/dist/agent/direct-tools.d.ts +6 -6
package/dist/cli/commands/config.d.ts +3 -3
package/dist/cli/commands/mcp.js +8 -7
package/dist/cli/factories/command-factory.d.ts +4 -0
package/dist/cli/factories/command-factory.js +63 -8
package/dist/cli/index.js +87 -140
package/dist/core/base-provider.d.ts +423 -0
package/dist/core/base-provider.js +376 -0
package/dist/core/constants.d.ts +2 -1
package/dist/core/constants.js +2 -1
package/dist/core/dynamic-models.d.ts +6 -6
package/dist/core/evaluation.d.ts +19 -80
package/dist/core/evaluation.js +185 -484
package/dist/core/factory.d.ts +3 -3
package/dist/core/factory.js +31 -91
package/dist/core/service-registry.d.ts +47 -0
package/dist/core/service-registry.js +112 -0
package/dist/core/types.d.ts +8 -1
package/dist/factories/compatibility-factory.js +1 -1
package/dist/factories/provider-factory.d.ts +72 -0
package/dist/factories/provider-factory.js +144 -0
package/dist/factories/provider-registry.d.ts +38 -0
package/dist/factories/provider-registry.js +107 -0
package/dist/index.d.ts +4 -3
package/dist/index.js +2 -4
package/dist/lib/agent/direct-tools.d.ts +6 -6
package/dist/lib/core/base-provider.d.ts +423 -0
package/dist/lib/core/base-provider.js +376 -0
package/dist/lib/core/constants.d.ts +2 -1
package/dist/lib/core/constants.js +2 -1
package/dist/lib/core/dynamic-models.d.ts +6 -6
package/dist/lib/core/evaluation.d.ts +19 -80
package/dist/lib/core/evaluation.js +185 -484
package/dist/lib/core/factory.d.ts +3 -3
package/dist/lib/core/factory.js +30 -91
package/dist/lib/core/service-registry.d.ts +47 -0
package/dist/lib/core/service-registry.js +112 -0
package/dist/lib/core/types.d.ts +8 -1
package/dist/lib/factories/compatibility-factory.js +1 -1
package/dist/lib/factories/provider-factory.d.ts +72 -0
package/dist/lib/factories/provider-factory.js +144 -0
package/dist/lib/factories/provider-registry.d.ts +38 -0
package/dist/lib/factories/provider-registry.js +107 -0
package/dist/lib/index.d.ts +4 -3
package/dist/lib/index.js +2 -4
package/dist/lib/mcp/client.d.ts +1 -0
package/dist/lib/mcp/client.js +1 -0
package/dist/lib/mcp/config.js +28 -3
package/dist/lib/mcp/context-manager.d.ts +1 -0
package/dist/lib/mcp/context-manager.js +8 -4
package/dist/lib/mcp/function-calling.d.ts +13 -0
package/dist/lib/mcp/function-calling.js +134 -35
package/dist/lib/mcp/initialize-tools.d.ts +1 -1
package/dist/lib/mcp/initialize-tools.js +45 -1
package/dist/lib/mcp/initialize.js +16 -6
package/dist/lib/mcp/neurolink-mcp-client.d.ts +1 -0
package/dist/lib/mcp/neurolink-mcp-client.js +21 -5
package/dist/lib/mcp/servers/agent/direct-tools-server.d.ts +8 -0
package/dist/lib/mcp/servers/agent/direct-tools-server.js +109 -0
package/dist/lib/mcp/servers/ai-providers/ai-core-server.js +3 -1
package/dist/lib/mcp/servers/ai-providers/ai-workflow-tools.d.ts +2 -2
package/dist/lib/mcp/unified-registry.d.ts +4 -0
package/dist/lib/mcp/unified-registry.js +42 -9
package/dist/lib/neurolink.d.ts +156 -117
package/dist/lib/neurolink.js +619 -404
package/dist/lib/providers/amazon-bedrock.d.ts +32 -0
package/dist/lib/providers/amazon-bedrock.js +143 -0
package/dist/lib/providers/analytics-helper.js +7 -4
package/dist/lib/providers/anthropic-baseprovider.d.ts +23 -0
package/dist/lib/providers/anthropic-baseprovider.js +114 -0
package/dist/lib/providers/anthropic.d.ts +19 -43
package/dist/lib/providers/anthropic.js +82 -306
package/dist/lib/providers/azure-openai.d.ts +20 -0
package/dist/lib/providers/azure-openai.js +89 -0
package/dist/lib/providers/function-calling-provider.d.ts +64 -2
package/dist/lib/providers/function-calling-provider.js +208 -9
package/dist/lib/providers/google-ai-studio.d.ts +23 -0
package/dist/lib/providers/google-ai-studio.js +107 -0
package/dist/lib/providers/google-vertex.d.ts +47 -0
package/dist/lib/providers/google-vertex.js +205 -0
package/dist/lib/providers/huggingFace.d.ts +32 -25
package/dist/lib/providers/huggingFace.js +97 -431
package/dist/lib/providers/index.d.ts +9 -9
package/dist/lib/providers/index.js +9 -9
package/dist/lib/providers/mcp-provider.js +24 -5
package/dist/lib/providers/mistral.d.ts +42 -0
package/dist/lib/providers/mistral.js +160 -0
package/dist/lib/providers/ollama.d.ts +52 -36
package/dist/lib/providers/ollama.js +297 -520
package/dist/lib/providers/openAI.d.ts +19 -18
package/dist/lib/providers/openAI.js +76 -275
package/dist/lib/sdk/tool-extension.d.ts +181 -0
package/dist/lib/sdk/tool-extension.js +283 -0
package/dist/lib/sdk/tool-registration.d.ts +95 -0
package/dist/lib/sdk/tool-registration.js +167 -0
package/dist/lib/services/streaming/streaming-manager.js +11 -10
package/dist/lib/services/websocket/websocket-server.js +12 -11
package/dist/lib/telemetry/telemetry-service.js +8 -7
package/dist/lib/types/generate-types.d.ts +1 -0
package/dist/lib/types/mcp-types.d.ts +116 -0
package/dist/lib/types/mcp-types.js +5 -0
package/dist/lib/types/stream-types.d.ts +30 -18
package/dist/lib/types/universal-provider-options.d.ts +87 -0
package/dist/lib/types/universal-provider-options.js +53 -0
package/dist/mcp/client.d.ts +1 -0
package/dist/mcp/client.js +1 -0
package/dist/mcp/config.js +28 -3
package/dist/mcp/context-manager.d.ts +1 -0
package/dist/mcp/context-manager.js +8 -4
package/dist/mcp/function-calling.d.ts +13 -0
package/dist/mcp/function-calling.js +134 -35
package/dist/mcp/initialize-tools.d.ts +1 -1
package/dist/mcp/initialize-tools.js +45 -1
package/dist/mcp/initialize.js +16 -6
package/dist/mcp/neurolink-mcp-client.d.ts +1 -0
package/dist/mcp/neurolink-mcp-client.js +21 -5
package/dist/mcp/servers/agent/direct-tools-server.d.ts +8 -0
package/dist/mcp/servers/agent/direct-tools-server.js +109 -0
package/dist/mcp/servers/ai-providers/ai-core-server.js +3 -1
package/dist/mcp/servers/ai-providers/ai-workflow-tools.d.ts +2 -2
package/dist/mcp/unified-registry.d.ts +4 -0
package/dist/mcp/unified-registry.js +42 -9
package/dist/neurolink.d.ts +156 -117
package/dist/neurolink.js +619 -404
package/dist/providers/amazon-bedrock.d.ts +32 -0
package/dist/providers/amazon-bedrock.js +143 -0
package/dist/providers/analytics-helper.js +7 -4
package/dist/providers/anthropic-baseprovider.d.ts +23 -0
package/dist/providers/anthropic-baseprovider.js +114 -0
package/dist/providers/anthropic.d.ts +19 -43
package/dist/providers/anthropic.js +81 -305
package/dist/providers/azure-openai.d.ts +20 -0
package/dist/providers/azure-openai.js +89 -0
package/dist/providers/function-calling-provider.d.ts +64 -2
package/dist/providers/function-calling-provider.js +208 -9
package/dist/providers/google-ai-studio.d.ts +23 -0
package/dist/providers/google-ai-studio.js +108 -0
package/dist/providers/google-vertex.d.ts +47 -0
package/dist/providers/google-vertex.js +205 -0
package/dist/providers/huggingFace.d.ts +32 -25
package/dist/providers/huggingFace.js +96 -430
package/dist/providers/index.d.ts +9 -9
package/dist/providers/index.js +9 -9
package/dist/providers/mcp-provider.js +24 -5
package/dist/providers/mistral.d.ts +42 -0
package/dist/providers/mistral.js +160 -0
package/dist/providers/ollama.d.ts +52 -36
package/dist/providers/ollama.js +297 -519
package/dist/providers/openAI.d.ts +19 -18
package/dist/providers/openAI.js +76 -276
package/dist/sdk/tool-extension.d.ts +181 -0
package/dist/sdk/tool-extension.js +283 -0
package/dist/sdk/tool-registration.d.ts +95 -0
package/dist/sdk/tool-registration.js +168 -0
package/dist/services/streaming/streaming-manager.js +11 -10
package/dist/services/websocket/websocket-server.js +12 -11
package/dist/telemetry/telemetry-service.js +8 -7
package/dist/types/generate-types.d.ts +1 -0
package/dist/types/mcp-types.d.ts +116 -0
package/dist/types/mcp-types.js +5 -0
package/dist/types/stream-types.d.ts +30 -18
package/dist/types/universal-provider-options.d.ts +87 -0
package/dist/types/universal-provider-options.js +53 -0
package/package.json +12 -5
package/dist/lib/providers/agent-enhanced-provider.d.ts +0 -93
package/dist/lib/providers/agent-enhanced-provider.js +0 -605
package/dist/lib/providers/amazonBedrock.d.ts +0 -28
package/dist/lib/providers/amazonBedrock.js +0 -364
package/dist/lib/providers/azureOpenAI.d.ts +0 -42
package/dist/lib/providers/azureOpenAI.js +0 -347
package/dist/lib/providers/googleAIStudio.d.ts +0 -42
package/dist/lib/providers/googleAIStudio.js +0 -364
package/dist/lib/providers/googleVertexAI.d.ts +0 -34
package/dist/lib/providers/googleVertexAI.js +0 -547
package/dist/lib/providers/mistralAI.d.ts +0 -37
package/dist/lib/providers/mistralAI.js +0 -325
package/dist/providers/agent-enhanced-provider.d.ts +0 -93
package/dist/providers/agent-enhanced-provider.js +0 -606
package/dist/providers/amazonBedrock.d.ts +0 -28
package/dist/providers/amazonBedrock.js +0 -364
package/dist/providers/azureOpenAI.d.ts +0 -42
package/dist/providers/azureOpenAI.js +0 -348
package/dist/providers/googleAIStudio.d.ts +0 -42
package/dist/providers/googleAIStudio.js +0 -364
package/dist/providers/googleVertexAI.d.ts +0 -34
package/dist/providers/googleVertexAI.js +0 -547
package/dist/providers/mistralAI.d.ts +0 -37
package/dist/providers/mistralAI.js +0 -325

package/dist/lib/core/evaluation.js CHANGED Viewed

@@ -1,528 +1,229 @@
 /**
  * NeuroLink Unified Evaluation System
- *
- * Combines Universal Evaluation with Lighthouse-Enhanced capabilities
- * - Domain-aware evaluation with sophisticated context handling
- * - Multi-provider support with fallback strategies
- * - Structured output with Zod schema validation
- * - Tool usage and conversation history analysis
- * - Enterprise-grade reliability and performance
  */
 import { logger } from "../utils/logger.js";
 import { AIProviderFactory } from "./factory.js";
 import { z } from "zod";
-/**
- * Unified Evaluation Schema (Lighthouse-compatible with extensions)
- */
-export const unifiedEvaluationSchema = z.object({
-    // Core evaluation scores
-    relevance: z
-        .number()
-        .min(0)
-        .max(10)
-        .describe("Score (0-10) for how well the response addresses query intent and aligns with domain/role. 10 is most relevant."),
-    accuracy: z
-        .number()
-        .min(0)
-        .max(10)
-        .describe("Score (0-10) for factual correctness against data, tool outputs, and domain knowledge. 10 is most accurate."),
-    completeness: z
-        .number()
-        .min(0)
-        .max(10)
-        .describe("Score (0-10) for how completely the response addresses the query. 10 is most complete."),
-    // Enhanced domain scores (optional)
-    domainAlignment: z
-        .number()
-        .min(0)
-        .max(10)
-        .optional()
-        .describe("Score (0-10) for how well response aligns with specified domain expertise."),
-    terminologyAccuracy: z
-        .number()
-        .min(0)
-        .max(10)
-        .optional()
-        .describe("Score (0-10) for correct usage of domain-specific terminology."),
-    toolEffectiveness: z
-        .number()
-        .min(0)
-        .max(10)
-        .optional()
-        .describe("Score (0-10) for how effectively available tools/MCPs were utilized."),
-    // Qualitative assessment
-    isOffTopic: z
-        .boolean()
-        .describe("True if the response significantly deviates from query/domain."),
-    reasoning: z
-        .string()
-        .describe("Brief justification for scores, especially if low or off-topic. Max 150 words."),
-    suggestedImprovements: z
-        .string()
-        .optional()
-        .describe("Optional: Suggestions for improving the original response. Max 100 words."),
-    alertSeverity: z
-        .enum(["low", "medium", "high", "none"])
-        .describe("Suggested alert severity considering all scores and domain context."),
+import { ProviderRegistry } from "../factories/provider-registry.js";
+// Zod schema for validation
+const UnifiedEvaluationSchema = z.object({
+    relevance: z.number().min(1).max(10),
+    accuracy: z.number().min(1).max(10),
+    completeness: z.number().min(1).max(10),
+    overall: z.number().min(1).max(10),
+    domainAlignment: z.number().min(1).max(10).optional(),
+    terminologyAccuracy: z.number().min(1).max(10).optional(),
+    toolEffectiveness: z.number().min(1).max(10).optional(),
 });
 /**
- * Main unified evaluation function
+ * Get default evaluation when evaluation fails
  */
-export async function performUnifiedEvaluation(context) {
-    const functionTag = "performUnifiedEvaluation";
-    const startTime = Date.now();
-    // Determine evaluation mode
-    const mode = context.mode || detectEvaluationMode(context);
-    logger.debug(`[${functionTag}] Starting unified evaluation`, {
-        mode,
-        domain: context.primaryDomain,
-        toolsUsed: context.toolsUsed?.length || 0,
-        conversationTurns: context.conversationHistory?.length || 0,
-        queryLength: context.userQuery.length,
-        responseLength: context.aiResponse.length,
+function getDefaultUnifiedEvaluation(reason, evaluationTime, context) {
+    const functionTag = "getDefaultUnifiedEvaluation";
+    logger.debug(`[${functionTag}] Creating default evaluation`, {
+        reason,
+        evaluationTime,
+        hasContext: !!context,
     });
-    const { parseEvaluationConfig } = await import("./evaluation-config.js");
-    const config = parseEvaluationConfig();
-    let lastError = null;
-    for (let attempt = 0; attempt <= config.retryAttempts; attempt++) {
-        try {
-            // Get evaluation model
-            const evaluationModelResult = await getEvaluationModel();
-            if (!evaluationModelResult) {
-                logger.debug(`[${functionTag}] No evaluation model available, returning defaults`);
-                return getDefaultUnifiedEvaluation("unavailable", Date.now() - startTime, context);
-            }
-            const { provider: evaluationModel, config: modelConfig } = evaluationModelResult;
-            // Create evaluation prompt based on mode
-            const evaluationPrompt = createUnifiedEvaluationPrompt(context, mode);
-            logger.debug(`[${functionTag}] Using ${mode} evaluation mode`, {
-                provider: modelConfig.providerName,
-                model: modelConfig.modelName,
-                attempt: attempt + 1,
-            });
-            // Try structured evaluation first (preferred)
-            try {
-                const structuredResult = await evaluationModel.generateObject({
-                    schema: unifiedEvaluationSchema,
-                    prompt: evaluationPrompt,
-                    temperature: 0.1,
-                    maxTokens: 1000,
-                    system: createUnifiedSystemPrompt(mode),
-                });
-                return processStructuredEvaluationResult(structuredResult.object, modelConfig, Date.now() - startTime, context, attempt + 1);
-            }
-            catch (structuredError) {
-                logger.warn(`[${functionTag}] Structured evaluation failed, using fallback`, { structuredError });
-                // Fallback to legacy generate
-                const result = await evaluationModel.generate({
-                    prompt: evaluationPrompt + "\n\nRespond with valid JSON only.",
-                    temperature: 0.1,
-                    maxTokens: 1000,
-                    systemPrompt: createUnifiedSystemPrompt(mode),
-                });
-                const responseText = result?.text || result?.content;
-                if (!responseText) {
-                    throw new Error("No evaluation text received from fallback");
-                }
-                return parseUnifiedEvaluationResult(responseText, modelConfig, Date.now() - startTime, context, attempt + 1);
-            }
-        }
-        catch (error) {
-            lastError = error instanceof Error ? error : new Error(String(error));
-            logger.warn(`[${functionTag}] Evaluation attempt ${attempt + 1} failed:`, lastError.message);
-            if (attempt === config.retryAttempts) {
-                break;
-            }
-            // Exponential backoff
-            await new Promise((resolve) => setTimeout(resolve, Math.pow(2, attempt) * 1000));
-        }
-    }
-    // All attempts failed
-    logger.error(`[${functionTag}] All evaluation attempts failed:`, lastError?.message);
-    return getDefaultUnifiedEvaluation(lastError?.message || "unknown-error", Date.now() - startTime, context);
-}
-/**
- * Detect appropriate evaluation mode based on context
- */
-function detectEvaluationMode(context) {
-    // Lighthouse mode: Has domain awareness, tool context, or conversation history
-    if (context.primaryDomain ||
-        context.toolsUsed?.length ||
-        context.conversationHistory?.length) {
-        return "lighthouse";
-    }
-    // Enhanced mode: Has rich context
-    if (context.context && Object.keys(context.context).length > 0) {
-        return "enhanced";
-    }
-    // Simple mode: Basic evaluation
-    return "simple";
-}
-/**
- * Create unified evaluation prompt based on mode
- */
-function createUnifiedEvaluationPrompt(context, mode) {
-    switch (mode) {
-        case "lighthouse":
-            return createLighthouseEvaluationPrompt(context);
-        case "enhanced":
-            return createEnhancedEvaluationPrompt(context);
-        case "simple":
-        default:
-            return createSimpleEvaluationPrompt(context);
-    }
-}
-/**
- * Create Lighthouse-style domain-aware evaluation prompt
- */
-function createLighthouseEvaluationPrompt(context) {
-    const { userQuery, aiResponse, primaryDomain = "general AI assistant", assistantRole = "AI assistant", toolContext = "No specific tools used in this interaction", conversationHistory = [], } = context;
-    const formattedHistory = formatConversationHistory(conversationHistory);
-    return `You are an AI Response Evaluator with advanced domain awareness.
-**EVALUATION CONTEXT**:
-1. **Primary Assistant Domain**: "${primaryDomain}"
-   - This defines the AI assistant's core expertise area
-   - Responses should demonstrate competency within this domain
-   - Domain-specific terminology should be used accurately
-2. **Assistant Role**: "${assistantRole}"
-   - This defines the specific role the assistant should fulfill
-   - Responses should align with this role's responsibilities
-3. **Tool Usage Context**: "${toolContext}"
-   - Tools/MCPs are capabilities the assistant used to generate the response
-   - Evaluate how effectively these tools were utilized
-   - Consider if additional tools should have been used
-4. **Conversation History**:
-\`\`\`
-${formattedHistory}
-\`\`\`
-**CRITICAL DOMAIN FAILURE ASSESSMENT**:
-Pay special attention to domain alignment. If the query is within the assistant's domain and sufficient context is available:
-- Inability to answer ("I can't help", generic errors, evasions) = HIGH ALERT
-- Incorrect domain-specific information = HIGH ALERT
-- Misuse of domain terminology = MEDIUM-HIGH ALERT
-**EVALUATION CRITERIA**:
-- **relevanceScore** (0-10): Direct query addressing + domain alignment
-- **accuracyScore** (0-10): Factual correctness + terminology accuracy
-- **completenessScore** (0-10): Full query addressing + appropriate depth
-- **domainAlignment** (0-10): How well response fits the domain expertise
-- **terminologyAccuracy** (0-10): Correct use of domain-specific terms
-- **toolEffectiveness** (0-10): How well available tools were utilized
-- **isOffTopic** (boolean): True if significantly deviates from domain/query
-- **reasoning** (string): Brief explanation (max 150 words)
-- **suggestedImprovements** (string): How to improve (max 100 words)
-- **alertSeverity** ('low'|'medium'|'high'|'none'): Based on domain failure assessment
-**Current User Query**:
-"${userQuery}"
-**AI Assistant Response**:
-"${aiResponse}"
-Provide your assessment in the specified format.`;
-}
-/**
- * Create enhanced evaluation prompt
- */
-function createEnhancedEvaluationPrompt(context) {
-    const { userQuery, aiResponse, context: additionalContext } = context;
-    const contextInfo = additionalContext
-        ? `\nContext: ${JSON.stringify(additionalContext, null, 2)}`
-        : "";
-    return `Evaluate this AI response with enhanced criteria:
-Query: "${userQuery}"
-Response: "${aiResponse}"${contextInfo}
-Provide scores for:
-- relevanceScore (0-10): How well the response addresses the query
-- accuracyScore (0-10): Factual correctness and reliability
-- completenessScore (0-10): Whether the response fully answers the question
-- isOffTopic (boolean): Whether response deviates from query
-- reasoning (string): Brief explanation of scores
-- alertSeverity ('low'|'medium'|'high'|'none'): Overall quality assessment
-Respond in the specified format.`;
-}
-/**
- * Create simple evaluation prompt
- */
-function createSimpleEvaluationPrompt(context) {
-    const { userQuery, aiResponse } = context;
-    return `Rate this AI response:
-Q: "${userQuery}"
-A: "${aiResponse}"
-Provide:
-- relevanceScore (0-10)
-- accuracyScore (0-10)
-- completenessScore (0-10)
-- reasoning (brief explanation)
-Respond in the specified format.`;
-}
-/**
- * Create unified system prompt based on mode
- */
-function createUnifiedSystemPrompt(mode) {
-    const basePrompt = "You are an expert AI Response Evaluator. Respond with valid structured output only.";
-    switch (mode) {
-        case "lighthouse":
-            return `${basePrompt} Use advanced domain awareness and sophisticated context analysis for comprehensive evaluation.`;
-        case "enhanced":
-            return `${basePrompt} Consider all provided context and metadata for thorough evaluation.`;
-        case "simple":
-        default:
-            return `${basePrompt} Focus on core quality metrics: relevance, accuracy, and completeness.`;
-    }
-}
-/**
- * Process structured evaluation result
- */
-function processStructuredEvaluationResult(result, modelConfig, evaluationTime, context, attempt) {
-    // Calculate overall score
-    const coreScores = [
-        result.relevanceScore || 0,
-        result.accuracyScore || 0,
-        result.completenessScore || 0,
-    ];
-    const enhancedScores = [
-        result.domainAlignment,
-        result.terminologyAccuracy,
-        result.toolEffectiveness,
-    ].filter((score) => typeof score === "number" && score > 0);
-    const allScores = [...coreScores, ...enhancedScores];
-    const overall = Math.round(allScores.reduce((sum, score) => sum + score, 0) / allScores.length);
     return {
-        // Core scores
-        relevance: Math.max(0, Math.min(10, Math.round(result.relevanceScore || 0))),
-        accuracy: Math.max(0, Math.min(10, Math.round(result.accuracyScore || 0))),
-        completeness: Math.max(0, Math.min(10, Math.round(result.completenessScore || 0))),
-        overall: Math.max(0, Math.min(10, overall)),
-        // Enhanced insights
-        isOffTopic: result.isOffTopic || false,
-        alertSeverity: result.alertSeverity || "none",
-        reasoning: result.reasoning || "Evaluation completed successfully.",
-        suggestedImprovements: result.suggestedImprovements,
-        // Domain-specific scores (if available)
-        domainAlignment: result.domainAlignment
-            ? Math.max(0, Math.min(10, Math.round(result.domainAlignment)))
-            : undefined,
-        terminologyAccuracy: result.terminologyAccuracy
-            ? Math.max(0, Math.min(10, Math.round(result.terminologyAccuracy)))
-            : undefined,
-        toolEffectiveness: result.toolEffectiveness
-            ? Math.max(0, Math.min(10, Math.round(result.toolEffectiveness)))
-            : undefined,
-        // Context analysis
+        relevance: 1,
+        accuracy: 1,
+        completeness: 1,
+        overall: 1,
+        domainAlignment: 1,
+        terminologyAccuracy: 1,
+        toolEffectiveness: 1,
+        isOffTopic: false,
+        alertSeverity: "low",
+        reasoning: `Default evaluation used due to: ${reason}`,
         contextUtilization: {
-            conversationUsed: (context.conversationHistory?.length || 0) > 0,
-            toolsUsed: (context.toolsUsed?.length || 0) > 0,
-            domainKnowledgeUsed: !!context.primaryDomain,
+            conversationUsed: false,
+            toolsUsed: false,
+            domainKnowledgeUsed: false,
         },
-        // Enhanced metadata
         evaluationContext: {
             domain: context.primaryDomain || "general",
-            toolsEvaluated: context.toolsUsed || [],
-            conversationTurns: context.conversationHistory?.length || 0,
+            toolsEvaluated: [],
+            conversationTurns: 0,
         },
-        // Standard metadata
-        evaluationModel: `${modelConfig.providerName}/${modelConfig.modelName}`,
+        evaluationModel: "default",
         evaluationTime,
-        evaluationProvider: modelConfig.providerName,
-        evaluationAttempt: attempt,
+        evaluationProvider: "default",
+        evaluationAttempt: 1,
         evaluationConfig: {
-            mode: context.mode || "auto",
-            fallbackUsed: attempt > 1,
+            mode: "fallback",
+            fallbackUsed: true,
             costEstimate: 0,
         },
     };
 }
 /**
- * Parse evaluation result from text response
+ * Parse unified evaluation result from text response
  */
-function parseUnifiedEvaluationResult(evaluationText, modelConfig, evaluationTime, context, attempt) {
+function parseUnifiedEvaluationResult(response, context) {
+    const functionTag = "parseUnifiedEvaluationResult";
     try {
-        // Clean and parse JSON
-        const cleanText = evaluationText.trim().replace(/```json\s*|```\s*/g, "");
-        const jsonMatch = cleanText.match(/\{[^]*?\}/s);
+        logger.debug(`[${functionTag}] Parsing evaluation response`, {
+            responseLength: response.length,
+        });
+        // Try JSON parsing first
+        const jsonMatch = response.match(/\{[^}]*\}/s);
         if (jsonMatch) {
-            const parsed = JSON.parse(jsonMatch[0]);
-            return processStructuredEvaluationResult(parsed, modelConfig, evaluationTime, context, attempt);
+            try {
+                const parsed = JSON.parse(jsonMatch[0]);
+                return parsed;
+            }
+            catch (e) {
+                logger.debug(`[${functionTag}] JSON parsing failed, trying regex`);
+            }
+        }
+        // Fallback to regex parsing
+        const result = {};
+        const patterns = {
+            relevance: /relevance[:\s]*([0-9]+(?:\.[0-9]+)?)/i,
+            accuracy: /accuracy[:\s]*([0-9]+(?:\.[0-9]+)?)/i,
+            completeness: /completeness[:\s]*([0-9]+(?:\.[0-9]+)?)/i,
+            overall: /overall[:\s]*([0-9]+(?:\.[0-9]+)?)/i,
+        };
+        for (const [key, pattern] of Object.entries(patterns)) {
+            const match = response.match(pattern);
+            if (match) {
+                const value = parseFloat(match[1]);
+                if (value >= 1 && value <= 10) {
+                    result[key] = Math.round(value);
+                }
+            }
         }
-        // Fallback to regex parsing with improved patterns
-        const relevanceMatch = evaluationText.match(/(?:relevance[Score"\s]*:?["\s]*(\d+)|Relevance["\s]*:?["\s]*(\d+)|relevance.*?(\d+))/i);
-        const accuracyMatch = evaluationText.match(/(?:accuracy[Score"\s]*:?["\s]*(\d+)|Accuracy["\s]*:?["\s]*(\d+)|accuracy.*?(\d+))/i);
-        const completenessMatch = evaluationText.match(/(?:completeness[Score"\s]*:?["\s]*(\d+)|Completeness["\s]*:?["\s]*(\d+)|completeness.*?(\d+))/i);
-        // Extract scores with fallback to default values
-        const relevance = relevanceMatch
-            ? parseInt(relevanceMatch[1] || relevanceMatch[2] || relevanceMatch[3], 10)
-            : 8; // Default fallback score
-        const accuracy = accuracyMatch
-            ? parseInt(accuracyMatch[1] || accuracyMatch[2] || accuracyMatch[3], 10)
-            : 8; // Default fallback score
-        const completeness = completenessMatch
-            ? parseInt(completenessMatch[1] || completenessMatch[2] || completenessMatch[3], 10)
-            : 8; // Default fallback score
+        // Ensure minimum valid scores
         return {
-            relevance: Math.max(0, Math.min(10, relevance)),
-            accuracy: Math.max(0, Math.min(10, accuracy)),
-            completeness: Math.max(0, Math.min(10, completeness)),
-            overall: Math.round((relevance + accuracy + completeness) / 3),
-            isOffTopic: false,
-            alertSeverity: "none",
-            reasoning: "Parsed using regex fallback - response was not in expected JSON format.",
-            evaluationModel: `${modelConfig.providerName}/${modelConfig.modelName}`,
-            evaluationTime,
-            evaluationProvider: modelConfig.providerName,
-            evaluationAttempt: attempt,
-            evaluationConfig: {
-                mode: "fallback",
-                fallbackUsed: true,
-                costEstimate: 0,
-            },
+            relevance: result.relevance || 1,
+            accuracy: result.accuracy || 1,
+            completeness: result.completeness || 1,
+            overall: result.overall || 1,
         };
     }
     catch (error) {
-        logger.error("Failed to parse unified evaluation result", { error });
-        return getDefaultUnifiedEvaluation("parse-error", evaluationTime, context);
+        logger.error(`[${functionTag}] Failed to parse evaluation result`, {
+            error,
+        });
+        return {
+            relevance: 1,
+            accuracy: 1,
+            completeness: 1,
+            overall: 1,
+        };
     }
 }
 /**
- * Get default evaluation when evaluation fails
- */
-function getDefaultUnifiedEvaluation(reason, evaluationTime, context) {
-    return {
-        relevance: 0,
-        accuracy: 0,
-        completeness: 0,
-        overall: 0,
-        isOffTopic: false,
-        alertSeverity: "high",
-        reasoning: `Evaluation unavailable (${reason}). This may be due to missing API keys, network issues, or service unavailability.`,
-        suggestedImprovements: "Check evaluation system configuration, API credentials, and network connectivity.",
-        evaluationModel: "unavailable",
-        evaluationTime,
-        evaluationProvider: "none",
-        evaluationAttempt: 0,
-        evaluationConfig: {
-            mode: "default",
-            fallbackUsed: true,
-            costEstimate: 0,
-        },
-        contextUtilization: {
-            conversationUsed: (context.conversationHistory?.length || 0) > 0,
-            toolsUsed: (context.toolsUsed?.length || 0) > 0,
-            domainKnowledgeUsed: !!context.primaryDomain,
-        },
-        evaluationContext: {
-            domain: context.primaryDomain || "unknown",
-            toolsEvaluated: context.toolsUsed || [],
-            conversationTurns: context.conversationHistory?.length || 0,
-        },
-    };
-}
-/**
- * Enhanced evaluation model selection
+ * Main unified evaluation function
  */
-export async function getEvaluationModel() {
-    const { parseEvaluationConfig, getProviderFallbackOrder } = await import("./evaluation-config.js");
-    const { getProviderConfig } = await import("./evaluation-providers.js");
-    const config = parseEvaluationConfig();
-    const fallbackOrder = getProviderFallbackOrder(config);
-    for (const providerName of fallbackOrder) {
-        try {
-            const providerConfig = getProviderConfig(providerName);
-            if (!providerConfig) {
-                continue;
-            }
-            let modelName = config.model;
-            if (modelName === "auto" || !config.model) {
-                modelName =
-                    providerConfig.models[config.mode] || providerConfig.models.fast;
-            }
-            const provider = await AIProviderFactory.createProvider(providerName, modelName);
-            if (provider) {
-                return {
-                    provider,
-                    config: {
-                        providerName,
-                        modelName,
-                        providerConfig,
-                        evaluationConfig: config,
-                    },
-                };
-            }
+export async function generateUnifiedEvaluation(context) {
+    const functionTag = "generateUnifiedEvaluation";
+    const startTime = Date.now();
+    logger.debug(`[${functionTag}] Starting evaluation`, {
+        hasUserQuery: !!context.userQuery,
+        hasAiResponse: !!context.aiResponse,
+        domain: context.primaryDomain,
+    });
+    try {
+        // Ensure providers are registered
+        await ProviderRegistry.registerAllProviders();
+        // Get evaluation provider
+        const evaluationProvider = process.env.NEUROLINK_EVALUATION_PROVIDER || "google-ai";
+        const evaluationModel = process.env.NEUROLINK_EVALUATION_MODEL || "gemini-2.5-flash";
+        logger.debug(`[${functionTag}] Using provider: ${evaluationProvider}, model: ${evaluationModel}`);
+        const provider = await AIProviderFactory.createProvider(evaluationProvider, evaluationModel);
+        if (!provider) {
+            logger.debug(`[${functionTag}] No evaluation provider available, returning defaults`);
+            return getDefaultUnifiedEvaluation("no-provider", Date.now() - startTime, context);
         }
-        catch (error) {
-            if (!config.fallbackEnabled) {
-                throw error;
-            }
-            continue;
+        // Create evaluation prompt
+        const prompt = `
+Evaluate this AI response on a scale of 1-10 for each criterion:
+User Query: ${context.userQuery}
+AI Response: ${context.aiResponse}
+Rate on these criteria (1-10 scale):
+- Relevance: How well does the response address the user's question?
+- Accuracy: How factually correct and precise is the information?
+- Completeness: How thoroughly does it cover the topic?
+- Overall: General quality assessment
+Respond in this exact format:
+Relevance: [score]
+Accuracy: [score]
+Completeness: [score]
+Overall: [score]
+`;
+        // Generate evaluation
+        const result = await provider.generate(prompt);
+        if (!result) {
+            logger.debug(`[${functionTag}] No response from provider`);
+            return getDefaultUnifiedEvaluation("no-response", Date.now() - startTime, context);
         }
+        // Extract text from result
+        const response = typeof result === "string"
+            ? result
+            : result.text || String(result);
+        // Parse evaluation result
+        const parsed = parseUnifiedEvaluationResult(response, context);
+        // Validate and enhance result
+        const validatedResult = {
+            ...parsed,
+            evaluationModel: `${evaluationProvider}/${evaluationModel}`,
+            evaluationTime: Date.now() - startTime,
+            evaluationProvider,
+            evaluationAttempt: 1,
+            evaluationConfig: {
+                mode: "standard",
+                fallbackUsed: false,
+                costEstimate: 0.001, // Rough estimate
+            },
+        };
+        logger.debug(`[${functionTag}] Evaluation completed`, {
+            relevance: validatedResult.relevance,
+            accuracy: validatedResult.accuracy,
+            completeness: validatedResult.completeness,
+            overall: validatedResult.overall,
+            evaluationTime: validatedResult.evaluationTime,
+        });
+        return validatedResult;
     }
-    return null;
-}
-/**
- * Format conversation history for evaluation
- */
-function formatConversationHistory(history) {
-    if (!history?.length) {
-        return "No prior conversation context.";
+    catch (error) {
+        logger.error(`[${functionTag}] Evaluation failed`, {
+            error: error instanceof Error ? error.message : String(error),
+        });
+        return getDefaultUnifiedEvaluation(error instanceof Error ? error.message : "unknown-error", Date.now() - startTime, context);
     }
-    return history
-        .slice(-3) // Last 3 turns
-        .map((msg, i) => `${i + 1}. ${msg.role.toUpperCase()}: ${msg.content.substring(0, 200)}${msg.content.length > 200 ? "..." : ""}`)
-        .join("\n");
-}
-/**
- * Create simple evaluation context (backward compatibility)
- */
-export function createSimpleEvaluationContext(prompt, response, context) {
-    return {
-        userQuery: prompt,
-        aiResponse: response,
-        context,
-        mode: "simple",
-    };
 }
-/**
- * Create enhanced evaluation context
- */
-export function createEnhancedEvaluationContext(userQuery, aiResponse, options = {}) {
-    return {
-        userQuery,
+// Legacy compatibility function with flexible arguments
+export async function evaluateResponse(responseOrContext, contextOrUserQuery, userQuery, providedContexts, options, additionalArgs) {
+    // Handle different call patterns for backward compatibility
+    let aiResponse;
+    let context;
+    if (typeof responseOrContext === "string") {
+        // Normal call: evaluateResponse(response, context, ...)
+        aiResponse = responseOrContext;
+        context = contextOrUserQuery;
+    }
+    else {
+        // Provider call pattern: evaluateResponse(contextObject, userQuery, ...)
+        context = responseOrContext;
+        aiResponse =
+            context?.aiResponse ||
+                context?.response ||
+                String(contextOrUserQuery || "");
+    }
+    const evalContext = {
+        userQuery: userQuery ||
+            context?.userQuery ||
+            contextOrUserQuery ||
+            "Generated response",
         aiResponse,
-        primaryDomain: options.domain,
-        assistantRole: options.role,
-        toolsUsed: options.toolsUsed,
-        toolContext: options.toolsUsed?.length
-            ? `Tools used: ${options.toolsUsed.join(", ")}`
-            : undefined,
-        conversationHistory: options.conversationHistory,
-        sessionId: options.sessionId,
-        context: options.context,
-        mode: "lighthouse",
-    };
-}
-// Legacy compatibility wrapper for old function signature
-export async function evaluateResponse(prompt, response, context, evaluationDomain, toolUsageContext, conversationHistory) {
-    // Convert old arguments to new context format
-    const unifiedContext = {
-        userQuery: prompt,
-        aiResponse: response,
         context,
-        primaryDomain: evaluationDomain,
-        toolContext: toolUsageContext,
-        conversationHistory: conversationHistory,
-        mode: evaluationDomain ? "lighthouse" : "simple",
     };
-    return performUnifiedEvaluation(unifiedContext);
+    return generateUnifiedEvaluation(evalContext);
 }
+// Export additional utilities
+export { getDefaultUnifiedEvaluation, parseUnifiedEvaluationResult };