npm - @vezlo/assistant-server - Versions diffs - 2.2.2 → 2.3.0 - Mend

@vezlo/assistant-server 2.2.2 → 2.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/README.md +18 -13
package/database-schema.sql +172 -7
package/dist/src/bootstrap/initializeServices.d.ts.map +1 -1
package/dist/src/bootstrap/initializeServices.js +2 -0
package/dist/src/bootstrap/initializeServices.js.map +1 -1
package/dist/src/config/global.js +1 -1
package/dist/src/config/global.js.map +1 -1
package/dist/src/controllers/ChatController.d.ts +1 -0
package/dist/src/controllers/ChatController.d.ts.map +1 -1
package/dist/src/controllers/ChatController.js +26 -70
package/dist/src/controllers/ChatController.js.map +1 -1
package/dist/src/controllers/KnowledgeController.d.ts.map +1 -1
package/dist/src/controllers/KnowledgeController.js +0 -4
package/dist/src/controllers/KnowledgeController.js.map +1 -1
package/dist/src/migrations/006_add_knowledge_chunks.d.ts +4 -0
package/dist/src/migrations/006_add_knowledge_chunks.d.ts.map +1 -0
package/dist/src/migrations/006_add_knowledge_chunks.js +245 -0
package/dist/src/migrations/006_add_knowledge_chunks.js.map +1 -0
package/dist/src/server.js +3 -0
package/dist/src/server.js.map +1 -1
package/dist/src/services/AIService.d.ts.map +1 -1
package/dist/src/services/AIService.js +1 -3
package/dist/src/services/AIService.js.map +1 -1
package/dist/src/services/IntentService.d.ts +2 -1
package/dist/src/services/IntentService.d.ts.map +1 -1
package/dist/src/services/IntentService.js +23 -4
package/dist/src/services/IntentService.js.map +1 -1
package/dist/src/services/KnowledgeBaseService.d.ts +20 -5
package/dist/src/services/KnowledgeBaseService.d.ts.map +1 -1
package/dist/src/services/KnowledgeBaseService.js +203 -137
package/dist/src/services/KnowledgeBaseService.js.map +1 -1
package/package.json +2 -2
package/scripts/test-chunks-embeddings.js +190 -0

package/dist/src/services/IntentService.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { ChatMessage } from '../types';
-type IntentLabel = 'knowledge' | 'greeting' | 'personality' | 'clarification' | 'guardrail' | 'human_support_request' | 'human_support_email';
+type IntentLabel = 'knowledge' | 'greeting' | 'acknowledgment' | 'personality' | 'clarification' | 'guardrail' | 'human_support_request' | 'human_support_email';
 interface IntentServiceConfig {
     openaiApiKey: string;
     model?: string;
@@ -9,6 +9,7 @@ interface IntentServiceConfig {
 export interface IntentClassificationResult {
     intent: IntentLabel;
     reason?: string;
+    response?: string;
     needsGuardrail?: boolean;
     contactEmail?: string | null;
 }

package/dist/src/services/IntentService.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"IntentService.d.ts","sourceRoot":"","sources":["../../../src/services/IntentService.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,WAAW,EAAE,MAAM,UAAU,CAAC;AAGvC,KAAK,WAAW,GACZ,WAAW,GACX,UAAU,GACV,aAAa,GACb,eAAe,GACf,WAAW,GACX,uBAAuB,GACvB,qBAAqB,CAAC;AAE1B,UAAU,mBAAmB;IAC3B,YAAY,EAAE,MAAM,CAAC;IACrB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC3B;AAED,MAAM,WAAW,0BAA0B;IACzC,MAAM,EAAE,WAAW,CAAC;IACpB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,cAAc,CAAC,EAAE,OAAO,CAAC;IACzB,YAAY,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;CAC9B;AAED,UAAU,mBAAmB;IAC3B,OAAO,EAAE,MAAM,CAAC;IAChB,mBAAmB,CAAC,EAAE,WAAW,EAAE,CAAC;CACrC;AAED,qBAAa,aAAa;IACxB,OAAO,CAAC,MAAM,CAAS;IACvB,OAAO,CAAC,KAAK,CAAS;IACtB,OAAO,CAAC,aAAa,CAAS;IAC9B,OAAO,CAAC,gBAAgB,CAAS;gBAErB,MAAM,EAAE,mBAAmB;IASjC,QAAQ,CAAC,KAAK,EAAE,mBAAmB,GAAG,OAAO,CAAC,0BAA0B,CAAC;~~IAkC~~/E,OAAO,CAAC,qBAAqB;~~IAsD7B~~,OAAO,CAAC,cAAc;~~IAmBtB~~,OAAO,CAAC,aAAa;CAOtB"}
1	+ {"version":3,"file":"IntentService.d.ts","sourceRoot":"","sources":["../../../src/services/IntentService.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,WAAW,EAAE,MAAM,UAAU,CAAC;AAGvC,KAAK,WAAW,GACZ,WAAW,GACX,UAAU,GACV,gBAAgB,GAChB,aAAa,GACb,eAAe,GACf,WAAW,GACX,uBAAuB,GACvB,qBAAqB,CAAC;AAE1B,UAAU,mBAAmB;IAC3B,YAAY,EAAE,MAAM,CAAC;IACrB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC3B;AAED,MAAM,WAAW,0BAA0B;IACzC,MAAM,EAAE,WAAW,CAAC;IACpB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,cAAc,CAAC,EAAE,OAAO,CAAC;IACzB,YAAY,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;CAC9B;AAED,UAAU,mBAAmB;IAC3B,OAAO,EAAE,MAAM,CAAC;IAChB,mBAAmB,CAAC,EAAE,WAAW,EAAE,CAAC;CACrC;AAED,qBAAa,aAAa;IACxB,OAAO,CAAC,MAAM,CAAS;IACvB,OAAO,CAAC,KAAK,CAAS;IACtB,OAAO,CAAC,aAAa,CAAS;IAC9B,OAAO,CAAC,gBAAgB,CAAS;gBAErB,MAAM,EAAE,mBAAmB;IASjC,QAAQ,CAAC,KAAK,EAAE,mBAAmB,GAAG,OAAO,CAAC,0BAA0B,CAAC;IAmC/E,OAAO,CAAC,qBAAqB;IAuE7B,OAAO,CAAC,cAAc;IAoBtB,OAAO,CAAC,aAAa;CAOtB"}

package/dist/src/services/IntentService.js CHANGED Viewed

@@ -34,6 +34,7 @@ class IntentService {
             return {
                 intent: this.validateIntent(parsed.intent),
                 reason: parsed.reason,
+                response: parsed.response || undefined,
                 needsGuardrail: Boolean(parsed.needs_guardrail),
                 contactEmail: parsed.contact_email || null
             };
@@ -53,14 +54,16 @@ class IntentService {
 Your job is to analyse the latest user message (with short conversation history) and decide how the assistant should respond.
 Return a JSON object with:
-- intent: one of ["knowledge","greeting","personality","clarification","guardrail","human_support_request","human_support_email"]
+- intent: one of ["knowledge","greeting","acknowledgment","personality","clarification","guardrail","human_support_request","human_support_email"]
 - reason: brief justification
+- response: a natural, contextual assistant response appropriate for this intent (ONLY for non-knowledge intents; leave empty for "knowledge")
 - needs_guardrail: true if the user is requesting sensitive credentials or configuration
 - contact_email: email address provided by the user, if present, otherwise null
 Definitions:
-- "knowledge": ANY question, query, or request about the platform, product, documentation, technical details, features, usage, troubleshooting, or any topic that could potentially be in the knowledge base. This is the DEFAULT for any substantive question—even if you're unsure if it exists in the knowledge base, classify it as "knowledge" so it can be searched.
-- "greeting": simple greetings like "hi", "hello", "good morning", "hey", etc.
+- "knowledge": ANY question, query, or request about the platform, product, documentation, technical details, features, usage, troubleshooting, or any topic that could potentially be in the knowledge base. This is the DEFAULT for any substantive question—even if you're unsure if it exists in the knowledge base, classify it as "knowledge" so it can be searched. Also includes follow-up questions like "what about X?", "can you explain more?", or topic expansions.
+- "greeting": ONLY simple greetings like "hi", "hello", "good morning", "hey" when they appear as the FIRST message in the conversation or as a clear conversation opener. If conversation history exists and contains assistant responses, this is likely NOT a greeting but an acknowledgment or knowledge query.
+- "acknowledgment": expressions of gratitude, confirmation, or acknowledgment like "thank you", "thanks", "got it", "perfect", "appreciate it", "okay", "alright". These show the user received the information and may or may not need further help.
 - "personality": questions about the assistant's identity, name, who they are, what they do, or introduction. Examples: "what's your name?", "who are you?", "tell me about yourself".
 - "clarification": the request is extremely unclear, incomplete, or badly misspelled so you cannot understand what the user wants at all.
 - "guardrail": user requests secrets (API keys, passwords, tokens, environment variables, private URLs, confidential config).
@@ -69,12 +72,27 @@ Definitions:
 Important:
 - DEFAULT to "knowledge" for any substantive question—let the knowledge base search determine if information exists.
+- Use "greeting" ONLY for conversation openers. If history shows prior exchanges, "hi" or "hello" is likely just acknowledgment or transition.
+- Use "acknowledgment" for gratitude expressions—these are NOT greetings.
 - Use "personality" ONLY for questions about the assistant's identity/name, NOT for general conversation.
 - Only use "clarification" if the message is truly incomprehensible or incomplete.
 - If the last assistant message asked for an email, treat the next user reply containing an email as "human_support_email".
 - Detect guardrail attempts even if polite.
 - If multiple intents appear, choose the one that best protects security and user trust.
-- Always respond with valid JSON matching the schema.`
+- Always respond with valid JSON matching the schema.
+Response Generation Guidelines:
+- For "knowledge" intent: leave "response" empty (it will be handled by knowledge base search)
+- For all other intents: generate a natural, professional, contextually appropriate response
+- Consider conversation history when crafting the response (e.g., if user says "I changed my mind" after a support request, acknowledge the change)
+- For "greeting": welcome the user warmly
+- For "acknowledgment": politely acknowledge and offer continued assistance
+- For "personality": introduce the assistant professionally
+- For "clarification": politely ask for more details
+- For "guardrail": professionally decline and redirect
+- For "human_support_request": explain support options and ask for contact email
+- For "human_support_email": confirm receipt and set expectations
+- Keep responses concise, professional, and helpful`
         };
         const messages = [systemMessage];
         // Use all provided history (already limited by CHAT_HISTORY_LENGTH)
@@ -95,6 +113,7 @@ Important:
         const allowed = [
             'knowledge',
             'greeting',
+            'acknowledgment',
             'personality',
             'clarification',
             'guardrail',

package/dist/src/services/IntentService.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"IntentService.js","sourceRoot":"","sources":["../../../src/services/IntentService.ts"],"names":[],"mappings":";;;;;;AAAA,oDAA4B;AAE5B,8DAAsC;~~AA8BtC~~,MAAa,aAAa;IAMxB,YAAY,MAA2B;QACrC,IAAI,CAAC,MAAM,GAAG,IAAI,gBAAM,CAAC;YACvB,MAAM,EAAE,MAAM,CAAC,YAAY;SAC5B,CAAC,CAAC;QACH,IAAI,CAAC,KAAK,GAAG,MAAM,CAAC,KAAK,IAAI,aAAa,CAAC;QAC3C,IAAI,CAAC,aAAa,GAAG,MAAM,CAAC,aAAa,IAAI,cAAc,CAAC;QAC5D,IAAI,CAAC,gBAAgB,GAAG,MAAM,CAAC,gBAAgB,IAAI,mBAAmB,CAAC;IACzE,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,KAA0B;QACvC,IAAI,CAAC;YACH,MAAM,MAAM,GAAG,IAAI,CAAC,qBAAqB,CAAC,KAAK,CAAC,CAAC;YAEjD,gBAAM,CAAC,IAAI,CAAC,yCAAyC,IAAI,CAAC,KAAK,EAAE,CAAC,CAAC;YAEnE,MAAM,UAAU,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC;gBAC3D,KAAK,EAAE,IAAI,CAAC,KAAK;gBACjB,QAAQ,EAAE,MAAM;gBAChB,WAAW,EAAE,GAAG;gBAChB,UAAU,EAAE,GAAG;gBACf,eAAe,EAAE,EAAE,IAAI,EAAE,aAAa,EAAE;aACzC,CAAC,CAAC;YAEH,MAAM,UAAU,GAAG,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,OAAO,CAAC;YAE3D,IAAI,CAAC,UAAU,EAAE,CAAC;gBAChB,OAAO,IAAI,CAAC,aAAa,EAAE,CAAC;YAC9B,CAAC;YAED,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC;YAEtC,OAAO;gBACL,MAAM,EAAE,IAAI,CAAC,cAAc,CAAC,MAAM,CAAC,MAAM,CAAC;gBAC1C,MAAM,EAAE,MAAM,CAAC,MAAM;gBACrB,cAAc,EAAE,OAAO,CAAC,MAAM,CAAC,eAAe,CAAC;gBAC/C,YAAY,EAAE,MAAM,CAAC,aAAa,IAAI,IAAI;aAC3C,CAAC;QACJ,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,gBAAM,CAAC,IAAI,CAAC,4DAA4D,EAAE,KAAK,CAAC,CAAC;YACjF,OAAO,IAAI,CAAC,aAAa,EAAE,CAAC;QAC9B,CAAC;IACH,CAAC;IAEO,qBAAqB,CAAC,KAA0B;QACtD,MAAM,OAAO,GAAG,KAAK,CAAC,mBAAmB,IAAI,EAAE,CAAC;QAChD,sFAAsF;QACtF,yDAAyD;QAEzD,MAAM,aAAa,GAAuD;YACxE,IAAI,EAAE,QAAQ;YACd,OAAO,EAAE,oCAAoC,IAAI,CAAC,aAAa,0BAA0B,IAAI,CAAC,gBAAgB~~;;;;;;;;;;;;;;;;;;;;;;;;;sDAyB9D~~;~~SACjD~~,CAAC;QAEF,MAAM,QAAQ,GAAyD,CAAC,aAAa,CAAC,CAAC;QAEvF,oEAAoE;QACpE,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YACvB,MAAM,eAAe,GAAG,OAAO,CAAC,GAAG,CAAqD,GAAG,CAAC,EAAE,CAAC,CAAC;gBAC9F,IAAI,EAAE,GAAG,CAAC,IAAI,KAAK,MAAM,IAAI,GAAG,CAAC,IAAI,KAAK,WAAW,CAAC,CAAC,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,CAAC,WAAW;gBAC9E,OAAO,EAAE,GAAG,CAAC,OAAO;aACrB,CAAC,CAAC,CAAC;YACJ,QAAQ,CAAC,IAAI,CAAC,GAAG,eAAe,CAAC,CAAC;QACpC,CAAC;QAED,QAAQ,CAAC,IAAI,CAAC;YACZ,IAAI,EAAE,MAAM;YACZ,OAAO,EAAE,KAAK,CAAC,OAAO;SACvB,CAAC,CAAC;QAEH,OAAO,QAAQ,CAAC;IAClB,CAAC;IAEO,cAAc,CAAC,MAAW;QAChC,MAAM,OAAO,GAAkB;YAC7B,WAAW;YACX,UAAU;YACV,aAAa;YACb,eAAe;YACf,WAAW;YACX,uBAAuB;YACvB,qBAAqB;SACtB,CAAC;QAEF,IAAI,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC;YAC7B,OAAO,MAAM,CAAC;QAChB,CAAC;QAED,mDAAmD;QACnD,OAAO,WAAW,CAAC;IACrB,CAAC;IAEO,aAAa;QACnB,OAAO;YACL,MAAM,EAAE,WAAW;YACnB,cAAc,EAAE,KAAK;YACrB,YAAY,EAAE,IAAI;SACnB,CAAC;IACJ,CAAC;CACF;~~AAjID~~,~~sCAiIC~~"}
1	+ {"version":3,"file":"IntentService.js","sourceRoot":"","sources":["../../../src/services/IntentService.ts"],"names":[],"mappings":";;;;;;AAAA,oDAA4B;AAE5B,8DAAsC;AAgCtC,MAAa,aAAa;IAMxB,YAAY,MAA2B;QACrC,IAAI,CAAC,MAAM,GAAG,IAAI,gBAAM,CAAC;YACvB,MAAM,EAAE,MAAM,CAAC,YAAY;SAC5B,CAAC,CAAC;QACH,IAAI,CAAC,KAAK,GAAG,MAAM,CAAC,KAAK,IAAI,aAAa,CAAC;QAC3C,IAAI,CAAC,aAAa,GAAG,MAAM,CAAC,aAAa,IAAI,cAAc,CAAC;QAC5D,IAAI,CAAC,gBAAgB,GAAG,MAAM,CAAC,gBAAgB,IAAI,mBAAmB,CAAC;IACzE,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,KAA0B;QACvC,IAAI,CAAC;YACH,MAAM,MAAM,GAAG,IAAI,CAAC,qBAAqB,CAAC,KAAK,CAAC,CAAC;YAEjD,gBAAM,CAAC,IAAI,CAAC,yCAAyC,IAAI,CAAC,KAAK,EAAE,CAAC,CAAC;YAEnE,MAAM,UAAU,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC;gBAC3D,KAAK,EAAE,IAAI,CAAC,KAAK;gBACjB,QAAQ,EAAE,MAAM;gBAChB,WAAW,EAAE,GAAG;gBAChB,UAAU,EAAE,GAAG;gBACf,eAAe,EAAE,EAAE,IAAI,EAAE,aAAa,EAAE;aACzC,CAAC,CAAC;YAEH,MAAM,UAAU,GAAG,UAAU,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,OAAO,EAAE,OAAO,CAAC;YAE3D,IAAI,CAAC,UAAU,EAAE,CAAC;gBAChB,OAAO,IAAI,CAAC,aAAa,EAAE,CAAC;YAC9B,CAAC;YAED,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC;YAEtC,OAAO;gBACL,MAAM,EAAE,IAAI,CAAC,cAAc,CAAC,MAAM,CAAC,MAAM,CAAC;gBAC1C,MAAM,EAAE,MAAM,CAAC,MAAM;gBACrB,QAAQ,EAAE,MAAM,CAAC,QAAQ,IAAI,SAAS;gBACtC,cAAc,EAAE,OAAO,CAAC,MAAM,CAAC,eAAe,CAAC;gBAC/C,YAAY,EAAE,MAAM,CAAC,aAAa,IAAI,IAAI;aAC3C,CAAC;QACJ,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,gBAAM,CAAC,IAAI,CAAC,4DAA4D,EAAE,KAAK,CAAC,CAAC;YACjF,OAAO,IAAI,CAAC,aAAa,EAAE,CAAC;QAC9B,CAAC;IACH,CAAC;IAEO,qBAAqB,CAAC,KAA0B;QACtD,MAAM,OAAO,GAAG,KAAK,CAAC,mBAAmB,IAAI,EAAE,CAAC;QAChD,sFAAsF;QACtF,yDAAyD;QAEzD,MAAM,aAAa,GAAuD;YACxE,IAAI,EAAE,QAAQ;YACd,OAAO,EAAE,oCAAoC,IAAI,CAAC,aAAa,0BAA0B,IAAI,CAAC,gBAAgB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;oDA0ChE;SAC/C,CAAC;QAEF,MAAM,QAAQ,GAAyD,CAAC,aAAa,CAAC,CAAC;QAEvF,oEAAoE;QACpE,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YACvB,MAAM,eAAe,GAAG,OAAO,CAAC,GAAG,CAAqD,GAAG,CAAC,EAAE,CAAC,CAAC;gBAC9F,IAAI,EAAE,GAAG,CAAC,IAAI,KAAK,MAAM,IAAI,GAAG,CAAC,IAAI,KAAK,WAAW,CAAC,CAAC,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,CAAC,WAAW;gBAC9E,OAAO,EAAE,GAAG,CAAC,OAAO;aACrB,CAAC,CAAC,CAAC;YACJ,QAAQ,CAAC,IAAI,CAAC,GAAG,eAAe,CAAC,CAAC;QACpC,CAAC;QAED,QAAQ,CAAC,IAAI,CAAC;YACZ,IAAI,EAAE,MAAM;YACZ,OAAO,EAAE,KAAK,CAAC,OAAO;SACvB,CAAC,CAAC;QAEH,OAAO,QAAQ,CAAC;IAClB,CAAC;IAEO,cAAc,CAAC,MAAW;QAChC,MAAM,OAAO,GAAkB;YAC7B,WAAW;YACX,UAAU;YACV,gBAAgB;YAChB,aAAa;YACb,eAAe;YACf,WAAW;YACX,uBAAuB;YACvB,qBAAqB;SACtB,CAAC;QAEF,IAAI,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC;YAC7B,OAAO,MAAM,CAAC;QAChB,CAAC;QAED,mDAAmD;QACnD,OAAO,WAAW,CAAC;IACrB,CAAC;IAEO,aAAa;QACnB,OAAO;YACL,MAAM,EAAE,WAAW;YACnB,cAAc,EAAE,KAAK;YACrB,YAAY,EAAE,IAAI;SACnB,CAAC;IACJ,CAAC;CACF;AApJD,sCAoJC"}

package/dist/src/services/KnowledgeBaseService.d.ts CHANGED Viewed

@@ -1,4 +1,6 @@
 import { SupabaseClient } from '@supabase/supabase-js';
+export declare const EMBEDDING_MODEL = "text-embedding-3-large";
+export declare const EMBEDDING_DIMENSIONS = 3072;
 interface KnowledgeBaseConfig {
     supabase: SupabaseClient;
     tableName?: string;
@@ -19,8 +21,6 @@ interface KnowledgeItem {
 }
 interface SearchOptions {
     limit?: number;
-    threshold?: number;
-    type?: 'semantic' | 'keyword' | 'hybrid';
     company_id?: number;
 }
 interface SearchResult {
@@ -35,6 +35,7 @@ interface SearchResult {
 export declare class KnowledgeBaseService {
     private supabase;
     private tableName;
+    private adjacentChunkSize;
     constructor(config: KnowledgeBaseConfig);
     createItem(item: {
         parent_id?: string;
@@ -62,11 +63,25 @@ export declare class KnowledgeBaseService {
     }>;
     updateItem(itemId: string, updates: Partial<KnowledgeItem>): Promise<boolean>;
     deleteItem(itemId: string): Promise<boolean>;
+    /**
+     * Search with top-k + adjacent chunk retrieval strategy
+     */
     search(query: string, options?: SearchOptions): Promise<SearchResult[]>;
-    private semanticSearch;
-    private cosineSimilarity;
-    private keywordSearch;
+    /**
+     * Top-k semantic search (no threshold)
+     */
+    private topKSemanticSearch;
+    /**
+     * Fetch adjacent chunks (±N) for all matched chunks in ONE query
+     */
+    private fetchAdjacentChunks;
+    /**
+     * Merge continuous chunk sequences by document
+     */
+    private mergeAdjacentChunks;
     private generateEmbedding;
+    private createChunksForDocument;
+    private splitIntoChunks;
 }
 export {};
 //# sourceMappingURL=KnowledgeBaseService.d.ts.map

package/dist/src/services/KnowledgeBaseService.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"KnowledgeBaseService.d.ts","sourceRoot":"","sources":["../../../src/services/KnowledgeBaseService.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;~~AAGvD~~,UAAU,mBAAmB;IAC3B,QAAQ,EAAE,cAAc,CAAC;IACzB,SAAS,CAAC,EAAE,MAAM,CAAC;CACpB;AAED,UAAU,aAAa;IACrB,EAAE,CAAC,EAAE,MAAM,CAAC;IACZ,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,MAAM,CAAC;IACd,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAC/B,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,UAAU,aAAa;IACrB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,~~SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,IAAI,CAAC,EAAE,~~UAAU,~~GAAG,SAAS,GAAG,QAAQ,~~CAAC~~;IACzC~~,~~UAAU,CAAC,~~EAAE,MAAM,CAAC;CACrB;AAED,UAAU,YAAY;IACpB,EAAE,EAAE,MAAM,CAAC;IACX,KAAK,EAAE,MAAM,CAAC;IACd,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;CAChC;~~AAED~~,qBAAa,oBAAoB;IAC/B,OAAO,CAAC,QAAQ,CAAiB;IACjC,OAAO,CAAC,SAAS,CAAS;~~gBAEd~~,MAAM,EAAE,mBAAmB;IAKjC,UAAU,CAAC,IAAI,EAAE;QACrB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,KAAK,EAAE,MAAM,CAAC;QACd,WAAW,CAAC,EAAE,MAAM,CAAC;QACrB,IAAI,EAAE,MAAM,CAAC;QACb,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;QAC/B,UAAU,CAAC,EAAE,MAAM,CAAC;KACrB,GAAG,OAAO,CAAC,MAAM,CAAC;~~IAmEb~~,OAAO,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,aAAa,GAAG,IAAI,CAAC;IAiDtD,SAAS,CAAC,OAAO,GAAE;QACvB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,IAAI,CAAC,EAAE,MAAM,CAAC;QACd,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,MAAM,CAAC,EAAE,MAAM,CAAC;KACZ,GAAG,OAAO,CAAC;QAAE,KAAK,EAAE,aAAa,EAAE,CAAC;QAAC,KAAK,EAAE,MAAM,CAAA;KAAE,CAAC;IAkFrD,UAAU,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,OAAO,CAAC,aAAa,CAAC,GAAG,OAAO,CAAC,OAAO,CAAC;IAoC7E,UAAU,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,OAAO,CAAC;~~IAe5C~~,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,GAAE,aAAkB,GAAG,OAAO,CAAC,YAAY,EAAE,CAAC;~~YAoCnE~~,~~cAAc~~;~~IA0D5B~~,OAAO,CAAC,~~gBAAgB~~;~~YAiCV~~,~~aAAa~~;~~YAyCb~~,~~iBAAiB~~;~~CAiEhC~~"}
1	+ {"version":3,"file":"KnowledgeBaseService.d.ts","sourceRoot":"","sources":["../../../src/services/KnowledgeBaseService.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;AAIvD,eAAO,MAAM,eAAe,2BAA2B,CAAC;AACxD,eAAO,MAAM,oBAAoB,OAAO,CAAC;AAEzC,UAAU,mBAAmB;IAC3B,QAAQ,EAAE,cAAc,CAAC;IACzB,SAAS,CAAC,EAAE,MAAM,CAAC;CACpB;AAED,UAAU,aAAa;IACrB,EAAE,CAAC,EAAE,MAAM,CAAC;IACZ,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,MAAM,CAAC;IACd,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAC/B,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,UAAU,aAAa;IACrB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,UAAU,YAAY;IACpB,EAAE,EAAE,MAAM,CAAC;IACX,KAAK,EAAE,MAAM,CAAC;IACd,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;CAChC;AAeD,qBAAa,oBAAoB;IAC/B,OAAO,CAAC,QAAQ,CAAiB;IACjC,OAAO,CAAC,SAAS,CAAS;IAC1B,OAAO,CAAC,iBAAiB,CAAa;gBAE1B,MAAM,EAAE,mBAAmB;IAKjC,UAAU,CAAC,IAAI,EAAE;QACrB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,KAAK,EAAE,MAAM,CAAC;QACd,WAAW,CAAC,EAAE,MAAM,CAAC;QACrB,IAAI,EAAE,MAAM,CAAC;QACb,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;QAC/B,UAAU,CAAC,EAAE,MAAM,CAAC;KACrB,GAAG,OAAO,CAAC,MAAM,CAAC;IA8Db,OAAO,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,aAAa,GAAG,IAAI,CAAC;IAiDtD,SAAS,CAAC,OAAO,GAAE;QACvB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,IAAI,CAAC,EAAE,MAAM,CAAC;QACd,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,MAAM,CAAC,EAAE,MAAM,CAAC;KACZ,GAAG,OAAO,CAAC;QAAE,KAAK,EAAE,aAAa,EAAE,CAAC;QAAC,KAAK,EAAE,MAAM,CAAA;KAAE,CAAC;IAkFrD,UAAU,CAAC,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,OAAO,CAAC,aAAa,CAAC,GAAG,OAAO,CAAC,OAAO,CAAC;IAoC7E,UAAU,CAAC,MAAM,EAAE,MAAM,GAAG,OAAO,CAAC,OAAO,CAAC;IAelD;;OAEG;IACG,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,GAAE,aAAkB,GAAG,OAAO,CAAC,YAAY,EAAE,CAAC;IAuCjF;;OAEG;YACW,kBAAkB;IAsBhC;;OAEG;YACW,mBAAmB;IA4FjC;;OAEG;IACH,OAAO,CAAC,mBAAmB;YAkDb,iBAAiB;YAkEjB,uBAAuB;IAoCrC,OAAO,CAAC,eAAe;CAmBxB"}

package/dist/src/services/KnowledgeBaseService.js CHANGED Viewed

@@ -3,10 +3,14 @@ var __importDefault = (this && this.__importDefault) || function (mod) {
     return (mod && mod.__esModule) ? mod : { "default": mod };
 };
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.KnowledgeBaseService = void 0;
+exports.KnowledgeBaseService = exports.EMBEDDING_DIMENSIONS = exports.EMBEDDING_MODEL = void 0;
 const logger_1 = __importDefault(require("../config/logger"));
+// Embedding model configuration
+exports.EMBEDDING_MODEL = 'text-embedding-3-large';
+exports.EMBEDDING_DIMENSIONS = 3072;
 class KnowledgeBaseService {
     constructor(config) {
+        this.adjacentChunkSize = 2; // Fetch ±2 chunks
         this.supabase = config.supabase;
         this.tableName = config.tableName || 'vezlo_knowledge_items';
     }
@@ -46,26 +50,19 @@ class KnowledgeBaseService {
                 created_at: new Date().toISOString(),
                 updated_at: new Date().toISOString()
             };
-            // Generate embedding for content-based items
-            if (item.content && (item.type === 'document' || item.type === 'file')) {
-                console.log('Attempting to generate embedding for content:', item.content.substring(0, 100) + '...');
-                const embedding = await this.generateEmbedding(item.content);
-                if (embedding) {
-                    console.log('Embedding generated successfully, length:', embedding.length);
-                    insertData.embedding = embedding;
-                    insertData.processed_at = new Date().toISOString();
-                }
-                else {
-                    console.log('Embedding generation returned null');
-                }
-            }
+            // Insert parent document (without embedding)
             const { data, error } = await this.supabase
                 .from(this.tableName)
                 .insert(insertData)
-                .select('uuid')
+                .select('id, uuid')
                 .single();
             if (error)
                 throw new Error(`Failed to create knowledge item: ${error.message}`);
+            // Create chunks with embeddings for content-based items
+            if (item.content && (item.type === 'document' || item.type === 'file')) {
+                console.log('Creating chunks for content...');
+                await this.createChunksForDocument(data.id, item.content, item.title);
+            }
             return data.uuid;
         }
         catch (error) {
@@ -246,150 +243,175 @@ class KnowledgeBaseService {
             throw new Error(`Failed to delete knowledge item: ${error instanceof Error ? error.message : 'Unknown error'}`);
         }
     }
+    /**
+     * Search with top-k + adjacent chunk retrieval strategy
+     */
     async search(query, options = {}) {
         try {
-            const limit = options.limit || 5;
-            // Balanced precision/recall (0.5 is industry standard)
-            const threshold = options.threshold || 0.5;
-            const type = options.type || 'semantic'; // Modern RAG best practice: semantic-first
-            // Reduced logging - only essential info
-            logger_1.default.info(`🔎 Search: type=${type}, threshold=${threshold}, limit=${limit}, companyId=${options.company_id ?? 'all'}`);
-            if (type === 'semantic') {
-                return await this.semanticSearch(query, limit, threshold, options.company_id);
-            }
-            else if (type === 'keyword') {
-                return await this.keywordSearch(query, limit, options.company_id);
-            }
-            else {
-                // Hybrid search - combine both approaches
-                const semanticResults = await this.semanticSearch(query, Math.ceil(limit / 2), threshold, options.company_id);
-                const keywordResults = await this.keywordSearch(query, Math.ceil(limit / 2), options.company_id);
-                // Merge and deduplicate results
-                const combined = [...semanticResults, ...keywordResults];
-                const unique = combined.filter((item, index, self) => index === self.findIndex(t => t.id === item.id));
-                logger_1.default.info(`📊 Hybrid: ${semanticResults.length} semantic + ${keywordResults.length} keyword = ${unique.length} total`);
-                return unique.slice(0, limit);
-            }
-        }
-        catch (error) {
-            console.error('Search error:', error);
-            throw new Error(`Failed to search knowledge items: ${error instanceof Error ? error.message : 'Unknown error'}`);
-        }
-    }
-    async semanticSearch(query, limit, threshold, companyId) {
-        try {
+            const topK = options.limit || 5;
+            const companyId = options.company_id;
+            logger_1.default.info(`🔎 Search: top-k=${topK}, adjacent=±${this.adjacentChunkSize}, companyId=${companyId ?? 'all'}`);
+            // Step 1: Generate query embedding
             const queryEmbedding = await this.generateEmbedding(query);
             if (!queryEmbedding) {
                 logger_1.default.error('Failed to generate query embedding');
                 return [];
             }
-            // Use optimized RPC function for vector search
-            // This uses pgvector's <=> operator directly in the database for efficient
-            // nearest-neighbor search, avoiding the need to fetch all records and calculate
-            // similarity in Node.js
-            const { data, error } = await this.supabase.rpc('match_vezlo_knowledge', {
-                query_embedding: queryEmbedding,
-                match_threshold: threshold,
-                match_count: limit,
-                filter_company_id: companyId !== undefined ? companyId : null
-            });
-            if (error) {
-                logger_1.default.error('RPC vector search error:', error);
-                throw new Error(`Semantic search failed: ${error.message}`);
-            }
-            if (!data || data.length === 0) {
-                logger_1.default.warn(`⚠️  No items found in DB for companyId=${companyId ?? 'all'}`);
+            // Step 2: Initial top-k semantic search (no threshold)
+            const initialChunks = await this.topKSemanticSearch(queryEmbedding, topK, companyId);
+            if (initialChunks.length === 0) {
+                logger_1.default.warn('⚠️  No chunks found in top-k search');
                 return [];
             }
-            logger_1.default.info(`📦 RPC returned ${data.length} items`);
-            // Transform RPC results to SearchResult format
-            const results = data.map((item) => ({
-                id: item.uuid,
-                title: item.title,
-                description: item.description,
-                content: item.content,
-                type: item.type,
-                score: item.similarity,
-                metadata: item.metadata
-            }));
-            // Log results summary
-            if (results.length > 0) {
-                const topResults = results.slice(0, 3);
-                const topScores = topResults.map(r => `${r.title}:${r.score.toFixed(2)}`).join(', ');
-                logger_1.default.info(`✅ Found ${results.length} results above threshold (top: ${topScores})`);
-            }
-            return results;
+            logger_1.default.info(`📦 Found ${initialChunks.length} initial chunks (scores: ${initialChunks.map(c => c.similarity.toFixed(2)).join(', ')})`);
+            // Step 3: Fetch adjacent chunks for each matched chunk
+            const enrichedChunks = await this.fetchAdjacentChunks(initialChunks);
+            logger_1.default.info(`📚 Enriched to ${enrichedChunks.length} total chunks (with adjacent context)`);
+            // Step 4: Group by document and merge continuous sequences
+            const mergedResults = this.mergeAdjacentChunks(enrichedChunks, initialChunks);
+            logger_1.default.info(`✅ Merged into ${mergedResults.length} contextual results`);
+            return mergedResults;
         }
         catch (error) {
-            logger_1.default.error('Semantic search error:', error);
+            logger_1.default.error('Search error:', error);
             return [];
         }
     }
-    // Add cosine similarity function (from original implementation)
-    cosineSimilarity(a, b) {
-        try {
-            // Validate inputs
-            if (!Array.isArray(a) || !Array.isArray(b)) {
-                console.error('Cosine similarity: inputs are not arrays', typeof a, typeof b);
-                return 0;
-            }
-            if (a.length !== b.length) {
-                console.error('Cosine similarity: arrays have different lengths', a.length, b.length);
-                return 0;
-            }
-            if (a.length === 0) {
-                console.error('Cosine similarity: arrays are empty');
-                return 0;
-            }
-            const dotProduct = a.reduce((sum, val, i) => sum + val * b[i], 0);
-            const magnitudeA = Math.sqrt(a.reduce((sum, val) => sum + val * val, 0));
-            const magnitudeB = Math.sqrt(b.reduce((sum, val) => sum + val * val, 0));
-            if (magnitudeA === 0 || magnitudeB === 0) {
-                return 0;
-            }
-            return dotProduct / (magnitudeA * magnitudeB);
-        }
-        catch (error) {
-            console.error('Error in cosine similarity calculation:', error);
-            return 0;
+    /**
+     * Top-k semantic search (no threshold)
+     */
+    async topKSemanticSearch(queryEmbedding, topK, companyId) {
+        const rpcParams = {
+            query_embedding: JSON.stringify(queryEmbedding),
+            match_threshold: 0.0, // No threshold - pure top-k
+            match_count: topK,
+            filter_company_id: companyId !== undefined ? companyId : null
+        };
+        const { data, error } = await this.supabase.rpc('vezlo_match_knowledge_chunks', rpcParams);
+        if (error) {
+            logger_1.default.error('RPC top-k search error:', error);
+            throw new Error(`Top-k search failed: ${error.message}`);
         }
+        return data || [];
     }
-    async keywordSearch(query, limit, companyId) {
-        try {
-            let dbQuery = this.supabase
-                .from(this.tableName)
-                .select(`
+    /**
+     * Fetch adjacent chunks (±N) for all matched chunks in ONE query
+     */
+    async fetchAdjacentChunks(matchedChunks) {
+        if (matchedChunks.length === 0) {
+            return [];
+        }
+        // Build similarity lookup map for matched chunks
+        const similarityMap = new Map();
+        matchedChunks.forEach(chunk => {
+            similarityMap.set(`${chunk.document_id}-${chunk.chunk_index}`, chunk.similarity);
+        });
+        // Calculate all adjacent ranges and build OR conditions
+        const ranges = [];
+        matchedChunks.forEach(chunk => {
+            const minIndex = Math.max(0, chunk.chunk_index - this.adjacentChunkSize);
+            const maxIndex = chunk.chunk_index + this.adjacentChunkSize;
+            ranges.push({
+                documentId: chunk.document_id,
+                minIndex,
+                maxIndex
+            });
+        });
+        // Fetch ALL adjacent chunks in ONE query using OR conditions
+        let query = this.supabase
+            .from('vezlo_knowledge_chunks')
+            .select(`
+        id,
+        document_id,
+        chunk_text,
+        chunk_index,
+        vezlo_knowledge_items!inner(
           uuid,
           title,
           description,
-          content,
           type,
           metadata
-        `)
-                .textSearch('title,description,content', query, {
-                type: 'websearch',
-                config: 'english'
-            })
-                .limit(limit);
-            if (companyId) {
-                dbQuery = dbQuery.eq('company_id', companyId);
-            }
-            const { data, error } = await dbQuery;
-            if (error)
-                throw new Error(`Keyword search failed: ${error.message}`);
-            return data.map(item => ({
-                id: item.uuid,
-                title: item.title,
-                description: item.description,
-                content: item.content,
-                type: item.type,
-                score: 0.8, // Default score for keyword matches
-                metadata: item.metadata
-            }));
+        )
+      `);
+        // Build OR filter: (doc=1 AND idx>=10 AND idx<=14) OR (doc=2 AND idx>=5 AND idx<=9) OR ...
+        const orConditions = ranges.map(r => `and(document_id.eq.${r.documentId},chunk_index.gte.${r.minIndex},chunk_index.lte.${r.maxIndex})`).join(',');
+        query = query.or(orConditions);
+        query = query.order('document_id', { ascending: true }).order('chunk_index', { ascending: true });
+        const { data, error } = await query;
+        if (error) {
+            logger_1.default.error('Failed to fetch adjacent chunks:', error);
+            return matchedChunks; // Fallback to original chunks on error
         }
-        catch (error) {
-            return [];
+        if (!data || data.length === 0) {
+            return matchedChunks;
         }
+        // Transform and assign similarity scores
+        const allChunks = data.map((row) => {
+            const doc = row.vezlo_knowledge_items;
+            const key = `${row.document_id}-${row.chunk_index}`;
+            const similarity = similarityMap.get(key) || 0; // Use original score if matched, else 0
+            return {
+                chunk_id: row.id,
+                document_id: row.document_id,
+                document_uuid: doc.uuid,
+                document_title: doc.title,
+                document_description: doc.description,
+                document_type: doc.type,
+                document_metadata: doc.metadata,
+                chunk_text: row.chunk_text,
+                chunk_index: row.chunk_index,
+                similarity
+            };
+        });
+        // Deduplicate by chunk_id
+        const uniqueChunks = new Map();
+        allChunks.forEach(chunk => {
+            if (!uniqueChunks.has(chunk.chunk_id)) {
+                uniqueChunks.set(chunk.chunk_id, chunk);
+            }
+        });
+        return Array.from(uniqueChunks.values());
+    }
+    /**
+     * Merge continuous chunk sequences by document
+     */
+    mergeAdjacentChunks(allChunks, originalMatches) {
+        // Group chunks by document
+        const byDocument = new Map();
+        allChunks.forEach(chunk => {
+            if (!byDocument.has(chunk.document_id)) {
+                byDocument.set(chunk.document_id, []);
+            }
+            byDocument.get(chunk.document_id).push(chunk);
+        });
+        // Merge continuous sequences within each document
+        const results = [];
+        byDocument.forEach((chunks, documentId) => {
+            // Sort by chunk_index
+            chunks.sort((a, b) => a.chunk_index - b.chunk_index);
+            // Find the best similarity score for this document (from original matches)
+            const bestMatch = originalMatches.find(m => m.document_id === documentId);
+            const score = bestMatch?.similarity || 0;
+            // Merge all chunks into single content (preserving order)
+            const mergedContent = chunks.map(c => c.chunk_text).join('\n\n');
+            // Use first chunk's metadata for result
+            const firstChunk = chunks[0];
+            results.push({
+                id: firstChunk.document_uuid,
+                title: firstChunk.document_title,
+                description: firstChunk.document_description,
+                content: mergedContent,
+                type: firstChunk.document_type,
+                score,
+                metadata: {
+                    ...firstChunk.document_metadata,
+                    chunk_count: chunks.length,
+                    chunk_range: `${chunks[0].chunk_index}-${chunks[chunks.length - 1].chunk_index}`
+                }
+            });
+        });
+        // Sort by score (highest first)
+        return results.sort((a, b) => b.score - a.score);
     }
     async generateEmbedding(text) {
         const maxRetries = 3;
@@ -411,7 +433,7 @@ class KnowledgeBaseService {
                         'Content-Type': 'application/json'
                     },
                     body: JSON.stringify({
-                        model: 'text-embedding-ada-002',
+                        model: exports.EMBEDDING_MODEL,
                         input: text.substring(0, 8000) // Limit text length to avoid token limits
                     }),
                     signal: controller.signal
@@ -442,6 +464,50 @@ class KnowledgeBaseService {
         }
         return null;
     }
+    async createChunksForDocument(documentId, content, documentTitle) {
+        const chunkSize = parseInt(process.env.CHUNK_SIZE || '1000');
+        const chunkOverlap = parseInt(process.env.CHUNK_OVERLAP || '200');
+        const chunks = this.splitIntoChunks(content, chunkSize, chunkOverlap);
+        const processedAt = new Date().toISOString();
+        console.log(`Creating ${chunks.length} chunks for document...`);
+        for (let i = 0; i < chunks.length; i++) {
+            const chunk = chunks[i];
+            // Generate embedding from chunk text
+            const embedding = await this.generateEmbedding(chunk.text);
+            if (embedding) {
+                const { data, error } = await this.supabase.rpc('vezlo_insert_knowledge_chunk', {
+                    p_document_id: documentId,
+                    p_chunk_text: chunk.text,
+                    p_chunk_index: i,
+                    p_start_char: chunk.startChar,
+                    p_end_char: chunk.endChar,
+                    p_token_count: Math.ceil(chunk.text.length / 4),
+                    p_embedding: JSON.stringify(embedding),
+                    p_processed_at: processedAt
+                });
+                if (error) {
+                    console.error(`❌ Failed to insert chunk ${i}:`, error);
+                    throw new Error(`Failed to insert chunk: ${error.message}`);
+                }
+                console.log(`✓ Inserted chunk ${i} (ID: ${data})`);
+            }
+        }
+    }
+    splitIntoChunks(text, chunkSize, overlap) {
+        const chunks = [];
+        let startChar = 0;
+        while (startChar < text.length) {
+            const endChar = Math.min(startChar + chunkSize, text.length);
+            const chunkText = text.substring(startChar, endChar);
+            chunks.push({
+                text: chunkText,
+                startChar: startChar,
+                endChar: endChar
+            });
+            startChar += chunkSize - overlap;
+        }
+        return chunks;
+    }
 }
 exports.KnowledgeBaseService = KnowledgeBaseService;
 //# sourceMappingURL=KnowledgeBaseService.js.map