npm - @byte5ai/palaia - Versions diffs - 2.0.4 → 2.0.5 - Mend

@byte5ai/palaia 2.0.4 → 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/package.json +1 -1
package/src/hooks.ts +96 -88

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@byte5ai/palaia",
-  "version": "2.0.4",
+  "version": "2.0.5",
   "description": "Palaia memory backend for OpenClaw",
   "main": "index.ts",
   "openclaw": {

package/src/hooks.ts CHANGED Viewed

@@ -137,6 +137,16 @@ const lastInboundMessageByChannel = new Map<string, { messageId: string; provide
 /** Channels that support emoji reactions. */
 const REACTION_SUPPORTED_PROVIDERS = new Set(["slack", "discord"]);
+// ============================================================================
+// Logger (Issue: api.logger integration)
+// ============================================================================
+/** Module-level logger — defaults to console, replaced by api.logger in registerHooks. */
+let logger: { info: (...args: any[]) => void; warn: (...args: any[]) => void } = {
+  info: (...args: any[]) => console.log(...args),
+  warn: (...args: any[]) => console.warn(...args),
+};
 // ============================================================================
 // Scope Validation (Issue #90)
 // ============================================================================
@@ -350,7 +360,7 @@ async function sendSlackReaction(
 ): Promise<void> {
   const token = await resolveSlackBotToken();
   if (!token) {
-    console.warn("[palaia] Cannot send Slack reaction: no bot token found");
+    logger.warn("[palaia] Cannot send Slack reaction: no bot token found");
     return;
   }
@@ -375,11 +385,11 @@ async function sendSlackReaction(
     });
     const data = await response.json() as { ok: boolean; error?: string };
     if (!data.ok && data.error !== "already_reacted") {
-      console.warn(`[palaia] Slack reaction failed: ${data.error} (${normalizedEmoji} on ${channelId})`);
+      logger.warn(`[palaia] Slack reaction failed: ${data.error} (${normalizedEmoji} on ${channelId})`);
     }
   } catch (err) {
     if ((err as Error).name !== "AbortError") {
-      console.warn(`[palaia] Slack reaction error (${normalizedEmoji}): ${err}`);
+      logger.warn(`[palaia] Slack reaction error (${normalizedEmoji}): ${err}`);
     }
   } finally {
     clearTimeout(timeout);
@@ -792,7 +802,7 @@ export function resolveCaptureModel(
     if (parts.length >= 2) {
       if (!_captureModelFallbackWarned) {
         _captureModelFallbackWarned = true;
-        console.warn(`[palaia] No captureModel configured — using primary model. Set captureModel in plugin config for cost savings.`);
+        logger.warn(`[palaia] No captureModel configured — using primary model. Set captureModel in plugin config for cost savings.`);
       }
       return { provider: parts[0], model: parts.slice(1).join("/") };
     }
@@ -825,21 +835,27 @@ function collectText(payloads: Array<{ text?: string; isError?: boolean }> | und
  * then hard-cap at maxChars from the end (newest messages kept).
  */
 export function trimToRecentExchanges(
-  texts: Array<{ role: string; text: string }>,
+  texts: Array<{ role: string; text: string; provenance?: string }>,
   maxPairs = 5,
   maxChars = 10_000,
-): Array<{ role: string; text: string }> {
+): Array<{ role: string; text: string; provenance?: string }> {
   // Filter to only user + assistant messages (skip tool, toolResult, system, etc.)
   const exchanges = texts.filter((t) => t.role === "user" || t.role === "assistant");
   // Keep the last N pairs (a pair = one user + one assistant message)
+  // Only count external_user messages as real user turns.
+  // System-injected user messages (inter_session, internal_system) don't count as conversation turns.
   // Walk backwards, count pairs
   let pairCount = 0;
   let lastRole = "";
   let cutIndex = 0; // default: keep everything
   for (let i = exchanges.length - 1; i >= 0; i--) {
-    // Count a new pair when we see a user message after having seen an assistant
-    if (exchanges[i].role === "user" && lastRole === "assistant") {
+    const isRealUser = exchanges[i].role === "user" && (
+      exchanges[i].provenance === "external_user" ||
+      !exchanges[i].provenance // backward compat: no provenance = treat as real user
+    );
+    // Count a new pair when we see a real user message after having seen an assistant
+    if (isRealUser && lastRole === "assistant") {
       pairCount++;
       if (pairCount > maxPairs) {
         cutIndex = i + 1; // keep from next message onwards
@@ -1087,8 +1103,8 @@ export function extractSignificance(
   return { tags, type: primaryType, summary };
 }
-export function extractMessageTexts(messages: unknown[]): Array<{ role: string; text: string }> {
-  const result: Array<{ role: string; text: string }> = [];
+export function extractMessageTexts(messages: unknown[]): Array<{ role: string; text: string; provenance?: string }> {
+  const result: Array<{ role: string; text: string; provenance?: string }> = [];
   for (const msg of messages) {
     if (!msg || typeof msg !== "object") continue;
@@ -1096,8 +1112,12 @@ export function extractMessageTexts(messages: unknown[]): Array<{ role: string;
     const role = m.role;
     if (!role || typeof role !== "string") continue;
+    // Extract provenance kind (string or object with .kind)
+    const rawProvenance = (m as any).provenance?.kind ?? (m as any).provenance;
+    const provenance = typeof rawProvenance === "string" ? rawProvenance : undefined;
     if (typeof m.content === "string" && m.content.trim()) {
-      result.push({ role, text: m.content.trim() });
+      result.push({ role, text: m.content.trim(), provenance });
       continue;
     }
@@ -1110,7 +1130,7 @@ export function extractMessageTexts(messages: unknown[]): Array<{ role: string;
           typeof block.text === "string" &&
           block.text.trim()
         ) {
-          result.push({ role, text: block.text.trim() });
+          result.push({ role, text: block.text.trim(), provenance });
         }
       }
     }
@@ -1121,6 +1141,12 @@ export function extractMessageTexts(messages: unknown[]): Array<{ role: string;
 export function getLastUserMessage(messages: unknown[]): string | null {
   const texts = extractMessageTexts(messages);
+  // Prefer external_user provenance (real human input)
+  for (let i = texts.length - 1; i >= 0; i--) {
+    if (texts[i].role === "user" && texts[i].provenance === "external_user")
+      return texts[i].text;
+  }
+  // Fallback: any user message (backward compat for OpenClaw without provenance)
   for (let i = texts.length - 1; i >= 0; i--) {
     if (texts[i].role === "user") return texts[i].text;
   }
@@ -1128,80 +1154,44 @@ export function getLastUserMessage(messages: unknown[]): string | null {
 }
 // ============================================================================
-// Recall Query Builder (Issue #65 upgrade: robust user message extraction)
+// Recall Query Builder (provenance-based, Issue #65 upgrade)
 // ============================================================================
-/** Day-of-week prefixes used as system markers in messages. */
-const DAY_PREFIXES = ["[Mon ", "[Tue ", "[Wed ", "[Thu ", "[Fri ", "[Sat ", "[Sun "];
 /**
- * Clean a raw message string by removing system markers, JSON blocks,
- * and other noise that degrades semantic search quality.
- */
-export function cleanMessageForQuery(text: string): string {
-  let cleaned = text;
-  // Remove JSON code blocks (```json ... ```)
-  cleaned = cleaned.replace(/```json[\s\S]*?```/gi, "");
-  // Remove lines starting with system markers
-  cleaned = cleaned
-    .split("\n")
-    .filter((line) => {
-      const trimmed = line.trimStart();
-      if (trimmed.startsWith("System:")) return false;
-      if (trimmed.startsWith("[Queued")) return false;
-      if (trimmed.startsWith("[Inter-session")) return false;
-      for (const prefix of DAY_PREFIXES) {
-        if (trimmed.startsWith(prefix)) return false;
-      }
-      return true;
-    })
-    .join("\n")
-    .trim();
-  return cleaned;
-}
-/**
- * Build a recall query from message history.
+ * Build a recall query from message history using provenance to identify real user input.
  *
- * - Always uses actual user messages (ignores event.prompt which may be stale/synthetic).
- * - If the last user message is short (< 30 chars), prepends the previous user message
- *   for better semantic context ("Ja", "OK", "Status" alone are poor queries).
- * - Strips system markers, JSON blocks, and other noise.
+ * - Prefers external_user messages (real human input from Slack/Telegram).
+ * - Falls back to any user message for backward compat (OpenClaw without provenance).
+ * - If the last user message is short (< 30 chars), prepends the previous for context.
  * - Hard-caps at 500 characters.
  *
- * Returns empty string if nothing usable remains.
+ * Provenance makes the old heuristic cleaners (DAY_PREFIXES, system marker stripping) obsolete.
  */
 export function buildRecallQuery(messages: unknown[]): string {
   const texts = extractMessageTexts(messages);
-  const userMessages: string[] = [];
-  for (let i = texts.length - 1; i >= 0 && userMessages.length < 2; i--) {
-    if (texts[i].role === "user") {
-      const cleaned = cleanMessageForQuery(texts[i].text);
-      if (cleaned) userMessages.unshift(cleaned);
-    }
-  }
-  if (userMessages.length === 0) return "";
+  // Prefer external_user messages (real human input)
+  const externalUserMsgs = texts.filter(
+    t => t.role === "user" && t.provenance === "external_user"
+  );
+  // Fallback: any user message (backward compat for OpenClaw without provenance)
+  const userMsgs = externalUserMsgs.length > 0
+    ? externalUserMsgs
+    : texts.filter(t => t.role === "user");
-  const lastMsg = userMessages[userMessages.length - 1];
+  if (userMsgs.length === 0) return "";
-  // If the last user message is very short, include previous for context
-  let query: string;
-  if (lastMsg.length < 30 && userMessages.length > 1) {
-    query = `${userMessages[userMessages.length - 2]} ${lastMsg}`;
-  } else {
-    query = lastMsg;
-  }
+  const lastMsg = userMsgs[userMsgs.length - 1].text.trim();
-  // Hard cap at 500 characters
-  if (query.length > 500) {
-    query = query.slice(0, 500);
+  // Short messages: include previous for context
+  if (lastMsg.length < 30 && userMsgs.length > 1) {
+    const prevMsg = userMsgs[userMsgs.length - 2].text.trim();
+    const combined = `${prevMsg} ${lastMsg}`.slice(0, 500);
+    return combined;
   }
-  return query.trim();
+  return lastMsg.slice(0, 500);
 }
 // ============================================================================
@@ -1304,22 +1294,27 @@ export function resetTurnState(): void {
  * Register lifecycle hooks on the plugin API.
  */
 export function registerHooks(api: any, config: PalaiaPluginConfig): void {
+  // Store api.logger for module-wide use (integrates into OpenClaw log system)
+  if (api.logger && typeof api.logger.info === "function") {
+    logger = api.logger;
+  }
   const opts = buildRunnerOpts(config);
-  // ── Startup checks (H-2, H-3) ─────────────────────────────────
+  // ── Startup checks (H-2, H-3, captureModel validation) ────────
   (async () => {
     // H-2: Warn if no agent is configured
     if (!process.env.PALAIA_AGENT) {
       try {
         const statusOut = await run(["config", "get", "agent"], { ...opts, timeoutMs: 3000 });
         if (!statusOut.trim()) {
-          console.warn(
+          logger.warn(
             "[palaia] No agent configured. Set PALAIA_AGENT env var or run 'palaia init --agent <name>'. " +
             "Auto-captured entries will have no agent attribution."
           );
         }
       } catch {
-        console.warn(
+        logger.warn(
           "[palaia] No agent configured. Set PALAIA_AGENT env var or run 'palaia init --agent <name>'. " +
           "Auto-captured entries will have no agent attribution."
         );
@@ -1346,7 +1341,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
           || status.config?.embedding_provider
         );
         if (!hasSemanticProvider && !hasProviderConfig) {
-          console.warn(
+          logger.warn(
             "[palaia] No embedding provider configured. Semantic search is inactive (BM25 keyword-only). " +
             "Run 'pip install palaia[fastembed]' and 'palaia doctor --fix' for better recall quality."
           );
@@ -1356,6 +1351,19 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
     } catch {
       // Non-fatal — status check failed, skip warning (avoid false positive)
     }
+    // Validate captureModel auth at plugin startup via modelAuth API
+    if (config.captureModel && api.runtime?.modelAuth) {
+      try {
+        const resolved = resolveCaptureModel(api.config, config.captureModel);
+        if (resolved?.provider) {
+          const key = await api.runtime.modelAuth.resolveApiKeyForProvider({ provider: resolved.provider, cfg: api.config });
+          if (!key) {
+            logger.warn(`[palaia] captureModel provider "${resolved.provider}" has no API key — auto-capture LLM extraction will fail`);
+          }
+        }
+      } catch { /* non-fatal */ }
+    }
   })();
   // ── /palaia status command ─────────────────────────────────────
@@ -1445,7 +1453,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
                 entries = result.results;
               }
             } catch (queryError) {
-              console.warn(`[palaia] Query recall failed, falling back to list: ${queryError}`);
+              logger.warn(`[palaia] Query recall failed, falling back to list: ${queryError}`);
             }
           }
         }
@@ -1556,7 +1564,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
             : undefined,
         };
       } catch (error) {
-        console.warn(`[palaia] Memory injection failed: ${error}`);
+        logger.warn(`[palaia] Memory injection failed: ${error}`);
       }
     });
   }
@@ -1669,7 +1677,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
                   (p) => p.name.toLowerCase() === validatedProject!.toLowerCase(),
                 );
                 if (!isKnown) {
-                  console.log(`[palaia] Auto-capture: unknown project "${validatedProject}" ignored`);
+                  logger.info(`[palaia] Auto-capture: unknown project "${validatedProject}" ignored`);
                   validatedProject = null;
                 }
               }
@@ -1686,7 +1694,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
                 effectiveScope,
               );
               await run(args, { ...opts, timeoutMs: 10_000 });
-              console.log(
+              logger.info(
                 `[palaia] LLM auto-captured: type=${r.type}, significance=${r.significance}, tags=${tags.join(",")}, project=${validatedProject || "none"}, scope=${effectiveScope || "team"}`
               );
             }
@@ -1711,7 +1719,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
             // captureModel is broken — try primary model as fallback
             if (!_captureModelFailoverWarned) {
               _captureModelFailoverWarned = true;
-              console.warn(`[palaia] WARNING: captureModel failed (${errStr}). Using primary model as fallback. Please update captureModel in your config.`);
+              logger.warn(`[palaia] WARNING: captureModel failed (${errStr}). Using primary model as fallback. Please update captureModel in your config.`);
             }
             try {
               // Retry without captureModel → resolveCaptureModel will use primary model
@@ -1722,13 +1730,13 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
               llmHandled = true;
             } catch (fallbackError) {
               if (!_llmImportFailureLogged) {
-                console.warn(`[palaia] LLM extraction failed (primary model fallback also failed): ${fallbackError}`);
+                logger.warn(`[palaia] LLM extraction failed (primary model fallback also failed): ${fallbackError}`);
                 _llmImportFailureLogged = true;
               }
             }
           } else {
             if (!_llmImportFailureLogged) {
-              console.warn(`[palaia] LLM extraction failed, using rule-based fallback: ${llmError}`);
+              logger.warn(`[palaia] LLM extraction failed, using rule-based fallback: ${llmError}`);
               _llmImportFailureLogged = true;
             }
           }
@@ -1770,7 +1778,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
           );
           await run(args, { ...opts, timeoutMs: 10_000 });
-          console.log(
+          logger.info(
             `[palaia] Rule-based auto-captured: type=${captureData.type}, tags=${captureData.tags.join(",")}`
           );
         }
@@ -1782,7 +1790,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
         } else {
         }
       } catch (error) {
-        console.warn(`[palaia] Auto-capture failed: ${error}`);
+        logger.warn(`[palaia] Auto-capture failed: ${error}`);
       }
       // ── Emoji Reactions (Issue #87) ──────────────────────────
@@ -1814,7 +1822,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
             }
           }
         } catch (reactionError) {
-          console.warn(`[palaia] Reaction sending failed: ${reactionError}`);
+          logger.warn(`[palaia] Reaction sending failed: ${reactionError}`);
         } finally {
           // Always clean up turn state
           deleteTurnState(sessionKey);
@@ -1844,7 +1852,7 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
           }
         }
       } catch (err) {
-        console.warn(`[palaia] Recall reaction failed: ${err}`);
+        logger.warn(`[palaia] Recall reaction failed: ${err}`);
       } finally {
         deleteTurnState(sessionKey);
       }
@@ -1857,10 +1865,10 @@ export function registerHooks(api: any, config: PalaiaPluginConfig): void {
     start: async () => {
       const result = await recover(opts);
       if (result.replayed > 0) {
-        console.log(`[palaia] WAL recovery: replayed ${result.replayed} entries`);
+        logger.info(`[palaia] WAL recovery: replayed ${result.replayed} entries`);
       }
       if (result.errors > 0) {
-        console.warn(`[palaia] WAL recovery completed with ${result.errors} error(s)`);
+        logger.warn(`[palaia] WAL recovery completed with ${result.errors} error(s)`);
       }
     },
   });