npm - @mingxy/cerebro - Versions diffs - 1.11.15 → 1.12.1 - Mend

@mingxy/cerebro 1.11.15 → 1.12.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mingxy/cerebro",
-  "version": "1.11.15",
+  "version": "1.12.1",
   "description": "Cerebro persistent memory plugin for OpenCode — auto-recall, auto-capture, 9 memory tools with clustering",
   "type": "module",
   "main": "src/index.ts",

package/schema.json CHANGED Viewed

@@ -96,6 +96,61 @@
           "default": 10,
           "minimum": 1,
           "maximum": 50
+        },
+        "fetchMultiplier": {
+          "type": "number",
+          "description": "Search breadth multiplier: fetch_limit = max_results * N",
+          "default": 3,
+          "minimum": 1,
+          "maximum": 10
+        },
+        "topkCapMultiplier": {
+          "type": "number",
+          "description": "Candidate cap multiplier: topk_cap = max_results * N",
+          "default": 2,
+          "minimum": 1,
+          "maximum": 10
+        },
+        "mmrJaccardThreshold": {
+          "type": "number",
+          "description": "Jaccard similarity threshold for MMR diversity penalty",
+          "default": 0.85,
+          "minimum": 0.0,
+          "maximum": 1.0
+        },
+        "mmrPenaltyFactor": {
+          "type": "number",
+          "description": "Score penalty factor for similar memories in MMR diversity",
+          "default": 0.5,
+          "minimum": 0.0,
+          "maximum": 1.0
+        },
+        "phase2Multiplier": {
+          "type": "number",
+          "description": "Phase2 global fallback search multiplier",
+          "default": 2,
+          "minimum": 1,
+          "maximum": 10
+        },
+        "llmMaxEval": {
+          "type": "number",
+          "description": "Maximum candidates sent to LLM for relevance evaluation",
+          "default": 15,
+          "minimum": 1,
+          "maximum": 50
+        },
+        "refineStrategy": {
+          "type": "string",
+          "description": "LLM refinement strategy: strict (high only), balanced (high+medium), loose (keep all)",
+          "enum": ["strict", "balanced", "loose"],
+          "default": "balanced"
+        },
+        "refineMediumChars": {
+          "type": "number",
+          "description": "Character limit for medium-relevance content truncation",
+          "default": 200,
+          "minimum": 50,
+          "maximum": 2000
         }
       },
       "additionalProperties": false

package/src/client.ts CHANGED Viewed

@@ -55,6 +55,14 @@ export interface ClusteredRecallResult {
   standalone_memories: MemoryDto[];
 }
+export interface DiscardedItem {
+  memory_id: string;
+  content: string;
+  score: number;
+  refine_relevance?: string;
+  refine_reasoning?: string;
+}
 export interface ShouldRecallResponse {
   should_recall: boolean;
   query?: string;
@@ -62,8 +70,8 @@ export interface ShouldRecallResponse {
   similarity_score?: number;
   confidence?: number;
   memories?: SearchResult[];
+  discarded?: DiscardedItem[];
   clustered?: ClusteredRecallResult;
-  event_id?: string;
 }
 export interface MemoryRelation {
@@ -332,6 +340,16 @@ export class CerebroClient {
     max_results?: number,
     project_tags?: string[],
     conversation_context?: string[],
+    recall_overrides?: {
+      fetch_multiplier?: number;
+      topk_cap_multiplier?: number;
+      mmr_jaccard_threshold?: number;
+      mmr_penalty_factor?: number;
+      phase2_multiplier?: number;
+      llm_max_eval?: number;
+      refine_strategy?: string;
+      refine_medium_chars?: number;
+    },
   ): Promise<ShouldRecallResponse | null> {
     const res = await this.post<ShouldRecallResponse>("/v1/should-recall", {
       query_text,
@@ -341,6 +359,7 @@ export class CerebroClient {
       max_results,
       project_tags,
       conversation_context,
+      ...recall_overrides,
     }, 20_000);
     return res;
   }
@@ -348,15 +367,42 @@ export class CerebroClient {
   async updateProfileInjected(
     event_id: string,
     profile_injected: boolean,
+    profile_content?: string,
   ): Promise<unknown | null> {
+    const body: Record<string, unknown> = { profile_injected };
+    if (profile_content !== undefined) {
+      body.profile_content = profile_content;
+    }
     const res = await this.patch(
       `/v1/recall-events/${event_id}/profile-injected`,
-      { profile_injected },
+      body,
       10_000,
     );
     return res;
   }
+  async createRecallEvent(params: {
+    session_id: string;
+    recall_type?: string;
+    query_text: string;
+    max_score: number;
+    llm_confidence: number;
+    profile_injected: boolean;
+    kept_count: number;
+    discarded_count: number;
+    injected_count: number;
+    profile_content?: string;
+    items?: Array<{
+      memory_id: string;
+      score: number;
+      refine_relevance?: string;
+      refine_reasoning?: string;
+      is_kept: boolean;
+    }>;
+  }): Promise<{ ok: boolean; event_id?: string } | null> {
+    return this.post("/v1/recall-events", params, 10_000);
+  }
   async sessionIngest(
     messages: Array<{ role: string; content: string }>,
     sessionId?: string,

package/src/config.ts CHANGED Viewed

@@ -22,6 +22,14 @@ export interface OmemPluginConfig {
   recall: {
     similarityThreshold: number;
     maxRecallResults: number;
+    fetchMultiplier: number;
+    topkCapMultiplier: number;
+    mmrJaccardThreshold: number;
+    mmrPenaltyFactor: number;
+    phase2Multiplier: number;
+    llmMaxEval: number;
+    refineStrategy: "strict" | "balanced" | "loose";
+    refineMediumChars: number;
   };
   logging: {
     logEnabled: boolean;
@@ -55,6 +63,14 @@ const DEFAULTS: OmemPluginConfig = {
   recall: {
     similarityThreshold: 0.4,
     maxRecallResults: 10,
+    fetchMultiplier: 3,
+    topkCapMultiplier: 2,
+    mmrJaccardThreshold: 0.85,
+    mmrPenaltyFactor: 0.5,
+    phase2Multiplier: 2,
+    llmMaxEval: 15,
+    refineStrategy: "balanced",
+    refineMediumChars: 200,
   },
   logging: {
     logEnabled: true,
@@ -111,6 +127,14 @@ function migrateFlatToNested(flat: FlatConfig): OmemPluginConfig {
     recall: {
       similarityThreshold: flat.similarityThreshold ?? DEFAULTS.recall.similarityThreshold,
       maxRecallResults: flat.maxRecallResults ?? DEFAULTS.recall.maxRecallResults,
+      fetchMultiplier: DEFAULTS.recall.fetchMultiplier,
+      topkCapMultiplier: DEFAULTS.recall.topkCapMultiplier,
+      mmrJaccardThreshold: DEFAULTS.recall.mmrJaccardThreshold,
+      mmrPenaltyFactor: DEFAULTS.recall.mmrPenaltyFactor,
+      phase2Multiplier: DEFAULTS.recall.phase2Multiplier,
+      llmMaxEval: DEFAULTS.recall.llmMaxEval,
+      refineStrategy: DEFAULTS.recall.refineStrategy,
+      refineMediumChars: DEFAULTS.recall.refineMediumChars,
     },
     logging: {
       logEnabled: flat.logEnabled ?? DEFAULTS.logging.logEnabled,

package/src/hooks.ts CHANGED Viewed

@@ -299,6 +299,14 @@ function buildClusteredContextBlock(clustered: import("./client.js").ClusteredRe
 export function autoRecallHook(client: CerebroClient, containerTags: string[], tui: any, config: Partial<OmemPluginConfig> = {}, getAgentName?: () => string) {
   const similarityThreshold = config.recall?.similarityThreshold ?? 0.4;
   const maxRecallResults = config.recall?.maxRecallResults ?? 10;
+  const fetchMultiplier = config.recall?.fetchMultiplier ?? 3;
+  const topkCapMultiplier = config.recall?.topkCapMultiplier ?? 2;
+  const mmrJaccardThreshold = config.recall?.mmrJaccardThreshold ?? 0.85;
+  const mmrPenaltyFactor = config.recall?.mmrPenaltyFactor ?? 0.5;
+  const phase2Multiplier = config.recall?.phase2Multiplier ?? 2;
+  const llmMaxEval = config.recall?.llmMaxEval ?? 15;
+  const refineStrategy = config.recall?.refineStrategy ?? "balanced";
+  const refineMediumChars = config.recall?.refineMediumChars ?? 200;
   const maxContentLength = Math.max(MIN_CONTENT_LENGTH, config.content?.maxContentLength ?? 500);
   const maxContentChars = Math.max(MIN_CONTENT_CHARS, config.content?.maxContentChars ?? 30000);
   const toastDelayMs = config.ui?.toastDelayMs ?? 7000;
@@ -315,7 +323,7 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
     if (policy === "none") return;
     try {
-      logDebug("autoRecallHook start", { sessionId: input.sessionID, agentId, policy });
+      logDebug("autoRecallHook start", { sessionId: input.sessionID, agentId, policy, similarityThreshold, maxRecallResults, fetchMultiplier, topkCapMultiplier, mmrJaccardThreshold, mmrPenaltyFactor, phase2Multiplier, llmMaxEval, refineStrategy, refineMediumChars });
       const messages = sessionMessages.get(input.sessionID) ?? [];
       const userMessages = messages.filter((m) => m.role === "user");
@@ -348,26 +356,36 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
         similarityThreshold, maxRecallResults,
         projectTags.length > 0 ? projectTags : undefined,
         conversationContext && conversationContext.length > 0 ? conversationContext : undefined,
+        {
+          fetch_multiplier: fetchMultiplier,
+          topk_cap_multiplier: topkCapMultiplier,
+          mmr_jaccard_threshold: mmrJaccardThreshold,
+          mmr_penalty_factor: mmrPenaltyFactor,
+          phase2_multiplier: phase2Multiplier,
+          llm_max_eval: llmMaxEval,
+          refine_strategy: refineStrategy,
+          refine_medium_chars: refineMediumChars,
+        },
       );
       if (!shouldRecallRes) {
         showToast(tui, "🧠 Cerebro Service Unavailable", "Unable to reach memory API · check connection", "error", toastDelayMs);
         return;
       }
-      logDebug("autoRecallHook shouldRecall result", { shouldRecall: shouldRecallRes.should_recall, confidence: shouldRecallRes.confidence, memCount: shouldRecallRes.memories?.length ?? 0, clustered: !!shouldRecallRes.clustered });
+      logDebug("autoRecallHook shouldRecall result", { shouldRecall: shouldRecallRes.should_recall, confidence: shouldRecallRes.confidence, memCount: shouldRecallRes.memories?.length ?? 0, discardedCount: shouldRecallRes.discarded?.length ?? 0, clustered: !!shouldRecallRes.clustered });
       const profile = await client.getProfile();
       let profileInjected = false;
       let profileCountText = "";
       let profileBlock = "";
       const lastInjected = profileInjectedSessions.get(input.sessionID);
-      const ttlExpired = !lastInjected || (Date.now() - lastInjected > 5 * 60 * 1000);
+      const ttlExpired = !lastInjected || (Date.now() - lastInjected > 30 * 60 * 1000);
       const isFirstInjection = !lastInjected;
       if (profile && ttlExpired) {
         const prefs = ((profile as any)?.static_facts ?? [])
           .filter((sf: any) => {
             const t: string[] = sf.tags ?? [];
-            return t.includes("preferences") || t.includes("preference_extract") || t.some((tag: string) => tag.includes("偏好"));
+            return t.includes("preferences");
           })
           .map((sf: any) => sf.l2_content ?? sf.content ?? "")
           .filter(Boolean);
@@ -398,10 +416,56 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
         }
       }
-      if (!shouldRecallRes.should_recall) {
-        if (profileInjected && shouldRecallRes?.event_id) {
-          await client.updateProfileInjected(shouldRecallRes.event_id, true).catch(() => {});
+      const storedMemoryIds = shouldRecallRes.memories?.map((r) => r.memory.id) ?? [];
+      const storedDiscardedIds = shouldRecallRes.discarded?.map((d) => d.memory_id) ?? [];
+      const maxScore = storedMemoryIds.length > 0
+        ? Math.max(...(shouldRecallRes.memories?.map((r) => r.score) ?? [0]))
+        : 0;
+      const createEventAndReturn = async (
+        injectedCount: number,
+        keptCount: number,
+        discardedCount: number,
+      ): Promise<string | undefined> => {
+        try {
+          const items = [
+            ...(shouldRecallRes.memories?.map((r) => ({
+              memory_id: r.memory.id,
+              score: r.score,
+              refine_relevance: r.refine_relevance,
+              refine_reasoning: r.refine_reasoning,
+              is_kept: true,
+            })) ?? []),
+            ...(shouldRecallRes.discarded?.map((d) => ({
+              memory_id: d.memory_id,
+              score: d.score,
+              refine_relevance: d.refine_relevance,
+              refine_reasoning: d.refine_reasoning,
+              is_kept: false,
+            })) ?? []),
+          ];
+          const result = await client.createRecallEvent({
+            session_id: input.sessionID!,
+            recall_type: "auto",
+            query_text,
+            max_score: maxScore,
+            llm_confidence: shouldRecallRes.confidence ?? 0,
+            profile_injected: profileInjected,
+            kept_count: keptCount,
+            discarded_count: discardedCount,
+            injected_count: injectedCount,
+            profile_content: profileInjected && profileBlock ? profileBlock : undefined,
+            items: items.length > 0 ? items : undefined,
+          });
+          return result?.event_id;
+        } catch (e) {
+          logErr("autoRecallHook createRecallEvent failed", { error: String(e) });
+          return undefined;
         }
+      };
+      if (!shouldRecallRes.should_recall) {
+        await createEventAndReturn(0, 0, storedDiscardedIds.length);
         if (profileInjected && isFirstInjection) {
           showToast(tui, "👨 Profile Injected", `${profileCountText} · no memory recall needed`, "success", toastDelayMs);
         }
@@ -415,9 +479,7 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
       const newResults = results.filter((r) => !existingIds.has(r.memory.id));
       logDebug("autoRecallHook dedup", { totalResults: results.length, existingCount: existingIds.size, newCount: newResults.length });
       if (newResults.length === 0) {
-        if (profileInjected && shouldRecallRes?.event_id) {
-          await client.updateProfileInjected(shouldRecallRes.event_id, true).catch(() => {});
-        }
+        await createEventAndReturn(0, storedMemoryIds.length, storedDiscardedIds.length);
         if (profileInjected && isFirstInjection) {
           showToast(tui, "👨 Profile Injected", `${profileCountText} · all memories already injected`, "success", toastDelayMs);
         }
@@ -453,9 +515,7 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
       injectedMemoryIds.set(input.sessionID, new Set([...existingIds, ...newIds]));
       logDebug("autoRecallHook injection complete", { newIds: newIds.length, clustered: !!clustered });
-      if (profileInjected && shouldRecallRes?.event_id) {
-        await client.updateProfileInjected(shouldRecallRes.event_id, true).catch(() => {});
-      }
+      await createEventAndReturn(newResults.length, storedMemoryIds.length, storedDiscardedIds.length);
       const memDynamic = newResults.filter((r) => r.memory.memory_type === "fact" || r.memory.memory_type === "event").length;
       const memStatic = newResults.filter((r) => r.memory.memory_type === "pinned" || r.memory.memory_type === "preference").length;

package/src/tools.ts CHANGED Viewed

@@ -52,17 +52,17 @@ export function buildTools(client: CerebroClient, containerTags: string[], conte
           "Do NOT overuse 'private' for normal work notes — default 'global' is correct for most cases."
           ),
         category: tool.schema
-          .string()
+          .enum(["cases", "preferences", "entities", "events", "profile", "patterns"])
           .optional()
           .describe(
-            "MUST be one of (choose the BEST fit): " +
-          "'cases' (default) = work records, bug fixes, architecture decisions, implementation notes, meeting conclusions; " +
-          "'preferences' = user likes/dislikes, coding style preferences, tool choices (e.g. 'prefers Vim over VSCode'); " +
-          "'entities' = projects, tools, people, concepts — defining what something IS (e.g. 'omem-server: Rust memory backend using LanceDB'); " +
+            "Memory category. MUST be one of these exact values (lowercase): " +
+          "'cases' (default) = work records, bug fixes, architecture decisions; " +
+          "'preferences' = user likes/dislikes, coding style, tool choices; " +
+          "'entities' = projects, tools, people, concepts; " +
           "'events' = time-bound milestones (deployments, releases, incidents); " +
           "'profile' = user identity traits (role, skills, team membership); " +
-          "'patterns' = workflows, methodologies, best practices, recurring solutions. " +
-          "When in doubt, use 'cases'."
+          "'patterns' = workflows, methodologies, best practices. " +
+          "When in doubt, omit this field (defaults to 'cases')."
           ),
       },
       async execute(args) {