npm - @mingxy/cerebro - Versions diffs - 1.10.8 → 1.10.10 - Mend

@mingxy/cerebro 1.10.8 → 1.10.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/INJECTION_FLOW.md ADDED Viewed

@@ -0,0 +1,434 @@
+# Cerebro Plugin 记忆注入全流程
+> 版本: v1.10.8 | 文件: `plugins/opencode/src/`
+---
+## 一、全局状态（模块级变量）
+```
+┌─────────────────────────────────────────────────────────────┐
+│  hooks.ts 模块级状态（所有hook共享）                          │
+├─────────────────────────────────────────────────────────────┤
+│  keywordDetectedSessions: Set<sessionID>                    │
+│    → 标记检测到记忆关键词的session（注入时追加KEYWORD_NUDGE） │
+│                                                             │
+│  injectedMemoryIds: Map<sessionID, Set<memoryID>>           │
+│    → 增量去重：跟踪每个session已注入的记忆ID                  │
+│                                                             │
+│  firstMessages: Map<sessionID, string>                      │
+│    → 记录每个session的第一条用户消息                          │
+│                                                             │
+│  sessionMessages: Map<sessionID, {role,content}[]>          │
+│    → 消息累积缓冲区（keywordDetection写入，compacting消费）  │
+│                                                             │
+│  profileInjectedSessions: Set<sessionID>                    │
+│    → 每session只注入一次Profile                              │
+│                                                             │
+│  processedMessageIds: Set<msgID>                            │
+│    → sessionIdleHook防止重复处理已消费的消息                  │
+│                                                             │
+│  pluginStartTime: number                                    │
+│    → 插件启动时间戳，跳过启动前的历史消息                     │
+└─────────────────────────────────────────────────────────────┘
+```
+---
+## 二、四条Hook链路总览
+```
+用户消息 → OpenCode SDK → 触发Hook链
+                                    │
+        ┌───────────────────────────┼─────────────────────────────┐
+        ▼                           ▼                             ▼
+ chat.message            chat.system.transform              session.idle
+ (每条消息)              (每次LLM调用前)                    (session空闲)
+        │                           │                             │
+        ▼                           ▼                             ▼
+ keywordDetectionHook       autoRecallHook                sessionIdleHook
+        │                           │                             │
+        │                           │                             │
+        │                      ┌────┘                             │
+        ▼                      ▼                                  │
+ session.compacting                                              │
+ (session压缩时)                                                 │
+        │                                                        │
+        ▼                                                        │
+   compactingHook ───────────────────────────────────────────────┘
+```
+---
+## 三、Hook ①: keywordDetectionHook — 消息收集
+**触发时机**: `chat.message`（每条用户消息）
+**作用**: 收集用户消息到内存缓冲区 + 检测记忆关键词
+```
+用户消息到达
+    │
+    ▼
+[1] 提取文本内容（text parts拼接）
+    │
+    ▼
+[2] 记录第一条消息 → firstMessages[sessionID] = text
+    │
+    ▼
+[3] 关键词检测: detectKeyword(text)
+    │                    │
+    ├─ 命中 ────────→ keywordDetectedSessions.add(sessionID)
+    │                  （autoRecallHook注入时会追加KEYWORD_NUDGE）
+    │
+    ▼
+[4] Policy检查: resolveAgentPolicy(agentId, config)
+    │
+    ├─ "none" ──→ return（不收集消息）
+    │
+    ▼
+[5] 消息入缓冲: sessionMessages[sessionID].push({role:"user", content:text})
+    │
+    ▼
+[6] 消息数 ≥ threshold?
+    │
+    └─ 是 → 标记"待处理"（等session.idle时消费）
+```
+**关键点**:
+- `policy="none"` 时不收集，`readonly`/`readwrite` 都收集
+- 消息存在内存Map中，等 `compactingHook` 或 `sessionIdleHook` 消费
+---
+## 四、Hook ②: autoRecallHook — 记忆召回+注入（核心）
+**触发时机**: `experimental.chat.system.transform`（每次LLM调用前，transform system prompt时）
+**作用**: 召回相关记忆 + 注入到system prompt
+```
+LLM调用前触发
+    │
+    ▼
+[1] Policy检查: resolveAgentPolicy(agentId, config)
+    │
+    ├─ "none" ──→ return（不召回）
+    │
+    ▼
+[2] 提取查询: 最后一条用户消息 → extractUserRequest() → query_text
+    │
+    ▼
+[3] 调用 shouldRecall API ──────────────────────→ POST /v1/should-recall
+    │  参数: query_text, last_query_text, session_id,         │
+    │        similarity_threshold(0.6),                        │
+    │        max_results(10), project_tags                     │
+    │  超时: 20秒                                              │
+    │                                              │
+    │ ◄────────────────────────────────────────────┘
+    │ 返回: ShouldRecallResponse
+    │   { should_recall, confidence, memories[], clustered? }
+    │
+    ▼
+[4] API不可达? ──→ Toast "Service Unavailable" → return
+    │
+    ▼
+[5] 注入Profile（每session仅一次）
+    │
+    ├─ GET /v1/profile → profile数据
+    │
+    ├─ profileInjectedSessions.has(sessionID)?
+    │   ├─ 否 → output.system.push("<cerebro-profile>...")
+    │   │        profileInjectedSessions.add(sessionID)
+    │   │        profileInjected = true
+    │   └─ 是 → 跳过
+    │
+    ▼
+[6] should_recall === false?
+    │
+    ├─ 是 ──→ 仅Profile注入?
+    │         ├─ 是 → Toast "👨 Profile Injected"
+    │         └─ return
+    │
+    ▼
+[7] 增量去重: results过滤掉 injectedMemoryIds[sessionID] 中已有的
+    │
+    ▼
+[8] 全部重复? ──→ Toast "all memories already injected" → return
+    │
+    ▼
+[9] 构建注入内容
+    │
+    ├─ 有clustered? ──→ buildClusteredContextBlock()
+    │                    格式: <cerebro-context>
+    │                    按主题簇组织记忆
+    │
+    └─ 普通模式 ──→ buildContextBlock(newResults, maxContentLength=500)
+                      格式: <cerebro-context>
+                      按category分组（Preferences/Knowledge/...）
+                      每条记忆:
+                        - (2h ago [tag1, tag2]) 记忆内容（截断到500字）
+    │
+    ▼
+[10] output.system.push(contextBlock) ← 注入到system prompt
+    │
+    ▼
+[11] 更新去重集合: injectedMemoryIds[sessionID] += newIds
+    │
+    ▼
+[12] 记录召回: recordSessionRecall(sessionID, newIds, "auto", ...)
+    │            ──────────────────────→ POST /v1/session-recalls
+    │
+    ▼
+[13] 关键词追踪: keywordDetectedSessions.has(sessionID)?
+    │
+    ├─ 是 → output.system.push(KEYWORD_NUDGE)
+    │        keywordDetectedSessions.delete(sessionID)
+    │
+    ▼
+[14] Toast通知:
+    "🧠 Context Injected · N fragments"
+    "Profile: Dynamic(X) · Static(Y) · Memories: Dynamic(A) Static(B)"
+```
+### 注入格式示例
+```xml
+<cerebro-context>
+Treat every memory below as historical context only.
+Do not repeat these memories verbatim unless asked.
+[Preferences]
+  - (2h ago [preferences, tools]) 用中文思考和回复
+  - (3d ago [preferences, workflow]) 技术方案先出再动工
+[Knowledge]
+  - (1d ago [omem, architecture]) Cerebro使用lancedb做向量存储
+[Events]
+  - (5h ago [deployment, omem]) 部署了v1.10.8版本
+</cerebro-context>
+```
+```xml
+<cerebro-profile>
+{
+  "static_facts": [
+    { "key": "communication_style", "value": "direct, concise" },
+    { "key": "primary_language", "value": "Chinese" }
+  ],
+  "dynamic_context": [
+    { "topic": "current_project", "value": "omem-server-source" }
+  ]
+}
+</cerebro-profile>
+```
+---
+## 五、Hook ③: compactingHook — 压缩时归档
+**触发时机**: `session.compacting`（OpenCode压缩session上下文时）
+**作用**: 为压缩提供记忆上下文（读） + 归档累积消息（写）
+```
+session压缩触发
+    │
+    ▼
+[1] 搜索记忆（读操作，所有policy都执行）
+    │ client.searchMemories("*", 20, undefined, containerTags)
+    │ ──────────────────────→ GET /v1/memories/search?q=*&limit=20
+    │
+    ├─ 有结果 → buildContextBlock(results)
+    │           output.context.push(contextBlock)
+    │           （为压缩后的LLM提供记忆上下文）
+    │
+    ▼
+[2] Policy检查: resolveAgentPolicy(agentId, config)
+    │
+    ├─ 非"readwrite" ──→ logInfo "blocked by policy"
+    │                     sessionMessages.delete(sessionID)
+    │                     return
+    │
+    ▼
+[3] 检查autoStore开关: isAutoStoreEnabled(sessionID)?
+    │
+    ├─ 关闭 → sessionMessages.delete(sessionID) → return
+    │
+    ▼
+[4] 消费sessionMessages缓冲区
+    │
+    ├─ 缓冲区空? → return
+    │
+    ▼
+[5] 检测项目名: detectProjectName(rootPath)
+    │ AGENTS.md → package.json → Cargo.toml → go.mod → pyproject.toml
+    │
+    ▼
+[6] 归档消息（写入记忆）
+    │ client.ingestMessages(messages, {mode, tags, sessionId, projectName})
+    │ ──────────────────────→ POST /v1/memories
+    │                        body: { messages: [...], mode: "smart", tags, session_id, project_name }
+    │                        每条消息内容先 sanitizeContent(text, maxContentChars=3000)
+    │                        → 去XML标签 → 压缩空白 → 超长截断
+    │
+    ▼
+[7] 清理缓冲区: sessionMessages.delete(sessionID)
+    │
+    ▼
+[8] Toast: "📦 Session Archived · N dialogues archived"
+```
+---
+## 六、Hook ④: sessionIdleHook — 空闲时归档
+**触发时机**: `session.idle`（session空闲10秒后）
+**作用**: 从SDK获取完整对话历史并归档
+```
+session空闲事件
+    │
+    ▼
+[1] event.type === "session.idle"? ── 否 → return
+    │
+    ▼
+[2] 提取sessionID
+    │
+    ▼
+[3] isAutoStoreEnabled(sessionID)? ── 关闭 → return
+    │
+    ▼
+[4] 非主session? (sessionID !== getMainSessionId()) ── return
+    │
+    ▼
+[5] 延迟10秒执行（防抖）
+    │
+    ▼
+[6] 从SDK获取session消息: sdkClient.session.messages({id: sessionID})
+    │
+    ▼
+[7] 过滤消息:
+    │   ├─ 跳过 processedMessageIds 中已处理的
+    │   ├─ 跳过 pluginStartTime 之前的（防历史重放）
+    │   ├─ 只保留 user/assistant 角色
+    │   └─ 提取text parts
+    │
+    ▼
+[8] 消息数 < threshold? ── return
+    │
+    ▼
+[9] Policy检查: resolveAgentPolicy(agentId, config)
+    │
+    ├─ 非"readwrite" ──→ logInfo "blocked by policy" → return
+    │
+    ▼
+[10] 检测项目名: detectProjectName(rootPath)
+     │
+     ▼
+[11] sessionIngest（写入记忆）
+     │ client.sessionIngest(messages, sessionID, agentId, title, projectName)
+     │ ──────────────────────→ POST /v1/memories/session-ingest
+     │                        body: { messages, session_id, agent_id, session_title, project_name }
+     │                        超时60秒
+     │
+     ▼
+[12] 标记已处理: processedMessageIds += newMessageIds
+     │
+     ▼
+[13] Toast: "🧠 Memory Sealed · N dialogues captured"
+```
+---
+## 七、数据流全景图
+```
+                        ┌─────────────────────────────────┐
+                        │          用户消息输入             │
+                        └──────────┬──────────────────────┘
+                                   │
+                    ┌──────────────┼──────────────────┐
+                    ▼              ▼                  ▼
+            keywordDetection   autoRecall           session.idle
+            (chat.message)    (chat.system         (空闲10s)
+                               .transform)
+                    │              │                  │
+                    │         ┌────┘                  │
+                    ▼         ▼                       │
+            sessionMessages  System Prompt            │
+            (内存缓冲)      注入区                     │
+                    │         ▲                       │
+                    │         │                       │
+                    ▼         │                       ▼
+              compacting ─────┘                  sessionIdleHook
+              (session压缩)                         │
+                    │                               │
+                    ▼                               ▼
+            ┌───────────────────────────────────────────────┐
+            │              Cerebro REST API                  │
+            │                                              │
+            │  读: POST /v1/should-recall    (召回决策)     │
+            │  读: GET  /v1/profile          (用户画像)     │
+            │  读: GET  /v1/memories/search  (记忆搜索)     │
+            │  写: POST /v1/memories         (消息归档)     │
+            │  写: POST /v1/memories/session-ingest (session归档) │
+            │  写: POST /v1/session-recalls  (召回记录)     │
+            │                                              │
+            └──────────────────┬───────────────────────────┘
+                               │
+                               ▼
+                    ┌─────────────────────┐
+                    │   LanceDB 向量存储   │
+                    │   (omem-server)     │
+                    └─────────────────────┘
+```
+---
+## 八、Policy门控规则
+| Hook | "none" | "readonly" | "readwrite" |
+|------|--------|------------|-------------|
+| keywordDetection | ❌ 不收集消息 | ✅ 收集消息 | ✅ 收集消息 |
+| autoRecall | ❌ 不召回 | ✅ 召回+注入 | ✅ 召回+注入 |
+| compacting | ✅ 搜索（读） | ✅ 搜索（读） | ✅ 搜索+写入 |
+| sessionIdle | N/A | ❌ 不写入 | ✅ 写入 |
+---
+## 九、关键配置参数
+| 参数 | 位置 | 默认值 | 作用 |
+|------|------|--------|------|
+| `content.maxContentLength` | config.ts L49 | 500 | **读取侧**截断：每条注入记忆最大字符数 |
+| `content.maxContentChars` | config.ts L48 | 30000→3000 | **写入侧**截断：归档时单条消息最大字符数 |
+| `content.maxQueryLength` | config.ts L47 | 200 | 召回查询最大字符数 |
+| `recall.similarityThreshold` | config.ts L56 | 0.4 | 召回相似度阈值 |
+| `recall.maxRecallResults` | config.ts L57 | 10 | 最大召回结果数 |
+| `ingest.autoCaptureThreshold` | config.ts L51 | 5 | 消息累积到N条才触发归档 |
+| `ui.toastDelayMs` | config.ts L65 | 7000 | Toast显示时长(ms) |
+| `agentMemoryPolicy` | config.ts L34 | - | 各agent的读写权限 |
+| `defaultPolicy` | config.ts L35 | "readwrite" | 未配置agent的默认权限 |
+---
+## 十、写入侧 vs 读取侧截断对比
+```
+                        写入路径                          读取路径
+                    (归档到服务端)                    (注入到system prompt)
+消息内容          sanitizeContent()                 truncate()
+                  client.ts L4-10                   hooks.ts L147-150
+处理流程          去XML标签 → 压缩空白 → 截断       直接截断
+配置参数          maxContentChars (3000)            maxContentLength (500)
+截断标记          "…[truncated]"                    "…"
+触发点            createMemory() L182               buildContextBlock() L178
+                  ingestMessages() L238
+调用方            compactingHook                    autoRecallHook
+                  sessionIdleHook
+```

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mingxy/cerebro",
-  "version": "1.10.8",
+  "version": "1.10.10",
   "description": "Cerebro persistent memory plugin for OpenCode — auto-recall, auto-capture, 9 memory tools with clustering",
   "type": "module",
   "main": "src/index.ts",

package/src/config.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { readFileSync } from "node:fs";
+import { readFileSync, appendFileSync, mkdirSync } from "node:fs";
 import { homedir } from "node:os";
 import { join } from "node:path";
@@ -144,6 +144,25 @@ function deepMerge(base: OmemPluginConfig, overrides: Partial<OmemPluginConfig>)
 // ── Load config ──────────────────────────────────────────────────────
+/** File-only logger for config.ts (cannot import logger.ts due to circular dependency). */
+function configLog(message: string, fields?: Record<string, unknown>): void {
+  try {
+    const logDir = join(homedir(), ".config", "cerebro", "logs");
+    const logPath = join(logDir, "plugin.log");
+    const ts = new Date().toISOString().replace("T", " ").replace(/\.\d+Z$/, "");
+    const parts = [`WARN  ${ts} service=cerebro ${message}`];
+    if (fields) {
+      for (const [k, v] of Object.entries(fields)) {
+        parts.push(`${k}=${typeof v === "string" ? v : JSON.stringify(v)}`);
+      }
+    }
+    mkdirSync(logDir, { recursive: true });
+    appendFileSync(logPath, parts.join(" ") + "\n");
+  } catch (writeErr) {
+    process.stderr.write(`[cerebro] configLog write failed: ${writeErr instanceof Error ? writeErr.message : String(writeErr)}\n`);
+  }
+}
 export function loadPluginConfig(overrides?: Partial<OmemPluginConfig>): OmemPluginConfig {
   let config: OmemPluginConfig = structuredClone(DEFAULTS);
@@ -157,8 +176,8 @@ export function loadPluginConfig(overrides?: Partial<OmemPluginConfig>): OmemPlu
     // Merge nested groups with defaults for safety
     config = deepMerge(config, parsed);
-  } catch {
-    // Config file doesn't exist or is invalid, use defaults
+  } catch (e) {
+    configLog("config.json load failed, using defaults", { error: String(e) });
   }
   // Apply environment variable overrides (flat OMEM_* → nested paths)
@@ -201,7 +220,20 @@ export function resolveAgentPolicy(
   agentName: string,
   config: Partial<OmemPluginConfig>,
 ): AgentPolicy {
-  return config.agentMemoryPolicy?.[agentName] ?? config.defaultPolicy ?? "readwrite";
+  const policies = config.agentMemoryPolicy;
+  if (policies) {
+    const exact = policies[agentName];
+    if (exact) return exact;
+    const lower = agentName.toLowerCase();
+    for (const [key, policy] of Object.entries(policies)) {
+      if (lower.startsWith(key.toLowerCase()) || key.toLowerCase().startsWith(lower)) {
+        return policy;
+      }
+    }
+  }
+  if (config.defaultPolicy) return config.defaultPolicy;
+  configLog("resolveAgentPolicy: no policy configured, defaulting to readwrite", { agentName });
+  return "readwrite";
 }
 export { DEFAULTS };

package/src/hooks.ts CHANGED Viewed

@@ -5,6 +5,11 @@ import { detectKeyword, KEYWORD_NUDGE } from "./keywords.js";
 import { logDebug, logInfo, logError as logErr } from "./logger.js";
 import { readFile } from "node:fs/promises";
+const BOUNDARY_SEARCH_RATIO = 0.6;
+const MIN_ITEM_CONTENT_CHARS = 100;
+const MIN_CONTENT_CHARS = 1000;
+const MIN_CONTENT_LENGTH = 50;
 const projectNameCache = new Map<string, string>();
 async function detectProjectName(rootPath: string): Promise<string | undefined> {
@@ -144,9 +149,25 @@ function formatRelativeAge(isoDate: string): string {
   return `${months}mo ago`;
 }
-function truncate(text: string, max: number): string {
-  if (text.length <= max) return text;
-  return text.slice(0, max) + "…";
+function truncate(text: string, maxLength: number): string {
+  if (text.length <= maxLength) return text;
+  // Sentence boundary characters: period, exclamation, question (Latin + CJK)
+  // Also treat newline as a boundary
+  const boundaries = /[.!?。！？\n]/;
+  // Search backwards from maxLength for a boundary
+  const searchEnd = Math.min(maxLength, text.length);
+  for (let i = searchEnd - 1; i >= Math.floor(searchEnd * BOUNDARY_SEARCH_RATIO); i--) {
+    if (boundaries.test(text[i])) {
+      return text.slice(0, i + 1).trimEnd() + "…";
+    }
+  }
+  let truncated = text.slice(0, maxLength);
+  const lastCode = truncated.charCodeAt(truncated.length - 1);
+  if (lastCode >= 0xD800 && lastCode <= 0xDBFF) truncated = truncated.slice(0, -1);
+  return truncated + "…";
 }
 function categorize(results: SearchResult[]): Map<string, SearchResult[]> {
@@ -230,9 +251,10 @@ function buildClusteredContextBlock(clustered: import("./client.js").ClusteredRe
 }
 export function autoRecallHook(client: CerebroClient, containerTags: string[], tui: any, config: Partial<OmemPluginConfig> = {}) {
-  const similarityThreshold = config.recall?.similarityThreshold ?? 0.6;
+  const similarityThreshold = config.recall?.similarityThreshold ?? 0.4;
   const maxRecallResults = config.recall?.maxRecallResults ?? 10;
-  const maxContentLength = config.content?.maxContentLength ?? 500;
+  const maxContentLength = Math.max(MIN_CONTENT_LENGTH, config.content?.maxContentLength ?? 500);
+  const maxContentChars = Math.max(MIN_CONTENT_CHARS, config.content?.maxContentChars ?? 30000);
   const toastDelayMs = config.ui?.toastDelayMs ?? 7000;
   return async (
@@ -266,10 +288,11 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
       const profile = await client.getProfile();
       let profileInjected = false;
       let profileCountText = "";
+      let profileBlock = "";
       if (profile && !profileInjectedSessions.has(input.sessionID)) {
-        const profileBlock = [
+        profileBlock = [
           "<cerebro-profile>",
-          JSON.stringify(profile, null, 2),
+          JSON.stringify(profile),
           "</cerebro-profile>",
         ].join("\n");
         output.system.push(profileBlock);
@@ -302,9 +325,26 @@ export function autoRecallHook(client: CerebroClient, containerTags: string[], t
         return;
       }
+      // --- Token Budget Calculation ---
+      const profileChars = profileInjected ? profileBlock.length : 0;
+      const budgetRemaining = maxContentChars - profileChars;
+      if (budgetRemaining < 0) {
+        logDebug("autoRecallHook budget overflow", { profileChars, maxContentChars, deficit: -budgetRemaining });
+      }
+      const itemCount = clustered
+        ? (clustered.cluster_summaries.length + clustered.standalone_memories.length)
+        : newResults.length;
+      const dynamicMaxContentLength = itemCount > 0
+        ? Math.min(maxContentLength, Math.max(MIN_ITEM_CONTENT_CHARS, Math.floor(budgetRemaining / itemCount)))
+        : maxContentLength;
+      logDebug("autoRecallHook budget", {
+        maxContentChars, profileChars, budgetRemaining, itemCount,
+        configuredMax: maxContentLength, dynamicMax: dynamicMaxContentLength
+      });
       const block = clustered
-        ? buildClusteredContextBlock(clustered, maxContentLength)
-        : buildContextBlock(newResults, maxContentLength);
+        ? buildClusteredContextBlock(clustered, dynamicMaxContentLength)
+        : buildContextBlock(newResults, dynamicMaxContentLength);
       if (block) {
         output.system.push(block);
       }
@@ -442,6 +482,15 @@ export function compactingHook(client: CerebroClient, containerTags: string[], t
     } catch {
     }
+    // Main session gate: sub-agents must not write memories via compacting
+    if (getMainSessionId) {
+      const mainId = getMainSessionId();
+      if (mainId && input.sessionID && input.sessionID !== mainId) {
+        logInfo("compactingHook: non-main session skipped", { sessionID: input.sessionID, mainSessionId: mainId });
+        return;
+      }
+    }
     // Policy gate: only readwrite agents can write memories
     const policy = resolveAgentPolicy(effectiveAgentId, config);
     if (policy !== "readwrite") {
@@ -475,12 +524,13 @@ export function compactingHook(client: CerebroClient, containerTags: string[], t
           }
           try {
-            logInfo("compactingHook ingestMessages called", { msgCount: messages.length, sessionId: effectiveSessionId });
+            logInfo("compactingHook ingestMessages called", { msgCount: messages.length, sessionId: effectiveSessionId, agentId: effectiveAgentId });
             const result = await client.ingestMessages(messages, {
               mode: ingestMode,
               tags: [...containerTags, "auto-capture"],
               sessionId: effectiveSessionId,
               projectName: projectName,
+              agentId: effectiveAgentId,
             });
             logInfo("compactingHook ingestMessages result", { result: result === null ? "null(blocked)" : "ok" });
             if (result === null) {
@@ -513,6 +563,7 @@ export function sessionIdleHook(
   isAutoStoreEnabled?: (sessionId: string | undefined) => boolean,
   agentId?: string,
   config: Partial<OmemPluginConfig> = {},
+  onAgentResolved?: (name: string) => void,
 ) {
   let idleTimeout: ReturnType<typeof setTimeout> | null = null;
   let isCapturing = false;
@@ -520,6 +571,8 @@ export function sessionIdleHook(
   return async (input: { event: { type: string; properties?: any } }) => {
     if (input.event.type !== "session.idle") return;
+    logDebug("sessionIdleHook event.properties dump", { keys: Object.keys(input.event.properties || {}), raw: JSON.stringify(input.event.properties).substring(0, 2000) });
     const sessionID = input.event.properties?.sessionID;
     if (!sessionID) return;
@@ -527,7 +580,10 @@ export function sessionIdleHook(
     if (getMainSessionId) {
       const mainId = getMainSessionId();
-      if (mainId && sessionID !== mainId) return;
+      if (mainId && sessionID !== mainId) {
+        logInfo("sessionIdleHook: non-main session skipped", { sessionID, mainSessionId: mainId });
+        return;
+      }
     }
     if (idleTimeout) clearTimeout(idleTimeout);
@@ -549,8 +605,6 @@ export function sessionIdleHook(
           const msgId = msg.info?.id;
           if (!msgId || processedMessageIds.has(msgId)) continue;
-          // Skip messages created before this plugin instance started
-          // (prevents replaying entire session history on restart)
           const msgTime = msg.info?.createdAt ? new Date(msg.info.createdAt).getTime() : 0;
           if (msgTime > 0 && msgTime < pluginStartTime) continue;
@@ -574,18 +628,15 @@ export function sessionIdleHook(
           return;
         }
-        // Policy gate: only readwrite agents can write memories
-        const policy = resolveAgentPolicy(agentId || "", config);
-        if (policy !== "readwrite") {
-          logInfo("sessionIdleHook blocked by policy", { agentId: agentId || "", policy });
-          return;
-        }
         let sessionTitle: string | undefined;
         let projectName: string | undefined;
+        let effectiveAgentId = agentId || "opencode";
         try {
           const sessionInfo = await sdkClient.session.get({ path: { id: sessionID } });
-          logDebug("sessionIdleHook project.rootPath", { rootPath: sessionInfo?.data?.directory });
+          if ((sessionInfo?.data as any)?.agent) {
+            effectiveAgentId = (sessionInfo.data as any).agent;
+            onAgentResolved?.(effectiveAgentId);
+          }
           sessionTitle = sessionInfo?.data?.title;
           projectName = sessionInfo?.data?.directory
             ? await detectProjectName(sessionInfo.data.directory)
@@ -594,9 +645,17 @@ export function sessionIdleHook(
           logErr("sessionIdleHook detectProjectName failed", { error: String(e) });
         }
+        logDebug("sessionIdleHook resolved agentId", { effectiveAgentId, fallbackAgentId: agentId });
+        const policy = resolveAgentPolicy(effectiveAgentId, config);
+        if (policy !== "readwrite") {
+          logInfo("sessionIdleHook blocked by policy", { agentId: effectiveAgentId, policy, defaultPolicy: String(config.defaultPolicy ?? "undefined") });
+          return;
+        }
         try {
-          logInfo("sessionIdleHook sessionIngest called", { msgCount: conversationMessages.length, sessionId: sessionID, title: String(sessionTitle) });
-          await cerebroClient.sessionIngest(conversationMessages, sessionID, agentId, sessionTitle, projectName);
+          logInfo("sessionIdleHook sessionIngest called", { msgCount: conversationMessages.length, sessionId: sessionID, agentId: effectiveAgentId, title: String(sessionTitle) });
+          await cerebroClient.sessionIngest(conversationMessages, sessionID, effectiveAgentId, sessionTitle, projectName);
           logInfo("sessionIdleHook sessionIngest ok");
           for (const id of newMessageIds) {
             processedMessageIds.add(id);

package/src/index.ts CHANGED Viewed

@@ -7,7 +7,7 @@ import { CerebroClient } from "./client.js";
 import { autoRecallHook, compactingHook, keywordDetectionHook, sessionIdleHook } from "./hooks.js";
 import { getUserTag, getProjectTag } from "./tags.js";
 import { buildTools } from "./tools.js";
-import { logInfo, logError } from "./logger.js";
+import { logInfo, logDebug, logError } from "./logger.js";
 import { loadPluginConfig } from "./config.js";
 const __filename = fileURLToPath(import.meta.url);
@@ -115,7 +115,9 @@ const OmemPlugin: Plugin = async (input) => {
   const containerTags = [getUserTag(email), getProjectTag(cwd)];
   const agentId = process.env.OMEM_AGENT_ID || "opencode";
-  let currentSessionId: string | undefined;
+  let mainSessionId: string | undefined;
+  let mainSessionLocked = false;
+  let cachedAgentName: string | undefined;
   const recallHook = autoRecallHook(cerebroClient, containerTags, tui, config);
@@ -128,13 +130,18 @@ const OmemPlugin: Plugin = async (input) => {
       };
     },
     "experimental.chat.system.transform": async (input: any, output: any) => {
-      if (input.sessionID) currentSessionId = input.sessionID;
+      logDebug("transform input", { sessionID: input.sessionID });
+      if (input.sessionID && !mainSessionLocked) {
+        mainSessionId = input.sessionID;
+        mainSessionLocked = true;
+        logInfo("mainSessionId locked", { sessionId: input.sessionID });
+      }
       return recallHook(input, output);
     },
     "chat.message": keywordDetectionHook(cerebroClient, containerTags, config.ingest.autoCaptureThreshold, tui, config.ingest.ingestMode, config, agentId),
-    "experimental.session.compacting": compactingHook(cerebroClient, containerTags, tui, config.ingest.ingestMode, isAutoStoreEnabled, () => currentSessionId, client, config, agentId),
-    tool: buildTools(cerebroClient, containerTags, { agentId, getSessionId: () => currentSessionId }),
-    event: sessionIdleHook(cerebroClient, containerTags, tui, client, config.ingest.ingestMode, config.ingest.autoCaptureThreshold, () => currentSessionId, isAutoStoreEnabled, agentId, config),
+    "experimental.session.compacting": compactingHook(cerebroClient, containerTags, tui, config.ingest.ingestMode, isAutoStoreEnabled, () => mainSessionId, client, config, agentId),
+    tool: buildTools(cerebroClient, containerTags, { agentId, getSessionId: () => mainSessionId, getAgentName: () => cachedAgentName || agentId }),
+    event: sessionIdleHook(cerebroClient, containerTags, tui, client, config.ingest.ingestMode, config.ingest.autoCaptureThreshold, () => mainSessionId, isAutoStoreEnabled, agentId, config, (name: string) => { cachedAgentName = name; }),
     "shell.env": async (_input: any, output: any) => {
       if (directory) {
         output.env.OMEM_PROJECT_DIR = directory;

package/src/tools.ts CHANGED Viewed

@@ -24,6 +24,7 @@ function extractMemoryIds(result: unknown): string[] {
 export interface ToolContext {
   agentId?: string;
   getSessionId: () => string | undefined;
+  getAgentName?: () => string;
 }
 export function buildTools(client: CerebroClient, containerTags: string[], context: ToolContext) {
@@ -85,12 +86,13 @@ export function buildTools(client: CerebroClient, containerTags: string[], conte
       },
       async execute(args) {
         const allTags = [...containerTags, ...(args.tags ?? [])];
+        const effectiveAgentId = context.getAgentName?.() || context.agentId;
         const result = await client.createMemory(
           args.content,
           allTags,
           args.source,
           args.scope ?? "project",
-          context.agentId,
+          effectiveAgentId,
           context.getSessionId(),
           args.visibility,
           args.category,
@@ -241,10 +243,12 @@ export function buildTools(client: CerebroClient, containerTags: string[], conte
           .describe("Session ID to associate with the ingestion"),
       },
       async execute(args) {
+        const effectiveAgentId = context.getAgentName?.() || context.agentId;
         const result = await client.ingestMessages(args.messages, {
           mode: args.mode ?? "smart",
           tags: args.tags,
           sessionId: args.session_id,
+          agentId: effectiveAgentId,
         });
         if (result === null) return JSON.stringify({ ok: false, error: "Ingestion failed" });
         if (args.session_id) {