npm - ex-brain - Versions diffs - 0.1.0 → 0.1.1 - Mend

ex-brain 0.1.0 → 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

package/README.md +39 -37
package/package.json +5 -5
package/src/ai/compiler.ts +529 -0
package/src/ai/embed-factory.ts +116 -0
package/src/ai/entity-link.ts +226 -0
package/src/ai/hash-embed.ts +30 -0
package/src/ai/timeline-extractor.ts +436 -0
package/src/cli.ts +16 -0
package/src/commands/compile-cmd.ts +208 -0
package/src/commands/graph-cmd.ts +1070 -0
package/src/commands/index.ts +1447 -0
package/src/config.ts +80 -0
package/src/db/client.ts +101 -0
package/src/db/schema.ts +49 -0
package/src/markdown/io.ts +61 -0
package/src/markdown/parser.ts +72 -0
package/src/mcp/server.ts +540 -0
package/src/repositories/brain-repo.ts +772 -0
package/src/settings.ts +214 -0
package/src/types/index.ts +55 -0
package/src/utils/progress.ts +171 -0
package/dist/cli.js +0 -93543

package/README.md CHANGED Viewed

@@ -1,81 +1,83 @@
 # ex-brain
-CLI 个人知识库，基于 [seekdb](https://docs.seekdb.ai/) 构建，支持页面管理、混合检索、时间线、标签、导入导出与 MCP Server。
+CLI personal knowledge base built on [seekdb](https://docs.seekdb.ai/), featuring page management, hybrid search, timelines, tags, import/export, and MCP Server.
-## 核心功能
+## Core Features
-- **知识图谱可视化** - 交互式图谱，展示实体关联关系
-- **智能编译** - 语义分析，智能更新 Compiled Truth
-- **时间线管理** - 自动提取事件，记录历史演变
-- **混合检索** - 全文搜索 + 向量语义查询
-- **实体链接** - 自动识别实体，创建关联页面
+- **Knowledge Graph Visualization** - Interactive graph showing entity relationships
+- **Intelligent Compilation** - Semantic analysis with smart Compiled Truth updates
+- **Timeline Management** - Automatic event extraction and history tracking
+- **Hybrid Search** - Full-text search + vector semantic queries
+- **Entity Linking** - Auto-detect entities and create linked pages
-## 数据采集
+<img src="https://mdn.alipayobjects.com/huamei_ytl0i7/afts/img/A*TqdfTZ-yCPwAAAAAgBAAAAgAejCYAQ/original" width="800">
-推荐使用 [MarkSnip](https://chromewebstore.google.com/detail/kcbaglhfgbkjdnpeokaamjjkddempipm) 作为数据采集工具：
+## Data Collection
-- 一键剪藏网页为 Markdown 格式
-- 支持代码块、表格、数学公式
-- 本地处理，隐私友好
-- 支持 Obsidian 集成
+We recommend [MarkSnip](https://chromewebstore.google.com/detail/kcbaglhfgbkjdnpeokaamjjkddempipm) for data collection:
-配合 ex-brain 使用：
+- One-click web clipping to Markdown format
+- Supports code blocks, tables, math formulas
+- Local processing, privacy-friendly
+- Obsidian integration support
+Use with ex-brain:
 ```bash
-# MarkSnip 剪藏后，导入到知识库
+# After clipping with MarkSnip, import to knowledge base
 cat article.md | ebrain put articles/slug --stdin
-# 或智能编译
+# Or intelligent compilation
 ebrain compile companies/river-ai --file article.md --source web_clip
 ```
-## 安装
+## Installation
 ```bash
-# 全局安装（需要 Bun 或 Node.js）
+# Global installation (requires Bun or Node.js)
 bun install -g ex-brain
-# 或
+# or
 npm install -g ex-brain
 ebrain --help
 ```
-## 快速开始
+## Quick Start
 ```bash
-# 初始化（自动创建 ~/.ebrain/data/ebrain.db）
+# Initialize (creates ~/.ebrain/data/ebrain.db automatically)
 ebrain init
-# 写入页面
+# Write a page
 ebrain put my/note --file note.md
-# 知识图谱可视化
-ebrain graph                    # 启动图谱 Web UI (http://localhost:3000)
-ebrain graph --port 8080 --open # 指定端口并自动打开浏览器
+# Knowledge graph visualization
+ebrain graph                    # Start graph Web UI (http://localhost:3000)
+ebrain graph --port 8080 --open # Custom port and auto-open browser
-# 智能编译新信息
+# Intelligently compile new information
 ebrain compile companies/river-ai "River AI completed Series A funding" --source meeting_notes
-# 从页面提取时间线事件
+# Extract timeline events from a page
 ebrain timeline extract companies/river-ai
-# 检索
-ebrain search "某主题"
-ebrain query "某问题"
+# Search
+ebrain search "some topic"
+ebrain query "some question"
-# 启动 MCP Server（供 AI 工具调用）
+# Start MCP Server (for AI tool integration)
 ebrain serve
 ```
-## 配置
+## Configuration
-编辑 `~/.ebrain/settings.json`：
+Edit `~/.ebrain/settings.json`:
 ```jsonc
 {
   "db": { "path": "~/.ebrain/data/ebrain.db" },
   "embed": {
-    "provider": "hash",          // 或 "openai_compatible"
+    "provider": "hash",          // or "openai_compatible"
     "baseURL": "...",
     "model": "...",
     "dimensions": 1024,
@@ -84,12 +86,12 @@ ebrain serve
 }
 ```
-运行 `ebrain config` 查看当前生效配置。详见 [docs/ebrain-cli.md](docs/ebrain-cli.md)。
+Run `ebrain config` to view active configuration. See [docs/ebrain-cli.md](docs/ebrain-cli.md) for details.
-## 开发
+## Development
 ```bash
 bun install
 bun run src/cli.ts --help
 bun test
-```
+```

package/package.json CHANGED Viewed

@@ -1,15 +1,15 @@
 {
   "name": "ex-brain",
-  "version": "0.1.0",
+  "version": "0.1.1",
   "description": "CLI personal knowledge base powered by seekdb",
-  "main": "dist/cli.js",
+  "module": "src/cli.ts",
   "type": "module",
   "bin": {
-    "ebrain": "dist/cli.js"
+    "ebrain": "src/cli.ts"
   },
   "files": [
-    "dist",
-    "README.md"
+    "src",
+    "!src/**/*.test.ts"
   ],
   "scripts": {
     "dev": "bun run src/cli.ts",

package/src/ai/compiler.ts ADDED Viewed

@@ -0,0 +1,529 @@
+import type { ResolvedLLM } from "../settings";
+import type { TimelineEntry } from "../types";
+// ---------------------------------------------------------------------------
+// Types
+// ---------------------------------------------------------------------------
+export interface CompileInput {
+  /** Current compiled truth content */
+  currentTruth: string;
+  /** Timeline entries for context */
+  timeline: TimelineEntry[];
+  /** New information to process */
+  newInfo: string;
+  /** Source of the new information */
+  source: string;
+  /** Date of the new information (ISO or YYYY-MM-DD) */
+  date: string;
+  /** Page metadata for context */
+  pageContext?: {
+    slug: string;
+    type: string;
+    title: string;
+  };
+}
+export interface CompileResult {
+  /** Updated compiled truth */
+  compiledTruth: string;
+  /** Whether any update was made */
+  changed: boolean;
+  /** Type of change */
+  changeType: "append" | "update" | "replace" | "none" | "conflict";
+  /** Human-readable summary of what changed */
+  changeSummary: string;
+  /** Timeline entries to add (extracted from new info) */
+  timelineEntries: TimelineEntry[];
+  /** Confidence score */
+  confidence: number;
+}
+export interface FactAnalysis {
+  /** Key facts extracted */
+  facts: ExtractedFact[];
+  /** Information type classification */
+  infoType: "status_update" | "new_event" | "correction" | "confirmation" | "new_entity";
+  /** Entities mentioned */
+  entities: string[];
+  /** Temporal context */
+  temporalContext: string;
+}
+export interface ExtractedFact {
+  /** Fact category (e.g., "funding_stage", "valuation", "ceo") */
+  category: string;
+  /** Previous value (if this is an update) */
+  oldValue?: string;
+  /** New value */
+  newValue: string;
+  /** Whether this replaces or adds */
+  action: "replace" | "add";
+  /** Source sentence */
+  sourceSentence: string;
+  /** Confidence */
+  confidence: number;
+}
+// ---------------------------------------------------------------------------
+// Compile Logic
+// ---------------------------------------------------------------------------
+/**
+ * Intelligent compilation: analyze new info, merge/update compiled truth.
+ * Uses LLM to understand semantic changes and update appropriately.
+ */
+export async function compileTruth(
+  input: CompileInput,
+  llm: ResolvedLLM,
+): Promise<CompileResult> {
+  const apiKey = resolveApiKey(llm);
+  if (!apiKey) {
+    return {
+      compiledTruth: appendFact(input.currentTruth, input.newInfo, input.source),
+      changed: true,
+      changeType: "append",
+      changeSummary: "LLM not configured, appended as simple fact",
+      timelineEntries: [],
+      confidence: 0.5,
+    };
+  }
+  // Step 1: Analyze the new information
+  const analysis = await analyzeNewInfo(input, llm);
+  // Step 2: Generate updated compiled truth
+  const updateResult = await generateUpdatedTruth(input, analysis, llm);
+  // Step 3: Extract timeline entries from new info
+  const timelineEntries = await extractTimelineFromInfo(input, analysis, llm);
+  return {
+    compiledTruth: updateResult.compiledTruth,
+    changed: updateResult.changed,
+    changeType: updateResult.changeType,
+    changeSummary: updateResult.changeSummary,
+    timelineEntries,
+    confidence: analysis.facts.reduce((sum, f) => sum + f.confidence, 0) / Math.max(analysis.facts.length, 1),
+  };
+}
+/**
+ * Step 1: Analyze new information to understand what it means
+ */
+async function analyzeNewInfo(
+  input: CompileInput,
+  llm: ResolvedLLM,
+): Promise<FactAnalysis> {
+  const prompt = buildAnalysisPrompt(input);
+  const resp = await callLLM(llm, prompt, 2048);
+  const parsed = parseAnalysisResponse(resp);
+  return parsed;
+}
+/**
+ * Step 2: Generate updated compiled truth based on analysis
+ */
+async function generateUpdatedTruth(
+  input: CompileInput,
+  analysis: FactAnalysis,
+  llm: ResolvedLLM,
+): Promise<{ compiledTruth: string; changed: boolean; changeType: CompileResult["changeType"]; changeSummary: string }> {
+  // If no facts extracted, no change needed
+  if (analysis.facts.length === 0) {
+    return {
+      compiledTruth: input.currentTruth,
+      changed: false,
+      changeType: "none",
+      changeSummary: "No actionable facts extracted",
+    };
+  }
+  // For status updates and corrections, use LLM to intelligently merge
+  if (analysis.infoType === "status_update" || analysis.infoType === "correction") {
+    return await smartMergeTruth(input, analysis, llm);
+  }
+  // For new events/entities, append
+  if (analysis.infoType === "new_event" || analysis.infoType === "new_entity") {
+    return {
+      compiledTruth: appendStructuredFacts(input.currentTruth, analysis.facts, input.source),
+      changed: true,
+      changeType: "append",
+      changeSummary: `Added ${analysis.facts.length} new facts`,
+    };
+  }
+  // Default: append with source attribution
+  return {
+    compiledTruth: appendFact(input.currentTruth, input.newInfo, input.source),
+    changed: true,
+    changeType: "append",
+    changeSummary: "Appended new information with source attribution",
+  };
+}
+/**
+ * Smart merge: LLM understands semantic updates and rewrites compiled truth
+ */
+async function smartMergeTruth(
+  input: CompileInput,
+  analysis: FactAnalysis,
+  llm: ResolvedLLM,
+): Promise<{ compiledTruth: string; changed: boolean; changeType: CompileResult["changeType"]; changeSummary: string }> {
+  const prompt = buildMergePrompt(input, analysis);
+  const resp = await callLLM(llm, prompt, 4096);
+  const result = parseMergeResponse(resp);
+  return result;
+}
+/**
+ * Step 3: Extract timeline entries from new information
+ */
+async function extractTimelineFromInfo(
+  input: CompileInput,
+  analysis: FactAnalysis,
+  llm: ResolvedLLM,
+): Promise<TimelineEntry[]> {
+  // Only extract timeline for significant events
+  if (analysis.infoType === "status_update" || analysis.infoType === "new_event") {
+    const prompt = buildTimelinePrompt(input, analysis);
+    const resp = await callLLM(llm, prompt, 1024);
+    return parseTimelineResponse(resp, input.pageContext?.slug ?? "");
+  }
+  return [];
+}
+// ---------------------------------------------------------------------------
+// Prompt Building
+// ---------------------------------------------------------------------------
+function buildAnalysisPrompt(input: CompileInput): string {
+  return `Analyze the new information and classify what type of update this represents.
+## Context
+Page: ${input.pageContext?.title ?? "Unknown"} (${input.pageContext?.type ?? "unknown"})
+Current Compiled Truth:
+${input.currentTruth || "(empty)"}
+Recent Timeline (for temporal context):
+${input.timeline.slice(0, 10).map(t => `- ${t.date} | ${t.source}: ${t.summary}`).join("\n") || "(no timeline)"}
+## New Information
+Source: ${input.source}
+Date: ${input.date}
+Content: ${input.newInfo}
+## Task
+Classify this information and extract key facts. Output ONLY JSON.
+Schema:
+{
+  "facts": [
+    {
+      "category": "funding_stage|valuation|ceo|employee_count|product_status|partnership|...",
+      "oldValue": "previous value if this updates something (null if new)",
+      "newValue": "the new value",
+      "action": "replace|add",
+      "sourceSentence": "exact sentence from new info",
+      "confidence": 0.0-1.0
+    }
+  ],
+  "infoType": "status_update|new_event|correction|confirmation|new_entity",
+  "entities": ["list of entities mentioned"],
+  "temporalContext": "when this happened or is valid for"
+}
+Rules:
+1. "status_update" = information that changes/updates existing state (e.g., funding stage change)
+2. "new_event" = discrete event that happened (e.g., product launch)
+3. "correction" = explicitly correcting previous information
+4. "confirmation" = confirming existing information without change
+5. "new_entity" = introducing new entity/aspect not previously tracked
+6. Extract ALL actionable facts, not just the most prominent one
+7. Use high confidence (0.8+) for clear, explicit statements; lower for ambiguous ones
+/no_think`;
+}
+function buildMergePrompt(input: CompileInput, analysis: FactAnalysis): string {
+  const factSummaries = analysis.facts.map(f =>
+    `- ${f.category}: ${f.oldValue ? `"${f.oldValue}" → "${f.newValue}"` : `"${f.newValue}"`} (${f.action}, confidence: ${f.confidence})`
+  ).join("\n");
+  return `Rewrite the compiled truth to incorporate the analyzed changes.
+## Current Compiled Truth
+${input.currentTruth || "(empty)"}
+## Changes to Apply
+${factSummaries}
+## Source Attribution
+Source: ${input.source}
+Date: ${input.date}
+## Change Type
+${analysis.infoType}
+## Task
+Rewrite the compiled truth. Output ONLY JSON with this schema:
+{
+  "compiledTruth": "the full rewritten compiled truth content (markdown format)",
+  "changed": true|false,
+  "changeType": "update|replace|conflict|none",
+  "changeSummary": "human-readable summary of what changed"
+}
+Rules:
+1. For "replace" actions: remove the old value, add the new value
+2. For "add" actions: append the new fact in appropriate section
+3. Preserve the overall structure and style of existing content
+4. Add source attribution: append " (Source: ${input.source}, ${input.date})" to updated facts
+5. If structure doesn't exist, create appropriate sections (## Status, ## Facts, etc.)
+6. "update" = modified existing content; "replace" = replaced entire section; "conflict" = contradictory info (keep both with notes)
+7. Do NOT remove historical context - keep timeline references
+8. Format as clean markdown
+Example output for funding stage update:
+{
+  "compiledTruth": "## Status\n\n- **Funding Stage**: Series A (Source: meeting_notes, 2024-05-20)\n- **Valuation**: ~$50M (estimated)\n\n## History\n\n- Previously: Seed stage (until 2024-05-20)\n\n## Facts\n\n- ...",
+  "changed": true,
+  "changeType": "update",
+  "changeSummary": "Updated funding stage from Seed to Series A"
+}
+/no_think`;
+}
+function buildTimelinePrompt(input: CompileInput, analysis: FactAnalysis): string {
+  return `Extract timeline entries from this information.
+## New Information
+Date: ${input.date}
+Source: ${input.source}
+Content: ${input.newInfo}
+## Analysis
+Type: ${analysis.infoType}
+Key Facts: ${analysis.facts.map(f => f.newValue).join(", ")}
+## Task
+Create timeline entries. Output ONLY JSON array:
+[
+  {
+    "date": "YYYY-MM-DD",
+    "source": "${input.source}",
+    "summary": "one-line summary (max 80 chars)",
+    "detail": "optional additional detail (markdown)"
+  }
+]
+Rules:
+1. Use the provided date, or extract exact date from content if mentioned
+2. Summary should be concise and factual
+3. Only create entries for significant events worth tracking
+4. Max 2 entries per input
+5. Empty array if nothing significant
+/no_think`;
+}
+// ---------------------------------------------------------------------------
+// LLM Call
+// ---------------------------------------------------------------------------
+async function callLLM(llm: ResolvedLLM, prompt: string, maxTokens: number): Promise<string> {
+  const apiKey = resolveApiKey(llm);
+  if (!apiKey) return "";
+  const body = {
+    model: llm.model,
+    messages: [
+      { role: "system", content: "You are a knowledge compilation assistant. You analyze information, extract facts, and maintain structured compiled truth. Always output valid JSON. Be precise and factual." },
+      { role: "user", content: prompt },
+    ],
+    temperature: 0.1,
+    max_tokens: maxTokens,
+    enable_thinking: false,
+  };
+  try {
+    const resp = await fetch(
+      llm.baseURL.endsWith("/") ? llm.baseURL + "chat/completions" : llm.baseURL + "/chat/completions",
+      {
+        method: "POST",
+        headers: { "Content-Type": "application/json", Authorization: `Bearer ${apiKey}` },
+        body: JSON.stringify(body),
+      },
+    );
+    if (!resp.ok) {
+      const text = await resp.text();
+      console.warn(`[compiler] LLM call failed (${resp.status}): ${text.slice(0, 200)}`);
+      return "";
+    }
+    const data = await resp.json();
+    return data.choices?.[0]?.message?.content?.trim() ?? "";
+  } catch (error) {
+    const msg = error instanceof Error ? error.message : String(error);
+    console.warn(`[compiler] LLM call error: ${msg}`);
+    return "";
+  }
+}
+// ---------------------------------------------------------------------------
+// Response Parsing
+// ---------------------------------------------------------------------------
+function parseAnalysisResponse(resp: string): FactAnalysis {
+  const match = resp.match(/\{[\s\S]*\}/);
+  if (!match) {
+    return { facts: [], infoType: "new_entity", entities: [], temporalContext: "" };
+  }
+  try {
+    const parsed = JSON.parse(match[0]) as Record<string, unknown>;
+    const facts: ExtractedFact[] = [];
+    const rawFacts = parsed.facts as unknown[] ?? [];
+    for (const f of rawFacts) {
+      if (typeof f !== "object" || f === null) continue;
+      const fact = f as Record<string, unknown>;
+      facts.push({
+        category: String(fact.category ?? "other"),
+        oldValue: fact.oldValue ? String(fact.oldValue) : undefined,
+        newValue: String(fact.newValue ?? ""),
+        action: fact.action === "replace" ? "replace" : "add",
+        sourceSentence: String(fact.sourceSentence ?? ""),
+        confidence: typeof fact.confidence === "number" ? fact.confidence : 0.8,
+      });
+    }
+    return {
+      facts,
+      infoType: normalizeInfoType(String(parsed.infoType ?? "new_entity")),
+      entities: (parsed.entities as unknown[] ?? []).map(String),
+      temporalContext: String(parsed.temporalContext ?? ""),
+    };
+  } catch {
+    return { facts: [], infoType: "new_entity", entities: [], temporalContext: "" };
+  }
+}
+function parseMergeResponse(resp: string): { compiledTruth: string; changed: boolean; changeType: CompileResult["changeType"]; changeSummary: string } {
+  const match = resp.match(/\{[\s\S]*\}/);
+  if (!match) {
+    return {
+      compiledTruth: "",
+      changed: false,
+      changeType: "none",
+      changeSummary: "Failed to parse LLM response",
+    };
+  }
+  try {
+    const parsed = JSON.parse(match[0]) as Record<string, unknown>;
+    return {
+      compiledTruth: String(parsed.compiledTruth ?? ""),
+      changed: Boolean(parsed.changed),
+      changeType: normalizeChangeType(String(parsed.changeType ?? "none")),
+      changeSummary: String(parsed.changeSummary ?? ""),
+    };
+  } catch {
+    return {
+      compiledTruth: "",
+      changed: false,
+      changeType: "none",
+      changeSummary: "Failed to parse LLM response",
+    };
+  }
+}
+function parseTimelineResponse(resp: string, pageSlug: string): TimelineEntry[] {
+  const match = resp.match(/\[[\s\S]*\]/);
+  if (!match) return [];
+  try {
+    const parsed = JSON.parse(match[0]) as unknown[];
+    const entries: TimelineEntry[] = [];
+    for (const e of parsed) {
+      if (typeof e !== "object" || e === null) continue;
+      const entry = e as Record<string, unknown>;
+      entries.push({
+        pageSlug,
+        date: String(entry.date ?? ""),
+        source: String(entry.source ?? "manual"),
+        summary: String(entry.summary ?? "").slice(0, 120),
+        detail: String(entry.detail ?? ""),
+      });
+    }
+    return entries;
+  } catch {
+    return [];
+  }
+}
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+function normalizeInfoType(raw: string): FactAnalysis["infoType"] {
+  const valid = ["status_update", "new_event", "correction", "confirmation", "new_entity"] as const;
+  const lower = raw.toLowerCase().trim();
+  if (valid.includes(lower as typeof valid[number])) return lower as typeof valid[number];
+  return "new_entity";
+}
+function normalizeChangeType(raw: string): CompileResult["changeType"] {
+  const valid = ["append", "update", "replace", "none", "conflict"] as const;
+  const lower = raw.toLowerCase().trim();
+  if (valid.includes(lower as typeof valid[number])) return lower as typeof valid[number];
+  return "none";
+}
+function resolveApiKey(llm: ResolvedLLM): string {
+  if (llm.apiKey) return llm.apiKey;
+  if (llm.apiKeyEnv) return process.env[llm.apiKeyEnv] ?? "";
+  return "";
+}
+function appendFact(current: string, newInfo: string, source: string): string {
+  const timestamp = new Date().toISOString().slice(0, 10);
+  const newLine = `- ${newInfo.trim()} (Source: ${source}, ${timestamp})`;
+  if (!current.trim()) {
+    return `## Facts\n\n${newLine}`;
+  }
+  if (!current.includes("## Facts")) {
+    return `${current}\n\n## Facts\n\n${newLine}`;
+  }
+  return `${current}\n${newLine}`;
+}
+function appendStructuredFacts(current: string, facts: ExtractedFact[], source: string): string {
+  const timestamp = new Date().toISOString().slice(0, 10);
+  const newLines = facts.map(f =>
+    `- **${f.category}**: ${f.newValue} (Source: ${source}, ${timestamp})`
+  ).join("\n");
+  if (!current.trim()) {
+    return `## Facts\n\n${newLines}`;
+  }
+  if (!current.includes("## Facts")) {
+    return `${current}\n\n## Facts\n\n${newLines}`;
+  }
+  return `${current}\n${newLines}`;
+}