npm - ultra-memory - Versions diffs - 3.1.0 → 4.0.0 - Mend

ultra-memory 3.1.0 → 4.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/integrations/__init__.py +1 -0
package/integrations/langchain_memory.py +118 -0
package/integrations/langgraph_checkpointer.py +76 -0
package/integrations/n8n_nodes.py +150 -0
package/package.json +17 -4
package/scripts/__pycache__/conflict_detector.cpython-313.pyc +0 -0
package/scripts/__pycache__/recall.cpython-313.pyc +0 -0
package/scripts/auto_decay.py +351 -0
package/scripts/cleanup.py +21 -0
package/scripts/conflict_detector.py +319 -0
package/scripts/detect_contradictions.py +537 -0
package/scripts/evolve_profile.py +414 -0
package/scripts/extract_facts.py +471 -0
package/scripts/log_op.py +70 -0
package/scripts/multimodal/__init__.py +2 -0
package/scripts/multimodal/extract_from_image.py +138 -0
package/scripts/multimodal/extract_from_pdf.py +182 -0
package/scripts/multimodal/transcribe_video.py +157 -0
package/scripts/recall.py +41 -0

package/scripts/multimodal/extract_from_pdf.py ADDED Viewed

@@ -0,0 +1,182 @@
+#!/usr/bin/env python3
+"""
+ultra-memory: PDF 文本提取 (Multimodal Phase 5)
+从 PDF 文件中提取文本内容，写入 session 的 multimodal/ 目录，
+并触发事实提取。
+依赖: pdfminer.six
+安装: pip install pdfminer.six
+"""
+import os
+import sys
+import json
+import argparse
+import hashlib
+import subprocess
+from datetime import datetime, timezone
+from pathlib import Path
+if sys.stdout.encoding != "utf-8":
+    sys.stdout.reconfigure(encoding="utf-8")
+if sys.stderr.encoding != "utf-8":
+    sys.stderr.reconfigure(encoding="utf-8")
+ULTRA_MEMORY_HOME = Path(os.environ.get("ULTRA_MEMORY_HOME", Path.home() / ".ultra-memory"))
+CHUNK_SIZE = 500  # 每块字符数
+def _now_iso() -> str:
+    return datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")
+def _chunk_text(text: str, chunk_size: int = CHUNK_SIZE) -> list[tuple[int, str]]:
+    """将文本分割为段落块，返回 [(chunk_index, text), ...]"""
+    paragraphs = text.split("\n\n")
+    chunks = []
+    current = []
+    current_len = 0
+    idx = 0
+    for para in paragraphs:
+        para_len = len(para)
+        if current_len + para_len > chunk_size and current:
+            chunks.append((idx, "\n".join(current).strip()))
+            idx += 1
+            current = []
+            current_len = 0
+        current.append(para)
+        current_len += para_len
+    if current:
+        chunks.append((idx, "\n".join(current).strip()))
+    return chunks
+def extract_text_from_pdf(pdf_path: str) -> str:
+    """
+    使用 pdfminer.six 提取 PDF 文本。
+    返回原始文本（保留布局）。
+    """
+    try:
+        from pdfminer.high_level import extract_text
+        from pdfminer.layout import LAParams
+        text = extract_text(pdf_path, laparams=LAParams())
+        return text
+    except ImportError:
+        print("[ultra-memory] ⚠️  pdfminer.six 未安装: pip install pdfminer.six")
+        return ""
+    except Exception as e:
+        print(f"[ultra-memory] ⚠️  PDF 提取失败: {e}")
+        return ""
+def save_extracted_text(
+    session_id: str,
+    media_path: str,
+    text: str,
+    media_id: str,
+) -> Path:
+    """保存提取的文本到 multimodal 目录"""
+    session_dir = ULTRA_MEMORY_HOME / "sessions" / session_id
+    multimodal_dir = session_dir / "multimodal"
+    multimodal_dir.mkdir(parents=True, exist_ok=True)
+    file_name = Path(media_path).name
+    output_file = multimodal_dir / f"{file_name}.txt"
+    with open(output_file, "w", encoding="utf-8") as f:
+        f.write(f"# Extracted from: {media_path}\n")
+        f.write(f"# Media ID: {media_id}\n")
+        f.write(f"# Extracted at: {_now_iso()}\n")
+        f.write(f"# Chars: {len(text)}\n")
+        f.write("---\n")
+        f.write(text)
+    return output_file
+def trigger_fact_extraction(session_id: str, text_chunk: str, media_id: str):
+    """触发 extract_facts.py 从文本块中提取事实"""
+    try:
+        scripts_dir = Path(__file__).parent.parent
+        python = sys.executable
+        import subprocess
+        startupinfo = subprocess.STARTUPINFO()
+        startupinfo.dwFlags |= subprocess.STARTF_USESHOWWINDOW
+        # 将文本通过 stdin 传递（避免命令行转义问题）
+        proc = subprocess.Popen(
+            [python, str(scripts_dir / "extract_facts.py"),
+             "--session", session_id, "--batch"],
+            stdin=subprocess.PIPE,
+            stdout=subprocess.DEVNULL,
+            stderr=subprocess.DEVNULL,
+            start_new_session=True,
+            startupinfo=startupinfo,
+        )
+        # 文本注入到 fact extraction 流程
+        # 注意：当前实现将文本保存到文件，fact extraction 从文件读取
+    except Exception:
+        pass
+def process_pdf(session_id: str, pdf_path: str) -> dict:
+    """
+    处理单个 PDF 文件。
+    返回处理结果摘要。
+    """
+    if not Path(pdf_path).exists():
+        print(f"[ultra-memory] ⚠️  PDF 文件不存在: {pdf_path}")
+        return {"success": False, "error": "file not found"}
+    # 提取文本
+    text = extract_text_from_pdf(pdf_path)
+    if not text.strip():
+        return {"success": False, "error": "no text extracted"}
+    # 生成 media_id
+    media_id = f"media_{hashlib.sha1(pdf_path.encode()).hexdigest()[:12]}"
+    # 保存文本
+    output_file = save_extracted_text(session_id, pdf_path, text, media_id)
+    # 分块
+    chunks = _chunk_text(text)
+    char_count = len(text)
+    print(f"[ultra-memory] ✅ PDF 提取完成: {pdf_path}")
+    print(f"  文件: {output_file.name}")
+    print(f"  字符数: {char_count}")
+    print(f"  文本块: {len(chunks)} 块")
+    return {
+        "success": True,
+        "media_id": media_id,
+        "session_id": session_id,
+        "source_path": pdf_path,
+        "output_file": str(output_file),
+        "char_count": char_count,
+        "chunk_count": len(chunks),
+        "processed_at": _now_iso(),
+    }
+# ── CLI ─────────────────────────────────────────────────────────────────────
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="从 PDF 文件提取文本")
+    parser.add_argument("--path", required=True, help="PDF 文件路径")
+    parser.add_argument("--session", required=True, help="会话 ID")
+    args = parser.parse_args()
+    result = process_pdf(args.session, args.path)
+    if result["success"]:
+        sys.exit(0)
+    else:
+        print(f"[ultra-memory] ❌ PDF 处理失败: {result.get('error')}")
+        sys.exit(1)

package/scripts/multimodal/transcribe_video.py ADDED Viewed

@@ -0,0 +1,157 @@
+#!/usr/bin/env python3
+"""
+ultra-memory: 视频转录 (Multimodal Phase 5)
+从视频文件中提取音频并转录为文字，写入 session 的 multimodal/ 目录。
+依赖: whisper (OpenAI 本地转录，无需 API)
+安装: pip install openai-whisper
+      或: pip install whisper
+注意: whisper 模型较大（base≈1.5GB, small≈3GB, medium≈5GB, large≈10GB）
+首次运行会自动下载模型。建议从 base 开始测试。
+"""
+import os
+import sys
+import json
+import argparse
+import hashlib
+import subprocess
+import tempfile
+import shutil
+from datetime import datetime, timezone
+from pathlib import Path
+if sys.stdout.encoding != "utf-8":
+    sys.stdout.reconfigure(encoding="utf-8")
+if sys.stderr.encoding != "utf-8":
+    sys.stderr.reconfigure(encoding="utf-8")
+ULTRA_MEMORY_HOME = Path(os.environ.get("ULTRA_MEMORY_HOME", Path.home() / ".ultra-memory"))
+# whisper 模型大小映射
+MODEL_SIZES = ["tiny", "base", "small", "medium", "large"]
+def _now_iso() -> str:
+    return datetime.now(timezone.utc).isoformat().replace("+00:00", "Z")
+def transcribe_video(video_path: str, model_size: str = "base") -> str:
+    """
+    使用 Whisper 本地转录视频。
+    自动检测语言。
+    """
+    try:
+        import whisper
+    except ImportError:
+        print("[ultra-memory] ⚠️  whisper 未安装: pip install openai-whisper")
+        print("[ultra-memory] ⚠️  首次运行会自动下载模型（约 1.5GB for base）")
+        return ""
+    if model_size not in MODEL_SIZES:
+        model_size = "base"
+    try:
+        print(f"[ultra-memory] 加载 Whisper {model_size} 模型...")
+        model = whisper.load_model(model_size)
+        print(f"[ultra-memory] 开始转录: {video_path}")
+        result = model.transcribe(video_path, language=None, verbose=False)
+        return result.get("text", "").strip()
+    except Exception as e:
+        print(f"[ultra-memory] ⚠️  转录失败: {e}")
+        return ""
+def save_extracted_text(
+    session_id: str,
+    media_path: str,
+    text: str,
+    media_id: str,
+    model_size: str,
+) -> Path:
+    """保存转录文本到 multimodal 目录"""
+    session_dir = ULTRA_MEMORY_HOME / "sessions" / session_id
+    multimodal_dir = session_dir / "multimodal"
+    multimodal_dir.mkdir(parents=True, exist_ok=True)
+    file_name = Path(media_path).name
+    output_file = multimodal_dir / f"{file_name}.transcript.txt"
+    with open(output_file, "w", encoding="utf-8") as f:
+        f.write(f"# Transcribed from: {media_path}\n")
+        f.write(f"# Media ID: {media_id}\n")
+        f.write(f"# Type: video (Whisper {model_size})\n")
+        f.write(f"# Transcribed at: {_now_iso()}\n")
+        f.write(f"# Chars: {len(text)}\n")
+        f.write("---\n")
+        f.write(text)
+    return output_file
+def process_video(
+    session_id: str,
+    video_path: str,
+    model_size: str = "base",
+) -> dict:
+    """
+    处理单个视频文件。
+    返回处理结果摘要。
+    """
+    if not Path(video_path).exists():
+        print(f"[ultra-memory] ⚠️  视频文件不存在: {video_path}")
+        return {"success": False, "error": "file not found"}
+    # 转录
+    text = transcribe_video(video_path, model_size)
+    if not text.strip():
+        return {"success": False, "error": "transcription failed"}
+    # 生成 media_id
+    media_id = f"media_{hashlib.sha1(video_path.encode()).hexdigest()[:12]}"
+    # 保存文本
+    output_file = save_extracted_text(
+        session_id, video_path, text, media_id, model_size
+    )
+    char_count = len(text)
+    print(f"[ultra-memory] ✅ 视频转录完成: {video_path}")
+    print(f"  文件: {output_file.name}")
+    print(f"  字符数: {char_count}")
+    return {
+        "success": True,
+        "media_id": media_id,
+        "session_id": session_id,
+        "source_path": video_path,
+        "output_file": str(output_file),
+        "char_count": char_count,
+        "model_size": model_size,
+        "processed_at": _now_iso(),
+    }
+# ── CLI ─────────────────────────────────────────────────────────────────────
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="从视频提取文字转录")
+    parser.add_argument("--path", required=True, help="视频文件路径")
+    parser.add_argument("--session", required=True, help="会话 ID")
+    parser.add_argument(
+        "--model",
+        default="base",
+        choices=MODEL_SIZES,
+        help="Whisper 模型大小 (默认: base)",
+    )
+    args = parser.parse_args()
+    result = process_video(args.session, args.path, args.model)
+    if result["success"]:
+        sys.exit(0)
+    else:
+        print(f"[ultra-memory] ❌ 视频处理失败: {result.get('error')}")
+        sys.exit(1)

package/scripts/recall.py CHANGED Viewed

@@ -289,6 +289,9 @@ def search_semantic(query_tokens: set, top_k: int) -> list[dict]:
                     entry = json.loads(line)
                 except json.JSONDecodeError:
                     continue
+                # 过滤已失效条目
+                if entry.get("superseded"):
+                    continue
                 text = entry.get("content", "") + " " + entry.get("title", "")
                 ts = entry.get("ts", "")
                 score = score_relevance(query_tokens, text, ts)
@@ -309,6 +312,36 @@ def search_semantic(query_tokens: set, top_k: int) -> list[dict]:
     return results[:top_k]
+def search_profile(query_tokens: set, home: Path) -> list[dict]:
+    """从 user_profile.json 检索相关字段，跳过 superseded 字段"""
+    profile_file = home / "semantic" / "user_profile.json"
+    if not profile_file.exists():
+        return []
+    try:
+        with open(profile_file, encoding="utf-8") as f:
+            profile = json.load(f)
+    except (json.JSONDecodeError, IOError):
+        return []
+    results = []
+    for key, value in profile.items():
+        # 跳过 superseded 标记的字段
+        if key.endswith("_superseded"):
+            continue
+        text = f"{key} {value}"
+        score = score_relevance(query_tokens, str(text))
+        if score > 0.1:
+            results.append({
+                "score": score,
+                "source": "profile",
+                "data": {"field": key, "value": value},
+            })
+    results.sort(key=lambda x: -x["score"])
+    return results[:3]
 # ── TF-IDF 向量语义搜索层（第四层召回的增强）───────────────────────────
 def is_sklearn_available() -> bool:
@@ -628,6 +661,10 @@ def format_result(result: dict, show_context: bool = True) -> str:
             for k, v in list(detail.items())[:2]:
                 lines.append(f"  [{k}] {str(v)[:60]}")
+    elif source == "profile":
+        d = result["data"]
+        lines.append(f"[用户画像] {d['field']}: {d['value']}")
     return "\n".join(lines) if lines else str(result)
@@ -650,6 +687,10 @@ def recall(session_id: str, query: str, top_k: int = 5):
     semantic_results = search_semantic(query_tokens, top_k)
     found.extend(semantic_results)
+    # 画像检索（从 user_profile.json 搜索相关字段）
+    profile_results = search_profile(query_tokens, ULTRA_MEMORY_HOME)
+    found.extend(profile_results)
     # Layer 4: 实体索引（结构化精确检索）
     entity_results = search_entities(query_tokens, top_k)
     found.extend(entity_results)