PyPI - mem1 - Versions diffs - 0.0.9__tar.gz → 0.1.1__tar.gz - Mend

mem1 0.0.9tar.gz → 0.1.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

{mem1-0.0.9 → mem1-0.1.1}/.env.example RENAMED Viewed

@@ -19,7 +19,7 @@
 MEM1_LLM_API_KEY=your-api-key
 MEM1_LLM_BASE_URL=https://api.deepseek.com
 MEM1_LLM_MODEL=deepseek-chat
-MEM1_LLM_TEMPERATURE=0.7
+MEM1_LLM_TEMPERATURE=0.2
 # ES 配置（必填）
 MEM1_ES_HOSTS=http://localhost:9200

{mem1-0.0.9 → mem1-0.1.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mem1
-Version: 0.0.9
+Version: 0.1.1
 Summary: 基于云服务的用户记忆系统
 Project-URL: Homepage, https://github.com/sougannkyou/mem1
 Project-URL: Repository, https://github.com/sougannkyou/mem1
@@ -239,14 +239,24 @@ def search_memory(start_days: int, end_days: int) -> str:
 使用 `get_context()` 获取上下文后，建议在 system prompt 中加入以下规则，避免 LLM 编造信息：
 ```
-## 重要规则
-1. 回答必须基于上述对话记录中的实际内容，严禁编造任何信息
-2. 涉及数字（金额、数量、百分比、日期等）时，必须从对话记录中原样提取，不得估算或编造
-3. 需要汇总累加时，必须列出计算过程（如：23+31+18+25=97）
-4. 涉及人名、公司名、账号名等实体时，必须使用对话中的原始名称
-5. 如果对话记录中没有相关信息，请明确说"对话记录中未提及"，不要猜测
+## 严格规则（违反将被标记为错误）
+1. 禁止编造任何未在对话记录中出现的信息
+2. 涉及时间/日期时，必须从对话记录中原样引用，不得推测
+3. 如果对话记录中没有明确的时间信息，回答"对话记录中未提及具体时间"
+4. 需要引用数据时，必须标注来源（如：根据 [对话-003] 的记录）
+5. 涉及数字（金额、数量、百分比等）时，必须从对话记录中原样提取，不得估算
+6. 需要汇总累加时，必须列出计算过程（如：23+31+18+25=97）
+7. 涉及人名、公司名、账号名等实体时，必须使用对话中的原始名称
 ```
+**对话记录格式说明**：
+- 每条对话都有唯一 ID，格式为 `[对话-001]`、`[对话-002]` 等
+- 回答时引用对话 ID 可提高可信度，如："根据 [对话-003] 的记录，本月处理了97起舆情"
+**推荐配置**：
+- `MEM1_LLM_TEMPERATURE=0.2`（降低创造性，减少编造）
+- `MEM1_CONTEXT_DAYS_LIMIT=7`（缩小检索范围，提高精准度）
 ## 设计决策：为什么不用向量数据库
 mem1 选择 ES 时间范围检索而非 Milvus/Pinecone 等向量数据库，核心原因是**对话记忆需要上下文连续性**：

{mem1-0.0.9 → mem1-0.1.1}/README.md RENAMED Viewed

@@ -214,14 +214,24 @@ def search_memory(start_days: int, end_days: int) -> str:
 使用 `get_context()` 获取上下文后，建议在 system prompt 中加入以下规则，避免 LLM 编造信息：
 ```
-## 重要规则
-1. 回答必须基于上述对话记录中的实际内容，严禁编造任何信息
-2. 涉及数字（金额、数量、百分比、日期等）时，必须从对话记录中原样提取，不得估算或编造
-3. 需要汇总累加时，必须列出计算过程（如：23+31+18+25=97）
-4. 涉及人名、公司名、账号名等实体时，必须使用对话中的原始名称
-5. 如果对话记录中没有相关信息，请明确说"对话记录中未提及"，不要猜测
+## 严格规则（违反将被标记为错误）
+1. 禁止编造任何未在对话记录中出现的信息
+2. 涉及时间/日期时，必须从对话记录中原样引用，不得推测
+3. 如果对话记录中没有明确的时间信息，回答"对话记录中未提及具体时间"
+4. 需要引用数据时，必须标注来源（如：根据 [对话-003] 的记录）
+5. 涉及数字（金额、数量、百分比等）时，必须从对话记录中原样提取，不得估算
+6. 需要汇总累加时，必须列出计算过程（如：23+31+18+25=97）
+7. 涉及人名、公司名、账号名等实体时，必须使用对话中的原始名称
 ```
+**对话记录格式说明**：
+- 每条对话都有唯一 ID，格式为 `[对话-001]`、`[对话-002]` 等
+- 回答时引用对话 ID 可提高可信度，如："根据 [对话-003] 的记录，本月处理了97起舆情"
+**推荐配置**：
+- `MEM1_LLM_TEMPERATURE=0.2`（降低创造性，减少编造）
+- `MEM1_CONTEXT_DAYS_LIMIT=7`（缩小检索范围，提高精准度）
 ## 设计决策：为什么不用向量数据库
 mem1 选择 ES 时间范围检索而非 Milvus/Pinecone 等向量数据库，核心原因是**对话记忆需要上下文连续性**：

{mem1-0.0.9 → mem1-0.1.1}/mem1/__init__.py RENAMED Viewed

@@ -3,7 +3,7 @@ Mem1 - 用户记忆系统（支持可插拔存储后端）
 """
 import logging
-__version__ = "0.0.9"
+__version__ = "0.1.1"
 # 屏蔽第三方库的详细日志（必须在导入前设置）
 logging.getLogger("elastic_transport").setLevel(logging.WARNING)

{mem1-0.0.9 → mem1-0.1.1}/mem1/memory.py RENAMED Viewed

@@ -546,13 +546,14 @@ class Mem1Memory:
         return summary
     def _format_conversations_for_llm(self, conversations: List[Dict[str, Any]]) -> str:
-        """格式化对话记录为文本"""
+        """格式化对话记录为文本（带引用 ID）"""
         output = []
-        for conv in conversations:
+        for idx, conv in enumerate(conversations, start=1):
+            conv_id = f"对话-{idx:03d}"  # 001, 002, 003...
             timestamp = conv.get("timestamp", "未知时间")
             metadata = conv.get("metadata", {})
-            title = f"### {timestamp}"
+            title = f"### [{conv_id}] {timestamp}"
             if metadata:
                 tags = " ".join([f"[{k}:{v}]" for k, v in metadata.items()])
                 title += f" {tags}"

{mem1-0.0.9 → mem1-0.1.1}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "hatchling.build"
 [project]
 name = "mem1"
-version = "0.0.9"
+version = "0.1.1"
 description = "基于云服务的用户记忆系统"
 authors = [
     { name = "Song" }