@chainlesschain/personal-data-hub 0.4.29 → 0.4.31

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (199) hide show
  1. package/lib/forensics/qq-nt-collect.js +190 -0
  2. package/lib/prompt-builder.js +15 -1
  3. package/package.json +8 -3
  4. package/__tests__/adapter-guide.test.js +0 -47
  5. package/__tests__/adapter-spec.test.js +0 -78
  6. package/__tests__/adapters/ai-chat-cookie-capture-spec.test.js +0 -211
  7. package/__tests__/adapters/ai-chat-health-checker.test.js +0 -262
  8. package/__tests__/adapters/ai-chat-history.test.js +0 -396
  9. package/__tests__/adapters/ai-chat-http-client.test.js +0 -242
  10. package/__tests__/adapters/ai-chat-vendors.test.js +0 -874
  11. package/__tests__/adapters/alipay-bill-adapter.test.js +0 -538
  12. package/__tests__/adapters/apple-health.test.js +0 -95
  13. package/__tests__/adapters/bank-family.test.js +0 -125
  14. package/__tests__/adapters/biz-tianyancha.test.js +0 -159
  15. package/__tests__/adapters/browser-history-chrome.test.js +0 -377
  16. package/__tests__/adapters/browser-history-edge.test.js +0 -159
  17. package/__tests__/adapters/car-mercedesme.test.js +0 -74
  18. package/__tests__/adapters/doc-baidu-netdisk.test.js +0 -102
  19. package/__tests__/adapters/doc-camscanner.test.js +0 -147
  20. package/__tests__/adapters/doc-platforms.test.js +0 -177
  21. package/__tests__/adapters/edu-huawei-learning-live.test.js +0 -198
  22. package/__tests__/adapters/edu-zuoyebang-live.test.js +0 -226
  23. package/__tests__/adapters/email-adapter-snapshot.test.js +0 -237
  24. package/__tests__/adapters/email-adapter.test.js +0 -742
  25. package/__tests__/adapters/email-classifier.test.js +0 -347
  26. package/__tests__/adapters/email-imap-session.test.js +0 -334
  27. package/__tests__/adapters/email-parser.test.js +0 -244
  28. package/__tests__/adapters/email-pdf-extractor.test.js +0 -529
  29. package/__tests__/adapters/email-providers.test.js +0 -84
  30. package/__tests__/adapters/email-retry-progress.test.js +0 -294
  31. package/__tests__/adapters/email-templates.test.js +0 -822
  32. package/__tests__/adapters/family-23-collectors-scaffold.test.js +0 -182
  33. package/__tests__/adapters/finance-alipay-live.test.js +0 -258
  34. package/__tests__/adapters/finance-dcep.test.js +0 -74
  35. package/__tests__/adapters/fitness-joyrun.test.js +0 -82
  36. package/__tests__/adapters/game-genshin-live.test.js +0 -238
  37. package/__tests__/adapters/game-genshin-scaffold.test.js +0 -108
  38. package/__tests__/adapters/game-honor-of-kings-live.test.js +0 -230
  39. package/__tests__/adapters/git-activity.test.js +0 -222
  40. package/__tests__/adapters/gov-12123.test.js +0 -103
  41. package/__tests__/adapters/gov-ixiamen.test.js +0 -150
  42. package/__tests__/adapters/gov-tax.test.js +0 -135
  43. package/__tests__/adapters/health-meiyou.test.js +0 -125
  44. package/__tests__/adapters/local-files.test.js +0 -264
  45. package/__tests__/adapters/local-im-pc.test.js +0 -154
  46. package/__tests__/adapters/messaging-whatsapp.test.js +0 -289
  47. package/__tests__/adapters/music-kugou.test.js +0 -187
  48. package/__tests__/adapters/music-qq.test.js +0 -112
  49. package/__tests__/adapters/netease-music-live.test.js +0 -244
  50. package/__tests__/adapters/netease-music.test.js +0 -74
  51. package/__tests__/adapters/pc-local-discovery.test.js +0 -141
  52. package/__tests__/adapters/qq-pc-direct-read.test.js +0 -227
  53. package/__tests__/adapters/reading-family.test.js +0 -108
  54. package/__tests__/adapters/recruit-boss.test.js +0 -180
  55. package/__tests__/adapters/shell-history.test.js +0 -180
  56. package/__tests__/adapters/shopping-base.test.js +0 -179
  57. package/__tests__/adapters/shopping-dianping.test.js +0 -239
  58. package/__tests__/adapters/social-bilibili-adb-api-client.test.js +0 -721
  59. package/__tests__/adapters/social-bilibili-adb-chromium-cookies-reader.test.js +0 -346
  60. package/__tests__/adapters/social-bilibili-adb-collector.test.js +0 -284
  61. package/__tests__/adapters/social-bilibili-adb-cookies-extension.test.js +0 -343
  62. package/__tests__/adapters/social-bilibili-adb-snapshot-builder.test.js +0 -296
  63. package/__tests__/adapters/social-csdn.test.js +0 -175
  64. package/__tests__/adapters/social-dongchedi.test.js +0 -165
  65. package/__tests__/adapters/social-douyin-adb-aweme-detail.test.js +0 -165
  66. package/__tests__/adapters/social-douyin-adb-collector.test.js +0 -254
  67. package/__tests__/adapters/social-douyin-adb-db-extension.test.js +0 -114
  68. package/__tests__/adapters/social-douyin-adb-im-db-parser.test.js +0 -304
  69. package/__tests__/adapters/social-douyin-adb-snapshot-builder.test.js +0 -216
  70. package/__tests__/adapters/social-douyin-adb-usage-profile.test.js +0 -229
  71. package/__tests__/adapters/social-douyin-adb-watch-history.test.js +0 -269
  72. package/__tests__/adapters/social-kuaishou-adb-api-client.test.js +0 -496
  73. package/__tests__/adapters/social-kuaishou-adb-collector.test.js +0 -276
  74. package/__tests__/adapters/social-kuaishou-adb-cookies-extension.test.js +0 -152
  75. package/__tests__/adapters/social-kuaishou-adb-snapshot-builder.test.js +0 -178
  76. package/__tests__/adapters/social-toutiao-adb-account-reader.test.js +0 -135
  77. package/__tests__/adapters/social-toutiao-adb-api-client.test.js +0 -626
  78. package/__tests__/adapters/social-toutiao-adb-article.test.js +0 -155
  79. package/__tests__/adapters/social-toutiao-adb-collector.test.js +0 -378
  80. package/__tests__/adapters/social-toutiao-adb-cookies-extension.test.js +0 -193
  81. package/__tests__/adapters/social-toutiao-adb-snapshot-builder.test.js +0 -196
  82. package/__tests__/adapters/social-toutiao-kuaishou-scaffold.test.js +0 -311
  83. package/__tests__/adapters/social-weibo-adb-api-client.test.js +0 -362
  84. package/__tests__/adapters/social-weibo-adb-collector.test.js +0 -201
  85. package/__tests__/adapters/social-weibo-adb-cookies-extension.test.js +0 -167
  86. package/__tests__/adapters/social-weibo-adb-snapshot-builder.test.js +0 -189
  87. package/__tests__/adapters/social-xiaohongshu-adb-api-client.test.js +0 -431
  88. package/__tests__/adapters/social-xiaohongshu-adb-collector.test.js +0 -207
  89. package/__tests__/adapters/social-xiaohongshu-adb-cookies-extension.test.js +0 -0
  90. package/__tests__/adapters/social-xiaohongshu-adb-sign-provider-injection.test.js +0 -351
  91. package/__tests__/adapters/social-xiaohongshu-adb-sign.test.js +0 -130
  92. package/__tests__/adapters/social-xiaohongshu-adb-snapshot-builder.test.js +0 -200
  93. package/__tests__/adapters/social-zhihu.test.js +0 -246
  94. package/__tests__/adapters/system-data-adapter.test.js +0 -443
  95. package/__tests__/adapters/system-data-android-ingest.test.js +0 -144
  96. package/__tests__/adapters/system-data-android.test.js +0 -519
  97. package/__tests__/adapters/system-data-disclosure.test.js +0 -153
  98. package/__tests__/adapters/travel-12306.test.js +0 -512
  99. package/__tests__/adapters/travel-amap.test.js +0 -219
  100. package/__tests__/adapters/travel-baidu-map.test.js +0 -305
  101. package/__tests__/adapters/travel-base.test.js +0 -205
  102. package/__tests__/adapters/travel-ctrip.test.js +0 -377
  103. package/__tests__/adapters/travel-didi-consumer.test.js +0 -66
  104. package/__tests__/adapters/travel-didi.test.js +0 -204
  105. package/__tests__/adapters/travel-tencent-map.test.js +0 -207
  106. package/__tests__/adapters/travel-tongcheng.test.js +0 -289
  107. package/__tests__/adapters/video-platforms.test.js +0 -152
  108. package/__tests__/adapters/video-xigua.test.js +0 -106
  109. package/__tests__/adapters/vscode.test.js +0 -299
  110. package/__tests__/adapters/wechat-bootstrap.test.js +0 -240
  111. package/__tests__/adapters/wechat-env-probe.test.js +0 -162
  112. package/__tests__/adapters/wechat-frida-agent.test.js +0 -322
  113. package/__tests__/adapters/wechat-frida-integration.test.js +0 -149
  114. package/__tests__/adapters/wechat-frida-key-provider.test.js +0 -188
  115. package/__tests__/adapters/wechat-md5-key-provider.test.js +0 -101
  116. package/__tests__/adapters/wechat-pc-direct-read.test.js +0 -365
  117. package/__tests__/adapters/wechat-pc-group-topic.test.js +0 -63
  118. package/__tests__/adapters/wechat-pc-v4-sidecar.test.js +0 -72
  119. package/__tests__/adapters/weread.test.js +0 -123
  120. package/__tests__/adapters/wework-pc.test.js +0 -124
  121. package/__tests__/adapters/win-recent.test.js +0 -192
  122. package/__tests__/analysis-skills.test.js +0 -754
  123. package/__tests__/analysis.test.js +0 -1845
  124. package/__tests__/audio-ximalaya-snapshot.test.js +0 -279
  125. package/__tests__/batch.test.js +0 -133
  126. package/__tests__/bridges-cc-kg.test.js +0 -231
  127. package/__tests__/bridges-cc-llm.test.js +0 -191
  128. package/__tests__/bridges-cc-rag.test.js +0 -162
  129. package/__tests__/categories.test.js +0 -92
  130. package/__tests__/e2e/ai-chat-cross-source-journey.test.js +0 -213
  131. package/__tests__/e2e/full-user-journey.test.js +0 -188
  132. package/__tests__/e2e/local-data-adapters-cli.e2e.test.js +0 -146
  133. package/__tests__/entity-resolver-ingest-hook.test.js +0 -177
  134. package/__tests__/entity-resolver-stages.test.js +0 -411
  135. package/__tests__/entity-resolver-vault.test.js +0 -249
  136. package/__tests__/entity-resolver.test.js +0 -526
  137. package/__tests__/fitness-keep-snapshot.test.js +0 -224
  138. package/__tests__/fixtures/entity-resolver-200-mock.json +0 -96
  139. package/__tests__/ids.test.js +0 -45
  140. package/__tests__/integration/ai-chat-history-registry.test.js +0 -228
  141. package/__tests__/integration/aichat-wizard-end-to-end.test.js +0 -282
  142. package/__tests__/integration/cross-adapter-pipelines.test.js +0 -396
  143. package/__tests__/integration/local-data-adapters-pipeline.test.js +0 -373
  144. package/__tests__/integration/social-bilibili-pipeline.test.js +0 -261
  145. package/__tests__/integration/wechat-bootstrap-end-to-end.test.js +0 -390
  146. package/__tests__/key-providers.test.js +0 -126
  147. package/__tests__/kg-derive.test.js +0 -219
  148. package/__tests__/llm-client.test.js +0 -122
  149. package/__tests__/longtail-adapters.test.js +0 -281
  150. package/__tests__/messaging-qq-snapshot.test.js +0 -294
  151. package/__tests__/mobile-extractor-encrypted.test.js +0 -460
  152. package/__tests__/mobile-extractor.test.js +0 -288
  153. package/__tests__/mock-adapter.test.js +0 -93
  154. package/__tests__/prompt-builder.test.js +0 -249
  155. package/__tests__/query-parser.test.js +0 -365
  156. package/__tests__/rag-derive.test.js +0 -169
  157. package/__tests__/registry-readiness.test.js +0 -292
  158. package/__tests__/registry.test.js +0 -420
  159. package/__tests__/salvage-ingest.test.js +0 -97
  160. package/__tests__/schemas.test.js +0 -331
  161. package/__tests__/shopping-adapters.test.js +0 -392
  162. package/__tests__/shopping-eleme-snapshot.test.js +0 -454
  163. package/__tests__/shopping-pinduoduo-snapshot.test.js +0 -484
  164. package/__tests__/shopping-snapshot.test.js +0 -438
  165. package/__tests__/shopping-vipshop-snapshot.test.js +0 -425
  166. package/__tests__/shopping-xianyu-snapshot.test.js +0 -451
  167. package/__tests__/sidecar-contacts-cross-validate.test.js +0 -186
  168. package/__tests__/sidecar-supervisor.test.js +0 -128
  169. package/__tests__/sign-providers.test.js +0 -62
  170. package/__tests__/social-adapters.test.js +0 -280
  171. package/__tests__/social-bilibili-snapshot.test.js +0 -278
  172. package/__tests__/social-douban-snapshot.test.js +0 -351
  173. package/__tests__/social-douyin-im-direct-read.test.js +0 -377
  174. package/__tests__/social-douyin-salvage-collector.test.js +0 -98
  175. package/__tests__/social-douyin-salvage-mapper.test.js +0 -90
  176. package/__tests__/social-douyin-snapshot.test.js +0 -256
  177. package/__tests__/social-kuaishou-snapshot.test.js +0 -362
  178. package/__tests__/social-toutiao-snapshot.test.js +0 -366
  179. package/__tests__/social-weibo-snapshot.test.js +0 -234
  180. package/__tests__/social-weibo-sqlite-device.test.js +0 -174
  181. package/__tests__/social-xiaohongshu-snapshot.test.js +0 -232
  182. package/__tests__/sqlite-leaf-salvage.test.js +0 -97
  183. package/__tests__/travel-adapters.test.js +0 -483
  184. package/__tests__/travel-maps-snapshot.test.js +0 -426
  185. package/__tests__/vault-driver-error.test.js +0 -74
  186. package/__tests__/vault-search-helpers.test.js +0 -104
  187. package/__tests__/vault-search.test.js +0 -423
  188. package/__tests__/vault.test.js +0 -767
  189. package/__tests__/wechat-adapter.test.js +0 -594
  190. package/__tests__/whatsapp-adapter.test.js +0 -138
  191. package/scripts/_make-fixture-all.js +0 -126
  192. package/scripts/_make-fixture-contacts.js +0 -84
  193. package/scripts/evaluate-entity-resolver.js +0 -213
  194. package/scripts/run-native-tests-sandbox.sh +0 -55
  195. package/scripts/smoke-phase-5-5.js +0 -196
  196. package/scripts/smoke-phase-5-7.js +0 -181
  197. package/scripts/smoke-system-data-contacts.js +0 -309
  198. package/scripts/smoke-system-data.js +0 -312
  199. package/vitest.config.js +0 -88
@@ -1,191 +0,0 @@
1
- "use strict";
2
-
3
- import { describe, it, expect } from "vitest";
4
-
5
- const { CcLLMAdapter, LOCAL_PROVIDERS } = require("../lib/bridges/cc-llm-adapter");
6
- const { AnalysisEngine } = require("../lib/analysis");
7
-
8
- describe("CcLLMAdapter construction", () => {
9
- it("requires chat function", () => {
10
- expect(() => new CcLLMAdapter()).toThrow();
11
- expect(() => new CcLLMAdapter({})).toThrow(/chat/);
12
- });
13
-
14
- it("constructs with just chat", () => {
15
- const a = new CcLLMAdapter({ chat: async () => ({}) });
16
- expect(a.name).toBe("cc-llm"); // no provider/model getters → default name
17
- });
18
- });
19
-
20
- describe("CcLLMAdapter.isLocal", () => {
21
- it("returns true for ollama / llama-cpp / lm-studio / vllm-local", () => {
22
- for (const p of ["ollama", "llama-cpp", "llamacpp", "vllm-local", "lm-studio", "lmstudio"]) {
23
- const a = new CcLLMAdapter({
24
- chat: async () => ({}),
25
- getActiveProvider: () => p,
26
- });
27
- expect(a.isLocal).toBe(true);
28
- }
29
- });
30
-
31
- it("returns false for openai / anthropic / volcengine / etc.", () => {
32
- for (const p of ["openai", "anthropic", "volcengine", "gemini", "deepseek"]) {
33
- const a = new CcLLMAdapter({
34
- chat: async () => ({}),
35
- getActiveProvider: () => p,
36
- });
37
- expect(a.isLocal).toBe(false);
38
- }
39
- });
40
-
41
- it("returns false (conservative) when no provider getter is wired", () => {
42
- const a = new CcLLMAdapter({ chat: async () => ({}) });
43
- expect(a.isLocal).toBe(false);
44
- });
45
-
46
- it("getActiveProvider throws → fall through to false (defensive)", () => {
47
- const a = new CcLLMAdapter({
48
- chat: async () => ({}),
49
- getActiveProvider: () => { throw new Error("oops"); },
50
- });
51
- expect(a.isLocal).toBe(false);
52
- });
53
-
54
- it("custom localProviders override the default whitelist", () => {
55
- const a = new CcLLMAdapter({
56
- chat: async () => ({}),
57
- getActiveProvider: () => "my-private-cluster",
58
- localProviders: ["my-private-cluster"],
59
- });
60
- expect(a.isLocal).toBe(true);
61
- });
62
-
63
- it("LOCAL_PROVIDERS contains the documented set", () => {
64
- expect(LOCAL_PROVIDERS.has("ollama")).toBe(true);
65
- expect(LOCAL_PROVIDERS.has("llama-cpp")).toBe(true);
66
- expect(LOCAL_PROVIDERS.has("vllm-local")).toBe(true);
67
- expect(LOCAL_PROVIDERS.has("openai")).toBe(false);
68
- });
69
- });
70
-
71
- describe("CcLLMAdapter.name", () => {
72
- it("uses opts.name override when provided", () => {
73
- const a = new CcLLMAdapter({ chat: async () => ({}), name: "my-name" });
74
- expect(a.name).toBe("my-name");
75
- });
76
-
77
- it("composes provider:model when both getters available", () => {
78
- const a = new CcLLMAdapter({
79
- chat: async () => ({}),
80
- getActiveProvider: () => "ollama",
81
- getActiveModel: () => "qwen2.5:7b",
82
- });
83
- expect(a.name).toBe("ollama:qwen2.5:7b");
84
- });
85
-
86
- it("falls back to model only when no provider", () => {
87
- const a = new CcLLMAdapter({
88
- chat: async () => ({}),
89
- getActiveModel: () => "qwen",
90
- });
91
- expect(a.name).toBe("qwen");
92
- });
93
- });
94
-
95
- describe("CcLLMAdapter.chat response normalization", () => {
96
- it("extracts text from .content (cc llm-manager shape)", async () => {
97
- const a = new CcLLMAdapter({
98
- chat: async () => ({ content: "hi from cc", model: "qwen", usage: { promptTokens: 5, completionTokens: 3 } }),
99
- getActiveModel: () => "qwen",
100
- });
101
- const r = await a.chat([{ role: "user", content: "x" }]);
102
- expect(r.text).toBe("hi from cc");
103
- expect(r.model).toBe("qwen");
104
- expect(r.usage.promptTokens).toBe(5);
105
- expect(r.usage.completionTokens).toBe(3);
106
- expect(r.usage.totalTokens).toBe(8);
107
- });
108
-
109
- it("extracts text from .message.content (raw provider)", async () => {
110
- const a = new CcLLMAdapter({
111
- chat: async () => ({ message: { role: "assistant", content: "from msg" } }),
112
- });
113
- const r = await a.chat([]);
114
- expect(r.text).toBe("from msg");
115
- });
116
-
117
- it("extracts text from .text (alt shape)", async () => {
118
- const a = new CcLLMAdapter({ chat: async () => ({ text: "alt shape" }) });
119
- const r = await a.chat([]);
120
- expect(r.text).toBe("alt shape");
121
- });
122
-
123
- it("extracts text from OpenAI-style .choices[0].message.content", async () => {
124
- const a = new CcLLMAdapter({
125
- chat: async () => ({
126
- choices: [{ message: { content: "openai-like" } }],
127
- }),
128
- });
129
- const r = await a.chat([]);
130
- expect(r.text).toBe("openai-like");
131
- });
132
-
133
- it("returns empty text for unknown shape (doesn't throw)", async () => {
134
- const a = new CcLLMAdapter({ chat: async () => ({ random: "blob" }) });
135
- const r = await a.chat([]);
136
- expect(r.text).toBe("");
137
- });
138
-
139
- it("normalizes snake_case usage (prompt_tokens) to camelCase", async () => {
140
- const a = new CcLLMAdapter({
141
- chat: async () => ({
142
- content: "x",
143
- usage: { prompt_tokens: 10, completion_tokens: 20, total_tokens: 30 },
144
- }),
145
- });
146
- const r = await a.chat([]);
147
- expect(r.usage).toEqual({ promptTokens: 10, completionTokens: 20, totalTokens: 30 });
148
- });
149
-
150
- it("wraps underlying chat errors with cause preserved", async () => {
151
- const a = new CcLLMAdapter({
152
- chat: async () => { throw new Error("upstream Ollama died"); },
153
- });
154
- await expect(a.chat([])).rejects.toThrow(/underlying client failed/);
155
- });
156
-
157
- it("validates messages is an array", async () => {
158
- const a = new CcLLMAdapter({ chat: async () => ({}) });
159
- await expect(a.chat("not an array")).rejects.toThrow(/array/);
160
- });
161
- });
162
-
163
- describe("CcLLMAdapter ↔ AnalysisEngine integration", () => {
164
- it("AnalysisEngine accepts CcLLMAdapter (local-provider path)", () => {
165
- const a = new CcLLMAdapter({
166
- chat: async () => ({ content: "ok" }),
167
- getActiveProvider: () => "ollama",
168
- });
169
- // Construction shouldn't throw — isLocal:true means engine accepts.
170
- const fakeVault = {
171
- audit: () => {},
172
- queryEvents: () => [],
173
- getWatermark: () => null,
174
- };
175
- expect(() => new AnalysisEngine({ vault: fakeVault, llm: a })).not.toThrow();
176
- });
177
-
178
- it("AnalysisEngine refuses CcLLMAdapter when provider is non-local without opt-in", async () => {
179
- const a = new CcLLMAdapter({
180
- chat: async () => ({ content: "ok" }),
181
- getActiveProvider: () => "anthropic",
182
- });
183
- const fakeVault = {
184
- audit: () => {},
185
- queryEvents: () => [],
186
- getWatermark: () => null,
187
- };
188
- const e = new AnalysisEngine({ vault: fakeVault, llm: a });
189
- await expect(e.ask("test")).rejects.toThrow(/non-local/);
190
- });
191
- });
@@ -1,162 +0,0 @@
1
- "use strict";
2
-
3
- import { describe, it, expect } from "vitest";
4
-
5
- const { CcRagSink } = require("../lib/bridges/cc-rag-sink");
6
-
7
- // Mirror BM25.addDocument shape — captures everything for assertion
8
- function makeFakeBm25() {
9
- const docs = [];
10
- return {
11
- docs,
12
- addDocument(doc) {
13
- docs.push({ ...doc });
14
- },
15
- };
16
- }
17
-
18
- const doc = (id, text, type = "event", metadata = {}) => ({
19
- id,
20
- type,
21
- text,
22
- metadata,
23
- });
24
-
25
- // ─── Tests ──────────────────────────────────────────────────────────────
26
-
27
- describe("CcRagSink construction", () => {
28
- it("requires bm25 with addDocument", () => {
29
- expect(() => new CcRagSink()).toThrow();
30
- expect(() => new CcRagSink({})).toThrow(/bm25/);
31
- expect(() => new CcRagSink({ bm25: {} })).toThrow(/addDocument/);
32
- });
33
-
34
- it("accepts bm25 with addDocument; optional vector + logger + transformDoc", () => {
35
- const bm25 = makeFakeBm25();
36
- const s = new CcRagSink({
37
- bm25,
38
- vector: { index: async () => {} },
39
- logger: () => {},
40
- transformDoc: (d) => d,
41
- });
42
- expect(s).toBeDefined();
43
- });
44
- });
45
-
46
- describe("CcRagSink.write", () => {
47
- it("indexes docs to BM25 in cc-expected shape", async () => {
48
- const bm25 = makeFakeBm25();
49
- const sink = new CcRagSink({ bm25 });
50
- const r = await sink.write([
51
- doc("evt-1", "妈妈生日蛋白粉 +288.50 CNY", "event", { subtype: "order", adapter: "taobao" }),
52
- doc("evt-2", "按摩仪 给妈妈", "event", { subtype: "order", adapter: "taobao" }),
53
- ]);
54
- expect(r.indexed).toBe(2);
55
- expect(r.skipped).toBe(0);
56
- expect(bm25.docs.length).toBe(2);
57
- expect(bm25.docs[0].id).toBe("evt-1");
58
- expect(bm25.docs[0].content).toContain("妈妈生日蛋白粉");
59
- expect(bm25.docs[0].title).toBe("order"); // metadata.subtype used as title
60
- expect(bm25.docs[0].meta.adapter).toBe("taobao");
61
- expect(bm25.docs[0].hubType).toBe("event");
62
- });
63
-
64
- it("falls back to hub type as title when no metadata.title/.subtype", async () => {
65
- const bm25 = makeFakeBm25();
66
- const sink = new CcRagSink({ bm25 });
67
- await sink.write([doc("p-1", "妈妈 陈某某", "person", {})]);
68
- expect(bm25.docs[0].title).toBe("person");
69
- });
70
-
71
- it("metadata.title overrides subtype/type", async () => {
72
- const bm25 = makeFakeBm25();
73
- const sink = new CcRagSink({ bm25 });
74
- await sink.write([doc("x", "body", "event", { title: "custom title", subtype: "order" })]);
75
- expect(bm25.docs[0].title).toBe("custom title");
76
- });
77
-
78
- it("dedupes by id within the sink lifetime", async () => {
79
- const bm25 = makeFakeBm25();
80
- const sink = new CcRagSink({ bm25 });
81
- await sink.write([doc("evt-1", "text v1")]);
82
- const r = await sink.write([doc("evt-1", "text v2")]);
83
- expect(r.indexed).toBe(0);
84
- expect(r.skipped).toBe(1);
85
- expect(bm25.docs.length).toBe(1);
86
- expect(bm25.docs[0].content).toBe("text v1"); // first write wins
87
- });
88
-
89
- it("skips empty / malformed docs", async () => {
90
- const bm25 = makeFakeBm25();
91
- const sink = new CcRagSink({ bm25 });
92
- const r = await sink.write([
93
- doc("a", ""), // empty text
94
- doc("b", "real text"),
95
- { id: "c" /* missing text */ },
96
- null,
97
- { /* missing id */ text: "orphan" },
98
- ]);
99
- expect(r.indexed).toBe(1);
100
- expect(r.skipped).toBe(4);
101
- expect(bm25.docs.length).toBe(1);
102
- });
103
-
104
- it("collects upstream BM25 errors without aborting batch", async () => {
105
- let failOn = "evt-2";
106
- const sink = new CcRagSink({
107
- bm25: {
108
- addDocument(d) {
109
- if (d.id === failOn) throw new Error("BM25 backend full");
110
- },
111
- },
112
- });
113
- const r = await sink.write([doc("evt-1", "a"), doc("evt-2", "b"), doc("evt-3", "c")]);
114
- expect(r.indexed).toBe(2);
115
- expect(r.errors.length).toBe(1);
116
- expect(r.errors[0].id).toBe("evt-2");
117
- });
118
-
119
- it("forwards to vector store when wired", async () => {
120
- const bm25 = makeFakeBm25();
121
- const vectorCalls = [];
122
- const sink = new CcRagSink({
123
- bm25,
124
- vector: { index: async (docs) => { vectorCalls.push(docs); } },
125
- });
126
- const r = await sink.write([doc("a", "alpha"), doc("b", "beta")]);
127
- expect(r.indexed).toBe(2);
128
- expect(vectorCalls.length).toBe(1);
129
- expect(vectorCalls[0].length).toBe(2);
130
- });
131
-
132
- it("vector failure is captured but BM25 indexing still succeeds", async () => {
133
- const bm25 = makeFakeBm25();
134
- const sink = new CcRagSink({
135
- bm25,
136
- vector: { index: async () => { throw new Error("qdrant down"); } },
137
- });
138
- const r = await sink.write([doc("a", "alpha")]);
139
- expect(r.indexed).toBe(1);
140
- expect(bm25.docs.length).toBe(1);
141
- expect(r.errors.length).toBe(1);
142
- expect(r.errors[0].phase).toBe("vector");
143
- });
144
-
145
- it("transformDoc hook lets caller rewrite the doc shape", async () => {
146
- const bm25 = makeFakeBm25();
147
- const sink = new CcRagSink({
148
- bm25,
149
- transformDoc: (d) => ({ id: d.id, title: "OVERRIDE", content: d.text.toUpperCase() }),
150
- });
151
- await sink.write([doc("a", "hello")]);
152
- expect(bm25.docs[0].title).toBe("OVERRIDE");
153
- expect(bm25.docs[0].content).toBe("HELLO");
154
- });
155
-
156
- it("returns zeros for empty input", async () => {
157
- const bm25 = makeFakeBm25();
158
- const sink = new CcRagSink({ bm25 });
159
- const r = await sink.write([]);
160
- expect(r).toEqual({ indexed: 0, skipped: 0, errors: [] });
161
- });
162
- });
@@ -1,92 +0,0 @@
1
- "use strict";
2
-
3
- import { describe, it, expect } from "vitest";
4
-
5
- const {
6
- CATEGORIES,
7
- CATEGORY_LABELS,
8
- getCategory,
9
- groupByCategory,
10
- } = require("../lib/categories");
11
-
12
- describe("PDH categories taxonomy", () => {
13
- it("CATEGORIES covers the 8 known buckets and is frozen", () => {
14
- expect(CATEGORIES).toEqual([
15
- "chat", "social", "email", "shopping", "travel", "system", "ai-chat", "other",
16
- ]);
17
- expect(Object.isFrozen(CATEGORIES)).toBe(true);
18
- });
19
-
20
- it("CATEGORY_LABELS has Chinese label for every category", () => {
21
- for (const c of CATEGORIES) {
22
- expect(typeof CATEGORY_LABELS[c]).toBe("string");
23
- expect(CATEGORY_LABELS[c].length).toBeGreaterThan(0);
24
- }
25
- });
26
-
27
- it.each([
28
- ["wechat", "chat"],
29
- ["messaging-qq", "chat"],
30
- ["messaging-telegram", "chat"],
31
- ["messaging-whatsapp", "chat"],
32
- ["social-bilibili", "social"],
33
- ["social-weibo", "social"],
34
- ["social-douyin", "social"],
35
- ["social-xiaohongshu", "social"],
36
- ["social-toutiao", "social"],
37
- ["social-kuaishou", "social"],
38
- ["email-imap", "email"],
39
- ["email-imap-qq", "email"],
40
- ["email-imap-gmail", "email"],
41
- ["alipay-bill", "shopping"],
42
- ["shopping-taobao", "shopping"],
43
- ["shopping-jd", "shopping"],
44
- ["shopping-meituan", "shopping"],
45
- ["shopping-pinduoduo", "shopping"],
46
- ["travel-12306", "travel"],
47
- ["travel-ctrip", "travel"],
48
- ["travel-amap", "travel"],
49
- ["travel-baidu-map", "travel"],
50
- ["travel-tencent-map", "travel"],
51
- ["system-data", "system"],
52
- ["system-data-android", "system"],
53
- ["browser-history-chrome", "system"],
54
- ["ai-chat-history", "ai-chat"],
55
- ["ai-chat-deepseek", "ai-chat"],
56
- ])("getCategory(%s) → %s", (adapter, cat) => {
57
- expect(getCategory(adapter)).toBe(cat);
58
- });
59
-
60
- it.each([
61
- ["unknown-adapter", "other"],
62
- ["", "other"],
63
- [null, "other"],
64
- [undefined, "other"],
65
- [123, "other"],
66
- ])("getCategory(%p) falls back to other", (adapter, expected) => {
67
- expect(getCategory(adapter)).toBe(expected);
68
- });
69
-
70
- it("groupByCategory groups multiple adapters and omits empty buckets", () => {
71
- const groups = groupByCategory([
72
- "wechat",
73
- "messaging-qq",
74
- "social-bilibili",
75
- "email-imap-qq",
76
- "unknown-x",
77
- ]);
78
- expect(groups).toEqual({
79
- chat: ["wechat", "messaging-qq"],
80
- social: ["social-bilibili"],
81
- email: ["email-imap-qq"],
82
- other: ["unknown-x"],
83
- });
84
- expect(groups.travel).toBeUndefined();
85
- });
86
-
87
- it("groupByCategory tolerates empty / nullish input", () => {
88
- expect(groupByCategory(null)).toEqual({});
89
- expect(groupByCategory(undefined)).toEqual({});
90
- expect(groupByCategory([])).toEqual({});
91
- });
92
- });
@@ -1,213 +0,0 @@
1
- "use strict";
2
-
3
- // E2E — Personal Data Hub cross-source journey including Phase 10.2 AIChat.
4
- //
5
- // User has:
6
- // 1. Two AI vendors with chat history (DeepSeek + Kimi)
7
- // 2. EntityResolver wires up vendor Persons as ai-agents
8
- // 3. Timeline + Relations skills weave AI conversations into the same
9
- // chronological story as other data sources (RAG-ready surface).
10
- //
11
- // Verifies the Phase 10.2 wiring through the entire stack — sync → vault
12
- // → KG/RAG sinks → analysis skills — using fixture HTTP (no live cookies).
13
-
14
- import { describe, it, expect, beforeEach, afterEach } from "vitest";
15
-
16
- const fs = require("node:fs");
17
- const path = require("node:path");
18
- const os = require("node:os");
19
-
20
- const {
21
- LocalVault, generateKeyHex, AdapterRegistry,
22
- EntityResolver,
23
- TimelineSkill, RelationsSkill,
24
- } = require("../../lib");
25
- const {
26
- AIChatHistoryAdapter, CookieAuthSession,
27
- } = require("../../lib/adapters/ai-chat-history");
28
-
29
- function makeResponse({ status = 200, body = {} } = {}) {
30
- return {
31
- status,
32
- ok: status >= 200 && status < 300,
33
- headers: { get: () => null },
34
- async json() { return body; },
35
- };
36
- }
37
-
38
- function makeRoutedFetch(routes) {
39
- return async (url, init) => {
40
- for (const [pattern, response] of routes) {
41
- if (typeof pattern === "string" ? url.includes(pattern) : pattern.test(url)) {
42
- if (typeof response === "function") return response(url, init);
43
- return response;
44
- }
45
- }
46
- return makeResponse({ status: 404 });
47
- };
48
- }
49
-
50
- function makeClock() {
51
- let t = 1700000000_000;
52
- return { now: () => t, sleep: async (ms) => { t += ms; } };
53
- }
54
-
55
- describe("E2E — Personal Data Hub cross-source journey with AIChat", () => {
56
- let dir, vault, registry, resolver;
57
-
58
- beforeEach(() => {
59
- dir = fs.mkdtempSync(path.join(os.tmpdir(), "pdh-aichat-e2e-"));
60
- vault = new LocalVault({ path: path.join(dir, "v.db"), key: generateKeyHex() });
61
- vault.open();
62
- resolver = new EntityResolver({ vault });
63
- registry = new AdapterRegistry({ vault, entityResolver: resolver });
64
- });
65
-
66
- afterEach(() => {
67
- try { vault.close(); } catch (_e) {}
68
- try { fs.rmSync(dir, { recursive: true, force: true }); } catch (_e) {}
69
- });
70
-
71
- it("two AIChat vendors land in vault; TimelineSkill returns interleaved events", async () => {
72
- const clk = makeClock();
73
- const fetch = makeRoutedFetch([
74
- // DeepSeek
75
- ["/get_user_info", makeResponse({ body: { code: 0, data: { biz_data: { user_id: "ds-u1" } } } })],
76
- [/fetch_page.*before=/, makeResponse({ body: { data: { biz_data: { chat_sessions: [] } } } })],
77
- ["/chat_session/fetch_page", makeResponse({ body: { data: { biz_data: { chat_sessions: [
78
- { id: "ds-c1", title: "DeepSeek code review", model: "deepseek-r1", inserted_at: 1700000100, updated_at: 1700000200 },
79
- ] } } } })],
80
- ["/chat/history_messages", makeResponse({ body: { data: { biz_data: { chat_messages: [
81
- { id: "ds-m1", role: "USER", content: "explain this Go race condition", inserted_at: 1700000100 },
82
- { id: "ds-m2", role: "ASSISTANT", content: "The issue is the unlocked mutex...", inserted_at: 1700000150, model: "deepseek-r1" },
83
- ] } } } })],
84
- // Kimi
85
- ["/api/user", makeResponse({ body: { id: "km-u1" } })],
86
- [/list\?offset=30/, makeResponse({ body: { items: [], total: 1 } })],
87
- [/list\?offset=0/, makeResponse({ body: { items: [
88
- { id: "km-c1", name: "Kimi 200k context Q", created_at: 1700000300, updated_at: 1700000400 },
89
- ], total: 1 } })],
90
- [/segment\/scroll/, async (_url, init) => {
91
- const body = JSON.parse(init.body);
92
- if (body.last === "0") {
93
- return makeResponse({ body: {
94
- items: [
95
- { id: "km-msg-1", role: "user", content: "summarize this paper", created_at: 1700000300 },
96
- { id: "km-msg-2", role: "assistant", content: "The paper proposes...", created_at: 1700000350 },
97
- ],
98
- has_more: false,
99
- } });
100
- }
101
- return makeResponse({ body: { items: [], has_more: false } });
102
- }],
103
- ]);
104
-
105
- const adapter = new AIChatHistoryAdapter({ fetch, sleep: clk.sleep, now: clk.now });
106
- adapter.setSession("deepseek", new CookieAuthSession({
107
- vendor: "deepseek",
108
- cookies: [{ name: "userToken", value: "ds-cookie" }],
109
- }));
110
- adapter.setSession("kimi", new CookieAuthSession({
111
- vendor: "kimi",
112
- cookies: [{ name: "access_token", value: "km-cookie" }],
113
- }));
114
- registry.register(adapter);
115
-
116
- // ─── Sync ──────────────────────────────────────────────
117
- const report = await registry.syncAdapter("ai-chat-history");
118
- expect(report.status).toBe("ok");
119
- expect(report.invalidCount).toBe(0);
120
- expect(report.rawCount).toBeGreaterThanOrEqual(6); // 2 convs + 4 msgs
121
-
122
- // ─── Vault inspection ──────────────────────────────────
123
- const events = vault.queryEvents({ adapter: "ai-chat-history", limit: 100 });
124
- expect(events.length).toBe(4); // 2 deepseek msgs + 2 kimi msgs
125
-
126
- // Both vendors present
127
- const vendors = new Set(events.map((e) => e.extra && e.extra.vendor).filter(Boolean));
128
- expect(vendors.has("deepseek")).toBe(true);
129
- expect(vendors.has("kimi")).toBe(true);
130
-
131
- // Vendor AI-agent Persons deduped
132
- const aiAgentCount = vault.db
133
- .prepare("SELECT COUNT(*) AS n FROM persons WHERE subtype = 'ai-agent'")
134
- .get().n;
135
- expect(aiAgentCount).toBe(2);
136
-
137
- // ─── TimelineSkill: events interleaved by time ─────────
138
- const timeline = new TimelineSkill({ vault });
139
- const result = await timeline.run({ since: 1700000000_000, until: 1700001000_000, limit: 100 });
140
- expect(result.entries.length).toBeGreaterThanOrEqual(4);
141
-
142
- // Both vendors appear via the timeline entries (each entry references an event)
143
- const allText = result.entries.map((e) => JSON.stringify(e)).join(" ");
144
- expect(allText).toMatch(/Go race|race condition/);
145
- expect(allText).toMatch(/summarize this paper|paper proposes/);
146
- });
147
-
148
- it("RelationsSkill aggregates AI-agent interactions across vendors", async () => {
149
- const clk = makeClock();
150
- const fetch = makeRoutedFetch([
151
- ["/get_user_info", makeResponse({ body: { code: 0, data: { biz_data: { user_id: "ds-u1" } } } })],
152
- [/fetch_page.*before=/, makeResponse({ body: { data: { biz_data: { chat_sessions: [] } } } })],
153
- ["/chat_session/fetch_page", makeResponse({ body: { data: { biz_data: { chat_sessions: [
154
- { id: "ds-c1", title: "ds chat", model: "deepseek-r1", inserted_at: 1700000100, updated_at: 1700000200 },
155
- ] } } } })],
156
- ["/chat/history_messages", makeResponse({ body: { data: { biz_data: { chat_messages: [
157
- { id: "ds-m1", role: "USER", content: "hi", inserted_at: 1700000100 },
158
- { id: "ds-m2", role: "ASSISTANT", content: "hi back", inserted_at: 1700000110 },
159
- { id: "ds-m3", role: "USER", content: "more questions", inserted_at: 1700000120 },
160
- ] } } } })],
161
- ]);
162
-
163
- const adapter = new AIChatHistoryAdapter({ fetch, sleep: clk.sleep, now: clk.now });
164
- adapter.setSession("deepseek", new CookieAuthSession({ vendor: "deepseek", cookies: [] }));
165
- registry.register(adapter);
166
-
167
- await registry.syncAdapter("ai-chat-history");
168
-
169
- const skill = new RelationsSkill({ vault });
170
- const r = await skill.run({ personId: "person-ai-deepseek" });
171
- expect(r.profile.totalInteractions).toBeGreaterThan(0);
172
- });
173
-
174
- it("AIChat + cookie-expired sentinel: partial success, journey continues", async () => {
175
- const clk = makeClock();
176
- // DeepSeek returns 401 (expired); Kimi works.
177
- const fetch = makeRoutedFetch([
178
- [/chat_session\/fetch_page/, makeResponse({ status: 401 })],
179
- ["/api/user", makeResponse({ body: { id: "km-u1" } })],
180
- [/list\?offset=30/, makeResponse({ body: { items: [], total: 1 } })],
181
- [/list\?offset=0/, makeResponse({ body: { items: [
182
- { id: "km-c1", name: "still works", created_at: 1700000300, updated_at: 1700000400 },
183
- ], total: 1 } })],
184
- [/segment\/scroll/, async (_url, init) => {
185
- const body = JSON.parse(init.body);
186
- if (body.last === "0") {
187
- return makeResponse({ body: {
188
- items: [{ id: "km-msg-1", role: "user", content: "hi kimi", created_at: 1700000300 }],
189
- has_more: false,
190
- } });
191
- }
192
- return makeResponse({ body: { items: [], has_more: false } });
193
- }],
194
- ]);
195
- const adapter = new AIChatHistoryAdapter({ fetch, sleep: clk.sleep, now: clk.now });
196
- adapter.setSession("deepseek", new CookieAuthSession({ vendor: "deepseek", cookies: [] }));
197
- adapter.setSession("kimi", new CookieAuthSession({ vendor: "kimi", cookies: [] }));
198
- registry.register(adapter);
199
-
200
- const report = await registry.syncAdapter("ai-chat-history");
201
- expect(report.status).toBe("ok");
202
-
203
- // Kimi events landed even though DeepSeek failed.
204
- const allEvents = vault.queryEvents({ adapter: "ai-chat-history", limit: 100 });
205
- const kimiEvents = allEvents.filter((e) => e.extra && e.extra.vendor === "kimi");
206
- expect(kimiEvents.length).toBeGreaterThan(0);
207
-
208
- // Timeline still returns kimi event despite deepseek failure.
209
- const timeline = new TimelineSkill({ vault });
210
- const result = await timeline.run({ since: 1700000000_000, until: 1700001000_000, limit: 100 });
211
- expect(result.entries.length).toBeGreaterThan(0);
212
- });
213
- });