@chainlesschain/personal-data-hub 0.4.28 → 0.4.30

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (204) hide show
  1. package/README.md +13 -5
  2. package/lib/adapters/social-douyin-adb/usage-profile-reader.js +253 -0
  3. package/lib/adapters/social-douyin-adb/watch-history-reader.js +104 -31
  4. package/lib/adapters/social-toutiao-adb/article-reader.js +202 -0
  5. package/lib/analysis-skills/overview.js +24 -4
  6. package/lib/analysis-skills/spending.js +63 -2
  7. package/lib/analysis-skills/timeline.js +11 -6
  8. package/lib/prompt-builder.js +15 -1
  9. package/lib/query-parser.js +38 -8
  10. package/package.json +4 -1
  11. package/__tests__/adapter-guide.test.js +0 -47
  12. package/__tests__/adapter-spec.test.js +0 -78
  13. package/__tests__/adapters/ai-chat-cookie-capture-spec.test.js +0 -211
  14. package/__tests__/adapters/ai-chat-health-checker.test.js +0 -262
  15. package/__tests__/adapters/ai-chat-history.test.js +0 -396
  16. package/__tests__/adapters/ai-chat-http-client.test.js +0 -242
  17. package/__tests__/adapters/ai-chat-vendors.test.js +0 -874
  18. package/__tests__/adapters/alipay-bill-adapter.test.js +0 -538
  19. package/__tests__/adapters/apple-health.test.js +0 -95
  20. package/__tests__/adapters/bank-family.test.js +0 -125
  21. package/__tests__/adapters/biz-tianyancha.test.js +0 -159
  22. package/__tests__/adapters/browser-history-chrome.test.js +0 -377
  23. package/__tests__/adapters/browser-history-edge.test.js +0 -159
  24. package/__tests__/adapters/car-mercedesme.test.js +0 -74
  25. package/__tests__/adapters/doc-baidu-netdisk.test.js +0 -102
  26. package/__tests__/adapters/doc-camscanner.test.js +0 -147
  27. package/__tests__/adapters/doc-platforms.test.js +0 -177
  28. package/__tests__/adapters/edu-huawei-learning-live.test.js +0 -198
  29. package/__tests__/adapters/edu-zuoyebang-live.test.js +0 -226
  30. package/__tests__/adapters/email-adapter-snapshot.test.js +0 -237
  31. package/__tests__/adapters/email-adapter.test.js +0 -742
  32. package/__tests__/adapters/email-classifier.test.js +0 -347
  33. package/__tests__/adapters/email-imap-session.test.js +0 -334
  34. package/__tests__/adapters/email-parser.test.js +0 -244
  35. package/__tests__/adapters/email-pdf-extractor.test.js +0 -529
  36. package/__tests__/adapters/email-providers.test.js +0 -84
  37. package/__tests__/adapters/email-retry-progress.test.js +0 -294
  38. package/__tests__/adapters/email-templates.test.js +0 -822
  39. package/__tests__/adapters/family-23-collectors-scaffold.test.js +0 -182
  40. package/__tests__/adapters/finance-alipay-live.test.js +0 -258
  41. package/__tests__/adapters/finance-dcep.test.js +0 -74
  42. package/__tests__/adapters/fitness-joyrun.test.js +0 -82
  43. package/__tests__/adapters/game-genshin-live.test.js +0 -238
  44. package/__tests__/adapters/game-genshin-scaffold.test.js +0 -108
  45. package/__tests__/adapters/game-honor-of-kings-live.test.js +0 -230
  46. package/__tests__/adapters/git-activity.test.js +0 -222
  47. package/__tests__/adapters/gov-12123.test.js +0 -103
  48. package/__tests__/adapters/gov-ixiamen.test.js +0 -150
  49. package/__tests__/adapters/gov-tax.test.js +0 -135
  50. package/__tests__/adapters/health-meiyou.test.js +0 -125
  51. package/__tests__/adapters/local-files.test.js +0 -264
  52. package/__tests__/adapters/local-im-pc.test.js +0 -154
  53. package/__tests__/adapters/messaging-whatsapp.test.js +0 -289
  54. package/__tests__/adapters/music-kugou.test.js +0 -187
  55. package/__tests__/adapters/music-qq.test.js +0 -112
  56. package/__tests__/adapters/netease-music-live.test.js +0 -244
  57. package/__tests__/adapters/netease-music.test.js +0 -74
  58. package/__tests__/adapters/pc-local-discovery.test.js +0 -141
  59. package/__tests__/adapters/qq-pc-direct-read.test.js +0 -227
  60. package/__tests__/adapters/reading-family.test.js +0 -108
  61. package/__tests__/adapters/recruit-boss.test.js +0 -180
  62. package/__tests__/adapters/shell-history.test.js +0 -180
  63. package/__tests__/adapters/shopping-base.test.js +0 -179
  64. package/__tests__/adapters/shopping-dianping.test.js +0 -239
  65. package/__tests__/adapters/social-bilibili-adb-api-client.test.js +0 -721
  66. package/__tests__/adapters/social-bilibili-adb-chromium-cookies-reader.test.js +0 -346
  67. package/__tests__/adapters/social-bilibili-adb-collector.test.js +0 -284
  68. package/__tests__/adapters/social-bilibili-adb-cookies-extension.test.js +0 -343
  69. package/__tests__/adapters/social-bilibili-adb-snapshot-builder.test.js +0 -296
  70. package/__tests__/adapters/social-csdn.test.js +0 -175
  71. package/__tests__/adapters/social-dongchedi.test.js +0 -165
  72. package/__tests__/adapters/social-douyin-adb-aweme-detail.test.js +0 -165
  73. package/__tests__/adapters/social-douyin-adb-collector.test.js +0 -254
  74. package/__tests__/adapters/social-douyin-adb-db-extension.test.js +0 -114
  75. package/__tests__/adapters/social-douyin-adb-im-db-parser.test.js +0 -304
  76. package/__tests__/adapters/social-douyin-adb-snapshot-builder.test.js +0 -216
  77. package/__tests__/adapters/social-douyin-adb-watch-history.test.js +0 -192
  78. package/__tests__/adapters/social-kuaishou-adb-api-client.test.js +0 -496
  79. package/__tests__/adapters/social-kuaishou-adb-collector.test.js +0 -276
  80. package/__tests__/adapters/social-kuaishou-adb-cookies-extension.test.js +0 -152
  81. package/__tests__/adapters/social-kuaishou-adb-snapshot-builder.test.js +0 -178
  82. package/__tests__/adapters/social-toutiao-adb-account-reader.test.js +0 -135
  83. package/__tests__/adapters/social-toutiao-adb-api-client.test.js +0 -626
  84. package/__tests__/adapters/social-toutiao-adb-collector.test.js +0 -378
  85. package/__tests__/adapters/social-toutiao-adb-cookies-extension.test.js +0 -193
  86. package/__tests__/adapters/social-toutiao-adb-snapshot-builder.test.js +0 -196
  87. package/__tests__/adapters/social-toutiao-kuaishou-scaffold.test.js +0 -311
  88. package/__tests__/adapters/social-weibo-adb-api-client.test.js +0 -362
  89. package/__tests__/adapters/social-weibo-adb-collector.test.js +0 -201
  90. package/__tests__/adapters/social-weibo-adb-cookies-extension.test.js +0 -167
  91. package/__tests__/adapters/social-weibo-adb-snapshot-builder.test.js +0 -189
  92. package/__tests__/adapters/social-xiaohongshu-adb-api-client.test.js +0 -431
  93. package/__tests__/adapters/social-xiaohongshu-adb-collector.test.js +0 -207
  94. package/__tests__/adapters/social-xiaohongshu-adb-cookies-extension.test.js +0 -0
  95. package/__tests__/adapters/social-xiaohongshu-adb-sign-provider-injection.test.js +0 -351
  96. package/__tests__/adapters/social-xiaohongshu-adb-sign.test.js +0 -130
  97. package/__tests__/adapters/social-xiaohongshu-adb-snapshot-builder.test.js +0 -200
  98. package/__tests__/adapters/social-zhihu.test.js +0 -246
  99. package/__tests__/adapters/system-data-adapter.test.js +0 -443
  100. package/__tests__/adapters/system-data-android-ingest.test.js +0 -144
  101. package/__tests__/adapters/system-data-android.test.js +0 -519
  102. package/__tests__/adapters/system-data-disclosure.test.js +0 -153
  103. package/__tests__/adapters/travel-12306.test.js +0 -512
  104. package/__tests__/adapters/travel-amap.test.js +0 -219
  105. package/__tests__/adapters/travel-baidu-map.test.js +0 -305
  106. package/__tests__/adapters/travel-base.test.js +0 -205
  107. package/__tests__/adapters/travel-ctrip.test.js +0 -377
  108. package/__tests__/adapters/travel-didi-consumer.test.js +0 -66
  109. package/__tests__/adapters/travel-didi.test.js +0 -204
  110. package/__tests__/adapters/travel-tencent-map.test.js +0 -207
  111. package/__tests__/adapters/travel-tongcheng.test.js +0 -289
  112. package/__tests__/adapters/video-platforms.test.js +0 -152
  113. package/__tests__/adapters/video-xigua.test.js +0 -106
  114. package/__tests__/adapters/vscode.test.js +0 -299
  115. package/__tests__/adapters/wechat-bootstrap.test.js +0 -240
  116. package/__tests__/adapters/wechat-env-probe.test.js +0 -162
  117. package/__tests__/adapters/wechat-frida-agent.test.js +0 -322
  118. package/__tests__/adapters/wechat-frida-integration.test.js +0 -149
  119. package/__tests__/adapters/wechat-frida-key-provider.test.js +0 -188
  120. package/__tests__/adapters/wechat-md5-key-provider.test.js +0 -101
  121. package/__tests__/adapters/wechat-pc-direct-read.test.js +0 -365
  122. package/__tests__/adapters/wechat-pc-group-topic.test.js +0 -63
  123. package/__tests__/adapters/wechat-pc-v4-sidecar.test.js +0 -72
  124. package/__tests__/adapters/weread.test.js +0 -123
  125. package/__tests__/adapters/wework-pc.test.js +0 -124
  126. package/__tests__/adapters/win-recent.test.js +0 -192
  127. package/__tests__/analysis-skills.test.js +0 -679
  128. package/__tests__/analysis.test.js +0 -1845
  129. package/__tests__/audio-ximalaya-snapshot.test.js +0 -279
  130. package/__tests__/batch.test.js +0 -133
  131. package/__tests__/bridges-cc-kg.test.js +0 -231
  132. package/__tests__/bridges-cc-llm.test.js +0 -191
  133. package/__tests__/bridges-cc-rag.test.js +0 -162
  134. package/__tests__/categories.test.js +0 -92
  135. package/__tests__/e2e/ai-chat-cross-source-journey.test.js +0 -213
  136. package/__tests__/e2e/full-user-journey.test.js +0 -188
  137. package/__tests__/e2e/local-data-adapters-cli.e2e.test.js +0 -146
  138. package/__tests__/entity-resolver-ingest-hook.test.js +0 -177
  139. package/__tests__/entity-resolver-stages.test.js +0 -411
  140. package/__tests__/entity-resolver-vault.test.js +0 -249
  141. package/__tests__/entity-resolver.test.js +0 -526
  142. package/__tests__/fitness-keep-snapshot.test.js +0 -224
  143. package/__tests__/fixtures/entity-resolver-200-mock.json +0 -96
  144. package/__tests__/ids.test.js +0 -45
  145. package/__tests__/integration/ai-chat-history-registry.test.js +0 -228
  146. package/__tests__/integration/aichat-wizard-end-to-end.test.js +0 -282
  147. package/__tests__/integration/cross-adapter-pipelines.test.js +0 -396
  148. package/__tests__/integration/local-data-adapters-pipeline.test.js +0 -373
  149. package/__tests__/integration/social-bilibili-pipeline.test.js +0 -261
  150. package/__tests__/integration/wechat-bootstrap-end-to-end.test.js +0 -390
  151. package/__tests__/key-providers.test.js +0 -126
  152. package/__tests__/kg-derive.test.js +0 -219
  153. package/__tests__/llm-client.test.js +0 -122
  154. package/__tests__/longtail-adapters.test.js +0 -281
  155. package/__tests__/messaging-qq-snapshot.test.js +0 -294
  156. package/__tests__/mobile-extractor-encrypted.test.js +0 -460
  157. package/__tests__/mobile-extractor.test.js +0 -288
  158. package/__tests__/mock-adapter.test.js +0 -93
  159. package/__tests__/prompt-builder.test.js +0 -249
  160. package/__tests__/query-parser.test.js +0 -302
  161. package/__tests__/rag-derive.test.js +0 -169
  162. package/__tests__/registry-readiness.test.js +0 -292
  163. package/__tests__/registry.test.js +0 -420
  164. package/__tests__/salvage-ingest.test.js +0 -97
  165. package/__tests__/schemas.test.js +0 -331
  166. package/__tests__/shopping-adapters.test.js +0 -392
  167. package/__tests__/shopping-eleme-snapshot.test.js +0 -454
  168. package/__tests__/shopping-pinduoduo-snapshot.test.js +0 -484
  169. package/__tests__/shopping-snapshot.test.js +0 -438
  170. package/__tests__/shopping-vipshop-snapshot.test.js +0 -425
  171. package/__tests__/shopping-xianyu-snapshot.test.js +0 -451
  172. package/__tests__/sidecar-contacts-cross-validate.test.js +0 -186
  173. package/__tests__/sidecar-supervisor.test.js +0 -128
  174. package/__tests__/sign-providers.test.js +0 -62
  175. package/__tests__/social-adapters.test.js +0 -280
  176. package/__tests__/social-bilibili-snapshot.test.js +0 -278
  177. package/__tests__/social-douban-snapshot.test.js +0 -351
  178. package/__tests__/social-douyin-im-direct-read.test.js +0 -377
  179. package/__tests__/social-douyin-salvage-collector.test.js +0 -98
  180. package/__tests__/social-douyin-salvage-mapper.test.js +0 -90
  181. package/__tests__/social-douyin-snapshot.test.js +0 -256
  182. package/__tests__/social-kuaishou-snapshot.test.js +0 -362
  183. package/__tests__/social-toutiao-snapshot.test.js +0 -366
  184. package/__tests__/social-weibo-snapshot.test.js +0 -234
  185. package/__tests__/social-weibo-sqlite-device.test.js +0 -174
  186. package/__tests__/social-xiaohongshu-snapshot.test.js +0 -232
  187. package/__tests__/sqlite-leaf-salvage.test.js +0 -97
  188. package/__tests__/travel-adapters.test.js +0 -483
  189. package/__tests__/travel-maps-snapshot.test.js +0 -426
  190. package/__tests__/vault-driver-error.test.js +0 -74
  191. package/__tests__/vault-search-helpers.test.js +0 -104
  192. package/__tests__/vault-search.test.js +0 -423
  193. package/__tests__/vault.test.js +0 -767
  194. package/__tests__/wechat-adapter.test.js +0 -594
  195. package/__tests__/whatsapp-adapter.test.js +0 -138
  196. package/scripts/_make-fixture-all.js +0 -126
  197. package/scripts/_make-fixture-contacts.js +0 -84
  198. package/scripts/evaluate-entity-resolver.js +0 -213
  199. package/scripts/run-native-tests-sandbox.sh +0 -55
  200. package/scripts/smoke-phase-5-5.js +0 -196
  201. package/scripts/smoke-phase-5-7.js +0 -181
  202. package/scripts/smoke-system-data-contacts.js +0 -309
  203. package/scripts/smoke-system-data.js +0 -312
  204. package/vitest.config.js +0 -88
@@ -1,302 +0,0 @@
1
- "use strict";
2
-
3
- import { describe, it, expect } from "vitest";
4
-
5
- const {
6
- parseQuery,
7
- parseTimeWindow,
8
- parseFilters,
9
- parseIntent,
10
- parseEntityFocus,
11
- extractEntityTerm,
12
- extractPersonNameCandidate,
13
- } = require("../lib/query-parser");
14
-
15
- // Pin "now" to 2026-05-19 12:00:00 UTC for deterministic windows
16
- const NOW = new Date("2026-05-19T12:00:00Z").getTime();
17
-
18
- describe("parseTimeWindow", () => {
19
- it("今天 → start of today through end of today", () => {
20
- const w = parseTimeWindow("我今天花了多少?", NOW);
21
- expect(w).not.toBeNull();
22
- const startOfDay = new Date(NOW);
23
- startOfDay.setHours(0, 0, 0, 0);
24
- expect(w.since).toBe(startOfDay.getTime());
25
- expect(w.until).toBe(startOfDay.getTime() + 86_400_000 - 1);
26
- });
27
-
28
- it("昨天 → start of yesterday through end of yesterday", () => {
29
- const w = parseTimeWindow("昨天的订单", NOW);
30
- expect(w).not.toBeNull();
31
- expect(w.until - w.since).toBe(86_400_000 - 1);
32
- });
33
-
34
- it("上个月 → full previous calendar month", () => {
35
- const w = parseTimeWindow("上个月支出", NOW);
36
- expect(w).not.toBeNull();
37
- // NOW is 2026-05-19; previous month = 2026-04
38
- const apr1 = new Date(2026, 3, 1).getTime();
39
- const may1 = new Date(2026, 4, 1).getTime();
40
- expect(w.since).toBe(apr1);
41
- expect(w.until).toBe(may1 - 1);
42
- });
43
-
44
- it("本月 → current calendar month", () => {
45
- const w = parseTimeWindow("本月开销", NOW);
46
- expect(w).not.toBeNull();
47
- expect(w.since).toBe(new Date(2026, 4, 1).getTime());
48
- expect(w.until).toBe(new Date(2026, 5, 1).getTime() - 1);
49
- });
50
-
51
- it("去年 → full previous calendar year", () => {
52
- const w = parseTimeWindow("去年我去过哪些地方", NOW);
53
- expect(w.since).toBe(new Date(2025, 0, 1).getTime());
54
- expect(w.until).toBe(new Date(2025, 11, 1).getTime() + 31 * 86_400_000 - 1);
55
- });
56
-
57
- it("最近 30 天 → past 30-day window ending now", () => {
58
- const w = parseTimeWindow("最近 30 天聊过什么", NOW);
59
- expect(w.until).toBe(NOW);
60
- expect(NOW - w.since).toBe(30 * 86_400_000);
61
- });
62
-
63
- it("最近 N 周 / 最近 N 个月 patterns work", () => {
64
- const week = parseTimeWindow("最近 2 周", NOW);
65
- expect(NOW - week.since).toBe(14 * 86_400_000);
66
-
67
- const months = parseTimeWindow("最近 3 个月", NOW);
68
- expect(months.until).toBe(NOW);
69
- expect(months.since).toBeLessThan(NOW);
70
- });
71
-
72
- it("YYYY 年 M 月 → that calendar month", () => {
73
- const w = parseTimeWindow("2024 年 7 月在淘宝下过几单", NOW);
74
- expect(w.since).toBe(new Date(2024, 6, 1).getTime());
75
- expect(w.until).toBe(new Date(2024, 7, 1).getTime() - 1);
76
- });
77
-
78
- it("returns null for question without time clue", () => {
79
- expect(parseTimeWindow("妈妈手机号是多少", NOW)).toBeNull();
80
- });
81
-
82
- it("returns null for non-string input", () => {
83
- expect(parseTimeWindow(null)).toBeNull();
84
- expect(parseTimeWindow(undefined)).toBeNull();
85
- });
86
- });
87
-
88
- describe("parseFilters", () => {
89
- it("identifies subtype via keywords (Chinese + English)", () => {
90
- expect(parseFilters("今年在淘宝下了多少单").subtype).toBe("order");
91
- expect(parseFilters("上个月总共花了多少").subtype).toBe("payment");
92
- expect(parseFilters("转给妈妈多少钱").subtype).toBe("transfer");
93
- expect(parseFilters("我今年的收入").subtype).toBe("income");
94
- expect(parseFilters("我跟妈妈聊了什么").subtype).toBe("message");
95
- expect(parseFilters("我朋友圈发了啥").subtype).toBe("post");
96
- });
97
-
98
- it("identifies adapter via keywords (Chinese + English)", () => {
99
- expect(parseFilters("淘宝今年下了多少单").adapter).toBe("taobao");
100
- expect(parseFilters("支付宝账单").adapter).toBe("alipay-bill");
101
- expect(parseFilters("微信里我跟谁聊最多").adapter).toBe("wechat");
102
- expect(parseFilters("高德历史足迹").adapter).toBe("amap");
103
- expect(parseFilters("DeepSeek 我之前问过啥").adapter).toBe("ai-chat-history");
104
- });
105
-
106
- it("returns empty object when no clue", () => {
107
- expect(parseFilters("hello world")).toEqual({});
108
- });
109
- });
110
-
111
- describe("parseIntent", () => {
112
- it("sum-amount when 'total ... money' phrasing", () => {
113
- expect(parseIntent("上个月总共花了多少")).toBe("sum-amount");
114
- expect(parseIntent("我今年开销加起来")).toBe("sum-amount");
115
- });
116
-
117
- it("count when 'how many' phrasing", () => {
118
- expect(parseIntent("最近多少次跟妈妈聊过")).toBe("count");
119
- expect(parseIntent("我下了几单")).toBe("count");
120
- });
121
-
122
- it("latest when 'recent / latest'", () => {
123
- expect(parseIntent("最近一次转账")).toBe("latest");
124
- });
125
-
126
- it("list as default", () => {
127
- expect(parseIntent("妈妈的手机号")).toBe("list");
128
- });
129
- });
130
-
131
- describe("parseEntityFocus", () => {
132
- it("returns 'persons' for 联系人 / 通讯录 phrasing", () => {
133
- expect(parseEntityFocus("我有哪些联系人")).toBe("persons");
134
- expect(parseEntityFocus("通讯录里有多少人")).toBe("persons");
135
- expect(parseEntityFocus("好友列表谁是张三")).toBe("persons");
136
- });
137
-
138
- it("returns 'persons' for phone-number phrasing", () => {
139
- expect(parseEntityFocus("妈手机号是多少")).toBe("persons");
140
- expect(parseEntityFocus("王医生的电话号码")).toBe("persons");
141
- expect(parseEntityFocus("show me my contacts")).toBe("persons");
142
- });
143
-
144
- it("returns 'items' for installed-app phrasing", () => {
145
- expect(parseEntityFocus("我装了哪些 app")).toBe("items");
146
- expect(parseEntityFocus("有哪些游戏")).toBe("items");
147
- expect(parseEntityFocus("installed apps")).toBe("items");
148
- });
149
-
150
- it("returns null when no focus signal", () => {
151
- expect(parseEntityFocus("上个月在淘宝花了多少")).toBeNull();
152
- expect(parseEntityFocus("最近的订单")).toBeNull();
153
- expect(parseEntityFocus("hello")).toBeNull();
154
- });
155
-
156
- it("returns null for non-string / empty input", () => {
157
- expect(parseEntityFocus("")).toBeNull();
158
- expect(parseEntityFocus(null)).toBeNull();
159
- expect(parseEntityFocus(undefined)).toBeNull();
160
- });
161
- });
162
-
163
- describe("parseQuery (integration)", () => {
164
- it("full parse for spending question", () => {
165
- const r = parseQuery("上个月在淘宝总共花了多少钱?", { now: NOW });
166
- expect(r.timeWindow.since).toBe(new Date(2026, 3, 1).getTime());
167
- expect(r.filters.subtype).toBe("payment");
168
- expect(r.filters.adapter).toBe("taobao");
169
- expect(r.intent).toBe("sum-amount");
170
- expect(r.entityFocus).toBeNull();
171
- });
172
-
173
- it("contact question carries entityFocus=persons", () => {
174
- const r = parseQuery("我有哪些联系人", { now: NOW });
175
- expect(r.entityFocus).toBe("persons");
176
- expect(r.intent).toBe("list");
177
- });
178
-
179
- it("full parse for footprint question", () => {
180
- const r = parseQuery("去年我在高德上去过哪些地方", { now: NOW });
181
- expect(r.timeWindow.since).toBe(new Date(2025, 0, 1).getTime());
182
- expect(r.filters.adapter).toBe("amap");
183
- expect(r.intent).toBe("list");
184
- });
185
-
186
- it("non-string question returns empty raw + nulls", () => {
187
- const r = parseQuery(undefined);
188
- expect(r.raw).toBe("");
189
- expect(r.timeWindow).toBeNull();
190
- expect(r.filters).toEqual({});
191
- });
192
- });
193
-
194
- // ─── extractEntityTerm — FTS5 fulltext routing helper ───────────────────
195
- //
196
- // 2026-05-24 — Powers AnalysisEngine._gatherFacts intent=list augmentation:
197
- // when the parser pulls a probable entity-name out of the question, the
198
- // engine appends vault.searchEvents(q=term) hits to the FACTS pool. Wrong
199
- // extractions are intentionally non-fatal — they waste a few rows of
200
- // budget at worst, never lose existing events. Memory:
201
- // pdh_analysis_engine_intent_routing.md.
202
-
203
- describe("extractEntityTerm", () => {
204
- it("extracts named entity from '提到 X 的消息' phrasing", () => {
205
- expect(extractEntityTerm("提到王老板的消息")).toBe("王老板");
206
- });
207
-
208
- it("returns null when only stop-words remain (no entity hint)", () => {
209
- expect(extractEntityTerm("上个月在淘宝总共花了多少?")).toBeNull();
210
- expect(extractEntityTerm("在淘宝买了什么")).toBeNull();
211
- });
212
-
213
- it("picks the longest remaining chunk when several survive cleaning", () => {
214
- // 苹果(2) vs 订单(stop) — only 苹果 left.
215
- expect(extractEntityTerm("苹果的订单")).toBe("苹果");
216
- });
217
-
218
- it("strips list/search trigger words ('提到', '查找', '看一下')", () => {
219
- expect(extractEntityTerm("查找王医生的订单")).toBe("王医生");
220
- expect(extractEntityTerm("看一下王医生的最新消息")).toBe("王医生");
221
- });
222
-
223
- it("strips compound subtype keywords before shorter intent forms", () => {
224
- // "多少钱" must clear before "多少" leaves stranded "钱". With clean
225
- // stripping there is no leftover ≥2 char chunk → null.
226
- expect(extractEntityTerm("我总共花了多少钱")).toBeNull();
227
- });
228
-
229
- it("ignores single-character residues (verbs leak through; 1-char names skipped first-pass)", () => {
230
- // "我妈" → "我" stripped (pronoun), "妈" left as single char → filtered.
231
- // Documented limitation; first-pass tradeoff for higher precision.
232
- expect(extractEntityTerm("我妈最近发的微信")).toBeNull();
233
- });
234
-
235
- it("handles ASCII entity tokens (≥2 chars)", () => {
236
- expect(extractEntityTerm("提到 GitHub 的消息")).toBe("GitHub");
237
- });
238
-
239
- it("returns null for non-string / empty input", () => {
240
- expect(extractEntityTerm("")).toBeNull();
241
- expect(extractEntityTerm(null)).toBeNull();
242
- expect(extractEntityTerm(undefined)).toBeNull();
243
- expect(extractEntityTerm(123)).toBeNull();
244
- });
245
-
246
- it("does not pick adapter keywords as the entity (handled by filters)", () => {
247
- // "淘宝" 是 adapter,会被 parseFilters 抽走当 q.adapter;不该再被
248
- // 当实体名重复 FTS 搜。
249
- expect(extractEntityTerm("看下淘宝的订单")).toBeNull();
250
- });
251
-
252
- it("> 10 char tokens are dropped (probable concatenated noise)", () => {
253
- // 拼出一个 12 char ASCII token,期望被 length 上限过滤掉
254
- const r = extractEntityTerm("提到 abcdefghijkl 的消息");
255
- expect(r).toBeNull();
256
- });
257
- });
258
-
259
- // ─── extractPersonNameCandidate — persons-branch name search ─────────────
260
- //
261
- // 2026-05-27 — Powers AnalysisEngine entityFocus=persons name-search
262
- // short-circuit. Differs from extractEntityTerm in two ways: strips
263
- // person-FOCUS framing words first (联系人/手机号/etc.) and allows
264
- // single-char Chinese names from a relation whitelist (妈/爸/姐/...).
265
-
266
- describe("extractPersonNameCandidate", () => {
267
- it("extracts multi-char name when present", () => {
268
- expect(extractPersonNameCandidate("张三的电话号码")).toBe("张三");
269
- expect(extractPersonNameCandidate("王医生手机号是多少")).toBe("王医生");
270
- });
271
-
272
- it("falls back to single-char relation word ('妈', '爸', '姐')", () => {
273
- expect(extractPersonNameCandidate("妈手机号是多少")).toBe("妈");
274
- expect(extractPersonNameCandidate("爸的电话")).toBe("爸");
275
- expect(extractPersonNameCandidate("姐姐的号码")).toBe("姐姐");
276
- });
277
-
278
- it("multi-char wins over single-char fallback", () => {
279
- // "王医生" (3 char) preferred over leaked single "医" / "生".
280
- expect(extractPersonNameCandidate("王医生的手机号")).toBe("王医生");
281
- });
282
-
283
- it("returns null when no name candidate (pure framing)", () => {
284
- expect(extractPersonNameCandidate("我有哪些联系人")).toBeNull();
285
- expect(extractPersonNameCandidate("通讯录里有多少人")).toBeNull();
286
- });
287
-
288
- it("ignores single-char Chinese outside the relation whitelist", () => {
289
- // "说" / "看" are not relation chars — should NOT slip through as names.
290
- expect(extractPersonNameCandidate("说手机号")).toBeNull();
291
- });
292
-
293
- it("returns null for non-string / empty input", () => {
294
- expect(extractPersonNameCandidate("")).toBeNull();
295
- expect(extractPersonNameCandidate(null)).toBeNull();
296
- expect(extractPersonNameCandidate(undefined)).toBeNull();
297
- });
298
-
299
- it("handles ASCII names ≥2 chars", () => {
300
- expect(extractPersonNameCandidate("Alice 的电话号码")).toBe("Alice");
301
- });
302
- });
@@ -1,169 +0,0 @@
1
- "use strict";
2
-
3
- import { describe, it, expect } from "vitest";
4
-
5
- const {
6
- eventToRagDoc,
7
- personToRagDoc,
8
- placeToRagDoc,
9
- itemToRagDoc,
10
- topicToRagDoc,
11
- entityToRagDoc,
12
- deriveBatchDocs,
13
- } = require("../lib/rag-derive");
14
-
15
- const sourceOk = (adapter = "test") => ({
16
- adapter,
17
- adapterVersion: "0.1.0",
18
- capturedAt: 1700000000000,
19
- capturedBy: "api",
20
- originalId: "ord-42",
21
- });
22
-
23
- describe("eventToRagDoc", () => {
24
- it("includes title + text + amount + subtype + adapter prose", () => {
25
- const doc = eventToRagDoc({
26
- id: "e1",
27
- type: "event",
28
- subtype: "order",
29
- occurredAt: 1700000000000,
30
- ingestedAt: 1700000000001,
31
- content: {
32
- title: "妈妈生日蛋白粉",
33
- text: "送到妈妈家",
34
- amount: { value: 288.5, currency: "CNY", direction: "out" },
35
- },
36
- source: sourceOk("taobao"),
37
- });
38
- expect(doc.id).toBe("e1");
39
- expect(doc.type).toBe("event");
40
- expect(doc.text).toContain("妈妈生日蛋白粉");
41
- expect(doc.text).toContain("送到妈妈家");
42
- expect(doc.text).toContain("-288.5 CNY");
43
- expect(doc.text).toContain("type: order");
44
- expect(doc.text).toContain("from: taobao");
45
- expect(doc.metadata.subtype).toBe("order");
46
- expect(doc.metadata.adapter).toBe("taobao");
47
- expect(doc.metadata.originalId).toBe("ord-42");
48
- expect(doc.metadata.occurredAt).toBe(1700000000000);
49
- });
50
-
51
- it("'in' direction renders with '+' sign", () => {
52
- const doc = eventToRagDoc({
53
- id: "e",
54
- type: "event",
55
- subtype: "income",
56
- occurredAt: 1,
57
- ingestedAt: 1,
58
- content: { amount: { value: 5000, currency: "CNY", direction: "in" } },
59
- source: sourceOk(),
60
- });
61
- expect(doc.text).toContain("+5000 CNY");
62
- });
63
-
64
- it("propagates topics into metadata", () => {
65
- const doc = eventToRagDoc({
66
- id: "e",
67
- type: "event",
68
- subtype: "message",
69
- occurredAt: 1,
70
- ingestedAt: 1,
71
- content: { text: "hi" },
72
- source: sourceOk(),
73
- topics: ["topic-fam"],
74
- });
75
- expect(doc.metadata.topics).toEqual(["topic-fam"]);
76
- });
77
- });
78
-
79
- describe("personToRagDoc", () => {
80
- it("packs names + relation + identifiers into searchable text", () => {
81
- const doc = personToRagDoc({
82
- id: "p1",
83
- type: "person",
84
- subtype: "contact",
85
- names: ["妈妈", "陈某某"],
86
- relation: "母亲",
87
- identifiers: { phone: ["13800001111"], wechatId: "wxid_xyz" },
88
- ingestedAt: 1,
89
- source: sourceOk(),
90
- });
91
- expect(doc.text).toContain("妈妈");
92
- expect(doc.text).toContain("陈某某");
93
- expect(doc.text).toContain("relation: 母亲");
94
- expect(doc.text).toContain("13800001111");
95
- expect(doc.text).toContain("wechatId: wxid_xyz");
96
- expect(doc.metadata.subtype).toBe("contact");
97
- });
98
- });
99
-
100
- describe("placeToRagDoc", () => {
101
- it("emits name + alias dedup + address + category", () => {
102
- const doc = placeToRagDoc({
103
- id: "pl",
104
- type: "place",
105
- name: "妈妈家",
106
- aliases: ["妈妈家", "妈家"],
107
- address: "厦门思明区",
108
- category: "home",
109
- coordinates: { lat: 24.5, lng: 118.1 },
110
- ingestedAt: 1,
111
- source: sourceOk(),
112
- });
113
- expect(doc.text).toContain("妈妈家");
114
- expect(doc.text).toContain("妈家");
115
- expect(doc.text).toContain("厦门思明区");
116
- expect(doc.text).toContain("category: home");
117
- expect(doc.metadata.coordinates).toEqual({ lat: 24.5, lng: 118.1 });
118
- });
119
- });
120
-
121
- describe("itemToRagDoc", () => {
122
- it("includes price + category", () => {
123
- const doc = itemToRagDoc({
124
- id: "i",
125
- type: "item",
126
- subtype: "product",
127
- name: "蛋白粉",
128
- category: "保健品",
129
- price: { value: 288, currency: "CNY" },
130
- ingestedAt: 1,
131
- source: sourceOk(),
132
- });
133
- expect(doc.text).toContain("蛋白粉");
134
- expect(doc.text).toContain("category: 保健品");
135
- expect(doc.text).toContain("288 CNY");
136
- });
137
- });
138
-
139
- describe("topicToRagDoc + entityToRagDoc + deriveBatchDocs", () => {
140
- it("topic doc is its name", () => {
141
- const doc = topicToRagDoc({
142
- id: "t",
143
- type: "topic",
144
- name: "母亲健康",
145
- ingestedAt: 1,
146
- source: sourceOk(),
147
- });
148
- expect(doc.text).toBe("母亲健康");
149
- });
150
-
151
- it("entityToRagDoc returns null for unknown types", () => {
152
- expect(entityToRagDoc(null)).toBeNull();
153
- expect(entityToRagDoc({ type: "alien" })).toBeNull();
154
- });
155
-
156
- it("deriveBatchDocs filters empty-text entities", () => {
157
- const docs = deriveBatchDocs({
158
- events: [
159
- // empty text — should be filtered
160
- { id: "empty", type: "event", subtype: "message", occurredAt: 1, ingestedAt: 1, content: {}, source: { adapter: "x", adapterVersion: "0.1.0", capturedAt: 1, capturedBy: "api" } },
161
- // has text
162
- { id: "kept", type: "event", subtype: "message", occurredAt: 1, ingestedAt: 1, content: { text: "hi" }, source: { adapter: "x", adapterVersion: "0.1.0", capturedAt: 1, capturedBy: "api" } },
163
- ],
164
- });
165
- expect(docs.length).toBe(2); // 'empty' includes 'type: message' + 'from: x' so text is non-empty
166
- // Both have text because structural prose is added — verify text is non-empty for both
167
- expect(docs.every((d) => d.text.length > 0)).toBe(true);
168
- });
169
- });