@jackwener/opencli 1.6.1 → 1.6.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CONTRIBUTING.md +1 -1
- package/README.md +27 -45
- package/README.zh-CN.md +32 -34
- package/autoresearch/browse-tasks.json +18 -20
- package/autoresearch/commands/debug.ts +163 -0
- package/autoresearch/commands/fix.ts +145 -0
- package/autoresearch/commands/plan.ts +88 -0
- package/autoresearch/commands/run.ts +138 -0
- package/autoresearch/config.ts +82 -0
- package/autoresearch/engine.ts +359 -0
- package/autoresearch/eval-all.ts +127 -0
- package/autoresearch/eval-browse.ts +1 -1
- package/autoresearch/eval-publish.ts +238 -0
- package/autoresearch/eval-save.ts +249 -0
- package/autoresearch/eval-skill.ts +14 -8
- package/autoresearch/eval-v2ex.ts +220 -0
- package/autoresearch/eval-zhihu.ts +230 -0
- package/autoresearch/logger.ts +69 -0
- package/autoresearch/presets/combined-reliability.ts +27 -0
- package/autoresearch/presets/index.ts +23 -0
- package/autoresearch/presets/operate-reliability.ts +24 -0
- package/autoresearch/presets/save-reliability.ts +26 -0
- package/autoresearch/presets/skill-quality.ts +20 -0
- package/autoresearch/presets/v2ex-reliability.ts +24 -0
- package/autoresearch/presets/zhihu-reliability.ts +25 -0
- package/autoresearch/publish-tasks.json +345 -0
- package/autoresearch/run-save.sh +11 -0
- package/autoresearch/save-adapters/xhs-explore-deep.ts +64 -0
- package/autoresearch/save-adapters/xhs-note-comments.ts +61 -0
- package/autoresearch/save-adapters/xhs-search-full.ts +62 -0
- package/autoresearch/save-adapters/zhihu-hot-detail.ts +52 -0
- package/autoresearch/save-adapters/zhihu-question-full.ts +57 -0
- package/autoresearch/save-adapters/zhihu-search-detail.ts +53 -0
- package/autoresearch/save-tasks.json +281 -0
- package/autoresearch/v2ex-tasks.json +899 -0
- package/autoresearch/zhihu-tasks.json +848 -0
- package/dist/browser/base-page.d.ts +4 -2
- package/dist/browser/base-page.js +37 -4
- package/dist/browser/bridge.js +10 -8
- package/dist/browser/cdp.js +2 -6
- package/dist/browser/daemon-client.d.ts +11 -1
- package/dist/browser/daemon-client.js +3 -0
- package/dist/browser/dom-helpers.d.ts +4 -2
- package/dist/browser/dom-helpers.js +42 -31
- package/dist/browser/dom-snapshot.js +23 -1
- package/dist/browser/page.d.ts +7 -2
- package/dist/browser/page.js +112 -30
- package/dist/browser.test.js +1 -1
- package/dist/build-manifest.d.ts +1 -0
- package/dist/build-manifest.js +1 -0
- package/dist/cli-manifest.json +1135 -184
- package/dist/cli.d.ts +2 -0
- package/dist/cli.js +48 -7
- package/dist/cli.test.d.ts +1 -0
- package/dist/cli.test.js +88 -0
- package/dist/clis/1688/item.d.ts +70 -0
- package/dist/clis/1688/item.js +187 -0
- package/dist/clis/1688/item.test.d.ts +1 -0
- package/dist/clis/1688/item.test.js +67 -0
- package/dist/clis/1688/search.d.ts +56 -0
- package/dist/clis/1688/search.js +309 -0
- package/dist/clis/1688/search.test.d.ts +1 -0
- package/dist/clis/1688/search.test.js +75 -0
- package/dist/clis/1688/shared.d.ts +112 -0
- package/dist/clis/1688/shared.js +514 -0
- package/dist/clis/1688/shared.test.d.ts +1 -0
- package/dist/clis/1688/shared.test.js +57 -0
- package/dist/clis/1688/store.d.ts +45 -0
- package/dist/clis/1688/store.js +226 -0
- package/dist/clis/1688/store.test.d.ts +1 -0
- package/dist/clis/1688/store.test.js +62 -0
- package/dist/clis/amazon/bestsellers.d.ts +0 -20
- package/dist/clis/amazon/bestsellers.js +6 -129
- package/dist/clis/amazon/bestsellers.test.js +12 -3
- package/dist/clis/amazon/movers-shakers.d.ts +1 -0
- package/dist/clis/amazon/movers-shakers.js +7 -0
- package/dist/clis/amazon/new-releases.d.ts +1 -0
- package/dist/clis/amazon/new-releases.js +7 -0
- package/dist/clis/amazon/rankings.d.ts +59 -0
- package/dist/clis/amazon/rankings.js +226 -0
- package/dist/clis/amazon/rankings.test.d.ts +1 -0
- package/dist/clis/amazon/rankings.test.js +41 -0
- package/dist/clis/amazon/shared.d.ts +11 -0
- package/dist/clis/amazon/shared.js +121 -11
- package/dist/clis/amazon/shared.test.js +11 -0
- package/dist/clis/bilibili/comments.js +2 -2
- package/dist/clis/bilibili/comments.test.js +3 -2
- package/dist/clis/bilibili/download.js +2 -1
- package/dist/clis/bilibili/subtitle.js +4 -3
- package/dist/clis/bilibili/subtitle.test.js +2 -1
- package/dist/clis/bilibili/utils.d.ts +5 -0
- package/dist/clis/bilibili/utils.js +30 -0
- package/dist/clis/bilibili/utils.test.d.ts +1 -0
- package/dist/clis/bilibili/utils.test.js +17 -0
- package/dist/clis/douban/marks.js +1 -1
- package/dist/clis/douban/subject.yaml +50 -19
- package/dist/clis/doubao/utils.js +32 -12
- package/dist/clis/douyin/_shared/browser-fetch.test.js +0 -1
- package/dist/clis/douyin/_shared/transcode.test.js +0 -2
- package/dist/clis/douyin/draft.test.js +0 -2
- package/dist/clis/facebook/search.test.js +0 -2
- package/dist/clis/gemini/ask.js +9 -3
- package/dist/clis/gemini/ask.test.d.ts +1 -0
- package/dist/clis/gemini/ask.test.js +100 -0
- package/dist/clis/gemini/reply-state.test.d.ts +1 -0
- package/dist/clis/gemini/reply-state.test.js +641 -0
- package/dist/clis/gemini/utils.d.ts +44 -1
- package/dist/clis/gemini/utils.js +528 -61
- package/dist/clis/gemini/utils.test.js +149 -2
- package/dist/clis/hupu/detail.d.ts +1 -0
- package/dist/clis/hupu/detail.js +72 -0
- package/dist/clis/hupu/hot.yaml +43 -0
- package/dist/clis/hupu/like.d.ts +1 -0
- package/dist/clis/hupu/like.js +75 -0
- package/dist/clis/hupu/reply.d.ts +1 -0
- package/dist/clis/hupu/reply.js +71 -0
- package/dist/clis/hupu/search.d.ts +1 -0
- package/dist/clis/hupu/search.js +59 -0
- package/dist/clis/hupu/unlike.d.ts +1 -0
- package/dist/clis/hupu/unlike.js +75 -0
- package/dist/clis/hupu/utils.d.ts +20 -0
- package/dist/clis/hupu/utils.js +319 -0
- package/dist/clis/instagram/_shared/private-publish.d.ts +138 -0
- package/dist/clis/instagram/_shared/private-publish.js +1030 -0
- package/dist/clis/instagram/_shared/private-publish.test.d.ts +1 -0
- package/dist/clis/instagram/_shared/private-publish.test.js +705 -0
- package/dist/clis/instagram/_shared/protocol-capture.d.ts +26 -0
- package/dist/clis/instagram/_shared/protocol-capture.js +282 -0
- package/dist/clis/instagram/_shared/protocol-capture.test.d.ts +1 -0
- package/dist/clis/instagram/_shared/protocol-capture.test.js +114 -0
- package/dist/clis/instagram/_shared/runtime-info.d.ts +9 -0
- package/dist/clis/instagram/_shared/runtime-info.js +81 -0
- package/dist/clis/instagram/note.d.ts +1 -0
- package/dist/clis/instagram/note.js +222 -0
- package/dist/clis/instagram/note.test.d.ts +1 -0
- package/dist/clis/instagram/note.test.js +81 -0
- package/dist/clis/instagram/post.d.ts +4 -0
- package/dist/clis/instagram/post.js +1496 -0
- package/dist/clis/instagram/post.test.d.ts +1 -0
- package/dist/clis/instagram/post.test.js +1647 -0
- package/dist/clis/instagram/reel.d.ts +1 -0
- package/dist/clis/instagram/reel.js +826 -0
- package/dist/clis/instagram/reel.test.d.ts +1 -0
- package/dist/clis/instagram/reel.test.js +167 -0
- package/dist/clis/instagram/story.d.ts +1 -0
- package/dist/clis/instagram/story.js +115 -0
- package/dist/clis/instagram/story.test.d.ts +1 -0
- package/dist/clis/instagram/story.test.js +167 -0
- package/dist/clis/sinafinance/stock-rank.d.ts +4 -0
- package/dist/clis/sinafinance/stock-rank.js +65 -0
- package/dist/clis/substack/utils.test.js +0 -2
- package/dist/clis/twitter/post.js +72 -45
- package/dist/clis/twitter/post.test.d.ts +1 -0
- package/dist/clis/twitter/post.test.js +116 -0
- package/dist/clis/twitter/reply.d.ts +12 -0
- package/dist/clis/twitter/reply.js +257 -35
- package/dist/clis/twitter/reply.test.d.ts +1 -0
- package/dist/clis/twitter/reply.test.js +151 -0
- package/dist/clis/xianyu/chat.d.ts +7 -0
- package/dist/clis/xianyu/chat.js +146 -0
- package/dist/clis/xianyu/chat.test.d.ts +1 -0
- package/dist/clis/xianyu/chat.test.js +15 -0
- package/dist/clis/xianyu/item.d.ts +7 -0
- package/dist/clis/xianyu/item.js +152 -0
- package/dist/clis/xianyu/item.test.d.ts +1 -0
- package/dist/clis/xianyu/item.test.js +56 -0
- package/dist/clis/xianyu/search.d.ts +10 -0
- package/dist/clis/xianyu/search.js +134 -0
- package/dist/clis/xianyu/search.test.d.ts +1 -0
- package/dist/clis/xianyu/search.test.js +17 -0
- package/dist/clis/xianyu/utils.d.ts +1 -0
- package/dist/clis/xianyu/utils.js +8 -0
- package/dist/clis/xiaoe/catalog.yaml +129 -0
- package/dist/clis/xiaoe/content.yaml +43 -0
- package/dist/clis/xiaoe/courses.yaml +73 -0
- package/dist/clis/xiaoe/detail.yaml +39 -0
- package/dist/clis/xiaoe/play-url.yaml +124 -0
- package/dist/clis/xiaohongshu/comments.test.js +0 -2
- package/dist/clis/xiaohongshu/creator-note-detail.test.js +0 -2
- package/dist/clis/xiaohongshu/creator-notes.test.js +0 -2
- package/dist/clis/xiaohongshu/download.test.js +0 -2
- package/dist/clis/xiaohongshu/note.test.js +0 -2
- package/dist/clis/xiaohongshu/publish.test.js +0 -2
- package/dist/clis/xiaohongshu/search.js +29 -20
- package/dist/clis/xiaohongshu/search.test.js +56 -48
- package/dist/clis/yuanbao/ask.d.ts +21 -0
- package/dist/clis/yuanbao/ask.js +427 -0
- package/dist/clis/yuanbao/ask.test.d.ts +1 -0
- package/dist/clis/yuanbao/ask.test.js +124 -0
- package/dist/clis/yuanbao/new.d.ts +1 -0
- package/dist/clis/yuanbao/new.js +70 -0
- package/dist/clis/yuanbao/new.test.d.ts +1 -0
- package/dist/clis/yuanbao/new.test.js +30 -0
- package/dist/clis/yuanbao/shared.d.ts +13 -0
- package/dist/clis/yuanbao/shared.js +49 -0
- package/dist/clis/zhihu/question.js +30 -19
- package/dist/clis/zhihu/question.test.js +34 -16
- package/dist/commanderAdapter.js +8 -4
- package/dist/commanderAdapter.test.js +42 -0
- package/dist/completion.js +3 -1
- package/dist/completion.test.d.ts +1 -0
- package/dist/completion.test.js +23 -0
- package/dist/doctor.js +1 -1
- package/dist/electron-apps.d.ts +2 -0
- package/dist/electron-apps.js +7 -1
- package/dist/errors.js +1 -1
- package/dist/execution.js +25 -35
- package/dist/explore.js +1 -1
- package/dist/launcher.d.ts +4 -0
- package/dist/launcher.js +64 -8
- package/dist/launcher.test.js +88 -7
- package/dist/output.d.ts +2 -0
- package/dist/output.js +10 -1
- package/dist/output.test.d.ts +0 -3
- package/dist/output.test.js +59 -92
- package/dist/pipeline/executor.test.js +0 -2
- package/dist/pipeline/steps/download.test.js +0 -2
- package/dist/registry.d.ts +2 -0
- package/dist/serialization.d.ts +1 -0
- package/dist/serialization.js +1 -0
- package/dist/types.d.ts +9 -2
- package/docs/.vitepress/config.mts +4 -0
- package/docs/adapters/browser/1688.md +52 -0
- package/docs/adapters/browser/36kr.md +2 -1
- package/docs/adapters/browser/doubao.md +5 -1
- package/docs/adapters/browser/hupu.md +53 -0
- package/docs/adapters/browser/sinafinance.md +32 -2
- package/docs/adapters/browser/weibo.md +6 -1
- package/docs/adapters/browser/wikipedia.md +2 -0
- package/docs/adapters/browser/xianyu.md +42 -0
- package/docs/adapters/browser/xiaoe.md +44 -0
- package/docs/adapters/browser/yuanbao.md +64 -0
- package/docs/adapters/index.md +14 -5
- package/docs/comparison.md +1 -1
- package/docs/developer/ai-workflow.md +2 -2
- package/docs/developer/contributing.md +1 -1
- package/docs/developer/testing.md +2 -0
- package/docs/guide/plugins.md +1 -0
- package/docs/guide/troubleshooting.md +11 -0
- package/docs/superpowers/specs/2026-04-03-v2ex-autoresearch-design.md +41 -0
- package/docs/zh/guide/plugins.md +1 -0
- package/extension/dist/background.js +1127 -0
- package/extension/src/background.test.ts +39 -0
- package/extension/src/background.ts +223 -34
- package/extension/src/cdp.ts +194 -4
- package/extension/src/protocol.ts +22 -1
- package/package.json +3 -2
- package/scripts/postinstall.js +1 -1
- package/skills/opencli-explorer/SKILL.md +1 -1
- package/skills/opencli-oneshot/SKILL.md +2 -2
- package/skills/opencli-operate/SKILL.md +120 -27
- package/skills/opencli-usage/SKILL.md +31 -20
- package/skills/opencli-usage/browser.md +114 -16
- package/skills/opencli-usage/public-api.md +32 -3
- package/skills/smart-search/SKILL.md +156 -0
- package/skills/smart-search/references/sources-ai.md +74 -0
- package/skills/smart-search/references/sources-info.md +43 -0
- package/skills/smart-search/references/sources-media.md +50 -0
- package/skills/smart-search/references/sources-other.md +42 -0
- package/skills/smart-search/references/sources-shopping.md +31 -0
- package/skills/smart-search/references/sources-social.md +51 -0
- package/skills/smart-search/references/sources-tech.md +42 -0
- package/skills/smart-search/references/sources-travel.md +20 -0
- package/src/browser/base-page.ts +41 -6
- package/src/browser/bridge.ts +11 -8
- package/src/browser/cdp.ts +1 -8
- package/src/browser/daemon-client.ts +11 -1
- package/src/browser/dom-helpers.ts +43 -31
- package/src/browser/dom-snapshot.ts +23 -1
- package/src/browser/page.ts +115 -31
- package/src/browser.test.ts +1 -1
- package/src/build-manifest.ts +2 -0
- package/src/cli.test.ts +133 -0
- package/src/cli.ts +73 -11
- package/src/clis/1688/item.test.ts +69 -0
- package/src/clis/1688/item.ts +282 -0
- package/src/clis/1688/search.test.ts +81 -0
- package/src/clis/1688/search.ts +402 -0
- package/src/clis/1688/shared.test.ts +75 -0
- package/src/clis/1688/shared.ts +623 -0
- package/src/clis/1688/store.test.ts +69 -0
- package/src/clis/1688/store.ts +300 -0
- package/src/clis/amazon/bestsellers.test.ts +12 -3
- package/src/clis/amazon/bestsellers.ts +6 -178
- package/src/clis/amazon/movers-shakers.ts +8 -0
- package/src/clis/amazon/new-releases.ts +8 -0
- package/src/clis/amazon/rankings.test.ts +47 -0
- package/src/clis/amazon/rankings.ts +312 -0
- package/src/clis/amazon/shared.test.ts +16 -0
- package/src/clis/amazon/shared.ts +134 -12
- package/src/clis/bilibili/comments.test.ts +4 -3
- package/src/clis/bilibili/comments.ts +2 -2
- package/src/clis/bilibili/download.ts +2 -1
- package/src/clis/bilibili/subtitle.test.ts +2 -1
- package/src/clis/bilibili/subtitle.ts +4 -3
- package/src/clis/bilibili/utils.test.ts +21 -0
- package/src/clis/bilibili/utils.ts +27 -0
- package/src/clis/douban/marks.ts +1 -1
- package/src/clis/douban/subject.yaml +50 -19
- package/src/clis/doubao/utils.ts +32 -12
- package/src/clis/douyin/_shared/browser-fetch.test.ts +0 -1
- package/src/clis/douyin/_shared/transcode.test.ts +0 -2
- package/src/clis/douyin/draft.test.ts +0 -2
- package/src/clis/facebook/search.test.ts +0 -2
- package/src/clis/gemini/ask.test.ts +116 -0
- package/src/clis/gemini/ask.ts +10 -3
- package/src/clis/gemini/reply-state.test.ts +708 -0
- package/src/clis/gemini/utils.test.ts +184 -2
- package/src/clis/gemini/utils.ts +588 -60
- package/src/clis/hupu/detail.ts +126 -0
- package/src/clis/hupu/hot.yaml +43 -0
- package/src/clis/hupu/like.ts +76 -0
- package/src/clis/hupu/reply.ts +76 -0
- package/src/clis/hupu/search.ts +95 -0
- package/src/clis/hupu/unlike.ts +76 -0
- package/src/clis/hupu/utils.ts +381 -0
- package/src/clis/instagram/_shared/private-publish.test.ts +827 -0
- package/src/clis/instagram/_shared/private-publish.ts +1303 -0
- package/src/clis/instagram/_shared/protocol-capture.test.ts +148 -0
- package/src/clis/instagram/_shared/protocol-capture.ts +321 -0
- package/src/clis/instagram/_shared/runtime-info.ts +91 -0
- package/src/clis/instagram/note.test.ts +96 -0
- package/src/clis/instagram/note.ts +254 -0
- package/src/clis/instagram/post.test.ts +1716 -0
- package/src/clis/instagram/post.ts +1620 -0
- package/src/clis/instagram/reel.test.ts +191 -0
- package/src/clis/instagram/reel.ts +886 -0
- package/src/clis/instagram/story.test.ts +191 -0
- package/src/clis/instagram/story.ts +151 -0
- package/src/clis/sinafinance/stock-rank.ts +68 -0
- package/src/clis/substack/utils.test.ts +0 -2
- package/src/clis/twitter/post.test.ts +157 -0
- package/src/clis/twitter/post.ts +82 -48
- package/src/clis/twitter/reply.test.ts +177 -0
- package/src/clis/twitter/reply.ts +285 -39
- package/src/clis/xianyu/chat.test.ts +20 -0
- package/src/clis/xianyu/chat.ts +175 -0
- package/src/clis/xianyu/item.test.ts +67 -0
- package/src/clis/xianyu/item.ts +172 -0
- package/src/clis/xianyu/search.test.ts +22 -0
- package/src/clis/xianyu/search.ts +151 -0
- package/src/clis/xianyu/utils.ts +9 -0
- package/src/clis/xiaoe/catalog.yaml +129 -0
- package/src/clis/xiaoe/content.yaml +43 -0
- package/src/clis/xiaoe/courses.yaml +73 -0
- package/src/clis/xiaoe/detail.yaml +39 -0
- package/src/clis/xiaoe/play-url.yaml +124 -0
- package/src/clis/xiaohongshu/comments.test.ts +0 -2
- package/src/clis/xiaohongshu/creator-note-detail.test.ts +0 -2
- package/src/clis/xiaohongshu/creator-notes.test.ts +0 -2
- package/src/clis/xiaohongshu/download.test.ts +0 -2
- package/src/clis/xiaohongshu/note.test.ts +0 -2
- package/src/clis/xiaohongshu/publish.test.ts +0 -2
- package/src/clis/xiaohongshu/search.test.ts +59 -48
- package/src/clis/xiaohongshu/search.ts +31 -21
- package/src/clis/yuanbao/ask.test.ts +156 -0
- package/src/clis/yuanbao/ask.ts +522 -0
- package/src/clis/yuanbao/new.test.ts +36 -0
- package/src/clis/yuanbao/new.ts +81 -0
- package/src/clis/yuanbao/shared.ts +57 -0
- package/src/clis/zhihu/question.test.ts +42 -17
- package/src/clis/zhihu/question.ts +31 -26
- package/src/commanderAdapter.test.ts +51 -0
- package/src/commanderAdapter.ts +8 -4
- package/src/completion.test.ts +30 -0
- package/src/completion.ts +3 -1
- package/src/doctor.ts +1 -1
- package/src/electron-apps.ts +9 -1
- package/src/errors.ts +1 -1
- package/src/execution.ts +26 -30
- package/src/explore.ts +1 -1
- package/src/launcher.test.ts +121 -7
- package/src/launcher.ts +87 -9
- package/src/output.test.ts +50 -90
- package/src/output.ts +10 -1
- package/src/pipeline/executor.test.ts +0 -2
- package/src/pipeline/steps/download.test.ts +0 -2
- package/src/registry.ts +2 -0
- package/src/serialization.ts +2 -0
- package/src/types.ts +9 -2
- package/tests/e2e/browser-auth.test.ts +9 -0
- package/CLI-EXPLORER.md +0 -724
- package/CLI-ONESHOT.md +0 -216
- package/SKILL.md +0 -59
|
@@ -0,0 +1,300 @@
|
|
|
1
|
+
import { CommandExecutionError, EmptyResultError } from '../../errors.js';
|
|
2
|
+
import { cli, Strategy } from '../../registry.js';
|
|
3
|
+
import type { IPage } from '../../types.js';
|
|
4
|
+
import {
|
|
5
|
+
FACTORY_BADGE_PATTERNS,
|
|
6
|
+
SERVICE_BADGE_PATTERNS,
|
|
7
|
+
assertAuthenticatedState,
|
|
8
|
+
buildDetailUrl,
|
|
9
|
+
buildProvenance,
|
|
10
|
+
canonicalizeSellerUrl,
|
|
11
|
+
canonicalizeStoreUrl,
|
|
12
|
+
cleanMultilineText,
|
|
13
|
+
cleanText,
|
|
14
|
+
extractAddress,
|
|
15
|
+
extractBadges,
|
|
16
|
+
extractMemberId,
|
|
17
|
+
extractMetric,
|
|
18
|
+
extractOfferId,
|
|
19
|
+
extractShopId,
|
|
20
|
+
extractYearsOnPlatform,
|
|
21
|
+
gotoAndReadState,
|
|
22
|
+
guessTopCategories,
|
|
23
|
+
resolveStoreUrl,
|
|
24
|
+
uniqueNonEmpty,
|
|
25
|
+
} from './shared.js';
|
|
26
|
+
|
|
27
|
+
interface StoreBrowserPayload {
|
|
28
|
+
href?: string;
|
|
29
|
+
title?: string;
|
|
30
|
+
bodyText?: string;
|
|
31
|
+
offerLinks?: string[];
|
|
32
|
+
contactLinks?: string[];
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
interface StoreItemSeed {
|
|
36
|
+
href?: string;
|
|
37
|
+
bodyText?: string;
|
|
38
|
+
seller?: {
|
|
39
|
+
companyName?: string;
|
|
40
|
+
memberId?: string;
|
|
41
|
+
winportUrl?: string;
|
|
42
|
+
sellerWinportUrlMap?: Record<string, string>;
|
|
43
|
+
};
|
|
44
|
+
services?: Array<{ serviceName?: string }>;
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
function normalizeStorePayload(input: {
|
|
48
|
+
resolvedUrl: string;
|
|
49
|
+
storePayload: StoreBrowserPayload | null;
|
|
50
|
+
contactPayload: StoreBrowserPayload | null;
|
|
51
|
+
seed: StoreItemSeed | null;
|
|
52
|
+
explicitMemberId: string | null;
|
|
53
|
+
}): Record<string, unknown> {
|
|
54
|
+
const storePayload = input.storePayload;
|
|
55
|
+
const contactPayload = input.contactPayload;
|
|
56
|
+
const seed = input.seed;
|
|
57
|
+
|
|
58
|
+
const contactText = cleanMultilineText(contactPayload?.bodyText);
|
|
59
|
+
const storeText = cleanMultilineText(storePayload?.bodyText);
|
|
60
|
+
const seedText = cleanMultilineText(seed?.bodyText);
|
|
61
|
+
const combinedText = [contactText, storeText, seedText].filter(Boolean).join('\n');
|
|
62
|
+
|
|
63
|
+
const sellerUrlRaw = cleanText(
|
|
64
|
+
seed?.seller?.winportUrl
|
|
65
|
+
?? seed?.seller?.sellerWinportUrlMap?.defaultUrl
|
|
66
|
+
?? storePayload?.href
|
|
67
|
+
?? input.resolvedUrl,
|
|
68
|
+
);
|
|
69
|
+
const storeUrl = safeCanonicalStoreUrl(sellerUrlRaw || input.resolvedUrl) ?? input.resolvedUrl;
|
|
70
|
+
const sellerUrl = canonicalizeSellerUrl(sellerUrlRaw) ?? storeUrl;
|
|
71
|
+
const companyUrl = pickCompanyUrl(contactPayload?.href, storeUrl);
|
|
72
|
+
const memberId = cleanText(seed?.seller?.memberId)
|
|
73
|
+
|| input.explicitMemberId
|
|
74
|
+
|| extractMemberId(input.resolvedUrl)
|
|
75
|
+
|| extractMemberId(storePayload?.href ?? '')
|
|
76
|
+
|| null;
|
|
77
|
+
const shopId = extractShopId(sellerUrl) ?? extractShopId(storeUrl);
|
|
78
|
+
const companyName = cleanText(seed?.seller?.companyName)
|
|
79
|
+
|| firstNamedLine(contactText)
|
|
80
|
+
|| firstNamedLine(storeText)
|
|
81
|
+
|| null;
|
|
82
|
+
const serviceBadges = uniqueNonEmpty([
|
|
83
|
+
...extractBadges(combinedText, SERVICE_BADGE_PATTERNS),
|
|
84
|
+
...((seed?.services ?? []).map((service) => cleanText(service.serviceName))),
|
|
85
|
+
]);
|
|
86
|
+
const factoryBadges = extractBadges(combinedText, FACTORY_BADGE_PATTERNS);
|
|
87
|
+
|
|
88
|
+
return {
|
|
89
|
+
member_id: memberId,
|
|
90
|
+
shop_id: shopId,
|
|
91
|
+
store_name: companyName,
|
|
92
|
+
store_url: storeUrl,
|
|
93
|
+
company_name: companyName,
|
|
94
|
+
company_url: companyUrl,
|
|
95
|
+
business_model_text: firstMetric(combinedText, ['经营模式', '生产加工', '主营产品']),
|
|
96
|
+
years_on_platform_text: extractYearsOnPlatform(combinedText),
|
|
97
|
+
location: extractAddress(contactText) ?? extractAddress(storeText),
|
|
98
|
+
staff_size_text: firstMetric(combinedText, ['员工人数', '员工总数']),
|
|
99
|
+
factory_badges: factoryBadges,
|
|
100
|
+
service_badges: serviceBadges,
|
|
101
|
+
response_rate_text: firstMetric(combinedText, ['响应率', '回复率', '响应速度']),
|
|
102
|
+
return_rate_text: extractReturnRate(combinedText),
|
|
103
|
+
top_categories: guessTopCategories(combinedText),
|
|
104
|
+
phone_text: extractMetric(contactText, '电话'),
|
|
105
|
+
mobile_text: extractMetric(contactText, '手机'),
|
|
106
|
+
...buildProvenance(cleanText(contactPayload?.href) || cleanText(storePayload?.href) || input.resolvedUrl),
|
|
107
|
+
};
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
function safeCanonicalStoreUrl(url: string): string | null {
|
|
111
|
+
try {
|
|
112
|
+
return canonicalizeStoreUrl(url);
|
|
113
|
+
} catch {
|
|
114
|
+
return null;
|
|
115
|
+
}
|
|
116
|
+
}
|
|
117
|
+
|
|
118
|
+
function pickCompanyUrl(contactHref: string | undefined, storeUrl: string): string | null {
|
|
119
|
+
const fromPage = cleanText(contactHref);
|
|
120
|
+
if (fromPage) {
|
|
121
|
+
const normalized = buildContactUrl(fromPage);
|
|
122
|
+
if (normalized) return normalized;
|
|
123
|
+
}
|
|
124
|
+
return buildContactUrl(storeUrl);
|
|
125
|
+
}
|
|
126
|
+
|
|
127
|
+
function buildContactUrl(storeUrl: string): string | null {
|
|
128
|
+
try {
|
|
129
|
+
const parsed = new URL(storeUrl);
|
|
130
|
+
if (!parsed.hostname.endsWith('.1688.com')) return null;
|
|
131
|
+
return `${parsed.protocol}//${parsed.hostname}/page/contactinfo.html`;
|
|
132
|
+
} catch {
|
|
133
|
+
return null;
|
|
134
|
+
}
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
function firstNamedLine(text: string): string | null {
|
|
138
|
+
return text
|
|
139
|
+
.split('\n')
|
|
140
|
+
.map((line) => cleanText(line))
|
|
141
|
+
.find((line) => line.includes('有限公司') || line.includes('商行') || line.includes('工厂'))
|
|
142
|
+
?? null;
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
function firstMetric(text: string, labels: string[]): string | null {
|
|
146
|
+
for (const label of labels) {
|
|
147
|
+
const value = extractMetric(text, label);
|
|
148
|
+
if (value) return value;
|
|
149
|
+
}
|
|
150
|
+
return null;
|
|
151
|
+
}
|
|
152
|
+
|
|
153
|
+
function extractReturnRate(text: string): string | null {
|
|
154
|
+
const inline = text.match(/回头率\s*([0-9.]+%)/);
|
|
155
|
+
if (inline) return cleanText(inline[0]);
|
|
156
|
+
const multiline = text.match(/回头率\s*\n\s*([0-9.]+%)/);
|
|
157
|
+
if (!multiline) return null;
|
|
158
|
+
return `回头率${cleanText(multiline[1])}`;
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
function firstOfferId(links: string[]): string | null {
|
|
162
|
+
for (const link of links) {
|
|
163
|
+
const offerId = extractOfferId(link);
|
|
164
|
+
if (offerId) return offerId;
|
|
165
|
+
}
|
|
166
|
+
return null;
|
|
167
|
+
}
|
|
168
|
+
|
|
169
|
+
function firstContactUrl(links: string[]): string | null {
|
|
170
|
+
for (const link of links) {
|
|
171
|
+
const url = buildContactUrl(link);
|
|
172
|
+
if (url) return url;
|
|
173
|
+
}
|
|
174
|
+
return null;
|
|
175
|
+
}
|
|
176
|
+
|
|
177
|
+
async function readStorePayload(page: IPage, url: string, action: string): Promise<StoreBrowserPayload> {
|
|
178
|
+
const state = await gotoAndReadState(page, url, 2500, action);
|
|
179
|
+
assertAuthenticatedState(state, action);
|
|
180
|
+
|
|
181
|
+
return await page.evaluate(`
|
|
182
|
+
(() => ({
|
|
183
|
+
href: window.location.href,
|
|
184
|
+
title: document.title || '',
|
|
185
|
+
bodyText: document.body ? document.body.innerText || '' : '',
|
|
186
|
+
offerLinks: Array.from(document.querySelectorAll('a[href*="detail.1688.com/offer/"], a[href*="offerId="]'))
|
|
187
|
+
.map((anchor) => anchor.href)
|
|
188
|
+
.filter(Boolean),
|
|
189
|
+
contactLinks: Array.from(document.querySelectorAll('a[href*="contactinfo"]'))
|
|
190
|
+
.map((anchor) => anchor.href)
|
|
191
|
+
.filter(Boolean),
|
|
192
|
+
}))()
|
|
193
|
+
`) as StoreBrowserPayload;
|
|
194
|
+
}
|
|
195
|
+
|
|
196
|
+
async function readItemSeed(page: IPage, offerId: string): Promise<StoreItemSeed> {
|
|
197
|
+
const itemUrl = buildDetailUrl(offerId);
|
|
198
|
+
const state = await gotoAndReadState(page, itemUrl, 2500, 'store seed item');
|
|
199
|
+
assertAuthenticatedState(state, 'store seed item');
|
|
200
|
+
|
|
201
|
+
const seed = await page.evaluate(`
|
|
202
|
+
(() => {
|
|
203
|
+
const model = window.context?.result?.global?.globalData?.model ?? null;
|
|
204
|
+
const toJson = (value) => JSON.parse(JSON.stringify(value ?? null));
|
|
205
|
+
return {
|
|
206
|
+
href: window.location.href,
|
|
207
|
+
bodyText: document.body ? document.body.innerText || '' : '',
|
|
208
|
+
seller: toJson(model?.sellerModel),
|
|
209
|
+
services: toJson(model?.shippingServices?.fields?.buyerProtectionModel ?? []),
|
|
210
|
+
};
|
|
211
|
+
})()
|
|
212
|
+
`) as StoreItemSeed;
|
|
213
|
+
|
|
214
|
+
const hasSellerContext = !!cleanText(seed?.seller?.memberId) || !!cleanText(seed?.seller?.winportUrl);
|
|
215
|
+
if (!hasSellerContext) {
|
|
216
|
+
throw new CommandExecutionError(
|
|
217
|
+
'1688 store seed item did not expose seller context',
|
|
218
|
+
'当前 tab 非商品详情上下文,请切到 detail.1688.com 商品页并重试',
|
|
219
|
+
);
|
|
220
|
+
}
|
|
221
|
+
|
|
222
|
+
return seed;
|
|
223
|
+
}
|
|
224
|
+
|
|
225
|
+
function hasAnyEvidence(
|
|
226
|
+
storePayload: StoreBrowserPayload | null,
|
|
227
|
+
contactPayload: StoreBrowserPayload | null,
|
|
228
|
+
seed: StoreItemSeed | null,
|
|
229
|
+
): boolean {
|
|
230
|
+
return !!cleanText(storePayload?.bodyText)
|
|
231
|
+
|| !!cleanText(contactPayload?.bodyText)
|
|
232
|
+
|| !!cleanText(seed?.bodyText);
|
|
233
|
+
}
|
|
234
|
+
|
|
235
|
+
cli({
|
|
236
|
+
site: '1688',
|
|
237
|
+
name: 'store',
|
|
238
|
+
description: '1688 店铺/供应商公开信息(联系方式、主营、入驻年限、公开服务信号)',
|
|
239
|
+
domain: 'www.1688.com',
|
|
240
|
+
strategy: Strategy.COOKIE,
|
|
241
|
+
navigateBefore: false,
|
|
242
|
+
args: [
|
|
243
|
+
{
|
|
244
|
+
name: 'input',
|
|
245
|
+
required: true,
|
|
246
|
+
positional: true,
|
|
247
|
+
help: '1688 店铺 URL 或 member ID(如 b2b-22154705262941f196)',
|
|
248
|
+
},
|
|
249
|
+
],
|
|
250
|
+
columns: ['store_name', 'years_on_platform_text', 'location', 'return_rate_text'],
|
|
251
|
+
func: async (page, kwargs) => {
|
|
252
|
+
const rawInput = String(kwargs.input ?? '');
|
|
253
|
+
const resolvedUrl = resolveStoreUrl(rawInput);
|
|
254
|
+
const explicitMemberId = extractMemberId(rawInput);
|
|
255
|
+
|
|
256
|
+
const storePayload = await readStorePayload(page, resolvedUrl, 'store');
|
|
257
|
+
const contactUrl = firstContactUrl(storePayload.contactLinks ?? []) || buildContactUrl(storePayload.href || resolvedUrl);
|
|
258
|
+
const contactPayload = contactUrl ? await readStorePayload(page, contactUrl, 'store contact') : null;
|
|
259
|
+
const offerId = extractOfferId(rawInput)
|
|
260
|
+
|| firstOfferId(storePayload.offerLinks ?? [])
|
|
261
|
+
|| firstOfferId(contactPayload?.offerLinks ?? []);
|
|
262
|
+
|
|
263
|
+
let seed: StoreItemSeed | null = null;
|
|
264
|
+
if (offerId) {
|
|
265
|
+
try {
|
|
266
|
+
seed = await readItemSeed(page, offerId);
|
|
267
|
+
} catch (error) {
|
|
268
|
+
if (!(error instanceof CommandExecutionError)) throw error;
|
|
269
|
+
}
|
|
270
|
+
}
|
|
271
|
+
|
|
272
|
+
if (!hasAnyEvidence(storePayload, contactPayload, seed)) {
|
|
273
|
+
throw new EmptyResultError(
|
|
274
|
+
'1688 store',
|
|
275
|
+
'Store page is reachable but no visible fields were extracted. Open the store page in Chrome and retry.',
|
|
276
|
+
);
|
|
277
|
+
}
|
|
278
|
+
|
|
279
|
+
return [
|
|
280
|
+
normalizeStorePayload({
|
|
281
|
+
resolvedUrl,
|
|
282
|
+
storePayload,
|
|
283
|
+
contactPayload,
|
|
284
|
+
seed,
|
|
285
|
+
explicitMemberId,
|
|
286
|
+
}),
|
|
287
|
+
];
|
|
288
|
+
},
|
|
289
|
+
});
|
|
290
|
+
|
|
291
|
+
export const __test__ = {
|
|
292
|
+
normalizeStorePayload,
|
|
293
|
+
safeCanonicalStoreUrl,
|
|
294
|
+
buildContactUrl,
|
|
295
|
+
firstNamedLine,
|
|
296
|
+
firstMetric,
|
|
297
|
+
extractReturnRate,
|
|
298
|
+
firstOfferId,
|
|
299
|
+
firstContactUrl,
|
|
300
|
+
};
|
|
@@ -1,9 +1,9 @@
|
|
|
1
1
|
import { describe, expect, it } from 'vitest';
|
|
2
|
-
import { __test__ } from './
|
|
2
|
+
import { __test__ } from './rankings.js';
|
|
3
3
|
|
|
4
4
|
describe('amazon bestsellers normalization', () => {
|
|
5
5
|
it('normalizes bestseller cards and infers review counts from card text', () => {
|
|
6
|
-
const result = __test__.
|
|
6
|
+
const result = __test__.normalizeRankingCandidate({
|
|
7
7
|
asin: 'B0DR31GC3D',
|
|
8
8
|
title: '',
|
|
9
9
|
href: 'https://www.amazon.com/NUTIKAS-Shelves-Desktop-Orgnizer-Shlef/dp/B0DR31GC3D/ref=zg_bs',
|
|
@@ -11,7 +11,16 @@ describe('amazon bestsellers normalization', () => {
|
|
|
11
11
|
rating_text: '4.3 out of 5 stars',
|
|
12
12
|
review_count_text: '',
|
|
13
13
|
card_text: 'Desk Shelves Desktop Organizer Shlef\n4.3 out of 5 stars\n435\n$25.92',
|
|
14
|
-
},
|
|
14
|
+
}, {
|
|
15
|
+
listType: 'bestsellers',
|
|
16
|
+
rankFallback: 2,
|
|
17
|
+
listTitle: 'Amazon Best Sellers: Best Desktop & Off-Surface Shelves',
|
|
18
|
+
sourceUrl: 'https://www.amazon.com/example',
|
|
19
|
+
categoryTitle: null,
|
|
20
|
+
categoryUrl: 'https://www.amazon.com/example',
|
|
21
|
+
categoryPath: [],
|
|
22
|
+
visibleCategoryLinks: [],
|
|
23
|
+
});
|
|
15
24
|
|
|
16
25
|
expect(result.rank).toBe(2);
|
|
17
26
|
expect(result.asin).toBe('B0DR31GC3D');
|
|
@@ -1,180 +1,8 @@
|
|
|
1
|
-
import {
|
|
2
|
-
import {
|
|
3
|
-
import type { IPage } from '../../types.js';
|
|
4
|
-
import {
|
|
5
|
-
buildProvenance,
|
|
6
|
-
cleanText,
|
|
7
|
-
extractAsin,
|
|
8
|
-
extractReviewCountFromCardText,
|
|
9
|
-
firstMeaningfulLine,
|
|
10
|
-
normalizeProductUrl,
|
|
11
|
-
parsePriceText,
|
|
12
|
-
parseRatingValue,
|
|
13
|
-
parseReviewCount,
|
|
14
|
-
resolveBestsellersUrl,
|
|
15
|
-
uniqueNonEmpty,
|
|
16
|
-
assertUsableState,
|
|
17
|
-
gotoAndReadState,
|
|
18
|
-
} from './shared.js';
|
|
1
|
+
import { cli } from '../../registry.js';
|
|
2
|
+
import { createRankingCliOptions } from './rankings.js';
|
|
19
3
|
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
list_title?: string;
|
|
24
|
-
cards?: Array<{
|
|
25
|
-
rank_text?: string | null;
|
|
26
|
-
asin?: string | null;
|
|
27
|
-
title?: string | null;
|
|
28
|
-
href?: string | null;
|
|
29
|
-
price_text?: string | null;
|
|
30
|
-
rating_text?: string | null;
|
|
31
|
-
review_count_text?: string | null;
|
|
32
|
-
card_text?: string | null;
|
|
33
|
-
}>;
|
|
34
|
-
page_links?: string[];
|
|
35
|
-
}
|
|
36
|
-
|
|
37
|
-
function normalizeBestsellerCandidate(
|
|
38
|
-
candidate: NonNullable<BestsellersPagePayload['cards']>[number],
|
|
39
|
-
rank: number,
|
|
40
|
-
listTitle: string | null,
|
|
41
|
-
sourceUrl: string,
|
|
42
|
-
): Record<string, unknown> {
|
|
43
|
-
const productUrl = normalizeProductUrl(candidate.href);
|
|
44
|
-
const asin = extractAsin(candidate.asin ?? '') ?? extractAsin(productUrl ?? '') ?? null;
|
|
45
|
-
const title = cleanText(candidate.title) || firstMeaningfulLine(candidate.card_text);
|
|
46
|
-
const price = parsePriceText(cleanText(candidate.price_text) || candidate.card_text);
|
|
47
|
-
const ratingText = cleanText(candidate.rating_text) || null;
|
|
48
|
-
const reviewCountText = cleanText(candidate.review_count_text)
|
|
49
|
-
|| extractReviewCountFromCardText(candidate.card_text)
|
|
50
|
-
|| null;
|
|
51
|
-
const provenance = buildProvenance(sourceUrl);
|
|
52
|
-
|
|
53
|
-
return {
|
|
54
|
-
rank,
|
|
55
|
-
asin,
|
|
56
|
-
title: title || null,
|
|
57
|
-
product_url: productUrl,
|
|
58
|
-
list_title: listTitle,
|
|
59
|
-
...provenance,
|
|
60
|
-
price_text: price.price_text,
|
|
61
|
-
price_value: price.price_value,
|
|
62
|
-
currency: price.currency,
|
|
63
|
-
rating_text: ratingText,
|
|
64
|
-
rating_value: parseRatingValue(ratingText),
|
|
65
|
-
review_count_text: reviewCountText,
|
|
66
|
-
review_count: parseReviewCount(reviewCountText),
|
|
67
|
-
};
|
|
68
|
-
}
|
|
69
|
-
|
|
70
|
-
async function readBestsellersPage(page: IPage, url: string): Promise<BestsellersPagePayload> {
|
|
71
|
-
const state = await gotoAndReadState(page, url, 2500, 'bestsellers');
|
|
72
|
-
assertUsableState(state, 'bestsellers');
|
|
73
|
-
|
|
74
|
-
return await page.evaluate(`
|
|
75
|
-
(() => ({
|
|
76
|
-
href: window.location.href,
|
|
77
|
-
title: document.title || '',
|
|
78
|
-
list_title:
|
|
79
|
-
document.querySelector('#zg_banner_text')?.textContent
|
|
80
|
-
|| document.querySelector('h1')?.textContent
|
|
81
|
-
|| '',
|
|
82
|
-
cards: Array.from(document.querySelectorAll('.p13n-sc-uncoverable-faceout'))
|
|
83
|
-
.map((card) => ({
|
|
84
|
-
rank_text:
|
|
85
|
-
card.querySelector('.zg-bdg-text')?.textContent
|
|
86
|
-
|| card.querySelector('[class*="rank"]')?.textContent
|
|
87
|
-
|| '',
|
|
88
|
-
asin: card.id || '',
|
|
89
|
-
title:
|
|
90
|
-
card.querySelector('[class*="line-clamp"]')?.textContent
|
|
91
|
-
|| card.querySelector('img')?.getAttribute('alt')
|
|
92
|
-
|| '',
|
|
93
|
-
href: card.querySelector('a[href*="/dp/"]')?.href || '',
|
|
94
|
-
price_text: card.querySelector('.a-price .a-offscreen')?.textContent || '',
|
|
95
|
-
rating_text: card.querySelector('[aria-label*="out of 5 stars"]')?.getAttribute('aria-label') || '',
|
|
96
|
-
review_count_text:
|
|
97
|
-
card.querySelector('a[href*="#customerReviews"]')?.textContent
|
|
98
|
-
|| card.querySelector('.a-size-small')?.textContent
|
|
99
|
-
|| '',
|
|
100
|
-
card_text: card.innerText || '',
|
|
101
|
-
})),
|
|
102
|
-
page_links: Array.from(document.querySelectorAll('li.a-normal a, li.a-selected a'))
|
|
103
|
-
.map((anchor) => anchor.href || '')
|
|
104
|
-
.filter((href) => /\\/zgbs\\//.test(href) && /(?:[?&]pg=|ref=zg_bs_pg_)/.test(href)),
|
|
105
|
-
}))()
|
|
106
|
-
`) as BestsellersPagePayload;
|
|
107
|
-
}
|
|
108
|
-
|
|
109
|
-
cli({
|
|
110
|
-
site: 'amazon',
|
|
111
|
-
name: 'bestsellers',
|
|
4
|
+
cli(createRankingCliOptions({
|
|
5
|
+
commandName: 'bestsellers',
|
|
6
|
+
listType: 'bestsellers',
|
|
112
7
|
description: 'Amazon Best Sellers pages for category candidate discovery',
|
|
113
|
-
|
|
114
|
-
strategy: Strategy.COOKIE,
|
|
115
|
-
navigateBefore: false,
|
|
116
|
-
args: [
|
|
117
|
-
{
|
|
118
|
-
name: 'input',
|
|
119
|
-
positional: true,
|
|
120
|
-
help: 'Best sellers URL or /zgbs path. Omit to use the root Best Sellers page.',
|
|
121
|
-
},
|
|
122
|
-
{
|
|
123
|
-
name: 'limit',
|
|
124
|
-
type: 'int',
|
|
125
|
-
default: 100,
|
|
126
|
-
help: 'Maximum number of ranked items to return (default 100)',
|
|
127
|
-
},
|
|
128
|
-
],
|
|
129
|
-
columns: ['rank', 'asin', 'title', 'price_text', 'rating_value', 'review_count'],
|
|
130
|
-
func: async (page, kwargs) => {
|
|
131
|
-
const limit = Math.max(1, Number(kwargs.limit) || 100);
|
|
132
|
-
const initialUrl = resolveBestsellersUrl(typeof kwargs.input === 'string' ? kwargs.input : undefined);
|
|
133
|
-
|
|
134
|
-
const queue = [initialUrl];
|
|
135
|
-
const visited = new Set<string>();
|
|
136
|
-
const seenAsins = new Set<string>();
|
|
137
|
-
const results: Record<string, unknown>[] = [];
|
|
138
|
-
let listTitle: string | null = null;
|
|
139
|
-
|
|
140
|
-
while (queue.length > 0 && results.length < limit) {
|
|
141
|
-
const nextUrl = queue.shift()!;
|
|
142
|
-
if (visited.has(nextUrl)) continue;
|
|
143
|
-
visited.add(nextUrl);
|
|
144
|
-
|
|
145
|
-
const payload = await readBestsellersPage(page, nextUrl);
|
|
146
|
-
const sourceUrl = cleanText(payload.href) || nextUrl;
|
|
147
|
-
listTitle = cleanText(payload.list_title) || cleanText(payload.title) || listTitle;
|
|
148
|
-
const cards = payload.cards ?? [];
|
|
149
|
-
|
|
150
|
-
for (const card of cards) {
|
|
151
|
-
const normalized = normalizeBestsellerCandidate(card, results.length + 1, listTitle, sourceUrl);
|
|
152
|
-
const asin = cleanText(String(normalized.asin ?? ''));
|
|
153
|
-
if (!asin || seenAsins.has(asin)) continue;
|
|
154
|
-
seenAsins.add(asin);
|
|
155
|
-
results.push(normalized);
|
|
156
|
-
if (results.length >= limit) break;
|
|
157
|
-
}
|
|
158
|
-
|
|
159
|
-
const pageLinks = uniqueNonEmpty(payload.page_links ?? []);
|
|
160
|
-
for (const href of pageLinks) {
|
|
161
|
-
if (!visited.has(href) && !queue.includes(href)) {
|
|
162
|
-
queue.push(href);
|
|
163
|
-
}
|
|
164
|
-
}
|
|
165
|
-
}
|
|
166
|
-
|
|
167
|
-
if (results.length === 0) {
|
|
168
|
-
throw new CommandExecutionError(
|
|
169
|
-
'amazon bestsellers did not expose any ranked items',
|
|
170
|
-
'Open the same best sellers page in Chrome, verify it is a real Amazon ranking page, and retry.',
|
|
171
|
-
);
|
|
172
|
-
}
|
|
173
|
-
|
|
174
|
-
return results.slice(0, limit);
|
|
175
|
-
},
|
|
176
|
-
});
|
|
177
|
-
|
|
178
|
-
export const __test__ = {
|
|
179
|
-
normalizeBestsellerCandidate,
|
|
180
|
-
};
|
|
8
|
+
}));
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import { cli } from '../../registry.js';
|
|
2
|
+
import { createRankingCliOptions } from './rankings.js';
|
|
3
|
+
|
|
4
|
+
cli(createRankingCliOptions({
|
|
5
|
+
commandName: 'movers-shakers',
|
|
6
|
+
listType: 'movers_shakers',
|
|
7
|
+
description: 'Amazon Movers & Shakers pages for short-term growth signals',
|
|
8
|
+
}));
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import { cli } from '../../registry.js';
|
|
2
|
+
import { createRankingCliOptions } from './rankings.js';
|
|
3
|
+
|
|
4
|
+
cli(createRankingCliOptions({
|
|
5
|
+
commandName: 'new-releases',
|
|
6
|
+
listType: 'new_releases',
|
|
7
|
+
description: 'Amazon New Releases pages for early momentum discovery',
|
|
8
|
+
}));
|
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
import { describe, expect, it } from 'vitest';
|
|
2
|
+
import { __test__ } from './rankings.js';
|
|
3
|
+
|
|
4
|
+
describe('amazon rankings helpers', () => {
|
|
5
|
+
it('normalizes ranking candidates with unified schema', () => {
|
|
6
|
+
const result = __test__.normalizeRankingCandidate(
|
|
7
|
+
{
|
|
8
|
+
rank_text: '#3',
|
|
9
|
+
asin: 'B0DR31GC3D',
|
|
10
|
+
title: 'Desk Shelves Desktop Organizer',
|
|
11
|
+
href: 'https://www.amazon.com/dp/B0DR31GC3D/ref=zg_bs',
|
|
12
|
+
price_text: '$25.92',
|
|
13
|
+
rating_text: '4.3 out of 5 stars',
|
|
14
|
+
review_count_text: '435',
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
listType: 'new_releases',
|
|
18
|
+
rankFallback: 3,
|
|
19
|
+
listTitle: 'Amazon New Releases',
|
|
20
|
+
sourceUrl: 'https://www.amazon.com/gp/new-releases',
|
|
21
|
+
categoryTitle: 'Home & Kitchen',
|
|
22
|
+
categoryUrl: 'https://www.amazon.com/gp/new-releases/home-garden',
|
|
23
|
+
categoryPath: ['Home & Kitchen'],
|
|
24
|
+
visibleCategoryLinks: [{ title: 'Storage', url: 'https://www.amazon.com/gp/new-releases/storage', node_id: null }],
|
|
25
|
+
},
|
|
26
|
+
);
|
|
27
|
+
|
|
28
|
+
expect(result.list_type).toBe('new_releases');
|
|
29
|
+
expect(result.rank).toBe(3);
|
|
30
|
+
expect(result.asin).toBe('B0DR31GC3D');
|
|
31
|
+
expect(result.product_url).toBe('https://www.amazon.com/dp/B0DR31GC3D');
|
|
32
|
+
expect(result.category_title).toBe('Home & Kitchen');
|
|
33
|
+
expect(result.visible_category_links).toEqual([
|
|
34
|
+
{ title: 'Storage', url: 'https://www.amazon.com/gp/new-releases/storage', node_id: null },
|
|
35
|
+
]);
|
|
36
|
+
});
|
|
37
|
+
|
|
38
|
+
it('deduplicates category links and parses rank fallback', () => {
|
|
39
|
+
const links = __test__.normalizeVisibleCategoryLinks([
|
|
40
|
+
{ title: 'Kitchen', url: '/gp/new-releases/home-garden' },
|
|
41
|
+
{ title: 'Kitchen', url: 'https://www.amazon.com/gp/new-releases/home-garden' },
|
|
42
|
+
{ title: 'Storage', url: '/gp/new-releases/storage', node_id: '1064954' },
|
|
43
|
+
]);
|
|
44
|
+
expect(links.length).toBe(2);
|
|
45
|
+
expect(__test__.parseRank('N/A', 8)).toBe(8);
|
|
46
|
+
});
|
|
47
|
+
});
|