@web-auto/webauto 0.1.1 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (354) hide show
  1. package/apps/desktop-console/default-settings.json +1 -0
  2. package/apps/desktop-console/dist/main/index.mjs +1618 -0
  3. package/apps/desktop-console/{src → dist}/main/preload.mjs +10 -0
  4. package/apps/desktop-console/dist/renderer/index.js +3063 -0
  5. package/apps/desktop-console/entry/ui-console.mjs +299 -0
  6. package/apps/webauto/entry/account.mjs +356 -0
  7. package/apps/webauto/entry/lib/account-detect.mjs +160 -0
  8. package/apps/webauto/entry/lib/account-store.mjs +587 -0
  9. package/apps/webauto/entry/lib/profilepool.mjs +1 -1
  10. package/apps/webauto/entry/xhs-install.mjs +27 -3
  11. package/apps/webauto/entry/xhs-status.mjs +152 -0
  12. package/apps/webauto/entry/xhs-unified.mjs +595 -17
  13. package/bin/webauto.mjs +247 -12
  14. package/dist/apps/webauto/server.js +66 -0
  15. package/dist/modules/camo-backend/src/index.js +575 -0
  16. package/dist/modules/camo-backend/src/internal/BrowserSession.js +817 -0
  17. package/dist/modules/camo-backend/src/internal/ElementRegistry.js +61 -0
  18. package/dist/modules/camo-backend/src/internal/ProfileLock.js +85 -0
  19. package/dist/modules/camo-backend/src/internal/SessionManager.js +172 -0
  20. package/dist/modules/camo-backend/src/internal/container-matcher.js +852 -0
  21. package/dist/modules/camo-backend/src/internal/engine-manager.js +258 -0
  22. package/dist/modules/camo-backend/src/internal/fingerprint.js +203 -0
  23. package/dist/modules/camo-backend/src/internal/pageRuntime.js +29 -0
  24. package/dist/modules/camo-backend/src/internal/runtimeInjector.js +30 -0
  25. package/dist/modules/camo-backend/src/internal/state-bus.js +46 -0
  26. package/dist/modules/camo-backend/src/internal/storage-paths.js +36 -0
  27. package/dist/modules/camo-backend/src/internal/ws-server.js +1202 -0
  28. package/dist/modules/camo-runtime/src/utils/browser-service.mjs +423 -0
  29. package/dist/modules/camo-runtime/src/utils/config.mjs +77 -0
  30. package/dist/modules/container-registry/src/index.js +184 -0
  31. package/dist/modules/logging/src/index.js +92 -0
  32. package/dist/modules/operations/src/builtin.js +27 -0
  33. package/dist/modules/operations/src/container-binding.js +75 -0
  34. package/dist/modules/operations/src/executor.js +146 -0
  35. package/dist/modules/operations/src/operations/click.js +167 -0
  36. package/dist/modules/operations/src/operations/extract.js +204 -0
  37. package/dist/modules/operations/src/operations/find-child.js +17 -0
  38. package/dist/modules/operations/src/operations/highlight.js +138 -0
  39. package/dist/modules/operations/src/operations/key.js +61 -0
  40. package/dist/modules/operations/src/operations/navigate.js +148 -0
  41. package/dist/modules/operations/src/operations/scroll.js +126 -0
  42. package/dist/modules/operations/src/operations/type.js +190 -0
  43. package/dist/modules/operations/src/queue.js +100 -0
  44. package/dist/modules/operations/src/registry.js +11 -0
  45. package/dist/modules/operations/src/system/mouse.js +33 -0
  46. package/dist/modules/state/src/atomic-json.js +33 -0
  47. package/dist/modules/workflow/blocks/AnchorVerificationBlock.js +71 -0
  48. package/dist/modules/workflow/blocks/BehaviorRandomizer.js +26 -0
  49. package/dist/modules/workflow/blocks/CallWorkflowBlock.js +38 -0
  50. package/dist/modules/workflow/blocks/CloseDetailBlock.js +209 -0
  51. package/dist/modules/workflow/blocks/CollectBatch.js +137 -0
  52. package/dist/modules/workflow/blocks/CollectCommentsBlock.js +415 -0
  53. package/dist/modules/workflow/blocks/CollectSearchListBlock.js +599 -0
  54. package/dist/modules/workflow/blocks/CollectWeiboPosts.js +229 -0
  55. package/dist/modules/workflow/blocks/DetectPageStateBlock.js +259 -0
  56. package/dist/modules/workflow/blocks/EnsureLoginBlock.js +162 -0
  57. package/dist/modules/workflow/blocks/EnsureSession.js +426 -0
  58. package/dist/modules/workflow/blocks/ErrorClassifier.js +164 -0
  59. package/dist/modules/workflow/blocks/ErrorRecoveryBlock.js +319 -0
  60. package/dist/modules/workflow/blocks/ExpandCommentsBlock.js +1032 -0
  61. package/dist/modules/workflow/blocks/ExtractDetailBlock.js +310 -0
  62. package/dist/modules/workflow/blocks/ExtractPostFields.js +88 -0
  63. package/dist/modules/workflow/blocks/GenerateSmartReplyBlock.js +68 -0
  64. package/dist/modules/workflow/blocks/GoToSearchBlock.js +497 -0
  65. package/dist/modules/workflow/blocks/GracefulFallbackBlock.js +104 -0
  66. package/dist/modules/workflow/blocks/HighlightBlock.js +66 -0
  67. package/dist/modules/workflow/blocks/InitAutoScroll.js +65 -0
  68. package/dist/modules/workflow/blocks/LoadContainerDefinition.js +50 -0
  69. package/dist/modules/workflow/blocks/LoadContainerIndex.js +43 -0
  70. package/dist/modules/workflow/blocks/LocateAndGuardBlock.js +176 -0
  71. package/dist/modules/workflow/blocks/LoginRecoveryBlock.js +242 -0
  72. package/dist/modules/workflow/blocks/MatchContainers.js +64 -0
  73. package/dist/modules/workflow/blocks/MonitoringBlock.js +190 -0
  74. package/dist/modules/workflow/blocks/OpenDetailBlock.js +1240 -0
  75. package/dist/modules/workflow/blocks/OrganizeXhsNotesBlock.js +117 -0
  76. package/dist/modules/workflow/blocks/PersistXhsNoteBlock.js +270 -0
  77. package/dist/modules/workflow/blocks/PickSinglePost.js +69 -0
  78. package/dist/modules/workflow/blocks/ProgressTracker.js +125 -0
  79. package/dist/modules/workflow/blocks/RecordFixtureBlock.js +44 -0
  80. package/dist/modules/workflow/blocks/RenderMarkdown.js +48 -0
  81. package/dist/modules/workflow/blocks/SaveFile.js +54 -0
  82. package/dist/modules/workflow/blocks/ScrollNextBatch.js +72 -0
  83. package/dist/modules/workflow/blocks/SessionHealthBlock.js +73 -0
  84. package/dist/modules/workflow/blocks/StartBrowserService.js +45 -0
  85. package/dist/modules/workflow/blocks/ValidateContainerDefinition.js +67 -0
  86. package/dist/modules/workflow/blocks/ValidateExtract.js +35 -0
  87. package/dist/modules/workflow/blocks/WaitSearchPermitBlock.js +162 -0
  88. package/dist/modules/workflow/blocks/WaitStable.js +74 -0
  89. package/dist/modules/workflow/blocks/WarmupCommentsBlock.js +120 -0
  90. package/dist/modules/workflow/blocks/WorkflowExecutor.js +156 -0
  91. package/dist/modules/workflow/blocks/XiaohongshuCollectFromLinksBlock.js +1004 -0
  92. package/dist/modules/workflow/blocks/XiaohongshuCollectLinksBlock.js +1049 -0
  93. package/dist/modules/workflow/blocks/XiaohongshuFullCollectBlock.js +782 -0
  94. package/dist/modules/workflow/blocks/helpers/anchorVerify.js +198 -0
  95. package/dist/modules/workflow/blocks/helpers/asyncWorkQueue.js +53 -0
  96. package/dist/modules/workflow/blocks/helpers/commentScroller.js +334 -0
  97. package/dist/modules/workflow/blocks/helpers/commentSectionLocator.js +126 -0
  98. package/dist/modules/workflow/blocks/helpers/containerAnchors.js +301 -0
  99. package/dist/modules/workflow/blocks/helpers/debugArtifacts.js +6 -0
  100. package/dist/modules/workflow/blocks/helpers/downloadPaths.js +29 -0
  101. package/dist/modules/workflow/blocks/helpers/expandCommentsController.js +53 -0
  102. package/dist/modules/workflow/blocks/helpers/expandCommentsExtractor.js +129 -0
  103. package/dist/modules/workflow/blocks/helpers/macosVisionOcrPlugin.js +116 -0
  104. package/dist/modules/workflow/blocks/helpers/mergeXhsMarkdown.js +109 -0
  105. package/dist/modules/workflow/blocks/helpers/openDetailController.js +56 -0
  106. package/dist/modules/workflow/blocks/helpers/openDetailTypes.js +7 -0
  107. package/dist/modules/workflow/blocks/helpers/openDetailViewport.js +474 -0
  108. package/dist/modules/workflow/blocks/helpers/openDetailWaiter.js +104 -0
  109. package/dist/modules/workflow/blocks/helpers/operationLogger.js +195 -0
  110. package/dist/modules/workflow/blocks/helpers/persistedNotes.js +107 -0
  111. package/dist/modules/workflow/blocks/helpers/replyExpander.js +260 -0
  112. package/dist/modules/workflow/blocks/helpers/scrollIntoView.js +138 -0
  113. package/dist/modules/workflow/blocks/helpers/searchExecutor.js +328 -0
  114. package/dist/modules/workflow/blocks/helpers/searchGate.js +46 -0
  115. package/dist/modules/workflow/blocks/helpers/searchPageState.js +164 -0
  116. package/dist/modules/workflow/blocks/helpers/searchResultWaiter.js +64 -0
  117. package/dist/modules/workflow/blocks/helpers/simpleAnchor.js +134 -0
  118. package/dist/modules/workflow/blocks/helpers/smartReply.js +40 -0
  119. package/dist/modules/workflow/blocks/helpers/systemInput.js +635 -0
  120. package/dist/modules/workflow/blocks/helpers/targetCountMode.js +9 -0
  121. package/dist/modules/workflow/blocks/helpers/xhsCliArgs.js +80 -0
  122. package/dist/modules/workflow/blocks/helpers/xhsCommentDom.js +805 -0
  123. package/dist/modules/workflow/blocks/helpers/xhsNoteOrganizer.js +140 -0
  124. package/dist/modules/workflow/blocks/restore/RestorePhaseBlock.js +204 -0
  125. package/dist/modules/workflow/config/workflowRegistry.js +32 -0
  126. package/dist/modules/workflow/definitions/batch-collect-workflow.js +63 -0
  127. package/dist/modules/workflow/definitions/scroll-extract-workflow.js +74 -0
  128. package/dist/modules/workflow/definitions/xiaohongshu-collect-workflow-v2.js +81 -0
  129. package/dist/modules/workflow/definitions/xiaohongshu-collect-workflow.js +57 -0
  130. package/dist/modules/workflow/definitions/xiaohongshu-full-collect-workflow-v3.js +68 -0
  131. package/dist/modules/workflow/definitions/xiaohongshu-note-collect.js +49 -0
  132. package/dist/modules/workflow/definitions/xiaohongshu-phase1-workflow-v3.js +30 -0
  133. package/dist/modules/workflow/definitions/xiaohongshu-phase2-links-workflow-v3.js +40 -0
  134. package/dist/modules/workflow/definitions/xiaohongshu-phase3-collect-workflow-v1.js +54 -0
  135. package/dist/modules/workflow/definitions/xiaohongshu-phase34-from-links-workflow-v3.js +25 -0
  136. package/dist/modules/workflow/src/WeiboEventDrivenWorkflowRunner.js +308 -0
  137. package/dist/modules/workflow/src/context.js +70 -0
  138. package/dist/modules/workflow/src/index.js +5 -0
  139. package/dist/modules/workflow/src/orchestrator.js +230 -0
  140. package/dist/modules/workflow/src/runner.js +55 -0
  141. package/dist/modules/workflow/src/runtime.js +70 -0
  142. package/dist/modules/workflow/workflows/WeiboFeedExtractionWorkflow.js +359 -0
  143. package/dist/modules/workflow/workflows/XiaohongshuLoginWorkflow.js +110 -0
  144. package/dist/modules/xiaohongshu/app/src/blocks/MatchCommentsBlock.js +139 -0
  145. package/dist/modules/xiaohongshu/app/src/blocks/Phase1EnsureServicesBlock.js +36 -0
  146. package/dist/modules/xiaohongshu/app/src/blocks/Phase1MonitorCookieBlock.js +213 -0
  147. package/dist/modules/xiaohongshu/app/src/blocks/Phase1StartProfileBlock.js +121 -0
  148. package/dist/modules/xiaohongshu/app/src/blocks/Phase2CollectLinksBlock.js +1249 -0
  149. package/dist/modules/xiaohongshu/app/src/blocks/Phase2SearchBlock.js +703 -0
  150. package/dist/modules/xiaohongshu/app/src/blocks/Phase34CloseDetailBlock.js +41 -0
  151. package/dist/modules/xiaohongshu/app/src/blocks/Phase34CloseTabsBlock.js +44 -0
  152. package/dist/modules/xiaohongshu/app/src/blocks/Phase34CollectCommentsBlock.js +150 -0
  153. package/dist/modules/xiaohongshu/app/src/blocks/Phase34ExtractDetailBlock.js +117 -0
  154. package/dist/modules/xiaohongshu/app/src/blocks/Phase34OpenDetailBlock.js +102 -0
  155. package/dist/modules/xiaohongshu/app/src/blocks/Phase34OpenTabsBlock.js +109 -0
  156. package/dist/modules/xiaohongshu/app/src/blocks/Phase34PersistDetailBlock.js +117 -0
  157. package/dist/modules/xiaohongshu/app/src/blocks/Phase34ProcessSingleNoteBlock.js +114 -0
  158. package/dist/modules/xiaohongshu/app/src/blocks/Phase34ValidateLinksBlock.js +90 -0
  159. package/dist/modules/xiaohongshu/app/src/blocks/Phase3InteractBlock.js +1009 -0
  160. package/dist/modules/xiaohongshu/app/src/blocks/Phase4MultiTabHarvestBlock.js +233 -0
  161. package/dist/modules/xiaohongshu/app/src/blocks/ReplyInteractBlock.js +291 -0
  162. package/dist/modules/xiaohongshu/app/src/blocks/XhsDiscoverFallbackBlock.js +240 -0
  163. package/dist/modules/xiaohongshu/app/src/blocks/helpers/commentMatchDsl.js +126 -0
  164. package/dist/modules/xiaohongshu/app/src/blocks/helpers/commentMatcher.js +99 -0
  165. package/dist/modules/xiaohongshu/app/src/blocks/helpers/evidence.js +27 -0
  166. package/dist/modules/xiaohongshu/app/src/blocks/helpers/sharding.js +42 -0
  167. package/dist/modules/xiaohongshu/app/src/blocks/helpers/xhsComments.js +270 -0
  168. package/dist/modules/xiaohongshu/app/src/index.js +9 -0
  169. package/dist/modules/xiaohongshu/app/src/utils/checkpoints.js +222 -0
  170. package/dist/modules/xiaohongshu/app/src/utils/controllerAction.js +43 -0
  171. package/dist/services/controller/src/controller.js +1476 -0
  172. package/dist/services/controller/src/index.js +2 -0
  173. package/dist/services/controller/src/payload-normalizer.js +129 -0
  174. package/dist/services/shared/heartbeat.js +120 -0
  175. package/dist/services/shared/lib/errorHandler.js +2 -0
  176. package/dist/services/shared/serviceProcessLogger.js +139 -0
  177. package/dist/services/unified-api/RemoteBrowserSession.js +176 -0
  178. package/dist/services/unified-api/RemoteSessionManager.js +148 -0
  179. package/dist/services/unified-api/container-operations-handler.js +115 -0
  180. package/dist/services/unified-api/server.js +652 -0
  181. package/dist/services/unified-api/state-registry.js +274 -0
  182. package/dist/services/unified-api/task-persistence.js +66 -0
  183. package/dist/services/unified-api/task-state.js +130 -0
  184. package/modules/camo-runtime/src/autoscript/action-providers/xhs/search.mjs +12 -5
  185. package/modules/xiaohongshu/app/pnpm-lock.yaml +24 -0
  186. package/package.json +37 -9
  187. package/.beads/README.md +0 -81
  188. package/.beads/config.yaml +0 -67
  189. package/.beads/interactions.jsonl +0 -0
  190. package/.beads/issues.jsonl +0 -180
  191. package/.beads/metadata.json +0 -4
  192. package/.claude/settings.local.json +0 -10
  193. package/.github/workflows/ci.yml +0 -55
  194. package/AGENTS.md +0 -253
  195. package/apps/desktop-console/README.md +0 -27
  196. package/apps/desktop-console/package-lock.json +0 -897
  197. package/apps/desktop-console/package.json +0 -20
  198. package/apps/desktop-console/scripts/build-and-install.mjs +0 -19
  199. package/apps/desktop-console/scripts/build.mjs +0 -45
  200. package/apps/desktop-console/scripts/test-preload.mjs +0 -13
  201. package/apps/desktop-console/src/main/config.mts +0 -26
  202. package/apps/desktop-console/src/main/core-daemon-manager.mts +0 -131
  203. package/apps/desktop-console/src/main/desktop-settings.mts +0 -267
  204. package/apps/desktop-console/src/main/heartbeat-watchdog.mts +0 -50
  205. package/apps/desktop-console/src/main/heartbeat-watchdog.test.mts +0 -68
  206. package/apps/desktop-console/src/main/index-streaming.test.mts +0 -20
  207. package/apps/desktop-console/src/main/index.mts +0 -980
  208. package/apps/desktop-console/src/main/profile-store.mts +0 -239
  209. package/apps/desktop-console/src/main/profile-store.test.mts +0 -54
  210. package/apps/desktop-console/src/main/state-bridge.mts +0 -114
  211. package/apps/desktop-console/src/main/task-state-types.ts +0 -32
  212. package/apps/desktop-console/src/renderer/hooks/use-task-state.mts +0 -120
  213. package/apps/desktop-console/src/renderer/index.mts +0 -133
  214. package/apps/desktop-console/src/renderer/index.test.mts +0 -34
  215. package/apps/desktop-console/src/renderer/path-helpers.mts +0 -46
  216. package/apps/desktop-console/src/renderer/path-helpers.test.mts +0 -14
  217. package/apps/desktop-console/src/renderer/tabs/debug.mts +0 -48
  218. package/apps/desktop-console/src/renderer/tabs/debug.test.mts +0 -22
  219. package/apps/desktop-console/src/renderer/tabs/logs.mts +0 -421
  220. package/apps/desktop-console/src/renderer/tabs/logs.test.mts +0 -27
  221. package/apps/desktop-console/src/renderer/tabs/preflight.mts +0 -486
  222. package/apps/desktop-console/src/renderer/tabs/preflight.test.mts +0 -33
  223. package/apps/desktop-console/src/renderer/tabs/profile-pool.mts +0 -213
  224. package/apps/desktop-console/src/renderer/tabs/results.mts +0 -171
  225. package/apps/desktop-console/src/renderer/tabs/run.test.mts +0 -63
  226. package/apps/desktop-console/src/renderer/tabs/runtime.mts +0 -151
  227. package/apps/desktop-console/src/renderer/tabs/settings.mts +0 -146
  228. package/apps/desktop-console/src/renderer/tabs/xiaohongshu/account-flow.mts +0 -486
  229. package/apps/desktop-console/src/renderer/tabs/xiaohongshu/guide-browser-check.mts +0 -56
  230. package/apps/desktop-console/src/renderer/tabs/xiaohongshu/helpers.mts +0 -262
  231. package/apps/desktop-console/src/renderer/tabs/xiaohongshu/layout-block.mts +0 -430
  232. package/apps/desktop-console/src/renderer/tabs/xiaohongshu/live-stats.mts +0 -847
  233. package/apps/desktop-console/src/renderer/tabs/xiaohongshu/run-flow.mts +0 -443
  234. package/apps/desktop-console/src/renderer/tabs/xiaohongshu-state.mts +0 -425
  235. package/apps/desktop-console/src/renderer/tabs/xiaohongshu.mts +0 -497
  236. package/apps/desktop-console/src/renderer/tabs/xiaohongshu.test.mts +0 -291
  237. package/apps/desktop-console/src/renderer/ui-components.mts +0 -31
  238. package/docs/README_camoufox_chinese.md +0 -141
  239. package/docs/USAGE_V3.md +0 -163
  240. package/docs/arch/OCR_MACOS_PLUGIN.md +0 -39
  241. package/docs/arch/PORTS.md +0 -40
  242. package/docs/arch/REGRESSION_CHECKLIST.md +0 -121
  243. package/docs/arch/SEARCH_GATE.md +0 -224
  244. package/docs/arch/VIEWPORT_SAFETY.md +0 -182
  245. package/docs/arch/XIAOHONGSHU_OFFLINE_MOCK_DESIGN.md +0 -267
  246. package/docs/xiaohongshu-container-driven-summary.md +0 -221
  247. package/docs/xiaohongshu-full-collect-runbook.md +0 -134
  248. package/docs/xiaohongshu-next-steps.md +0 -228
  249. package/docs/xiaohongshu-quickstart.md +0 -73
  250. package/docs/xiaohongshu-workflow-summary.md +0 -227
  251. package/modules/container-registry/tests/container-registry.test.ts +0 -16
  252. package/modules/logging/tests/logging.test.ts +0 -38
  253. package/modules/operations/tests/operations.test.ts +0 -22
  254. package/modules/operations/tests/viewport-filter.test.ts +0 -161
  255. package/modules/operations/tests/visible-only.test.ts +0 -250
  256. package/modules/session-manager/tests/session-manager.test.ts +0 -23
  257. package/modules/state/src/atomic-json.test.ts +0 -30
  258. package/modules/state/src/paths.test.ts +0 -59
  259. package/modules/state/src/xiaohongshu-collect-state.test.ts +0 -259
  260. package/modules/workflow/blocks/AnchorVerificationBlock.d.ts.map +0 -1
  261. package/modules/workflow/blocks/AnchorVerificationBlock.js.map +0 -1
  262. package/modules/workflow/blocks/DetectPageStateBlock.d.ts.map +0 -1
  263. package/modules/workflow/blocks/DetectPageStateBlock.js.map +0 -1
  264. package/modules/workflow/blocks/ErrorRecoveryBlock.d.ts.map +0 -1
  265. package/modules/workflow/blocks/ErrorRecoveryBlock.js.map +0 -1
  266. package/modules/workflow/blocks/WaitSearchPermitBlock.d.ts.map +0 -1
  267. package/modules/workflow/blocks/WaitSearchPermitBlock.js.map +0 -1
  268. package/modules/workflow/blocks/helpers/containerAnchors.d.ts.map +0 -1
  269. package/modules/workflow/blocks/helpers/containerAnchors.js.map +0 -1
  270. package/modules/workflow/blocks/helpers/downloadPaths.test.ts +0 -62
  271. package/modules/workflow/blocks/helpers/mergeXhsMarkdown.test.ts +0 -121
  272. package/modules/workflow/blocks/helpers/operationLogger.d.ts.map +0 -1
  273. package/modules/workflow/blocks/helpers/operationLogger.js.map +0 -1
  274. package/modules/workflow/blocks/helpers/persistedNotes.test.ts +0 -268
  275. package/modules/workflow/blocks/helpers/searchPageState.d.ts.map +0 -1
  276. package/modules/workflow/blocks/helpers/searchPageState.js.map +0 -1
  277. package/modules/workflow/blocks/helpers/targetCountMode.test.ts +0 -29
  278. package/modules/workflow/blocks/helpers/xhsCliArgs.test.ts +0 -75
  279. package/modules/workflow/tests/smartReply.test.ts +0 -32
  280. package/modules/xiaohongshu/app/src/blocks/Phase3Interact.matcher.test.ts +0 -33
  281. package/modules/xiaohongshu/app/src/utils/__tests__/checkpoints.test.ts +0 -141
  282. package/modules/xiaohongshu/app/tests/commentMatchDsl.test.ts +0 -50
  283. package/modules/xiaohongshu/app/tests/commentMatcher.test.ts +0 -46
  284. package/modules/xiaohongshu/app/tests/sharding.test.ts +0 -31
  285. package/package-scripts.json +0 -8
  286. package/runtime/infra/utils/README.md +0 -13
  287. package/runtime/infra/utils/scripts/README.md +0 -0
  288. package/runtime/infra/utils/scripts/development/eval-in-session.mjs +0 -40
  289. package/runtime/infra/utils/scripts/development/highlight-search-containers.mjs +0 -35
  290. package/runtime/infra/utils/scripts/service/kill-port.mjs +0 -24
  291. package/runtime/infra/utils/scripts/service/start-api.mjs +0 -39
  292. package/runtime/infra/utils/scripts/service/start-browser-service.mjs +0 -106
  293. package/runtime/infra/utils/scripts/service/stop-api.mjs +0 -18
  294. package/runtime/infra/utils/scripts/service/stop-browser-service.mjs +0 -104
  295. package/runtime/infra/utils/scripts/test-services.mjs +0 -94
  296. package/services/shared/heartbeat.test.ts +0 -102
  297. package/services/unified-api/__tests__/task-state.test.ts +0 -95
  298. package/sitecustomize.py +0 -19
  299. package/tests/README.md +0 -194
  300. package/tests/e2e/workflows/weibo-feed-extraction.test.ts +0 -171
  301. package/tests/fixtures/data/container-definitions.json +0 -67
  302. package/tests/fixtures/pages/simple-page.html +0 -69
  303. package/tests/integration/01-test-container-match.mjs +0 -188
  304. package/tests/integration/02-test-dom-branch.mjs +0 -161
  305. package/tests/integration/03-test-container-operation-system.mjs +0 -91
  306. package/tests/integration/05-test-container-lifecycle-events.mjs +0 -224
  307. package/tests/integration/05-test-container-lifecycle-with-events.mjs +0 -250
  308. package/tests/integration/06-test-container-dom-tree-drawing.mjs +0 -256
  309. package/tests/integration/07-test-weibo-container-lifecycle.mjs +0 -355
  310. package/tests/integration/08-test-weibo-feed-workflow.test.mjs +0 -164
  311. package/tests/integration/10-test-visual-analyzer.mjs +0 -312
  312. package/tests/integration/11-test-visual-loop.mjs +0 -284
  313. package/tests/integration/12-test-simple-visual-loop.mjs +0 -242
  314. package/tests/integration/13-test-visual-robust.mjs +0 -185
  315. package/tests/integration/14-test-visual-highlight-loop.mjs +0 -271
  316. package/tests/integration/inspect-page.mjs +0 -50
  317. package/tests/integration/run-all-tests.mjs +0 -95
  318. package/tests/patch_verification/CODEX_PATCH_TEST.md +0 -103
  319. package/tests/patch_verification/PHASE2_ANALYSIS.md +0 -179
  320. package/tests/patch_verification/PHASE2_OPTIMIZATION_REPORT.md +0 -55
  321. package/tests/patch_verification/PHASE2_TO_PHASE4_SUMMARY.md +0 -126
  322. package/tests/patch_verification/QUICK_TEST_SEQUENCE.md +0 -262
  323. package/tests/patch_verification/README.md +0 -143
  324. package/tests/patch_verification/RUN_TESTS.md +0 -60
  325. package/tests/patch_verification/TEST_EXECUTION.md +0 -99
  326. package/tests/patch_verification/TEST_PLAN.md +0 -328
  327. package/tests/patch_verification/TEST_RESULTS.md +0 -34
  328. package/tests/patch_verification/TOOL_TEST_PLAN.md +0 -48
  329. package/tests/patch_verification/run-tool-test.mjs +0 -121
  330. package/tests/patch_verification/temp_test_files/test01.txt +0 -1
  331. package/tests/patch_verification/temp_test_files/test02.txt +0 -3
  332. package/tests/patch_verification/temp_test_files/test02_gnu.txt +0 -3
  333. package/tests/patch_verification/temp_test_files/test03.txt +0 -1
  334. package/tests/patch_verification/temp_test_files/test03_multiline.txt +0 -5
  335. package/tests/patch_verification/temp_test_files/test04_function.ts +0 -5
  336. package/tests/patch_verification/temp_test_files/test05_import.ts +0 -4
  337. package/tests/patch_verification/temp_test_files/test06_special_chars.txt +0 -4
  338. package/tests/patch_verification/temp_test_files/test07_indentation.ts +0 -5
  339. package/tests/patch_verification/temp_test_files/test08_mismatch.txt +0 -1
  340. package/tests/patch_verification/temp_test_files/test_add_02.txt +0 -3
  341. package/tests/patch_verification/temp_test_files/test_simple.txt +0 -1
  342. package/tests/runner/TestReporter.mjs +0 -57
  343. package/tests/runner/TestRunner.mjs +0 -244
  344. package/tests/unit/commands/profile.test.mjs +0 -10
  345. package/tests/unit/container/change-notifier.test.mjs +0 -181
  346. package/tests/unit/lifecycle/session-registry.test.mjs +0 -135
  347. package/tests/unit/operations/registry.test.ts +0 -73
  348. package/tests/unit/utils/browser-service.test.mjs +0 -153
  349. package/tests/unit/utils/config.test.mjs +0 -166
  350. package/tests/unit/utils/fingerprint.test.mjs +0 -166
  351. package/tsconfig.json +0 -31
  352. package/tsconfig.services.json +0 -26
  353. /package/apps/desktop-console/{src → dist}/renderer/index.html +0 -0
  354. /package/apps/desktop-console/{src/renderer/tabs → dist/renderer}/run.mts +0 -0
@@ -0,0 +1,140 @@
1
+ import path from 'node:path';
2
+ import { promises as fs } from 'node:fs';
3
+ import { isImageFile, ocrImagesWithMacPlugin, pickMacOcrLanguages } from './macosVisionOcrPlugin.js';
4
+ function readLineValue(md, prefix) {
5
+ const re = new RegExp(`^${prefix}\\s*(.+)$`, 'm');
6
+ const m = md.match(re);
7
+ return m ? String(m[1] ?? '').trim() : null;
8
+ }
9
+ export async function organizeOneNote(options) {
10
+ const noteDir = options.noteDir;
11
+ const noteId = options.noteId;
12
+ const keyword = options.keyword;
13
+ const contentPath = path.join(noteDir, 'content.md');
14
+ const commentsPath = path.join(noteDir, 'comments.md');
15
+ const imagesDir = path.join(noteDir, 'images');
16
+ const ocrPath = path.join(noteDir, 'ocr.md');
17
+ const mergedPath = path.join(noteDir, 'merged.md');
18
+ const content = await fs.readFile(contentPath, 'utf-8');
19
+ const comments = await fs.readFile(commentsPath, 'utf-8');
20
+ const link = readLineValue(content, '- 链接:') || undefined;
21
+ let imageFiles = [];
22
+ try {
23
+ const ents = await fs.readdir(imagesDir, { withFileTypes: true });
24
+ imageFiles = ents
25
+ .filter((e) => e.isFile())
26
+ .map((e) => e.name)
27
+ .filter((n) => isImageFile(n))
28
+ .sort();
29
+ }
30
+ catch {
31
+ imageFiles = [];
32
+ }
33
+ const picked = pickMacOcrLanguages(options.ocrLanguages);
34
+ const ocrLanguagesUsed = picked.languages;
35
+ let ocrErrors = 0;
36
+ let ocrMd = null;
37
+ const runOcr = options.runOcr !== false;
38
+ if (runOcr) {
39
+ const absImages = imageFiles.map((img) => path.join(imagesDir, img));
40
+ const ocr = imageFiles.length
41
+ ? await ocrImagesWithMacPlugin(absImages, { languages: ocrLanguagesUsed, timeoutMs: 120_000 })
42
+ : { languagesUsed: ocrLanguagesUsed, results: [], binPath: '' };
43
+ const byImage = new Map();
44
+ for (const r of ocr.results) {
45
+ byImage.set(String(r.image || '').trim(), { text: r.text, error: r.error });
46
+ }
47
+ const lines = [];
48
+ lines.push(`# OCR(${imageFiles.length})`);
49
+ lines.push('');
50
+ lines.push(`- Note ID: ${noteId}`);
51
+ lines.push(`- 关键词: ${keyword}`);
52
+ if (link)
53
+ lines.push(`- 链接: ${link}`);
54
+ lines.push(`- OCR 语言: ${ocrLanguagesUsed}`);
55
+ lines.push('');
56
+ if (imageFiles.length === 0) {
57
+ lines.push('(无图片或 images/ 目录不存在)');
58
+ lines.push('');
59
+ }
60
+ else {
61
+ for (const img of imageFiles) {
62
+ const imgPath = path.join(imagesDir, img);
63
+ const rel = `images/${img}`;
64
+ const res = byImage.get(imgPath) || {};
65
+ lines.push(`## ${rel}`);
66
+ lines.push('');
67
+ if (res.error) {
68
+ ocrErrors += 1;
69
+ lines.push(`> OCR 失败: ${res.error}`);
70
+ lines.push('');
71
+ }
72
+ const text = String(res.text || '').trim();
73
+ if (text) {
74
+ lines.push('```');
75
+ lines.push(text);
76
+ lines.push('```');
77
+ }
78
+ else {
79
+ lines.push('(无可识别文字)');
80
+ }
81
+ lines.push('');
82
+ }
83
+ }
84
+ ocrMd = `${lines.join('\n')}\n`;
85
+ await fs.writeFile(ocrPath, ocrMd, 'utf-8');
86
+ }
87
+ else {
88
+ try {
89
+ ocrMd = await fs.readFile(ocrPath, 'utf-8');
90
+ }
91
+ catch {
92
+ if (options.requireExistingOcr) {
93
+ throw new Error(`missing ocr.md (requireExistingOcr=true): ${ocrPath}`);
94
+ }
95
+ const lines = [];
96
+ lines.push(`# OCR(${imageFiles.length})`);
97
+ lines.push('');
98
+ lines.push(`- Note ID: ${noteId}`);
99
+ lines.push(`- 关键词: ${keyword}`);
100
+ if (link)
101
+ lines.push(`- 链接: ${link}`);
102
+ lines.push(`- OCR 语言: ${ocrLanguagesUsed}`);
103
+ lines.push(`- OCR: skipped`);
104
+ lines.push('');
105
+ ocrMd = `${lines.join('\n')}\n`;
106
+ await fs.writeFile(ocrPath, ocrMd, 'utf-8');
107
+ }
108
+ }
109
+ const mergedLines = [];
110
+ mergedLines.push(`# 合并(${noteId})`);
111
+ mergedLines.push('');
112
+ mergedLines.push(`- Note ID: ${noteId}`);
113
+ mergedLines.push(`- 关键词: ${keyword}`);
114
+ if (link)
115
+ mergedLines.push(`- 链接: ${link}`);
116
+ mergedLines.push('');
117
+ mergedLines.push('## 正文');
118
+ mergedLines.push('');
119
+ mergedLines.push(content.trim());
120
+ mergedLines.push('');
121
+ mergedLines.push('## OCR');
122
+ mergedLines.push('');
123
+ mergedLines.push(String(ocrMd || '').trim());
124
+ mergedLines.push('');
125
+ mergedLines.push('## 评论');
126
+ mergedLines.push('');
127
+ mergedLines.push(comments.trim());
128
+ mergedLines.push('');
129
+ await fs.writeFile(mergedPath, `${mergedLines.join('\n')}\n`, 'utf-8');
130
+ return {
131
+ noteId,
132
+ ocrPath,
133
+ mergedPath,
134
+ imageCount: imageFiles.length,
135
+ ocrErrors,
136
+ ocrLanguagesUsed,
137
+ ...(link ? { link } : {}),
138
+ };
139
+ }
140
+ //# sourceMappingURL=xhsNoteOrganizer.js.map
@@ -0,0 +1,204 @@
1
+ /**
2
+ * RestorePhaseBlock
3
+ *
4
+ * 基于 URL + 容器匹配恢复到指定阶段(Phase 入口锚点),用于 Phase1–4 的“回归锚点”能力。
5
+ *
6
+ * 约定:
7
+ * - phase=1: 期望在 home/login(交给 Phase1 自己处理)
8
+ * - phase=2: 期望在搜索入口阶段(home 或 search_result)
9
+ * - phase=3: 期望在搜索结果阶段(search_result)
10
+ * - phase=4: 期望在详情页阶段(detail)
11
+ *
12
+ * 恢复策略(小红书):
13
+ * - 当前在 detail:优先使用 ErrorRecoveryBlock(ESC) 关闭模态框,回到 search_result/home
14
+ * - 当前在风控/未知页面:优先点击“发现页” sidebar 容器按钮(home/search.discover_button),回到首页
15
+ * - 当前在 login:交给上层 Phase1 处理,不在此处强行导航
16
+ */
17
+ import { execute as detectPageState } from '../DetectPageStateBlock.js';
18
+ import { execute as errorRecovery } from '../ErrorRecoveryBlock.js';
19
+ import { logControllerActionError, logControllerActionResult, logControllerActionStart, } from '../helpers/operationLogger.js';
20
+ function expectedStageForPhase(phase) {
21
+ switch (phase) {
22
+ case 1:
23
+ return ['home', 'login', 'unknown'];
24
+ case 2:
25
+ return ['home', 'search'];
26
+ case 3:
27
+ return ['search'];
28
+ case 4:
29
+ return ['detail'];
30
+ default:
31
+ return ['unknown'];
32
+ }
33
+ }
34
+ function choosePhaseFromStage(stage) {
35
+ if (stage === 'detail')
36
+ return 4;
37
+ if (stage === 'search')
38
+ return 3;
39
+ if (stage === 'home')
40
+ return 2;
41
+ if (stage === 'login')
42
+ return 1;
43
+ return 1;
44
+ }
45
+ export async function execute(input) {
46
+ const { sessionId, phase, serviceUrl = 'http://127.0.0.1:7701' } = input;
47
+ const controllerUrl = `${serviceUrl}/v1/controller/action`;
48
+ async function controllerAction(action, payload = {}) {
49
+ const opId = logControllerActionStart(action, payload, { source: 'RestorePhaseBlock' });
50
+ try {
51
+ const res = await fetch(controllerUrl, {
52
+ method: 'POST',
53
+ headers: { 'Content-Type': 'application/json' },
54
+ body: JSON.stringify({ action, payload }),
55
+ });
56
+ if (!res.ok) {
57
+ throw new Error(`HTTP ${res.status}: ${await res.text()}`);
58
+ }
59
+ const data = await res.json();
60
+ const result = data.data || data;
61
+ logControllerActionResult(opId, action, result, { source: 'RestorePhaseBlock' });
62
+ return result;
63
+ }
64
+ catch (error) {
65
+ logControllerActionError(opId, action, error, payload, { source: 'RestorePhaseBlock' });
66
+ throw error;
67
+ }
68
+ }
69
+ async function clickDiscoverButton() {
70
+ const candidates = [
71
+ 'xiaohongshu_home.discover_button',
72
+ 'xiaohongshu_search.discover_button',
73
+ ];
74
+ for (const containerId of candidates) {
75
+ try {
76
+ await controllerAction('container:operation', {
77
+ containerId,
78
+ operationId: 'click',
79
+ config: { useSystemMouse: true },
80
+ sessionId,
81
+ });
82
+ // 给页面一点时间完成导航
83
+ await new Promise((resolve) => setTimeout(resolve, 1500));
84
+ return { success: true, method: `discover:${containerId}` };
85
+ }
86
+ catch {
87
+ // 尝试下一个候选
88
+ }
89
+ }
90
+ return { success: false };
91
+ }
92
+ try {
93
+ // 1) 检测当前阶段(入口锚点)
94
+ const state = await detectPageState({
95
+ sessionId,
96
+ platform: 'xiaohongshu',
97
+ serviceUrl,
98
+ });
99
+ const expectedStages = expectedStageForPhase(phase);
100
+ if (state.success && expectedStages.includes(state.stage)) {
101
+ // 已经在本 Phase 允许的阶段,不做任何操作
102
+ return {
103
+ success: true,
104
+ restored: false,
105
+ finalPhase: phase,
106
+ finalStage: state.stage,
107
+ url: state.url,
108
+ method: 'already-at-expected-stage',
109
+ error: state.error,
110
+ };
111
+ }
112
+ let currentStage = state.stage;
113
+ let currentUrl = state.url;
114
+ let method;
115
+ // 2) 针对不同阶段执行恢复策略
116
+ if (currentStage === 'detail') {
117
+ // 使用 ErrorRecoveryBlock 的 ESC 模式关闭详情模态框
118
+ const rec = await errorRecovery({
119
+ sessionId,
120
+ fromStage: 'detail',
121
+ targetStage: 'search',
122
+ serviceUrl,
123
+ recoveryMode: 'esc',
124
+ maxRetries: 2,
125
+ });
126
+ if (!rec.success) {
127
+ return {
128
+ success: false,
129
+ restored: false,
130
+ finalPhase: phase,
131
+ finalStage: currentStage,
132
+ url: rec.currentUrl || currentUrl,
133
+ method: rec.method,
134
+ error: rec.error || 'ErrorRecoveryBlock failed',
135
+ };
136
+ }
137
+ method = `errorRecovery:${rec.method || 'esc'}`;
138
+ currentUrl = rec.currentUrl || currentUrl;
139
+ const after = await detectPageState({
140
+ sessionId,
141
+ platform: 'xiaohongshu',
142
+ serviceUrl,
143
+ });
144
+ currentStage = after.stage;
145
+ currentUrl = after.url;
146
+ }
147
+ else if (currentStage === 'login') {
148
+ // 登录页交给 Phase1 处理,不在此处强行导航
149
+ return {
150
+ success: false,
151
+ restored: false,
152
+ finalPhase: 1,
153
+ finalStage: 'login',
154
+ url: state.url,
155
+ method: 'login-delegate-phase1',
156
+ error: 'Current stage is login, please run Phase1 to complete login',
157
+ };
158
+ }
159
+ else {
160
+ // 风控/未知/其他页面:尝试点击发现页 sidebar 容器按钮
161
+ const clickRes = await clickDiscoverButton();
162
+ if (!clickRes.success) {
163
+ return {
164
+ success: false,
165
+ restored: false,
166
+ finalPhase: phase,
167
+ finalStage: currentStage,
168
+ url: currentUrl,
169
+ method: 'discover-button-failed',
170
+ error: 'Failed to click discover button to return home',
171
+ };
172
+ }
173
+ method = clickRes.method;
174
+ const after = await detectPageState({
175
+ sessionId,
176
+ platform: 'xiaohongshu',
177
+ serviceUrl,
178
+ });
179
+ currentStage = after.stage;
180
+ currentUrl = after.url;
181
+ }
182
+ const finalPhase = choosePhaseFromStage(currentStage);
183
+ return {
184
+ success: true,
185
+ restored: true,
186
+ finalPhase,
187
+ finalStage: currentStage,
188
+ url: currentUrl,
189
+ method,
190
+ error: state.error,
191
+ };
192
+ }
193
+ catch (error) {
194
+ return {
195
+ success: false,
196
+ restored: false,
197
+ finalPhase: phase,
198
+ finalStage: 'unknown',
199
+ url: '',
200
+ error: error?.message || String(error),
201
+ };
202
+ }
203
+ }
204
+ //# sourceMappingURL=RestorePhaseBlock.js.map
@@ -0,0 +1,32 @@
1
+ import { xiaohongshuCollectWorkflowV2 } from '../definitions/xiaohongshu-collect-workflow-v2.js';
2
+ import { xiaohongshuCollectWorkflow } from '../definitions/xiaohongshu-collect-workflow.js';
3
+ import { xiaohongshuNoteCollectWorkflow } from '../definitions/xiaohongshu-note-collect.js';
4
+ import { xiaohongshuFullCollectWorkflowV3 } from '../definitions/xiaohongshu-full-collect-workflow-v3.js';
5
+ import { xiaohongshuPhase3CollectWorkflowV1 } from '../definitions/xiaohongshu-phase3-collect-workflow-v1.js';
6
+ import { xiaohongshuPhase1WorkflowV3 } from '../definitions/xiaohongshu-phase1-workflow-v3.js';
7
+ import { xiaohongshuPhase2LinksWorkflowV3 } from '../definitions/xiaohongshu-phase2-links-workflow-v3.js';
8
+ import { xiaohongshuPhase34FromLinksWorkflowV3 } from '../definitions/xiaohongshu-phase34-from-links-workflow-v3.js';
9
+ const registry = new Map();
10
+ function register(def, idOverride) {
11
+ const id = idOverride || def.id;
12
+ if (!id) {
13
+ throw new Error('Workflow definition missing id');
14
+ }
15
+ registry.set(id, { ...def, id });
16
+ }
17
+ // 注册已有的小红书相关 workflow 定义
18
+ register(xiaohongshuCollectWorkflowV2, 'xiaohongshu-collect-v2');
19
+ register(xiaohongshuCollectWorkflow, 'xiaohongshu-collect-v1');
20
+ register(xiaohongshuNoteCollectWorkflow, 'xiaohongshu-note-collect');
21
+ register(xiaohongshuFullCollectWorkflowV3, 'xiaohongshu-collect-full-v3');
22
+ register(xiaohongshuPhase3CollectWorkflowV1, 'xiaohongshu-collect-phase3-v1');
23
+ register(xiaohongshuPhase1WorkflowV3, 'xiaohongshu-phase1-v3');
24
+ register(xiaohongshuPhase2LinksWorkflowV3, 'xiaohongshu-phase2-links-v3');
25
+ register(xiaohongshuPhase34FromLinksWorkflowV3, 'xiaohongshu-phase34-from-links-v3');
26
+ export function getWorkflowDefinition(id) {
27
+ return registry.get(id);
28
+ }
29
+ export function listWorkflowIds() {
30
+ return Array.from(registry.keys());
31
+ }
32
+ //# sourceMappingURL=workflowRegistry.js.map
@@ -0,0 +1,63 @@
1
+ /**
2
+ * 批量采集 Workflow 定义
3
+ *
4
+ * 采集150条微博并生成 Markdown
5
+ */
6
+ export const batchCollectWorkflow = {
7
+ id: 'weibo-batch-collect-150',
8
+ name: '微博批量采集150条',
9
+ config: {
10
+ targetCount: 150,
11
+ scrollDistance: 800,
12
+ stableWait: 10000,
13
+ outputPath: 'output/weibo/collect-150.md'
14
+ },
15
+ steps: [
16
+ {
17
+ blockName: 'StartBrowserService',
18
+ input: {
19
+ host: '127.0.0.1',
20
+ port: 7704
21
+ }
22
+ },
23
+ {
24
+ blockName: 'EnsureSession',
25
+ input: {
26
+ profileId: 'weibo_fresh',
27
+ url: 'https://weibo.com'
28
+ }
29
+ },
30
+ {
31
+ blockName: 'InitAutoScroll',
32
+ input: {
33
+ sessionId: '$sessionId',
34
+ scrollDistance: 800
35
+ }
36
+ },
37
+ {
38
+ blockName: 'CollectBatch',
39
+ input: {
40
+ sessionId: '$sessionId',
41
+ targetCount: 150,
42
+ containerSelector: '[class*="Feed_retweated"]',
43
+ scrollDistance: 800,
44
+ stableWait: 10000
45
+ }
46
+ },
47
+ {
48
+ blockName: 'RenderMarkdown',
49
+ input: {
50
+ posts: '$collectedPosts',
51
+ template: 'default'
52
+ }
53
+ },
54
+ {
55
+ blockName: 'SaveFile',
56
+ input: {
57
+ content: '$markdown',
58
+ path: 'output/weibo/collect-150.md'
59
+ }
60
+ }
61
+ ]
62
+ };
63
+ //# sourceMappingURL=batch-collect-workflow.js.map
@@ -0,0 +1,74 @@
1
+ /**
2
+ * 完整滚动+提取测试 Workflow 定义
3
+ *
4
+ * 组合 blocks 实现端到端数据采集
5
+ */
6
+ export const scrollExtractWorkflow = {
7
+ id: 'weibo-scroll-extract',
8
+ name: '微博滚动+提取完整流程',
9
+ steps: [
10
+ {
11
+ blockName: 'StartBrowserService',
12
+ input: {
13
+ host: '127.0.0.1',
14
+ port: 7704,
15
+ wsPort: 8765
16
+ }
17
+ },
18
+ {
19
+ blockName: 'EnsureSession',
20
+ input: {
21
+ profileId: 'weibo_fresh',
22
+ url: 'https://weibo.com',
23
+ serviceUrl: 'http://127.0.0.1:7704'
24
+ }
25
+ },
26
+ {
27
+ blockName: 'InitAutoScroll',
28
+ input: {
29
+ sessionId: '$sessionId',
30
+ scrollStrategy: 'smooth',
31
+ scrollDistance: 800
32
+ }
33
+ },
34
+ {
35
+ blockName: 'ScrollNextBatch',
36
+ input: {
37
+ sessionId: '$sessionId',
38
+ distance: 800,
39
+ behavior: 'smooth'
40
+ }
41
+ },
42
+ {
43
+ blockName: 'WaitStable',
44
+ input: {
45
+ sessionId: '$sessionId',
46
+ checkInterval: 500,
47
+ maxWait: 10000
48
+ }
49
+ },
50
+ {
51
+ blockName: 'MatchContainers',
52
+ input: {
53
+ sessionId: '$sessionId',
54
+ rootSelector: 'body'
55
+ }
56
+ },
57
+ {
58
+ blockName: 'ExtractPostFields',
59
+ input: {
60
+ sessionId: '$sessionId',
61
+ containerSelector: '[class*="Feed_retweeted"]',
62
+ index: 0
63
+ }
64
+ },
65
+ {
66
+ blockName: 'ValidateExtract',
67
+ input: {
68
+ fields: '$fields',
69
+ requiredFields: ['author', 'content']
70
+ }
71
+ }
72
+ ]
73
+ };
74
+ //# sourceMappingURL=scroll-extract-workflow.js.map
@@ -0,0 +1,81 @@
1
+ /**
2
+ * 小红书关键词采集 Workflow v2(容器驱动版)
3
+ *
4
+ * 新增:
5
+ * - WaitSearchPermitBlock:在执行搜索前先向 SearchGate 申请许可
6
+ */
7
+ export const xiaohongshuCollectWorkflowV2 = {
8
+ id: 'xiaohongshu-collect-v2',
9
+ name: '小红书关键词采集(容器驱动版)',
10
+ steps: [
11
+ {
12
+ blockName: 'EnsureSession',
13
+ input: {
14
+ profileId: '$sessionId',
15
+ url: 'https://www.xiaohongshu.com'
16
+ }
17
+ },
18
+ {
19
+ blockName: 'EnsureLoginBlock',
20
+ input: {
21
+ sessionId: '$sessionId',
22
+ maxWaitMs: 180000,
23
+ checkIntervalMs: 5000
24
+ }
25
+ },
26
+ {
27
+ blockName: 'WaitSearchPermitBlock',
28
+ input: {
29
+ sessionId: '$sessionId',
30
+ keyword: '$keyword',
31
+ }
32
+ },
33
+ {
34
+ blockName: 'GoToSearchBlock',
35
+ input: {
36
+ sessionId: '$sessionId',
37
+ keyword: '$keyword'
38
+ }
39
+ },
40
+ {
41
+ blockName: 'CollectSearchListBlock',
42
+ input: {
43
+ sessionId: '$sessionId',
44
+ targetCount: '$targetCount'
45
+ }
46
+ },
47
+ {
48
+ blockName: 'OpenDetailBlock',
49
+ input: {
50
+ sessionId: '$sessionId',
51
+ containerId: '$firstItemContainerId'
52
+ }
53
+ },
54
+ {
55
+ blockName: 'ExtractDetailBlock',
56
+ input: {
57
+ sessionId: '$sessionId'
58
+ }
59
+ },
60
+ {
61
+ blockName: 'WarmupCommentsBlock',
62
+ input: {
63
+ sessionId: '$sessionId',
64
+ maxRounds: 8
65
+ }
66
+ },
67
+ {
68
+ blockName: 'ExpandCommentsBlock',
69
+ input: {
70
+ sessionId: '$sessionId'
71
+ }
72
+ },
73
+ {
74
+ blockName: 'CloseDetailBlock',
75
+ input: {
76
+ sessionId: '$sessionId'
77
+ }
78
+ }
79
+ ]
80
+ };
81
+ //# sourceMappingURL=xiaohongshu-collect-workflow-v2.js.map
@@ -0,0 +1,57 @@
1
+ /**
2
+ * 小红书采集 Workflow 定义
3
+ */
4
+ export const xiaohongshuCollectWorkflow = {
5
+ id: 'xiaohongshu-collect',
6
+ name: '小红书关键词采集(已迁移到 v3 安全链路)',
7
+ steps: [
8
+ {
9
+ blockName: 'StartBrowserService',
10
+ input: {
11
+ host: '127.0.0.1',
12
+ port: 7704
13
+ }
14
+ },
15
+ {
16
+ blockName: 'EnsureSession',
17
+ input: {
18
+ profileId: '$sessionId',
19
+ url: 'https://www.xiaohongshu.com'
20
+ }
21
+ },
22
+ {
23
+ blockName: 'EnsureLoginBlock',
24
+ input: {
25
+ sessionId: '$sessionId',
26
+ maxWaitMs: 180000,
27
+ checkIntervalMs: 5000,
28
+ },
29
+ },
30
+ {
31
+ blockName: 'WaitSearchPermitBlock',
32
+ input: {
33
+ sessionId: '$sessionId',
34
+ keyword: '$keyword',
35
+ },
36
+ },
37
+ {
38
+ blockName: 'GoToSearchBlock',
39
+ input: {
40
+ sessionId: '$sessionId',
41
+ keyword: '$keyword',
42
+ },
43
+ },
44
+ {
45
+ blockName: 'XiaohongshuFullCollectBlock',
46
+ input: {
47
+ sessionId: '$sessionId',
48
+ keyword: '$keyword',
49
+ env: '$env',
50
+ targetCount: '$targetCount',
51
+ maxWarmupRounds: '$maxWarmupRounds',
52
+ allowClickCommentButton: '$allowClickCommentButton',
53
+ },
54
+ },
55
+ ]
56
+ };
57
+ //# sourceMappingURL=xiaohongshu-collect-workflow.js.map