@dyyz1993/agent-browser 0.9.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (187) hide show
  1. package/LICENSE +202 -0
  2. package/README.md +907 -0
  3. package/bin/agent-browser-darwin-arm64 +0 -0
  4. package/bin/agent-browser.js +120 -0
  5. package/dist/__tests__/e2e/utils/test-helpers.d.ts +5 -0
  6. package/dist/__tests__/e2e/utils/test-helpers.d.ts.map +1 -0
  7. package/dist/__tests__/e2e/utils/test-helpers.js +22 -0
  8. package/dist/__tests__/e2e/utils/test-helpers.js.map +1 -0
  9. package/dist/__tests__/test-iframe.d.ts +2 -0
  10. package/dist/__tests__/test-iframe.d.ts.map +1 -0
  11. package/dist/__tests__/test-iframe.js +52 -0
  12. package/dist/__tests__/test-iframe.js.map +1 -0
  13. package/dist/__tests__/utils/parseCli.d.ts +20 -0
  14. package/dist/__tests__/utils/parseCli.d.ts.map +1 -0
  15. package/dist/__tests__/utils/parseCli.js +1086 -0
  16. package/dist/__tests__/utils/parseCli.js.map +1 -0
  17. package/dist/actions.d.ts +50 -0
  18. package/dist/actions.d.ts.map +1 -0
  19. package/dist/actions.js +2164 -0
  20. package/dist/actions.js.map +1 -0
  21. package/dist/browser.d.ts +556 -0
  22. package/dist/browser.d.ts.map +1 -0
  23. package/dist/browser.js +2599 -0
  24. package/dist/browser.js.map +1 -0
  25. package/dist/cli/commands.d.ts +8 -0
  26. package/dist/cli/commands.d.ts.map +1 -0
  27. package/dist/cli/commands.js +1038 -0
  28. package/dist/cli/commands.js.map +1 -0
  29. package/dist/cli/connection.d.ts +50 -0
  30. package/dist/cli/connection.d.ts.map +1 -0
  31. package/dist/cli/connection.js +595 -0
  32. package/dist/cli/connection.js.map +1 -0
  33. package/dist/cli/flags.d.ts +36 -0
  34. package/dist/cli/flags.d.ts.map +1 -0
  35. package/dist/cli/flags.js +206 -0
  36. package/dist/cli/flags.js.map +1 -0
  37. package/dist/cli/help.d.ts +4 -0
  38. package/dist/cli/help.d.ts.map +1 -0
  39. package/dist/cli/help.js +1024 -0
  40. package/dist/cli/help.js.map +1 -0
  41. package/dist/cli/output.d.ts +14 -0
  42. package/dist/cli/output.d.ts.map +1 -0
  43. package/dist/cli/output.js +456 -0
  44. package/dist/cli/output.js.map +1 -0
  45. package/dist/cli-new.d.ts +3 -0
  46. package/dist/cli-new.d.ts.map +1 -0
  47. package/dist/cli-new.js +308 -0
  48. package/dist/cli-new.js.map +1 -0
  49. package/dist/cli-old.d.ts +3 -0
  50. package/dist/cli-old.d.ts.map +1 -0
  51. package/dist/cli-old.js +1101 -0
  52. package/dist/cli-old.js.map +1 -0
  53. package/dist/cli.d.ts +3 -0
  54. package/dist/cli.d.ts.map +1 -0
  55. package/dist/cli.js +403 -0
  56. package/dist/cli.js.map +1 -0
  57. package/dist/content-detection.d.ts +18 -0
  58. package/dist/content-detection.d.ts.map +1 -0
  59. package/dist/content-detection.js +68 -0
  60. package/dist/content-detection.js.map +1 -0
  61. package/dist/daemon.d.ts +55 -0
  62. package/dist/daemon.d.ts.map +1 -0
  63. package/dist/daemon.js +426 -0
  64. package/dist/daemon.js.map +1 -0
  65. package/dist/diff.d.ts +42 -0
  66. package/dist/diff.d.ts.map +1 -0
  67. package/dist/diff.js +166 -0
  68. package/dist/diff.js.map +1 -0
  69. package/dist/human-mouse.d.ts +31 -0
  70. package/dist/human-mouse.d.ts.map +1 -0
  71. package/dist/human-mouse.js +184 -0
  72. package/dist/human-mouse.js.map +1 -0
  73. package/dist/ios-actions.d.ts +11 -0
  74. package/dist/ios-actions.d.ts.map +1 -0
  75. package/dist/ios-actions.js +228 -0
  76. package/dist/ios-actions.js.map +1 -0
  77. package/dist/ios-manager.d.ts +266 -0
  78. package/dist/ios-manager.d.ts.map +1 -0
  79. package/dist/ios-manager.js +1076 -0
  80. package/dist/ios-manager.js.map +1 -0
  81. package/dist/message-bridge.d.ts +10 -0
  82. package/dist/message-bridge.d.ts.map +1 -0
  83. package/dist/message-bridge.js +60 -0
  84. package/dist/message-bridge.js.map +1 -0
  85. package/dist/protocol.d.ts +26 -0
  86. package/dist/protocol.d.ts.map +1 -0
  87. package/dist/protocol.js +912 -0
  88. package/dist/protocol.js.map +1 -0
  89. package/dist/recorder/binding.d.ts +24 -0
  90. package/dist/recorder/binding.d.ts.map +1 -0
  91. package/dist/recorder/binding.js +215 -0
  92. package/dist/recorder/binding.js.map +1 -0
  93. package/dist/recorder/index.d.ts +4 -0
  94. package/dist/recorder/index.d.ts.map +1 -0
  95. package/dist/recorder/index.js +4 -0
  96. package/dist/recorder/index.js.map +1 -0
  97. package/dist/recorder/inject.js +1913 -0
  98. package/dist/recorder/recorder.d.ts +19 -0
  99. package/dist/recorder/recorder.d.ts.map +1 -0
  100. package/dist/recorder/recorder.js +101 -0
  101. package/dist/recorder/recorder.js.map +1 -0
  102. package/dist/recorder/store.d.ts +22 -0
  103. package/dist/recorder/store.d.ts.map +1 -0
  104. package/dist/recorder/store.js +150 -0
  105. package/dist/recorder/store.js.map +1 -0
  106. package/dist/recorder/types.d.ts +73 -0
  107. package/dist/recorder/types.d.ts.map +1 -0
  108. package/dist/recorder/types.js +5 -0
  109. package/dist/recorder/types.js.map +1 -0
  110. package/dist/snapshot.d.ts +81 -0
  111. package/dist/snapshot.d.ts.map +1 -0
  112. package/dist/snapshot.js +1348 -0
  113. package/dist/snapshot.js.map +1 -0
  114. package/dist/stream-server-standalone.d.ts +38 -0
  115. package/dist/stream-server-standalone.d.ts.map +1 -0
  116. package/dist/stream-server-standalone.js +494 -0
  117. package/dist/stream-server-standalone.js.map +1 -0
  118. package/dist/stream-server.d.ts +214 -0
  119. package/dist/stream-server.d.ts.map +1 -0
  120. package/dist/stream-server.js +811 -0
  121. package/dist/stream-server.js.map +1 -0
  122. package/dist/types.d.ts +914 -0
  123. package/dist/types.d.ts.map +1 -0
  124. package/dist/types.js +4 -0
  125. package/dist/types.js.map +1 -0
  126. package/dist/viewer-html.d.ts +2 -0
  127. package/dist/viewer-html.d.ts.map +1 -0
  128. package/dist/viewer-html.js +185 -0
  129. package/dist/viewer-html.js.map +1 -0
  130. package/dist/viewer-script.d.ts +47 -0
  131. package/dist/viewer-script.d.ts.map +1 -0
  132. package/dist/viewer-script.js +586 -0
  133. package/dist/viewer-script.js.map +1 -0
  134. package/package.json +86 -0
  135. package/scripts/build-all-platforms.sh +68 -0
  136. package/scripts/check-version-sync.js +39 -0
  137. package/scripts/check_goods_container.js +35 -0
  138. package/scripts/check_page_content.js +36 -0
  139. package/scripts/click_applause_rate.js +30 -0
  140. package/scripts/copy-native.js +36 -0
  141. package/scripts/copy-recorder.js +21 -0
  142. package/scripts/e2e-test-recorder.ts +584 -0
  143. package/scripts/explore_jd_page.js +31 -0
  144. package/scripts/extract_all_jd_data.js +80 -0
  145. package/scripts/extract_jd_product_detail.js +62 -0
  146. package/scripts/extract_jd_products_correct_links.js +78 -0
  147. package/scripts/extract_jd_products_final.js +80 -0
  148. package/scripts/extract_jd_reviews.js +48 -0
  149. package/scripts/extract_jd_seafood_final.js +78 -0
  150. package/scripts/extract_multiple_products.js +77 -0
  151. package/scripts/extract_products_no_scroll.js +68 -0
  152. package/scripts/extract_products_simple.js +68 -0
  153. package/scripts/find_applause_rate.js +26 -0
  154. package/scripts/find_jd_links.js +28 -0
  155. package/scripts/find_main_content.js +20 -0
  156. package/scripts/find_product_cards.js +38 -0
  157. package/scripts/find_root_content.js +26 -0
  158. package/scripts/find_unique_products.js +55 -0
  159. package/scripts/get_jd_product_detail.js +16 -0
  160. package/scripts/get_jd_products.js +23 -0
  161. package/scripts/get_jd_seafood_products.js +44 -0
  162. package/scripts/get_product_details_from_images.js +54 -0
  163. package/scripts/postinstall.js +235 -0
  164. package/scripts/scroll_and_get_products.js +47 -0
  165. package/scripts/scroll_deep_and_find.js +45 -0
  166. package/scripts/sync-version.js +69 -0
  167. package/scripts/verify-baidu-enter.ts +116 -0
  168. package/skills/agent-browser/SKILL.md +310 -0
  169. package/skills/agent-browser/references/authentication.md +198 -0
  170. package/skills/agent-browser/references/commands.md +471 -0
  171. package/skills/agent-browser/references/data-extraction.md +377 -0
  172. package/skills/agent-browser/references/proxy-support.md +188 -0
  173. package/skills/agent-browser/references/session-management.md +197 -0
  174. package/skills/agent-browser/references/snapshot-refs.md +379 -0
  175. package/skills/agent-browser/references/video-recording.md +173 -0
  176. package/skills/agent-browser/templates/api-interception.sh +53 -0
  177. package/skills/agent-browser/templates/authenticated-session.sh +97 -0
  178. package/skills/agent-browser/templates/capture-workflow.sh +69 -0
  179. package/skills/agent-browser/templates/data-extraction.sh +210 -0
  180. package/skills/agent-browser/templates/form-automation.sh +62 -0
  181. package/skills/skill-creator/LICENSE.txt +202 -0
  182. package/skills/skill-creator/SKILL.md +356 -0
  183. package/skills/skill-creator/references/output-patterns.md +82 -0
  184. package/skills/skill-creator/references/workflows.md +28 -0
  185. package/skills/skill-creator/scripts/init_skill.py +303 -0
  186. package/skills/skill-creator/scripts/package_skill.py +113 -0
  187. package/skills/skill-creator/scripts/quick_validate.py +95 -0
@@ -0,0 +1,173 @@
1
+ # Video Recording
2
+
3
+ Capture browser automation as video for debugging, documentation, or verification.
4
+
5
+ **Related**: [commands.md](commands.md) for full command reference, [SKILL.md](../SKILL.md) for quick start.
6
+
7
+ ## Contents
8
+
9
+ - [Basic Recording](#basic-recording)
10
+ - [Recording Commands](#recording-commands)
11
+ - [Use Cases](#use-cases)
12
+ - [Best Practices](#best-practices)
13
+ - [Output Format](#output-format)
14
+ - [Limitations](#limitations)
15
+
16
+ ## Basic Recording
17
+
18
+ ```bash
19
+ # Start recording
20
+ agent-browser record start ./demo.webm
21
+
22
+ # Perform actions
23
+ agent-browser open https://example.com
24
+ agent-browser snapshot -i
25
+ agent-browser click @e1
26
+ agent-browser fill @e2 "test input"
27
+
28
+ # Stop and save
29
+ agent-browser record stop
30
+ ```
31
+
32
+ ## Recording Commands
33
+
34
+ ```bash
35
+ # Start recording to file
36
+ agent-browser record start ./output.webm
37
+
38
+ # Stop current recording
39
+ agent-browser record stop
40
+
41
+ # Restart with new file (stops current + starts new)
42
+ agent-browser record restart ./take2.webm
43
+ ```
44
+
45
+ ## Use Cases
46
+
47
+ ### Debugging Failed Automation
48
+
49
+ ```bash
50
+ #!/bin/bash
51
+ # Record automation for debugging
52
+
53
+ agent-browser record start ./debug-$(date +%Y%m%d-%H%M%S).webm
54
+
55
+ # Run your automation
56
+ agent-browser open https://app.example.com
57
+ agent-browser snapshot -i
58
+ agent-browser click @e1 || {
59
+ echo "Click failed - check recording"
60
+ agent-browser record stop
61
+ exit 1
62
+ }
63
+
64
+ agent-browser record stop
65
+ ```
66
+
67
+ ### Documentation Generation
68
+
69
+ ```bash
70
+ #!/bin/bash
71
+ # Record workflow for documentation
72
+
73
+ agent-browser record start ./docs/how-to-login.webm
74
+
75
+ agent-browser open https://app.example.com/login
76
+ agent-browser wait 1000 # Pause for visibility
77
+
78
+ agent-browser snapshot -i
79
+ agent-browser fill @e1 "demo@example.com"
80
+ agent-browser wait 500
81
+
82
+ agent-browser fill @e2 "password"
83
+ agent-browser wait 500
84
+
85
+ agent-browser click @e3
86
+ agent-browser wait --load networkidle
87
+ agent-browser wait 1000 # Show result
88
+
89
+ agent-browser record stop
90
+ ```
91
+
92
+ ### CI/CD Test Evidence
93
+
94
+ ```bash
95
+ #!/bin/bash
96
+ # Record E2E test runs for CI artifacts
97
+
98
+ TEST_NAME="${1:-e2e-test}"
99
+ RECORDING_DIR="./test-recordings"
100
+ mkdir -p "$RECORDING_DIR"
101
+
102
+ agent-browser record start "$RECORDING_DIR/$TEST_NAME-$(date +%s).webm"
103
+
104
+ # Run test
105
+ if run_e2e_test; then
106
+ echo "Test passed"
107
+ else
108
+ echo "Test failed - recording saved"
109
+ fi
110
+
111
+ agent-browser record stop
112
+ ```
113
+
114
+ ## Best Practices
115
+
116
+ ### 1. Add Pauses for Clarity
117
+
118
+ ```bash
119
+ # Slow down for human viewing
120
+ agent-browser click @e1
121
+ agent-browser wait 500 # Let viewer see result
122
+ ```
123
+
124
+ ### 2. Use Descriptive Filenames
125
+
126
+ ```bash
127
+ # Include context in filename
128
+ agent-browser record start ./recordings/login-flow-2024-01-15.webm
129
+ agent-browser record start ./recordings/checkout-test-run-42.webm
130
+ ```
131
+
132
+ ### 3. Handle Recording in Error Cases
133
+
134
+ ```bash
135
+ #!/bin/bash
136
+ set -e
137
+
138
+ cleanup() {
139
+ agent-browser record stop 2>/dev/null || true
140
+ agent-browser close 2>/dev/null || true
141
+ }
142
+ trap cleanup EXIT
143
+
144
+ agent-browser record start ./automation.webm
145
+ # ... automation steps ...
146
+ ```
147
+
148
+ ### 4. Combine with Screenshots
149
+
150
+ ```bash
151
+ # Record video AND capture key frames
152
+ agent-browser record start ./flow.webm
153
+
154
+ agent-browser open https://example.com
155
+ agent-browser screenshot ./screenshots/step1-homepage.png
156
+
157
+ agent-browser click @e1
158
+ agent-browser screenshot ./screenshots/step2-after-click.png
159
+
160
+ agent-browser record stop
161
+ ```
162
+
163
+ ## Output Format
164
+
165
+ - Default format: WebM (VP8/VP9 codec)
166
+ - Compatible with all modern browsers and video players
167
+ - Compressed but high quality
168
+
169
+ ## Limitations
170
+
171
+ - Recording adds slight overhead to automation
172
+ - Large recordings can consume significant disk space
173
+ - Some headless environments may have codec limitations
@@ -0,0 +1,53 @@
1
+ #!/bin/bash
2
+ # API Interception Template - Passively capture API responses
3
+ # Usage: ./api-interception.sh [target_url] [output_file]
4
+
5
+ TARGET_URL="${1:-https://example.com/user/profile}"
6
+ OUTPUT_FILE="${2:-/tmp/api-response.json}"
7
+ REQUEST_PATTERN="${3:-api/}"
8
+
9
+ echo "=== 1. Close old session ==="
10
+ agent-browser close 2>/dev/null
11
+ sleep 1
12
+
13
+ echo ""
14
+ echo "=== 2. Open blank page ==="
15
+ export https_proxy=http://127.0.0.1:7890
16
+ agent-browser open "about:blank"
17
+ sleep 1
18
+
19
+ echo ""
20
+ echo "=== 3. Start request listener in background ==="
21
+ (agent-browser wait --request "$REQUEST_PATTERN" --timeout 30000 > /tmp/api-captured.json 2>&1) &
22
+ WAIT_PID=$!
23
+ sleep 1
24
+
25
+ echo ""
26
+ echo "=== 4. Navigate to target page ==="
27
+ agent-browser open "$TARGET_URL"
28
+
29
+ echo ""
30
+ echo "=== 5. Wait for API response ==="
31
+ wait $WAIT_PID 2>/dev/null
32
+
33
+ echo ""
34
+ echo "=== 6. Process captured data ==="
35
+ if [ -f /tmp/api-captured.json ] && [ -s /tmp/api-captured.json ]; then
36
+ # Extract response body
37
+ jq '.body' /tmp/api-captured.json > "$OUTPUT_FILE"
38
+
39
+ echo "Response saved to: $OUTPUT_FILE"
40
+ echo ""
41
+ echo "=== Preview ==="
42
+ jq '.' "$OUTPUT_FILE" | head -50
43
+ else
44
+ echo "Error: No response captured"
45
+ exit 1
46
+ fi
47
+
48
+ echo ""
49
+ echo "=== 7. Close browser ==="
50
+ agent-browser close
51
+
52
+ echo ""
53
+ echo "=== Done ==="
@@ -0,0 +1,97 @@
1
+ #!/bin/bash
2
+ # Template: Authenticated Session Workflow
3
+ # Purpose: Login once, save state, reuse for subsequent runs
4
+ # Usage: ./authenticated-session.sh <login-url> [state-file]
5
+ #
6
+ # Environment variables:
7
+ # APP_USERNAME - Login username/email
8
+ # APP_PASSWORD - Login password
9
+ #
10
+ # Two modes:
11
+ # 1. Discovery mode (default): Shows form structure so you can identify refs
12
+ # 2. Login mode: Performs actual login after you update the refs
13
+ #
14
+ # Setup steps:
15
+ # 1. Run once to see form structure (discovery mode)
16
+ # 2. Update refs in LOGIN FLOW section below
17
+ # 3. Set APP_USERNAME and APP_PASSWORD
18
+ # 4. Delete the DISCOVERY section
19
+
20
+ set -euo pipefail
21
+
22
+ LOGIN_URL="${1:?Usage: $0 <login-url> [state-file]}"
23
+ STATE_FILE="${2:-./auth-state.json}"
24
+
25
+ echo "Authentication workflow: $LOGIN_URL"
26
+
27
+ # ================================================================
28
+ # SAVED STATE: Skip login if valid saved state exists
29
+ # ================================================================
30
+ if [[ -f "$STATE_FILE" ]]; then
31
+ echo "Loading saved state from $STATE_FILE..."
32
+ agent-browser state load "$STATE_FILE"
33
+ agent-browser open "$LOGIN_URL"
34
+ agent-browser wait --load networkidle
35
+
36
+ CURRENT_URL=$(agent-browser get url)
37
+ if [[ "$CURRENT_URL" != *"login"* ]] && [[ "$CURRENT_URL" != *"signin"* ]]; then
38
+ echo "Session restored successfully"
39
+ agent-browser snapshot -i
40
+ exit 0
41
+ fi
42
+ echo "Session expired, performing fresh login..."
43
+ rm -f "$STATE_FILE"
44
+ fi
45
+
46
+ # ================================================================
47
+ # DISCOVERY MODE: Shows form structure (delete after setup)
48
+ # ================================================================
49
+ echo "Opening login page..."
50
+ agent-browser open "$LOGIN_URL"
51
+ agent-browser wait --load networkidle
52
+
53
+ echo ""
54
+ echo "Login form structure:"
55
+ echo "---"
56
+ agent-browser snapshot -i
57
+ echo "---"
58
+ echo ""
59
+ echo "Next steps:"
60
+ echo " 1. Note the refs: username=@e?, password=@e?, submit=@e?"
61
+ echo " 2. Update the LOGIN FLOW section below with your refs"
62
+ echo " 3. Set: export APP_USERNAME='...' APP_PASSWORD='...'"
63
+ echo " 4. Delete this DISCOVERY MODE section"
64
+ echo ""
65
+ agent-browser close
66
+ exit 0
67
+
68
+ # ================================================================
69
+ # LOGIN FLOW: Uncomment and customize after discovery
70
+ # ================================================================
71
+ # : "${APP_USERNAME:?Set APP_USERNAME environment variable}"
72
+ # : "${APP_PASSWORD:?Set APP_PASSWORD environment variable}"
73
+ #
74
+ # agent-browser open "$LOGIN_URL"
75
+ # agent-browser wait --load networkidle
76
+ # agent-browser snapshot -i
77
+ #
78
+ # # Fill credentials (update refs to match your form)
79
+ # agent-browser fill @e1 "$APP_USERNAME"
80
+ # agent-browser fill @e2 "$APP_PASSWORD"
81
+ # agent-browser click @e3
82
+ # agent-browser wait --load networkidle
83
+ #
84
+ # # Verify login succeeded
85
+ # FINAL_URL=$(agent-browser get url)
86
+ # if [[ "$FINAL_URL" == *"login"* ]] || [[ "$FINAL_URL" == *"signin"* ]]; then
87
+ # echo "Login failed - still on login page"
88
+ # agent-browser screenshot /tmp/login-failed.png
89
+ # agent-browser close
90
+ # exit 1
91
+ # fi
92
+ #
93
+ # # Save state for future runs
94
+ # echo "Saving state to $STATE_FILE"
95
+ # agent-browser state save "$STATE_FILE"
96
+ # echo "Login successful"
97
+ # agent-browser snapshot -i
@@ -0,0 +1,69 @@
1
+ #!/bin/bash
2
+ # Template: Content Capture Workflow
3
+ # Purpose: Extract content from web pages (text, screenshots, PDF)
4
+ # Usage: ./capture-workflow.sh <url> [output-dir]
5
+ #
6
+ # Outputs:
7
+ # - page-full.png: Full page screenshot
8
+ # - page-structure.txt: Page element structure with refs
9
+ # - page-text.txt: All text content
10
+ # - page.pdf: PDF version
11
+ #
12
+ # Optional: Load auth state for protected pages
13
+
14
+ set -euo pipefail
15
+
16
+ TARGET_URL="${1:?Usage: $0 <url> [output-dir]}"
17
+ OUTPUT_DIR="${2:-.}"
18
+
19
+ echo "Capturing: $TARGET_URL"
20
+ mkdir -p "$OUTPUT_DIR"
21
+
22
+ # Optional: Load authentication state
23
+ # if [[ -f "./auth-state.json" ]]; then
24
+ # echo "Loading authentication state..."
25
+ # agent-browser state load "./auth-state.json"
26
+ # fi
27
+
28
+ # Navigate to target
29
+ agent-browser open "$TARGET_URL"
30
+ agent-browser wait --load networkidle
31
+
32
+ # Get metadata
33
+ TITLE=$(agent-browser get title)
34
+ URL=$(agent-browser get url)
35
+ echo "Title: $TITLE"
36
+ echo "URL: $URL"
37
+
38
+ # Capture full page screenshot
39
+ agent-browser screenshot --full "$OUTPUT_DIR/page-full.png"
40
+ echo "Saved: $OUTPUT_DIR/page-full.png"
41
+
42
+ # Get page structure with refs
43
+ agent-browser snapshot -i > "$OUTPUT_DIR/page-structure.txt"
44
+ echo "Saved: $OUTPUT_DIR/page-structure.txt"
45
+
46
+ # Extract all text content
47
+ agent-browser get text body > "$OUTPUT_DIR/page-text.txt"
48
+ echo "Saved: $OUTPUT_DIR/page-text.txt"
49
+
50
+ # Save as PDF
51
+ agent-browser pdf "$OUTPUT_DIR/page.pdf"
52
+ echo "Saved: $OUTPUT_DIR/page.pdf"
53
+
54
+ # Optional: Extract specific elements using refs from structure
55
+ # agent-browser get text @e5 > "$OUTPUT_DIR/main-content.txt"
56
+
57
+ # Optional: Handle infinite scroll pages
58
+ # for i in {1..5}; do
59
+ # agent-browser scroll down 1000
60
+ # agent-browser wait 1000
61
+ # done
62
+ # agent-browser screenshot --full "$OUTPUT_DIR/page-scrolled.png"
63
+
64
+ # Cleanup
65
+ agent-browser close
66
+
67
+ echo ""
68
+ echo "Capture complete:"
69
+ ls -la "$OUTPUT_DIR"
@@ -0,0 +1,210 @@
1
+ #!/bin/bash
2
+ # Data Extraction Template - Universal pattern for web scraping
3
+ # Usage: ./data-extraction.sh <url> [output_file] [mode]
4
+ #
5
+ # Modes:
6
+ # dom - Extract from DOM elements (default)
7
+ # js - Extract from JavaScript global variables
8
+ # api - Intercept API responses
9
+ # scroll - Infinite scroll collection
10
+ #
11
+ # Examples:
12
+ # ./data-extraction.sh https://example.com/products
13
+ # ./data-extraction.sh https://example.com/api/data output.json api
14
+ # ./data-extraction.sh https://example.com/list items.json scroll
15
+
16
+ set -euo pipefail
17
+
18
+ TARGET_URL="${1:?Usage: $0 <url> [output_file] [mode]}"
19
+ OUTPUT_FILE="${2:-/tmp/extracted-data.json}"
20
+ MODE="${3:-dom}"
21
+ REQUEST_PATTERN="${4:-api/}"
22
+
23
+ echo "=== Data Extraction Template ==="
24
+ echo "URL: $TARGET_URL"
25
+ echo "Mode: $MODE"
26
+ echo "Output: $OUTPUT_FILE"
27
+ echo ""
28
+
29
+ echo "=== 1. Close old session ==="
30
+ agent-browser close 2>/dev/null
31
+ sleep 1
32
+
33
+ case "$MODE" in
34
+ api)
35
+ echo ""
36
+ echo "=== 2. API Interception Mode ==="
37
+ export https_proxy=http://127.0.0.1:7890
38
+ agent-browser open "about:blank"
39
+ sleep 1
40
+
41
+ echo ""
42
+ echo "=== 3. Start request listener ==="
43
+ (agent-browser wait --request "$REQUEST_PATTERN" --timeout 30000 > /tmp/api-response.json 2>&1) &
44
+ WAIT_PID=$!
45
+ sleep 1
46
+
47
+ echo ""
48
+ echo "=== 4. Navigate to trigger API ==="
49
+ agent-browser open "$TARGET_URL"
50
+
51
+ echo ""
52
+ echo "=== 5. Wait for response ==="
53
+ wait $WAIT_PID 2>/dev/null || true
54
+
55
+ if [ -f /tmp/api-response.json ] && [ -s /tmp/api-response.json ]; then
56
+ jq '.' /tmp/api-response.json > "$OUTPUT_FILE"
57
+ echo "API response saved to: $OUTPUT_FILE"
58
+ else
59
+ echo "Warning: No API response captured, falling back to DOM extraction"
60
+ agent-browser eval 'document.body.innerText' > "$OUTPUT_FILE"
61
+ fi
62
+ ;;
63
+
64
+ scroll)
65
+ echo ""
66
+ echo "=== 2. Infinite Scroll Mode ==="
67
+ export https_proxy=http://127.0.0.1:7890
68
+ agent-browser open "$TARGET_URL"
69
+ sleep 2
70
+
71
+ ALL_DATA="[]"
72
+ PREV_COUNT=0
73
+ MAX_ITERATIONS=50
74
+
75
+ for i in $(seq 1 $MAX_ITERATIONS); do
76
+ CURRENT=$(agent-browser eval '
77
+ JSON.stringify(
78
+ Array.from(document.querySelectorAll("a, .item, .card"))
79
+ .slice(0, 100)
80
+ .map(el => ({
81
+ text: el.textContent?.trim()?.substring(0, 200),
82
+ href: el.href || null
83
+ }))
84
+ .filter(item => item.text && item.text.length > 0)
85
+ )
86
+ ')
87
+
88
+ ALL_DATA=$(echo "$ALL_DATA" "$CURRENT" | python3 -c "
89
+ import sys, json
90
+ data = []
91
+ for line in sys.stdin:
92
+ line = line.strip()
93
+ if line:
94
+ try:
95
+ d = json.loads(line)
96
+ if isinstance(d, list): data.extend(d)
97
+ except: pass
98
+ seen = set()
99
+ unique = []
100
+ for item in data:
101
+ key = item.get('href') or item.get('text', '')[:50]
102
+ if key not in seen:
103
+ seen.add(key)
104
+ unique.append(item)
105
+ print(json.dumps(unique, ensure_ascii=False))
106
+ " 2>/dev/null || echo "[]")
107
+
108
+ COUNT=$(echo "$ALL_DATA" | python3 -c "import sys,json; d=json.load(sys.stdin); print(len(d))" 2>/dev/null || echo "0")
109
+ echo "[$i] Collected: $COUNT items"
110
+
111
+ if [ "$COUNT" -eq "$PREV_COUNT" ] && [ "$COUNT" -gt 0 ]; then
112
+ echo "No new items, reached end"
113
+ break
114
+ fi
115
+ PREV_COUNT=$COUNT
116
+
117
+ agent-browser scroll down 500
118
+ sleep 0.5
119
+ done
120
+
121
+ echo "$ALL_DATA" | python3 -m json.tool > "$OUTPUT_FILE" 2>/dev/null || echo "$ALL_DATA" > "$OUTPUT_FILE"
122
+ echo "Scroll data saved to: $OUTPUT_FILE"
123
+ ;;
124
+
125
+ js)
126
+ echo ""
127
+ echo "=== 2. JS Variable Extraction Mode ==="
128
+ export https_proxy=http://127.0.0.1:7890
129
+ agent-browser open "$TARGET_URL"
130
+ sleep 3
131
+
132
+ agent-browser eval '
133
+ const result = {
134
+ url: window.location.href,
135
+ title: document.title,
136
+
137
+ __INITIAL_STATE__: window.__INITIAL_STATE__ || null,
138
+ __NEXT_DATA__: window.__NEXT_DATA__ || null,
139
+ __NUXT__: window.__NUXT__ || null,
140
+ dataLayer: window.dataLayer || null,
141
+
142
+ custom: {}
143
+ };
144
+
145
+ JSON.stringify(result, (k, v) => {
146
+ if (typeof v === "function") return "[Function]";
147
+ return v;
148
+ }, 2);
149
+ ' > "$OUTPUT_FILE"
150
+ echo "JS variables saved to: $OUTPUT_FILE"
151
+ ;;
152
+
153
+ dom|*)
154
+ echo ""
155
+ echo "=== 2. DOM Extraction Mode ==="
156
+ export https_proxy=http://127.0.0.1:7890
157
+ agent-browser open "$TARGET_URL"
158
+ sleep 2
159
+
160
+ agent-browser eval '
161
+ const extractText = (sel) => {
162
+ const el = document.querySelector(sel);
163
+ return el?.textContent?.trim() || null;
164
+ };
165
+
166
+ const extractAll = (sel, mapFn) => {
167
+ return Array.from(document.querySelectorAll(sel))
168
+ .map(mapFn)
169
+ .filter(Boolean);
170
+ };
171
+
172
+ const data = {
173
+ url: window.location.href,
174
+ title: document.title,
175
+ meta: {
176
+ description: extractText("meta[name=\"description\"]"),
177
+ keywords: extractText("meta[name=\"keywords\"]")
178
+ },
179
+ headings: extractAll("h1, h2, h3", el => ({
180
+ level: el.tagName,
181
+ text: el.textContent?.trim()
182
+ })),
183
+ links: extractAll("a[href]", el => ({
184
+ text: el.textContent?.trim()?.substring(0, 100),
185
+ href: el.href
186
+ })).slice(0, 50),
187
+ images: extractAll("img[src]", el => ({
188
+ alt: el.alt,
189
+ src: el.src
190
+ })).slice(0, 20),
191
+ bodyText: document.body.innerText.substring(0, 5000)
192
+ };
193
+
194
+ JSON.stringify(data, null, 2);
195
+ ' > "$OUTPUT_FILE"
196
+ echo "DOM data saved to: $OUTPUT_FILE"
197
+ ;;
198
+ esac
199
+
200
+ echo ""
201
+ echo "=== 6. Preview results ==="
202
+ head -100 "$OUTPUT_FILE"
203
+
204
+ echo ""
205
+ echo "=== 7. Close browser ==="
206
+ agent-browser close
207
+
208
+ echo ""
209
+ echo "=== Extraction Complete ==="
210
+ echo "Total items: $(wc -l < "$OUTPUT_FILE") lines"
@@ -0,0 +1,62 @@
1
+ #!/bin/bash
2
+ # Template: Form Automation Workflow
3
+ # Purpose: Fill and submit web forms with validation
4
+ # Usage: ./form-automation.sh <form-url>
5
+ #
6
+ # This template demonstrates the snapshot-interact-verify pattern:
7
+ # 1. Navigate to form
8
+ # 2. Snapshot to get element refs
9
+ # 3. Fill fields using refs
10
+ # 4. Submit and verify result
11
+ #
12
+ # Customize: Update the refs (@e1, @e2, etc.) based on your form's snapshot output
13
+
14
+ set -euo pipefail
15
+
16
+ FORM_URL="${1:?Usage: $0 <form-url>}"
17
+
18
+ echo "Form automation: $FORM_URL"
19
+
20
+ # Step 1: Navigate to form
21
+ agent-browser open "$FORM_URL"
22
+ agent-browser wait --load networkidle
23
+
24
+ # Step 2: Snapshot to discover form elements
25
+ echo ""
26
+ echo "Form structure:"
27
+ agent-browser snapshot -i
28
+
29
+ # Step 3: Fill form fields (customize these refs based on snapshot output)
30
+ #
31
+ # Common field types:
32
+ # agent-browser fill @e1 "John Doe" # Text input
33
+ # agent-browser fill @e2 "user@example.com" # Email input
34
+ # agent-browser fill @e3 "SecureP@ss123" # Password input
35
+ # agent-browser select @e4 "Option Value" # Dropdown
36
+ # agent-browser check @e5 # Checkbox
37
+ # agent-browser click @e6 # Radio button
38
+ # agent-browser fill @e7 "Multi-line text" # Textarea
39
+ # agent-browser upload @e8 /path/to/file.pdf # File upload
40
+ #
41
+ # Uncomment and modify:
42
+ # agent-browser fill @e1 "Test User"
43
+ # agent-browser fill @e2 "test@example.com"
44
+ # agent-browser click @e3 # Submit button
45
+
46
+ # Step 4: Wait for submission
47
+ # agent-browser wait --load networkidle
48
+ # agent-browser wait --url "**/success" # Or wait for redirect
49
+
50
+ # Step 5: Verify result
51
+ echo ""
52
+ echo "Result:"
53
+ agent-browser get url
54
+ agent-browser snapshot -i
55
+
56
+ # Optional: Capture evidence
57
+ agent-browser screenshot /tmp/form-result.png
58
+ echo "Screenshot saved: /tmp/form-result.png"
59
+
60
+ # Cleanup
61
+ agent-browser close
62
+ echo "Done"