agent-web-interface 4.2.0 → 4.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (265) hide show
  1. package/dist/src/browser/connection-utils.d.ts +48 -0
  2. package/dist/src/browser/connection-utils.d.ts.map +1 -0
  3. package/dist/src/browser/connection-utils.js +129 -0
  4. package/dist/src/browser/connection-utils.js.map +1 -0
  5. package/dist/src/browser/index.d.ts +3 -1
  6. package/dist/src/browser/index.d.ts.map +1 -1
  7. package/dist/src/browser/index.js +2 -1
  8. package/dist/src/browser/index.js.map +1 -1
  9. package/dist/src/browser/session-manager.d.ts +1 -89
  10. package/dist/src/browser/session-manager.d.ts.map +1 -1
  11. package/dist/src/browser/session-manager.js +1 -116
  12. package/dist/src/browser/session-manager.js.map +1 -1
  13. package/dist/src/browser/session-manager.types.d.ts +90 -0
  14. package/dist/src/browser/session-manager.types.d.ts.map +1 -0
  15. package/dist/src/browser/session-manager.types.js +7 -0
  16. package/dist/src/browser/session-manager.types.js.map +1 -0
  17. package/dist/src/form/constraint-extraction.d.ts +31 -0
  18. package/dist/src/form/constraint-extraction.d.ts.map +1 -0
  19. package/dist/src/form/constraint-extraction.js +110 -0
  20. package/dist/src/form/constraint-extraction.js.map +1 -0
  21. package/dist/src/form/field-extractor.d.ts.map +1 -1
  22. package/dist/src/form/field-extractor.js +3 -444
  23. package/dist/src/form/field-extractor.js.map +1 -1
  24. package/dist/src/form/field-state-extractor.d.ts +22 -0
  25. package/dist/src/form/field-state-extractor.d.ts.map +1 -0
  26. package/dist/src/form/field-state-extractor.js +55 -0
  27. package/dist/src/form/field-state-extractor.js.map +1 -0
  28. package/dist/src/form/form-actions.d.ts +45 -0
  29. package/dist/src/form/form-actions.d.ts.map +1 -0
  30. package/dist/src/form/form-actions.js +108 -0
  31. package/dist/src/form/form-actions.js.map +1 -0
  32. package/dist/src/form/form-detector.d.ts +0 -36
  33. package/dist/src/form/form-detector.d.ts.map +1 -1
  34. package/dist/src/form/form-detector.js +11 -376
  35. package/dist/src/form/form-detector.js.map +1 -1
  36. package/dist/src/form/input-clustering.d.ts +15 -0
  37. package/dist/src/form/input-clustering.d.ts.map +1 -0
  38. package/dist/src/form/input-clustering.js +61 -0
  39. package/dist/src/form/input-clustering.js.map +1 -0
  40. package/dist/src/form/intent-inference.d.ts +28 -0
  41. package/dist/src/form/intent-inference.d.ts.map +1 -0
  42. package/dist/src/form/intent-inference.js +137 -0
  43. package/dist/src/form/intent-inference.js.map +1 -0
  44. package/dist/src/form/purpose-inference.d.ts +50 -0
  45. package/dist/src/form/purpose-inference.d.ts.map +1 -0
  46. package/dist/src/form/purpose-inference.js +313 -0
  47. package/dist/src/form/purpose-inference.js.map +1 -0
  48. package/dist/src/form/submit-detection.d.ts +36 -0
  49. package/dist/src/form/submit-detection.d.ts.map +1 -0
  50. package/dist/src/form/submit-detection.js +101 -0
  51. package/dist/src/form/submit-detection.js.map +1 -0
  52. package/dist/src/form/types.d.ts +2 -2
  53. package/dist/src/index.js +65 -48
  54. package/dist/src/index.js.map +1 -1
  55. package/dist/src/observation/observation-accumulator.d.ts +1 -1
  56. package/dist/src/observation/observation-accumulator.js +1 -1
  57. package/dist/src/observation/observer-script.d.ts +1 -1
  58. package/dist/src/observation/observer-script.d.ts.map +1 -1
  59. package/dist/src/observation/observer-script.js +129 -7
  60. package/dist/src/observation/observer-script.js.map +1 -1
  61. package/dist/src/query/disambiguation.d.ts +18 -0
  62. package/dist/src/query/disambiguation.d.ts.map +1 -0
  63. package/dist/src/query/disambiguation.js +123 -0
  64. package/dist/src/query/disambiguation.js.map +1 -0
  65. package/dist/src/query/fuzzy-match.d.ts +17 -0
  66. package/dist/src/query/fuzzy-match.d.ts.map +1 -0
  67. package/dist/src/query/fuzzy-match.js +34 -0
  68. package/dist/src/query/fuzzy-match.js.map +1 -0
  69. package/dist/src/query/index.d.ts +3 -0
  70. package/dist/src/query/index.d.ts.map +1 -1
  71. package/dist/src/query/index.js +6 -0
  72. package/dist/src/query/index.js.map +1 -1
  73. package/dist/src/query/query-engine.d.ts +0 -35
  74. package/dist/src/query/query-engine.d.ts.map +1 -1
  75. package/dist/src/query/query-engine.js +9 -309
  76. package/dist/src/query/query-engine.js.map +1 -1
  77. package/dist/src/query/scoring.d.ts +52 -0
  78. package/dist/src/query/scoring.d.ts.map +1 -0
  79. package/dist/src/query/scoring.js +162 -0
  80. package/dist/src/query/scoring.js.map +1 -0
  81. package/dist/src/server/mcp-server.d.ts.map +1 -1
  82. package/dist/src/server/mcp-server.js +29 -1
  83. package/dist/src/server/mcp-server.js.map +1 -1
  84. package/dist/src/snapshot/element-resolver.d.ts +50 -18
  85. package/dist/src/snapshot/element-resolver.d.ts.map +1 -1
  86. package/dist/src/snapshot/element-resolver.js +180 -101
  87. package/dist/src/snapshot/element-resolver.js.map +1 -1
  88. package/dist/src/snapshot/extractors/ax-extractor.d.ts +1 -1
  89. package/dist/src/snapshot/extractors/ax-extractor.d.ts.map +1 -1
  90. package/dist/src/snapshot/extractors/ax-extractor.js +4 -1
  91. package/dist/src/snapshot/extractors/ax-extractor.js.map +1 -1
  92. package/dist/src/snapshot/extractors/index.d.ts +1 -1
  93. package/dist/src/snapshot/extractors/index.d.ts.map +1 -1
  94. package/dist/src/snapshot/extractors/index.js +1 -1
  95. package/dist/src/snapshot/extractors/index.js.map +1 -1
  96. package/dist/src/snapshot/extractors/region-resolver.d.ts.map +1 -1
  97. package/dist/src/snapshot/extractors/region-resolver.js +8 -0
  98. package/dist/src/snapshot/extractors/region-resolver.js.map +1 -1
  99. package/dist/src/snapshot/extractors/types.d.ts +8 -0
  100. package/dist/src/snapshot/extractors/types.d.ts.map +1 -1
  101. package/dist/src/snapshot/extractors/types.js +16 -0
  102. package/dist/src/snapshot/extractors/types.js.map +1 -1
  103. package/dist/src/snapshot/frame-context.d.ts +68 -0
  104. package/dist/src/snapshot/frame-context.d.ts.map +1 -0
  105. package/dist/src/snapshot/frame-context.js +131 -0
  106. package/dist/src/snapshot/frame-context.js.map +1 -0
  107. package/dist/src/snapshot/heading-index.d.ts +28 -0
  108. package/dist/src/snapshot/heading-index.d.ts.map +1 -0
  109. package/dist/src/snapshot/heading-index.js +108 -0
  110. package/dist/src/snapshot/heading-index.js.map +1 -0
  111. package/dist/src/snapshot/index.d.ts +5 -3
  112. package/dist/src/snapshot/index.d.ts.map +1 -1
  113. package/dist/src/snapshot/index.js +3 -2
  114. package/dist/src/snapshot/index.js.map +1 -1
  115. package/dist/src/snapshot/kind-mapping.d.ts +30 -0
  116. package/dist/src/snapshot/kind-mapping.d.ts.map +1 -0
  117. package/dist/src/snapshot/kind-mapping.js +114 -0
  118. package/dist/src/snapshot/kind-mapping.js.map +1 -0
  119. package/dist/src/snapshot/node-filter.d.ts +31 -0
  120. package/dist/src/snapshot/node-filter.d.ts.map +1 -0
  121. package/dist/src/snapshot/node-filter.js +137 -0
  122. package/dist/src/snapshot/node-filter.js.map +1 -0
  123. package/dist/src/snapshot/node-synthesizer.d.ts +62 -0
  124. package/dist/src/snapshot/node-synthesizer.d.ts.map +1 -0
  125. package/dist/src/snapshot/node-synthesizer.js +185 -0
  126. package/dist/src/snapshot/node-synthesizer.js.map +1 -0
  127. package/dist/src/snapshot/snapshot-compiler.d.ts +2 -36
  128. package/dist/src/snapshot/snapshot-compiler.d.ts.map +1 -1
  129. package/dist/src/snapshot/snapshot-compiler.js +28 -520
  130. package/dist/src/snapshot/snapshot-compiler.js.map +1 -1
  131. package/dist/src/snapshot/snapshot.types.d.ts +7 -2
  132. package/dist/src/snapshot/snapshot.types.d.ts.map +1 -1
  133. package/dist/src/snapshot/snapshot.types.js +9 -0
  134. package/dist/src/snapshot/snapshot.types.js.map +1 -1
  135. package/dist/src/state/actionables-filter.d.ts +5 -0
  136. package/dist/src/state/actionables-filter.d.ts.map +1 -1
  137. package/dist/src/state/actionables-filter.js +22 -3
  138. package/dist/src/state/actionables-filter.js.map +1 -1
  139. package/dist/src/state/diff-engine.js +3 -3
  140. package/dist/src/state/diff-engine.js.map +1 -1
  141. package/dist/src/state/element-registry.d.ts.map +1 -1
  142. package/dist/src/state/element-registry.js +6 -4
  143. package/dist/src/state/element-registry.js.map +1 -1
  144. package/dist/src/state/hash-utils.d.ts +24 -0
  145. package/dist/src/state/hash-utils.d.ts.map +1 -0
  146. package/dist/src/state/hash-utils.js +41 -0
  147. package/dist/src/state/hash-utils.js.map +1 -0
  148. package/dist/src/state/layer-detector.d.ts.map +1 -1
  149. package/dist/src/state/layer-detector.js +15 -286
  150. package/dist/src/state/layer-detector.js.map +1 -1
  151. package/dist/src/state/layer-detectors/drawer-detector.d.ts +32 -0
  152. package/dist/src/state/layer-detectors/drawer-detector.d.ts.map +1 -0
  153. package/dist/src/state/layer-detectors/drawer-detector.js +96 -0
  154. package/dist/src/state/layer-detectors/drawer-detector.js.map +1 -0
  155. package/dist/src/state/layer-detectors/index.d.ts +10 -0
  156. package/dist/src/state/layer-detectors/index.d.ts.map +1 -0
  157. package/dist/src/state/layer-detectors/index.js +10 -0
  158. package/dist/src/state/layer-detectors/index.js.map +1 -0
  159. package/dist/src/state/layer-detectors/modal-detector.d.ts +30 -0
  160. package/dist/src/state/layer-detectors/modal-detector.d.ts.map +1 -0
  161. package/dist/src/state/layer-detectors/modal-detector.js +127 -0
  162. package/dist/src/state/layer-detectors/modal-detector.js.map +1 -0
  163. package/dist/src/state/layer-detectors/popover-detector.d.ts +20 -0
  164. package/dist/src/state/layer-detectors/popover-detector.d.ts.map +1 -0
  165. package/dist/src/state/layer-detectors/popover-detector.js +76 -0
  166. package/dist/src/state/layer-detectors/popover-detector.js.map +1 -0
  167. package/dist/src/state/layer-detectors/toast-detector.d.ts +24 -0
  168. package/dist/src/state/layer-detectors/toast-detector.d.ts.map +1 -0
  169. package/dist/src/state/layer-detectors/toast-detector.js +48 -0
  170. package/dist/src/state/layer-detectors/toast-detector.js.map +1 -0
  171. package/dist/src/state/region-mapping.d.ts +13 -0
  172. package/dist/src/state/region-mapping.d.ts.map +1 -0
  173. package/dist/src/state/region-mapping.js +25 -0
  174. package/dist/src/state/region-mapping.js.map +1 -0
  175. package/dist/src/state/state-manager.d.ts.map +1 -1
  176. package/dist/src/state/state-manager.js +8 -192
  177. package/dist/src/state/state-manager.js.map +1 -1
  178. package/dist/src/state/state-renderer.d.ts.map +1 -1
  179. package/dist/src/state/state-renderer.js +16 -2
  180. package/dist/src/state/state-renderer.js.map +1 -1
  181. package/dist/src/state/types.d.ts +8 -4
  182. package/dist/src/state/types.d.ts.map +1 -1
  183. package/dist/src/state/url-sanitization.d.ts +22 -0
  184. package/dist/src/state/url-sanitization.d.ts.map +1 -0
  185. package/dist/src/state/url-sanitization.js +60 -0
  186. package/dist/src/state/url-sanitization.js.map +1 -0
  187. package/dist/src/state/value-masking.d.ts +36 -0
  188. package/dist/src/state/value-masking.d.ts.map +1 -0
  189. package/dist/src/state/value-masking.js +86 -0
  190. package/dist/src/state/value-masking.js.map +1 -0
  191. package/dist/src/tools/action-context.d.ts +60 -0
  192. package/dist/src/tools/action-context.d.ts.map +1 -0
  193. package/dist/src/tools/action-context.js +78 -0
  194. package/dist/src/tools/action-context.js.map +1 -0
  195. package/dist/src/tools/action-stabilization.d.ts +48 -0
  196. package/dist/src/tools/action-stabilization.d.ts.map +1 -0
  197. package/dist/src/tools/action-stabilization.js +87 -0
  198. package/dist/src/tools/action-stabilization.js.map +1 -0
  199. package/dist/src/tools/browser-tools.d.ts +8 -146
  200. package/dist/src/tools/browser-tools.d.ts.map +1 -1
  201. package/dist/src/tools/browser-tools.js +13 -689
  202. package/dist/src/tools/browser-tools.js.map +1 -1
  203. package/dist/src/tools/canvas-tools.d.ts +32 -0
  204. package/dist/src/tools/canvas-tools.d.ts.map +1 -0
  205. package/dist/src/tools/canvas-tools.js +370 -0
  206. package/dist/src/tools/canvas-tools.js.map +1 -0
  207. package/dist/src/tools/effect-tracker.d.ts +25 -0
  208. package/dist/src/tools/effect-tracker.d.ts.map +1 -0
  209. package/dist/src/tools/effect-tracker.js +69 -0
  210. package/dist/src/tools/effect-tracker.js.map +1 -0
  211. package/dist/src/tools/execute-action.d.ts +1 -31
  212. package/dist/src/tools/execute-action.d.ts.map +1 -1
  213. package/dist/src/tools/execute-action.js +7 -276
  214. package/dist/src/tools/execute-action.js.map +1 -1
  215. package/dist/src/tools/form-tools.d.ts +4 -6
  216. package/dist/src/tools/form-tools.d.ts.map +1 -1
  217. package/dist/src/tools/form-tools.js +10 -42
  218. package/dist/src/tools/form-tools.js.map +1 -1
  219. package/dist/src/tools/index.d.ts +6 -4
  220. package/dist/src/tools/index.d.ts.map +1 -1
  221. package/dist/src/tools/index.js +21 -10
  222. package/dist/src/tools/index.js.map +1 -1
  223. package/dist/src/tools/interaction-tools.d.ts +46 -0
  224. package/dist/src/tools/interaction-tools.d.ts.map +1 -0
  225. package/dist/src/tools/interaction-tools.js +138 -0
  226. package/dist/src/tools/interaction-tools.js.map +1 -0
  227. package/dist/src/tools/navigation-detection.d.ts +31 -0
  228. package/dist/src/tools/navigation-detection.d.ts.map +1 -0
  229. package/dist/src/tools/navigation-detection.js +46 -0
  230. package/dist/src/tools/navigation-detection.js.map +1 -0
  231. package/dist/src/tools/navigation-tools.d.ts +57 -0
  232. package/dist/src/tools/navigation-tools.d.ts.map +1 -0
  233. package/dist/src/tools/navigation-tools.js +178 -0
  234. package/dist/src/tools/navigation-tools.js.map +1 -0
  235. package/dist/src/tools/observation-tools.d.ts +53 -0
  236. package/dist/src/tools/observation-tools.d.ts.map +1 -0
  237. package/dist/src/tools/observation-tools.js +247 -0
  238. package/dist/src/tools/observation-tools.js.map +1 -0
  239. package/dist/src/tools/response-builder.js +2 -2
  240. package/dist/src/tools/response-builder.js.map +1 -1
  241. package/dist/src/tools/stale-element-retry.d.ts +37 -0
  242. package/dist/src/tools/stale-element-retry.d.ts.map +1 -0
  243. package/dist/src/tools/stale-element-retry.js +68 -0
  244. package/dist/src/tools/stale-element-retry.js.map +1 -0
  245. package/dist/src/tools/state-manager-registry.d.ts +26 -0
  246. package/dist/src/tools/state-manager-registry.d.ts.map +1 -0
  247. package/dist/src/tools/state-manager-registry.js +39 -0
  248. package/dist/src/tools/state-manager-registry.js.map +1 -0
  249. package/dist/src/tools/tool-context.d.ts +53 -0
  250. package/dist/src/tools/tool-context.d.ts.map +1 -0
  251. package/dist/src/tools/tool-context.js +119 -0
  252. package/dist/src/tools/tool-context.js.map +1 -0
  253. package/dist/src/tools/tool-result.types.d.ts +16 -1
  254. package/dist/src/tools/tool-result.types.d.ts.map +1 -1
  255. package/dist/src/tools/tool-result.types.js +11 -0
  256. package/dist/src/tools/tool-result.types.js.map +1 -1
  257. package/dist/src/tools/tool-schemas.d.ts +358 -146
  258. package/dist/src/tools/tool-schemas.d.ts.map +1 -1
  259. package/dist/src/tools/tool-schemas.js +142 -19
  260. package/dist/src/tools/tool-schemas.js.map +1 -1
  261. package/dist/src/tools/viewport-tools.d.ts +36 -0
  262. package/dist/src/tools/viewport-tools.d.ts.map +1 -0
  263. package/dist/src/tools/viewport-tools.js +105 -0
  264. package/dist/src/tools/viewport-tools.js.map +1 -0
  265. package/package.json +1 -1
@@ -10,293 +10,14 @@
10
10
  * - Accessibility: Semantic information
11
11
  * - CSS: Computed styles (optional, for layout)
12
12
  */
13
- import { createExtractorContext, extractDom, extractAx, extractLayout, extractState, resolveLabel, resolveRegion, buildLocators, resolveGrouping, classifyAxRole, extractAttributes, } from './extractors/index.js';
13
+ import { createExtractorContext, extractDom, extractAx, extractLayout, extractState, resolveLabel, resolveRegion, buildLocators, resolveGrouping, classifyAxRole, extractAttributes, LIVE_REGION_AX_ROLES, } from './extractors/index.js';
14
14
  import { detectInteractivity } from './extractors/interactivity-detector.js';
15
15
  import { getTextContent } from '../lib/text-utils.js';
16
- const ROOT_CONTEXT = 'root';
17
- const LIGHT_DOM_CONTEXT = 'light';
18
- /**
19
- * Build a context key based on iframe and shadow ancestry.
20
- */
21
- function buildContextKey(node) {
22
- const frameKey = node.framePath?.length ? node.framePath.join('/') : ROOT_CONTEXT;
23
- const shadowKey = node.shadowPath?.length ? node.shadowPath.join('/') : LIGHT_DOM_CONTEXT;
24
- return `${frameKey}|${shadowKey}`;
25
- }
26
- /**
27
- * Build context-scoped ID maps to avoid cross-frame/shadow collisions.
28
- */
29
- function buildIdMapsByContext(domResult) {
30
- const idMaps = new Map();
31
- for (const node of domResult.nodes.values()) {
32
- const id = node.attributes?.id;
33
- if (!id)
34
- continue;
35
- const contextKey = buildContextKey(node);
36
- let map = idMaps.get(contextKey);
37
- if (!map) {
38
- map = new Map();
39
- idMaps.set(contextKey, map);
40
- }
41
- map.set(id, node);
42
- }
43
- return idMaps;
44
- }
45
- /**
46
- * Get the ID map scoped to a node's frame/shadow context.
47
- */
48
- function getIdMapForNode(node, idMapsByContext) {
49
- if (!node)
50
- return undefined;
51
- return idMapsByContext.get(buildContextKey(node));
52
- }
53
- /**
54
- * Build adjacency maps for shadow roots and iframe content documents.
55
- * Single O(n) pass through all nodes.
56
- *
57
- * @param domResult - DOM extraction result
58
- * @returns Adjacency maps for shadow roots and content documents
59
- */
60
- function buildAdjacencyMaps(domResult) {
61
- const shadowRootsByHost = new Map();
62
- const contentDocsByFrame = new Map();
63
- for (const [nodeId, node] of domResult.nodes) {
64
- if (node.parentId === undefined)
65
- continue;
66
- if (node.nodeName === '#document-fragment') {
67
- // This is a shadow root - add to shadow host's children
68
- const existing = shadowRootsByHost.get(node.parentId) ?? [];
69
- existing.push(nodeId);
70
- shadowRootsByHost.set(node.parentId, existing);
71
- }
72
- else if (node.nodeName === '#document') {
73
- // This is a content document - add to iframe's children
74
- const existing = contentDocsByFrame.get(node.parentId) ?? [];
75
- existing.push(nodeId);
76
- contentDocsByFrame.set(node.parentId, existing);
77
- }
78
- }
79
- return { shadowRootsByHost, contentDocsByFrame };
80
- }
81
- /**
82
- * Build DOM pre-order index by traversing the DOM tree.
83
- * Also traverses into shadow roots and iframe content documents.
84
- *
85
- * @param domResult - DOM extraction result with nodes and rootId
86
- * @param adjacencyMaps - Precomputed maps for shadow roots and content documents
87
- * @returns Map of backendNodeId -> DOM order index
88
- */
89
- function buildDomOrderIndex(domResult, adjacencyMaps) {
90
- const orderIndex = new Map();
91
- const shadowHostSet = new Set(domResult.shadowRoots);
92
- let index = 0;
93
- function traverse(nodeId) {
94
- const node = domResult.nodes.get(nodeId);
95
- if (!node)
96
- return;
97
- orderIndex.set(nodeId, index++);
98
- // 1. Process light DOM children first (pre-order DFS)
99
- if (node.childNodeIds) {
100
- for (const childId of node.childNodeIds) {
101
- traverse(childId);
102
- }
103
- }
104
- // 2. If this node hosts a shadow root, traverse shadow content (O(1) lookup)
105
- if (shadowHostSet.has(nodeId)) {
106
- const shadowRoots = adjacencyMaps.shadowRootsByHost.get(nodeId) ?? [];
107
- for (const shadowRootId of shadowRoots) {
108
- traverse(shadowRootId);
109
- }
110
- }
111
- // 3. If this node is an iframe, traverse content document (O(1) lookup)
112
- if (node.frameId || node.nodeName.toUpperCase() === 'IFRAME') {
113
- const contentDocs = adjacencyMaps.contentDocsByFrame.get(nodeId) ?? [];
114
- for (const contentDocId of contentDocs) {
115
- traverse(contentDocId);
116
- }
117
- }
118
- }
119
- traverse(domResult.rootId);
120
- return orderIndex;
121
- }
122
- /**
123
- * Build heading index mapping each backendNodeId to its heading context.
124
- * Uses DOM order to determine the most recent preceding heading.
125
- * Also traverses into shadow roots and iframe content documents.
126
- *
127
- * Heading context is isolated at iframe boundaries:
128
- * - Heading from parent document does NOT propagate into iframe
129
- * - Heading from iframe does NOT propagate back to parent document
130
- * - Shadow DOM shares heading context with its host document
131
- *
132
- * @param domResult - DOM extraction result
133
- * @param axResult - AX extraction result for heading names
134
- * @param idMap - Map of DOM ID to RawDomNode for aria-labelledby resolution
135
- * @param adjacencyMaps - Precomputed maps for shadow roots and content documents
136
- * @returns Map of backendNodeId -> heading context string
137
- */
138
- function buildHeadingIndex(domResult, axResult, idMapsByContext, adjacencyMaps) {
139
- const headingIndex = new Map();
140
- const shadowHostSet = new Set(domResult.shadowRoots);
141
- // Helper to check if a node is a heading and resolve its name
142
- function isHeading(backendNodeId) {
143
- const domNode = domResult.nodes.get(backendNodeId);
144
- const axNode = axResult?.nodes.get(backendNodeId);
145
- // Check AX role first
146
- const scopedIdMap = domNode ? getIdMapForNode(domNode, idMapsByContext) : undefined;
147
- if (axNode?.role === 'heading') {
148
- // Priority: AX name -> resolveLabel -> DOM text content
149
- let name = axNode.name;
150
- if (!name && domNode) {
151
- const labelResult = resolveLabel(domNode, axNode, scopedIdMap);
152
- if (labelResult.source !== 'none') {
153
- name = labelResult.label;
154
- }
155
- }
156
- name ??= getTextContent(backendNodeId, domResult.nodes);
157
- return { isHeading: true, name };
158
- }
159
- // Check DOM tag (H1-H6)
160
- if (domNode?.nodeName?.match(/^H[1-6]$/i)) {
161
- // Priority: AX name -> resolveLabel -> DOM text content
162
- let name = axNode?.name;
163
- if (!name) {
164
- const labelResult = resolveLabel(domNode, axNode, scopedIdMap);
165
- if (labelResult.source !== 'none') {
166
- name = labelResult.label;
167
- }
168
- }
169
- name ??= getTextContent(backendNodeId, domResult.nodes);
170
- return { isHeading: true, name };
171
- }
172
- return { isHeading: false };
173
- }
174
- // Traverse DOM in pre-order, passing and returning heading context
175
- function traverse(nodeId, currentHeading) {
176
- const node = domResult.nodes.get(nodeId);
177
- if (!node)
178
- return currentHeading;
179
- // Check if this node is a heading
180
- const headingInfo = isHeading(nodeId);
181
- if (headingInfo.isHeading && headingInfo.name) {
182
- currentHeading = headingInfo.name;
183
- }
184
- // Record the current heading context for this node
185
- if (currentHeading) {
186
- headingIndex.set(nodeId, currentHeading);
187
- }
188
- // 1. Process light DOM children first (pre-order DFS)
189
- // Heading context propagates and updates through light DOM
190
- if (node.childNodeIds) {
191
- for (const childId of node.childNodeIds) {
192
- currentHeading = traverse(childId, currentHeading) ?? currentHeading;
193
- }
194
- }
195
- // 2. If this node hosts a shadow root, traverse shadow content (O(1) lookup)
196
- // Shadow DOM shares heading context with host document (same logical document)
197
- if (shadowHostSet.has(nodeId)) {
198
- const shadowRoots = adjacencyMaps.shadowRootsByHost.get(nodeId) ?? [];
199
- for (const shadowRootId of shadowRoots) {
200
- currentHeading = traverse(shadowRootId, currentHeading) ?? currentHeading;
201
- }
202
- }
203
- // 3. If this node is an iframe, traverse content document (O(1) lookup)
204
- // IMPORTANT: Heading context resets at iframe boundary (separate document)
205
- // - Pass undefined to reset context inside iframe
206
- // - Discard returned heading (iframe headings don't affect parent)
207
- if (node.frameId || node.nodeName.toUpperCase() === 'IFRAME') {
208
- const contentDocs = adjacencyMaps.contentDocsByFrame.get(nodeId) ?? [];
209
- for (const contentDocId of contentDocs) {
210
- traverse(contentDocId, undefined);
211
- }
212
- }
213
- return currentHeading;
214
- }
215
- traverse(domResult.rootId, undefined);
216
- return headingIndex;
217
- }
218
- /**
219
- * Recursively collect frame loaderIds from frame tree.
220
- */
221
- function collectFrameLoaderIds(frameTree, frameLoaderIds, _isMainFrame = true) {
222
- const frame = frameTree.frame;
223
- frameLoaderIds.set(frame.id, {
224
- frameId: frame.id,
225
- loaderId: frame.loaderId,
226
- isMainFrame: !frame.parentId,
227
- });
228
- if (frameTree.childFrames) {
229
- for (const child of frameTree.childFrames) {
230
- collectFrameLoaderIds(child, frameLoaderIds, false);
231
- }
232
- }
233
- }
234
- /**
235
- * Default compile options
236
- */
237
- const DEFAULT_OPTIONS = {
238
- include_hidden: false,
239
- max_nodes: 2000,
240
- timeout: 30000,
241
- redact_sensitive: true,
242
- include_values: true, // Enable value extraction with password redaction
243
- includeReadable: true,
244
- includeLayout: true,
245
- };
246
- /**
247
- * Map AX role to NodeKind.
248
- */
249
- function mapRoleToKind(role) {
250
- if (!role)
251
- return undefined;
252
- const normalized = role.toLowerCase();
253
- const kindMap = {
254
- // Interactive
255
- button: 'button',
256
- link: 'link',
257
- textbox: 'input',
258
- searchbox: 'input',
259
- combobox: 'combobox',
260
- listbox: 'select',
261
- checkbox: 'checkbox',
262
- radio: 'radio',
263
- switch: 'switch',
264
- slider: 'slider',
265
- spinbutton: 'slider',
266
- tab: 'tab',
267
- menuitem: 'menuitem',
268
- menuitemcheckbox: 'menuitem',
269
- menuitemradio: 'menuitem',
270
- option: 'menuitem',
271
- // Readable
272
- heading: 'heading',
273
- paragraph: 'paragraph',
274
- text: 'text',
275
- statictext: 'text',
276
- list: 'list',
277
- listitem: 'listitem',
278
- tree: 'list',
279
- treeitem: 'listitem',
280
- image: 'image',
281
- img: 'image',
282
- figure: 'image',
283
- table: 'table',
284
- grid: 'table',
285
- treegrid: 'table',
286
- // Structural
287
- form: 'form',
288
- dialog: 'dialog',
289
- alertdialog: 'dialog',
290
- navigation: 'navigation',
291
- region: 'section',
292
- article: 'section',
293
- main: 'section',
294
- banner: 'section',
295
- complementary: 'section',
296
- contentinfo: 'section',
297
- };
298
- return kindMap[normalized];
299
- }
16
+ import { buildIdMapsByContext, getIdMapForNode, buildAdjacencyMaps, buildDomOrderIndex, collectFrameLoaderIds, } from './frame-context.js';
17
+ import { buildHeadingIndex } from './heading-index.js';
18
+ import { synthesizeOptionNodes, synthesizeCanvasNodes, promoteToastNodes, } from './node-synthesizer.js';
19
+ import { filterNoiseNodes, sliceWithOverlayPriority } from './node-filter.js';
20
+ import { mapRoleToKind, getKindFromTag, DEFAULT_OPTIONS, } from './kind-mapping.js';
300
21
  /**
301
22
  * SnapshotCompiler class
302
23
  *
@@ -426,7 +147,10 @@ export class SnapshotCompiler {
426
147
  const isReadable = classification === 'readable' && this.options.includeReadable;
427
148
  const isEssentialStructural = classification === 'structural' &&
428
149
  essentialStructuralRoles.has(axNode.role?.toLowerCase() ?? '');
429
- if (isInteractive || isReadable || isEssentialStructural) {
150
+ // Live region roles (alert, status, log, tooltip, progressbar, timer)
151
+ // are always included — they carry critical action feedback
152
+ const isLiveRegion = classification === 'live';
153
+ if (isInteractive || isReadable || isEssentialStructural || isLiveRegion) {
430
154
  const domNode = domResult?.nodes.get(backendNodeId);
431
155
  nodesToProcess.push({
432
156
  backendNodeId,
@@ -440,7 +164,7 @@ export class SnapshotCompiler {
440
164
  // Fallback: Use DOM-only for interactive tags and essential structural elements
441
165
  for (const [backendNodeId, domNode] of domResult.nodes) {
442
166
  const tagName = domNode.nodeName.toUpperCase();
443
- if (['BUTTON', 'A', 'INPUT', 'SELECT', 'TEXTAREA', 'FORM', 'DIALOG'].includes(tagName)) {
167
+ if (['BUTTON', 'A', 'INPUT', 'SELECT', 'TEXTAREA', 'FORM', 'DIALOG', 'CANVAS'].includes(tagName)) {
444
168
  nodesToProcess.push({
445
169
  backendNodeId,
446
170
  domNode,
@@ -448,65 +172,11 @@ export class SnapshotCompiler {
448
172
  }
449
173
  }
450
174
  }
451
- // Phase 2.1: Synthesize option nodes from <select> children.
452
- // Chrome's AX tree often marks <option> nodes as ignored when the select
453
- // is collapsed, and their bounding boxes are zero (OS-rendered).
454
- // We inject them from the DOM so AI agents can discover available options.
175
+ // Phase 2.1-2.3: Synthesize missing nodes from DOM
455
176
  if (domResult) {
456
- const alreadyInSet = new Set(nodesToProcess.map((n) => n.backendNodeId));
457
- for (const nodeData of [...nodesToProcess]) {
458
- const domNode = nodeData.domNode;
459
- if (domNode?.nodeName.toUpperCase() !== 'SELECT')
460
- continue;
461
- const collectOptions = (parentId) => {
462
- const parent = domResult.nodes.get(parentId);
463
- if (!parent?.childNodeIds)
464
- return;
465
- for (const childId of parent.childNodeIds) {
466
- const child = domResult.nodes.get(childId);
467
- if (!child)
468
- continue;
469
- const childTag = child.nodeName.toUpperCase();
470
- if (childTag === 'OPTGROUP') {
471
- // Recurse into optgroup to find nested options
472
- collectOptions(childId);
473
- }
474
- else if (childTag === 'OPTION' && !alreadyInSet.has(childId)) {
475
- // Extract text content from option's child text nodes
476
- const optionText = getTextContent(childId, domResult.nodes);
477
- // Build synthetic AX node so label resolution and state extraction work
478
- const syntheticAx = {
479
- nodeId: `synthetic-opt-${childId}`,
480
- backendDOMNodeId: childId,
481
- role: 'option',
482
- name: optionText ?? '',
483
- properties: [],
484
- };
485
- // Transfer selected attribute to AX property
486
- if (child.attributes?.selected !== undefined) {
487
- syntheticAx.properties.push({
488
- name: 'selected',
489
- value: { type: 'boolean', value: true },
490
- });
491
- }
492
- // Transfer disabled attribute to AX property
493
- if (child.attributes?.disabled !== undefined) {
494
- syntheticAx.properties.push({
495
- name: 'disabled',
496
- value: { type: 'boolean', value: true },
497
- });
498
- }
499
- nodesToProcess.push({
500
- backendNodeId: childId,
501
- domNode: child,
502
- axNode: syntheticAx,
503
- });
504
- alreadyInSet.add(childId);
505
- }
506
- }
507
- };
508
- collectOptions(domNode.backendNodeId);
509
- }
177
+ synthesizeOptionNodes(nodesToProcess, domResult);
178
+ synthesizeCanvasNodes(nodesToProcess, domResult);
179
+ promoteToastNodes(nodesToProcess, domResult);
510
180
  }
511
181
  // Sort by DOM order if available (before max_nodes slicing)
512
182
  if (domOrderAvailable && domOrderIndex) {
@@ -540,6 +210,7 @@ export class SnapshotCompiler {
540
210
  'slider',
541
211
  'tab',
542
212
  'menuitem',
213
+ 'canvas',
543
214
  ]);
544
215
  // Collect non-interactive nodes already in nodesToProcess (Case A)
545
216
  for (const nodeData of nodesToProcess) {
@@ -651,7 +322,7 @@ export class SnapshotCompiler {
651
322
  }
652
323
  }
653
324
  // Phase 4.5: Filter noise nodes (empty containers, duplicate text)
654
- const nodes = this.filterNoiseNodes(transformedNodes, domResult?.nodes ?? new Map(), axResult?.nodes ?? new Map());
325
+ const nodes = filterNoiseNodes(transformedNodes, domResult?.nodes ?? new Map(), axResult?.nodes ?? new Map());
655
326
  // Phase 5: Build BaseSnapshot
656
327
  const duration = Date.now() - startTime;
657
328
  const interactiveCount = nodes.filter((n) => [
@@ -667,6 +338,7 @@ export class SnapshotCompiler {
667
338
  'slider',
668
339
  'tab',
669
340
  'menuitem',
341
+ 'canvas',
670
342
  ].includes(n.kind) || n.implicitly_interactive).length;
671
343
  const meta = {
672
344
  node_count: nodes.length,
@@ -722,14 +394,22 @@ export class SnapshotCompiler {
722
394
  kind = mapRoleToKind(axNode.role) ?? 'generic';
723
395
  }
724
396
  else if (domNode) {
725
- const tagKind = this.getKindFromTag(domNode.nodeName);
397
+ const tagKind = getKindFromTag(domNode.nodeName);
726
398
  if (tagKind)
727
399
  kind = tagKind;
728
400
  }
729
401
  // Resolve label
730
402
  const scopedIdMap = getIdMapForNode(domNode, idMapsByContext);
731
403
  const labelResult = resolveLabel(domNode, axNode, scopedIdMap);
732
- const label = labelResult.label;
404
+ let label = labelResult.label;
405
+ // Fallback for live region containers (alert, status, etc.) with empty labels:
406
+ // Their text typically lives in child StaticText/text nodes, not in the AX name.
407
+ if (!label &&
408
+ axNode?.role &&
409
+ LIVE_REGION_AX_ROLES.has(axNode.role.toLowerCase()) &&
410
+ domTree.size > 0) {
411
+ label = getTextContent(backendNodeId, domTree, 3) ?? '';
412
+ }
733
413
  // Resolve region (pass axTree for ancestor AX role lookup)
734
414
  const region = resolveRegion(domNode, axNode, domTree, axTree);
735
415
  // Resolve grouping (for group_id and group_path only)
@@ -797,178 +477,6 @@ export class SnapshotCompiler {
797
477
  }
798
478
  return node;
799
479
  }
800
- /**
801
- * Get NodeKind from HTML tag name.
802
- */
803
- getKindFromTag(tagName) {
804
- const tag = tagName.toUpperCase();
805
- const tagMap = {
806
- BUTTON: 'button',
807
- A: 'link',
808
- INPUT: 'input',
809
- TEXTAREA: 'textarea',
810
- SELECT: 'select',
811
- H1: 'heading',
812
- H2: 'heading',
813
- H3: 'heading',
814
- H4: 'heading',
815
- H5: 'heading',
816
- H6: 'heading',
817
- P: 'paragraph',
818
- IMG: 'image',
819
- TABLE: 'table',
820
- UL: 'list',
821
- OL: 'list',
822
- LI: 'listitem',
823
- FORM: 'form',
824
- DIALOG: 'dialog',
825
- NAV: 'navigation',
826
- OPTION: 'menuitem',
827
- };
828
- return tagMap[tag];
829
- }
830
- /**
831
- * Filter out noise nodes to reduce snapshot size.
832
- *
833
- * Filters:
834
- * 1. Empty list/listitem containers with no semantic name AND no interactive descendants
835
- * 2. StaticText/text nodes that mirror their parent's label exactly
836
- */
837
- filterNoiseNodes(nodes, domTree, axTree) {
838
- // Build set of interactive node backend IDs for descendant checking
839
- const interactiveKinds = new Set([
840
- 'button',
841
- 'link',
842
- 'input',
843
- 'textarea',
844
- 'select',
845
- 'combobox',
846
- 'checkbox',
847
- 'radio',
848
- 'switch',
849
- 'slider',
850
- 'tab',
851
- 'menuitem',
852
- ]);
853
- const interactiveBackendIds = new Set(nodes.filter((n) => interactiveKinds.has(n.kind)).map((n) => n.backend_node_id));
854
- // Build parent-child relationship from DOM tree
855
- const childToParent = new Map();
856
- for (const [nodeId, domNode] of domTree) {
857
- if (domNode.parentId !== undefined) {
858
- childToParent.set(nodeId, domNode.parentId);
859
- }
860
- }
861
- // Check if a node has any interactive descendants in the DOM tree
862
- const hasInteractiveDescendant = (nodeId) => {
863
- const domNode = domTree.get(nodeId);
864
- if (!domNode)
865
- return false;
866
- // Check direct children
867
- if (domNode.childNodeIds) {
868
- for (const childId of domNode.childNodeIds) {
869
- if (interactiveBackendIds.has(childId)) {
870
- return true;
871
- }
872
- if (hasInteractiveDescendant(childId)) {
873
- return true;
874
- }
875
- }
876
- }
877
- return false;
878
- };
879
- // Get label of parent node in the node list
880
- const getParentLabel = (nodeId) => {
881
- const parentId = childToParent.get(nodeId);
882
- if (parentId === undefined)
883
- return undefined;
884
- // Look up parent in our node list
885
- const parentNode = nodes.find((n) => n.backend_node_id === parentId);
886
- if (parentNode) {
887
- return parentNode.label;
888
- }
889
- // Parent might be further up - check AX tree for parent's name
890
- const parentAx = axTree.get(parentId);
891
- return parentAx?.name;
892
- };
893
- // Container kinds that can be noisy when empty
894
- const containerKinds = new Set(['list', 'listitem']);
895
- // Text kinds that can duplicate parent labels
896
- const textKinds = new Set(['text']);
897
- return nodes.filter((node) => {
898
- // Rule 1: Filter empty container nodes without interactive descendants
899
- if (containerKinds.has(node.kind)) {
900
- const hasSemanticName = node.label && node.label.trim().length > 0;
901
- if (!hasSemanticName) {
902
- const hasInteractive = hasInteractiveDescendant(node.backend_node_id);
903
- if (!hasInteractive) {
904
- return false; // Filter out empty container without interactive content
905
- }
906
- }
907
- }
908
- // Rule 2: Filter text nodes that mirror parent's label
909
- if (textKinds.has(node.kind)) {
910
- const parentLabel = getParentLabel(node.backend_node_id);
911
- if (parentLabel && node.label) {
912
- // Normalize and compare
913
- const normalizedParent = parentLabel.trim().toLowerCase();
914
- const normalizedNode = node.label.trim().toLowerCase();
915
- if (normalizedNode === normalizedParent) {
916
- return false; // Filter out duplicate text
917
- }
918
- }
919
- }
920
- return true; // Keep the node
921
- });
922
- }
923
- }
924
- /**
925
- * Slice nodes to max_nodes budget while preserving high z-index overlay content.
926
- *
927
- * Portal-rendered content (dropdowns, popovers, modals) appears at the end of
928
- * DOM order. On heavy pages, a naive slice truncates it.
929
- *
930
- * Strategy:
931
- * 1. Partition nodes into overlay (z-index > threshold) and main
932
- * 2. Take all overlay nodes (up to 30% of budget)
933
- * 3. Fill remaining budget with main nodes (DOM order)
934
- * 4. Re-sort by original DOM order
935
- */
936
- export function sliceWithOverlayPriority(nodes, maxNodes) {
937
- if (nodes.length <= maxNodes) {
938
- return nodes;
939
- }
940
- const OVERLAY_Z_THRESHOLD = 100;
941
- const MAX_OVERLAY_RATIO = 0.3;
942
- const overlayNodes = [];
943
- const mainNodes = [];
944
- for (const node of nodes) {
945
- const zIndex = node.layout?.zIndex;
946
- if (zIndex !== undefined && zIndex > OVERLAY_Z_THRESHOLD) {
947
- overlayNodes.push(node);
948
- }
949
- else {
950
- mainNodes.push(node);
951
- }
952
- }
953
- // No overlay content → simple slice
954
- if (overlayNodes.length === 0) {
955
- return nodes.slice(0, maxNodes);
956
- }
957
- // Reserve budget for overlay (capped at 30% of total)
958
- const maxOverlay = Math.min(overlayNodes.length, Math.floor(maxNodes * MAX_OVERLAY_RATIO));
959
- const overlaySlice = overlayNodes.slice(0, maxOverlay);
960
- // Fill remaining budget with main content
961
- const mainBudget = maxNodes - overlaySlice.length;
962
- const mainSlice = mainNodes.slice(0, mainBudget);
963
- // Merge and re-sort by original DOM order
964
- const merged = [...mainSlice, ...overlaySlice];
965
- const indexMap = new Map(nodes.map((n, i) => [n.backendNodeId, i]));
966
- merged.sort((a, b) => {
967
- const ia = indexMap.get(a.backendNodeId) ?? Infinity;
968
- const ib = indexMap.get(b.backendNodeId) ?? Infinity;
969
- return ia - ib;
970
- });
971
- return merged;
972
480
  }
973
481
  /**
974
482
  * Export a compile function for simpler usage.