@rpascene/core 0.30.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (200) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +9 -0
  3. package/dist/es/agent/agent.mjs +636 -0
  4. package/dist/es/agent/agent.mjs.map +1 -0
  5. package/dist/es/agent/common.mjs +0 -0
  6. package/dist/es/agent/index.mjs +6 -0
  7. package/dist/es/agent/task-cache.mjs +184 -0
  8. package/dist/es/agent/task-cache.mjs.map +1 -0
  9. package/dist/es/agent/tasks.mjs +666 -0
  10. package/dist/es/agent/tasks.mjs.map +1 -0
  11. package/dist/es/agent/ui-utils.mjs +72 -0
  12. package/dist/es/agent/ui-utils.mjs.map +1 -0
  13. package/dist/es/agent/utils.mjs +162 -0
  14. package/dist/es/agent/utils.mjs.map +1 -0
  15. package/dist/es/ai-model/action-executor.mjs +129 -0
  16. package/dist/es/ai-model/action-executor.mjs.map +1 -0
  17. package/dist/es/ai-model/common.mjs +355 -0
  18. package/dist/es/ai-model/common.mjs.map +1 -0
  19. package/dist/es/ai-model/conversation-history.mjs +58 -0
  20. package/dist/es/ai-model/conversation-history.mjs.map +1 -0
  21. package/dist/es/ai-model/index.mjs +11 -0
  22. package/dist/es/ai-model/inspect.mjs +286 -0
  23. package/dist/es/ai-model/inspect.mjs.map +1 -0
  24. package/dist/es/ai-model/llm-planning.mjs +140 -0
  25. package/dist/es/ai-model/llm-planning.mjs.map +1 -0
  26. package/dist/es/ai-model/prompt/assertion.mjs +31 -0
  27. package/dist/es/ai-model/prompt/assertion.mjs.map +1 -0
  28. package/dist/es/ai-model/prompt/common.mjs +7 -0
  29. package/dist/es/ai-model/prompt/common.mjs.map +1 -0
  30. package/dist/es/ai-model/prompt/describe.mjs +44 -0
  31. package/dist/es/ai-model/prompt/describe.mjs.map +1 -0
  32. package/dist/es/ai-model/prompt/extraction.mjs +140 -0
  33. package/dist/es/ai-model/prompt/extraction.mjs.map +1 -0
  34. package/dist/es/ai-model/prompt/llm-locator.mjs +275 -0
  35. package/dist/es/ai-model/prompt/llm-locator.mjs.map +1 -0
  36. package/dist/es/ai-model/prompt/llm-planning.mjs +367 -0
  37. package/dist/es/ai-model/prompt/llm-planning.mjs.map +1 -0
  38. package/dist/es/ai-model/prompt/llm-section-locator.mjs +47 -0
  39. package/dist/es/ai-model/prompt/llm-section-locator.mjs.map +1 -0
  40. package/dist/es/ai-model/prompt/playwright-generator.mjs +117 -0
  41. package/dist/es/ai-model/prompt/playwright-generator.mjs.map +1 -0
  42. package/dist/es/ai-model/prompt/ui-tars-locator.mjs +34 -0
  43. package/dist/es/ai-model/prompt/ui-tars-locator.mjs.map +1 -0
  44. package/dist/es/ai-model/prompt/ui-tars-planning.mjs +36 -0
  45. package/dist/es/ai-model/prompt/ui-tars-planning.mjs.map +1 -0
  46. package/dist/es/ai-model/prompt/util.mjs +124 -0
  47. package/dist/es/ai-model/prompt/util.mjs.map +1 -0
  48. package/dist/es/ai-model/prompt/yaml-generator.mjs +219 -0
  49. package/dist/es/ai-model/prompt/yaml-generator.mjs.map +1 -0
  50. package/dist/es/ai-model/service-caller/index.mjs +537 -0
  51. package/dist/es/ai-model/service-caller/index.mjs.map +1 -0
  52. package/dist/es/ai-model/ui-tars-planning.mjs +201 -0
  53. package/dist/es/ai-model/ui-tars-planning.mjs.map +1 -0
  54. package/dist/es/device/index.mjs +152 -0
  55. package/dist/es/device/index.mjs.map +1 -0
  56. package/dist/es/image/index.mjs +2 -0
  57. package/dist/es/index.mjs +11 -0
  58. package/dist/es/index.mjs.map +1 -0
  59. package/dist/es/insight/index.mjs +233 -0
  60. package/dist/es/insight/index.mjs.map +1 -0
  61. package/dist/es/insight/utils.mjs +15 -0
  62. package/dist/es/insight/utils.mjs.map +1 -0
  63. package/dist/es/report.mjs +88 -0
  64. package/dist/es/report.mjs.map +1 -0
  65. package/dist/es/tree.mjs +2 -0
  66. package/dist/es/types.mjs +11 -0
  67. package/dist/es/types.mjs.map +1 -0
  68. package/dist/es/utils.mjs +204 -0
  69. package/dist/es/utils.mjs.map +1 -0
  70. package/dist/es/yaml/builder.mjs +13 -0
  71. package/dist/es/yaml/builder.mjs.map +1 -0
  72. package/dist/es/yaml/index.mjs +3 -0
  73. package/dist/es/yaml/player.mjs +372 -0
  74. package/dist/es/yaml/player.mjs.map +1 -0
  75. package/dist/es/yaml/utils.mjs +73 -0
  76. package/dist/es/yaml/utils.mjs.map +1 -0
  77. package/dist/es/yaml.mjs +0 -0
  78. package/dist/lib/agent/agent.js +683 -0
  79. package/dist/lib/agent/agent.js.map +1 -0
  80. package/dist/lib/agent/common.js +5 -0
  81. package/dist/lib/agent/index.js +81 -0
  82. package/dist/lib/agent/index.js.map +1 -0
  83. package/dist/lib/agent/task-cache.js +236 -0
  84. package/dist/lib/agent/task-cache.js.map +1 -0
  85. package/dist/lib/agent/tasks.js +703 -0
  86. package/dist/lib/agent/tasks.js.map +1 -0
  87. package/dist/lib/agent/ui-utils.js +121 -0
  88. package/dist/lib/agent/ui-utils.js.map +1 -0
  89. package/dist/lib/agent/utils.js +233 -0
  90. package/dist/lib/agent/utils.js.map +1 -0
  91. package/dist/lib/ai-model/action-executor.js +163 -0
  92. package/dist/lib/ai-model/action-executor.js.map +1 -0
  93. package/dist/lib/ai-model/common.js +461 -0
  94. package/dist/lib/ai-model/common.js.map +1 -0
  95. package/dist/lib/ai-model/conversation-history.js +92 -0
  96. package/dist/lib/ai-model/conversation-history.js.map +1 -0
  97. package/dist/lib/ai-model/index.js +131 -0
  98. package/dist/lib/ai-model/index.js.map +1 -0
  99. package/dist/lib/ai-model/inspect.js +326 -0
  100. package/dist/lib/ai-model/inspect.js.map +1 -0
  101. package/dist/lib/ai-model/llm-planning.js +174 -0
  102. package/dist/lib/ai-model/llm-planning.js.map +1 -0
  103. package/dist/lib/ai-model/prompt/assertion.js +65 -0
  104. package/dist/lib/ai-model/prompt/assertion.js.map +1 -0
  105. package/dist/lib/ai-model/prompt/common.js +41 -0
  106. package/dist/lib/ai-model/prompt/common.js.map +1 -0
  107. package/dist/lib/ai-model/prompt/describe.js +78 -0
  108. package/dist/lib/ai-model/prompt/describe.js.map +1 -0
  109. package/dist/lib/ai-model/prompt/extraction.js +180 -0
  110. package/dist/lib/ai-model/prompt/extraction.js.map +1 -0
  111. package/dist/lib/ai-model/prompt/llm-locator.js +315 -0
  112. package/dist/lib/ai-model/prompt/llm-locator.js.map +1 -0
  113. package/dist/lib/ai-model/prompt/llm-planning.js +407 -0
  114. package/dist/lib/ai-model/prompt/llm-planning.js.map +1 -0
  115. package/dist/lib/ai-model/prompt/llm-section-locator.js +84 -0
  116. package/dist/lib/ai-model/prompt/llm-section-locator.js.map +1 -0
  117. package/dist/lib/ai-model/prompt/playwright-generator.js +178 -0
  118. package/dist/lib/ai-model/prompt/playwright-generator.js.map +1 -0
  119. package/dist/lib/ai-model/prompt/ui-tars-locator.js +68 -0
  120. package/dist/lib/ai-model/prompt/ui-tars-locator.js.map +1 -0
  121. package/dist/lib/ai-model/prompt/ui-tars-planning.js +73 -0
  122. package/dist/lib/ai-model/prompt/ui-tars-planning.js.map +1 -0
  123. package/dist/lib/ai-model/prompt/util.js +176 -0
  124. package/dist/lib/ai-model/prompt/util.js.map +1 -0
  125. package/dist/lib/ai-model/prompt/yaml-generator.js +280 -0
  126. package/dist/lib/ai-model/prompt/yaml-generator.js.map +1 -0
  127. package/dist/lib/ai-model/service-caller/index.js +623 -0
  128. package/dist/lib/ai-model/service-caller/index.js.map +1 -0
  129. package/dist/lib/ai-model/ui-tars-planning.js +238 -0
  130. package/dist/lib/ai-model/ui-tars-planning.js.map +1 -0
  131. package/dist/lib/device/index.js +255 -0
  132. package/dist/lib/device/index.js.map +1 -0
  133. package/dist/lib/image/index.js +56 -0
  134. package/dist/lib/image/index.js.map +1 -0
  135. package/dist/lib/index.js +103 -0
  136. package/dist/lib/index.js.map +1 -0
  137. package/dist/lib/insight/index.js +267 -0
  138. package/dist/lib/insight/index.js.map +1 -0
  139. package/dist/lib/insight/utils.js +49 -0
  140. package/dist/lib/insight/utils.js.map +1 -0
  141. package/dist/lib/report.js +122 -0
  142. package/dist/lib/report.js.map +1 -0
  143. package/dist/lib/tree.js +44 -0
  144. package/dist/lib/tree.js.map +1 -0
  145. package/dist/lib/types.js +82 -0
  146. package/dist/lib/types.js.map +1 -0
  147. package/dist/lib/utils.js +283 -0
  148. package/dist/lib/utils.js.map +1 -0
  149. package/dist/lib/yaml/builder.js +57 -0
  150. package/dist/lib/yaml/builder.js.map +1 -0
  151. package/dist/lib/yaml/index.js +80 -0
  152. package/dist/lib/yaml/index.js.map +1 -0
  153. package/dist/lib/yaml/player.js +406 -0
  154. package/dist/lib/yaml/player.js.map +1 -0
  155. package/dist/lib/yaml/utils.js +126 -0
  156. package/dist/lib/yaml/utils.js.map +1 -0
  157. package/dist/lib/yaml.js +20 -0
  158. package/dist/lib/yaml.js.map +1 -0
  159. package/dist/types/agent/agent.d.ts +156 -0
  160. package/dist/types/agent/common.d.ts +0 -0
  161. package/dist/types/agent/index.d.ts +9 -0
  162. package/dist/types/agent/task-cache.d.ts +48 -0
  163. package/dist/types/agent/tasks.d.ts +48 -0
  164. package/dist/types/agent/ui-utils.d.ts +7 -0
  165. package/dist/types/agent/utils.d.ts +52 -0
  166. package/dist/types/ai-model/action-executor.d.ts +19 -0
  167. package/dist/types/ai-model/common.d.ts +569 -0
  168. package/dist/types/ai-model/conversation-history.d.ts +18 -0
  169. package/dist/types/ai-model/index.d.ts +13 -0
  170. package/dist/types/ai-model/inspect.d.ts +46 -0
  171. package/dist/types/ai-model/llm-planning.d.ts +11 -0
  172. package/dist/types/ai-model/prompt/assertion.d.ts +2 -0
  173. package/dist/types/ai-model/prompt/common.d.ts +2 -0
  174. package/dist/types/ai-model/prompt/describe.d.ts +1 -0
  175. package/dist/types/ai-model/prompt/extraction.d.ts +4 -0
  176. package/dist/types/ai-model/prompt/llm-locator.d.ts +9 -0
  177. package/dist/types/ai-model/prompt/llm-planning.d.ts +9 -0
  178. package/dist/types/ai-model/prompt/llm-section-locator.d.ts +6 -0
  179. package/dist/types/ai-model/prompt/playwright-generator.d.ts +26 -0
  180. package/dist/types/ai-model/prompt/ui-tars-locator.d.ts +1 -0
  181. package/dist/types/ai-model/prompt/ui-tars-planning.d.ts +2 -0
  182. package/dist/types/ai-model/prompt/util.d.ts +47 -0
  183. package/dist/types/ai-model/prompt/yaml-generator.d.ts +100 -0
  184. package/dist/types/ai-model/service-caller/index.d.ts +48 -0
  185. package/dist/types/ai-model/ui-tars-planning.d.ts +59 -0
  186. package/dist/types/device/index.d.ts +2158 -0
  187. package/dist/types/image/index.d.ts +1 -0
  188. package/dist/types/index.d.ts +12 -0
  189. package/dist/types/insight/index.d.ts +31 -0
  190. package/dist/types/insight/utils.d.ts +2 -0
  191. package/dist/types/report.d.ts +12 -0
  192. package/dist/types/tree.d.ts +1 -0
  193. package/dist/types/types.d.ts +414 -0
  194. package/dist/types/utils.d.ts +40 -0
  195. package/dist/types/yaml/builder.d.ts +2 -0
  196. package/dist/types/yaml/index.d.ts +3 -0
  197. package/dist/types/yaml/player.d.ts +34 -0
  198. package/dist/types/yaml/utils.d.ts +9 -0
  199. package/dist/types/yaml.d.ts +178 -0
  200. package/package.json +108 -0
@@ -0,0 +1,569 @@
1
+ import type { BaseElement, DeviceAction, ElementTreeNode, RpasceneYamlFlowItem, PlanningAction, Rect, Size } from '../types';
2
+ import type { ChatCompletionMessageParam } from 'openai/resources/index';
3
+ import type { PlanningLocateParam } from '../types';
4
+ import type { TVlModeTypes } from '@rpascene/shared/env';
5
+ import { z } from 'zod';
6
+ export type AIArgs = ChatCompletionMessageParam[];
7
+ export declare enum AIActionType {
8
+ ASSERT = 0,
9
+ INSPECT_ELEMENT = 1,
10
+ EXTRACT_DATA = 2,
11
+ PLAN = 3,
12
+ DESCRIBE_ELEMENT = 4,
13
+ TEXT = 5
14
+ }
15
+ export declare function fillBboxParam(locate: PlanningLocateParam, width: number, height: number, rightLimit: number, bottomLimit: number, vlMode: TVlModeTypes | undefined): PlanningLocateParam;
16
+ export declare function adaptQwenBbox(bbox: number[]): [number, number, number, number];
17
+ export declare function adaptDoubaoBbox(bbox: string[] | number[] | string, width: number, height: number): [number, number, number, number];
18
+ export declare function adaptBbox(bbox: number[], width: number, height: number, rightLimit: number, bottomLimit: number, vlMode: TVlModeTypes | undefined): [number, number, number, number];
19
+ export declare function normalized01000(bbox: number[], width: number, height: number): [number, number, number, number];
20
+ export declare function adaptGeminiBbox(bbox: number[], width: number, height: number): [number, number, number, number];
21
+ export declare function adaptBboxToRect(bbox: number[], width: number, height: number, offsetX?: number, offsetY?: number, rightLimit?: number, bottomLimit?: number, vlMode?: TVlModeTypes | undefined): Rect;
22
+ export declare function warnGPT4oSizeLimit(size: Size, modelName: string): void;
23
+ export declare function mergeRects(rects: Rect[]): {
24
+ left: number;
25
+ top: number;
26
+ width: number;
27
+ height: number;
28
+ };
29
+ export declare function expandSearchArea(rect: Rect, screenSize: Size, vlMode: TVlModeTypes | undefined): Rect;
30
+ export declare function markupImageForLLM(screenshotBase64: string, tree: ElementTreeNode<BaseElement>, size: Size): Promise<string>;
31
+ export declare function buildYamlFlowFromPlans(plans: PlanningAction[], actionSpace: DeviceAction<any>[], sleep?: number): RpasceneYamlFlowItem[];
32
+ export declare const PointSchema: z.ZodObject<{
33
+ left: z.ZodNumber;
34
+ top: z.ZodNumber;
35
+ }, "strip", z.ZodTypeAny, {
36
+ left: number;
37
+ top: number;
38
+ }, {
39
+ left: number;
40
+ top: number;
41
+ }>;
42
+ export declare const SizeSchema: z.ZodObject<{
43
+ width: z.ZodNumber;
44
+ height: z.ZodNumber;
45
+ dpr: z.ZodOptional<z.ZodNumber>;
46
+ }, "strip", z.ZodTypeAny, {
47
+ width: number;
48
+ height: number;
49
+ dpr?: number | undefined;
50
+ }, {
51
+ width: number;
52
+ height: number;
53
+ dpr?: number | undefined;
54
+ }>;
55
+ export declare const RectSchema: z.ZodIntersection<z.ZodIntersection<z.ZodObject<{
56
+ left: z.ZodNumber;
57
+ top: z.ZodNumber;
58
+ }, "strip", z.ZodTypeAny, {
59
+ left: number;
60
+ top: number;
61
+ }, {
62
+ left: number;
63
+ top: number;
64
+ }>, z.ZodObject<{
65
+ width: z.ZodNumber;
66
+ height: z.ZodNumber;
67
+ dpr: z.ZodOptional<z.ZodNumber>;
68
+ }, "strip", z.ZodTypeAny, {
69
+ width: number;
70
+ height: number;
71
+ dpr?: number | undefined;
72
+ }, {
73
+ width: number;
74
+ height: number;
75
+ dpr?: number | undefined;
76
+ }>>, z.ZodObject<{
77
+ zoom: z.ZodOptional<z.ZodNumber>;
78
+ }, "strip", z.ZodTypeAny, {
79
+ zoom?: number | undefined;
80
+ }, {
81
+ zoom?: number | undefined;
82
+ }>>;
83
+ export declare const TMultimodalPromptSchema: z.ZodObject<{
84
+ images: z.ZodOptional<z.ZodArray<z.ZodObject<{
85
+ name: z.ZodString;
86
+ url: z.ZodString;
87
+ }, "strip", z.ZodTypeAny, {
88
+ name: string;
89
+ url: string;
90
+ }, {
91
+ name: string;
92
+ url: string;
93
+ }>, "many">>;
94
+ convertHttpImage2Base64: z.ZodOptional<z.ZodBoolean>;
95
+ }, "strip", z.ZodTypeAny, {
96
+ images?: {
97
+ name: string;
98
+ url: string;
99
+ }[] | undefined;
100
+ convertHttpImage2Base64?: boolean | undefined;
101
+ }, {
102
+ images?: {
103
+ name: string;
104
+ url: string;
105
+ }[] | undefined;
106
+ convertHttpImage2Base64?: boolean | undefined;
107
+ }>;
108
+ export declare const TUserPromptSchema: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
109
+ prompt: z.ZodString;
110
+ }, "strip", z.ZodTypeAny, {
111
+ prompt: string;
112
+ }, {
113
+ prompt: string;
114
+ }>, z.ZodObject<{
115
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
116
+ name: z.ZodString;
117
+ url: z.ZodString;
118
+ }, "strip", z.ZodTypeAny, {
119
+ name: string;
120
+ url: string;
121
+ }, {
122
+ name: string;
123
+ url: string;
124
+ }>, "many">>>;
125
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
126
+ }, "strip", z.ZodTypeAny, {
127
+ images?: {
128
+ name: string;
129
+ url: string;
130
+ }[] | undefined;
131
+ convertHttpImage2Base64?: boolean | undefined;
132
+ }, {
133
+ images?: {
134
+ name: string;
135
+ url: string;
136
+ }[] | undefined;
137
+ convertHttpImage2Base64?: boolean | undefined;
138
+ }>>]>;
139
+ export type TMultimodalPrompt = z.infer<typeof TMultimodalPromptSchema>;
140
+ export type TUserPrompt = z.infer<typeof TUserPromptSchema>;
141
+ declare const RpasceneLocationInput: z.ZodObject<{
142
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
143
+ prompt: z.ZodString;
144
+ }, "strip", z.ZodTypeAny, {
145
+ prompt: string;
146
+ }, {
147
+ prompt: string;
148
+ }>, z.ZodObject<{
149
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
150
+ name: z.ZodString;
151
+ url: z.ZodString;
152
+ }, "strip", z.ZodTypeAny, {
153
+ name: string;
154
+ url: string;
155
+ }, {
156
+ name: string;
157
+ url: string;
158
+ }>, "many">>>;
159
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
160
+ }, "strip", z.ZodTypeAny, {
161
+ images?: {
162
+ name: string;
163
+ url: string;
164
+ }[] | undefined;
165
+ convertHttpImage2Base64?: boolean | undefined;
166
+ }, {
167
+ images?: {
168
+ name: string;
169
+ url: string;
170
+ }[] | undefined;
171
+ convertHttpImage2Base64?: boolean | undefined;
172
+ }>>]>;
173
+ deepThink: z.ZodOptional<z.ZodBoolean>;
174
+ cacheable: z.ZodOptional<z.ZodBoolean>;
175
+ xpath: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodBoolean]>>;
176
+ }, "passthrough", z.ZodTypeAny, z.objectOutputType<{
177
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
178
+ prompt: z.ZodString;
179
+ }, "strip", z.ZodTypeAny, {
180
+ prompt: string;
181
+ }, {
182
+ prompt: string;
183
+ }>, z.ZodObject<{
184
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
185
+ name: z.ZodString;
186
+ url: z.ZodString;
187
+ }, "strip", z.ZodTypeAny, {
188
+ name: string;
189
+ url: string;
190
+ }, {
191
+ name: string;
192
+ url: string;
193
+ }>, "many">>>;
194
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
195
+ }, "strip", z.ZodTypeAny, {
196
+ images?: {
197
+ name: string;
198
+ url: string;
199
+ }[] | undefined;
200
+ convertHttpImage2Base64?: boolean | undefined;
201
+ }, {
202
+ images?: {
203
+ name: string;
204
+ url: string;
205
+ }[] | undefined;
206
+ convertHttpImage2Base64?: boolean | undefined;
207
+ }>>]>;
208
+ deepThink: z.ZodOptional<z.ZodBoolean>;
209
+ cacheable: z.ZodOptional<z.ZodBoolean>;
210
+ xpath: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodBoolean]>>;
211
+ }, z.ZodTypeAny, "passthrough">, z.objectInputType<{
212
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
213
+ prompt: z.ZodString;
214
+ }, "strip", z.ZodTypeAny, {
215
+ prompt: string;
216
+ }, {
217
+ prompt: string;
218
+ }>, z.ZodObject<{
219
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
220
+ name: z.ZodString;
221
+ url: z.ZodString;
222
+ }, "strip", z.ZodTypeAny, {
223
+ name: string;
224
+ url: string;
225
+ }, {
226
+ name: string;
227
+ url: string;
228
+ }>, "many">>>;
229
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
230
+ }, "strip", z.ZodTypeAny, {
231
+ images?: {
232
+ name: string;
233
+ url: string;
234
+ }[] | undefined;
235
+ convertHttpImage2Base64?: boolean | undefined;
236
+ }, {
237
+ images?: {
238
+ name: string;
239
+ url: string;
240
+ }[] | undefined;
241
+ convertHttpImage2Base64?: boolean | undefined;
242
+ }>>]>;
243
+ deepThink: z.ZodOptional<z.ZodBoolean>;
244
+ cacheable: z.ZodOptional<z.ZodBoolean>;
245
+ xpath: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodBoolean]>>;
246
+ }, z.ZodTypeAny, "passthrough">>;
247
+ declare const RpasceneLocationResult: z.ZodObject<{
248
+ rpascene_location_field_flag: z.ZodLiteral<true>;
249
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
250
+ prompt: z.ZodString;
251
+ }, "strip", z.ZodTypeAny, {
252
+ prompt: string;
253
+ }, {
254
+ prompt: string;
255
+ }>, z.ZodObject<{
256
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
257
+ name: z.ZodString;
258
+ url: z.ZodString;
259
+ }, "strip", z.ZodTypeAny, {
260
+ name: string;
261
+ url: string;
262
+ }, {
263
+ name: string;
264
+ url: string;
265
+ }>, "many">>>;
266
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
267
+ }, "strip", z.ZodTypeAny, {
268
+ images?: {
269
+ name: string;
270
+ url: string;
271
+ }[] | undefined;
272
+ convertHttpImage2Base64?: boolean | undefined;
273
+ }, {
274
+ images?: {
275
+ name: string;
276
+ url: string;
277
+ }[] | undefined;
278
+ convertHttpImage2Base64?: boolean | undefined;
279
+ }>>]>;
280
+ deepThink: z.ZodOptional<z.ZodBoolean>;
281
+ cacheable: z.ZodOptional<z.ZodBoolean>;
282
+ xpath: z.ZodOptional<z.ZodBoolean>;
283
+ center: z.ZodTuple<[z.ZodNumber, z.ZodNumber], null>;
284
+ rect: z.ZodIntersection<z.ZodIntersection<z.ZodObject<{
285
+ left: z.ZodNumber;
286
+ top: z.ZodNumber;
287
+ }, "strip", z.ZodTypeAny, {
288
+ left: number;
289
+ top: number;
290
+ }, {
291
+ left: number;
292
+ top: number;
293
+ }>, z.ZodObject<{
294
+ width: z.ZodNumber;
295
+ height: z.ZodNumber;
296
+ dpr: z.ZodOptional<z.ZodNumber>;
297
+ }, "strip", z.ZodTypeAny, {
298
+ width: number;
299
+ height: number;
300
+ dpr?: number | undefined;
301
+ }, {
302
+ width: number;
303
+ height: number;
304
+ dpr?: number | undefined;
305
+ }>>, z.ZodObject<{
306
+ zoom: z.ZodOptional<z.ZodNumber>;
307
+ }, "strip", z.ZodTypeAny, {
308
+ zoom?: number | undefined;
309
+ }, {
310
+ zoom?: number | undefined;
311
+ }>>;
312
+ }, "passthrough", z.ZodTypeAny, z.objectOutputType<{
313
+ rpascene_location_field_flag: z.ZodLiteral<true>;
314
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
315
+ prompt: z.ZodString;
316
+ }, "strip", z.ZodTypeAny, {
317
+ prompt: string;
318
+ }, {
319
+ prompt: string;
320
+ }>, z.ZodObject<{
321
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
322
+ name: z.ZodString;
323
+ url: z.ZodString;
324
+ }, "strip", z.ZodTypeAny, {
325
+ name: string;
326
+ url: string;
327
+ }, {
328
+ name: string;
329
+ url: string;
330
+ }>, "many">>>;
331
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
332
+ }, "strip", z.ZodTypeAny, {
333
+ images?: {
334
+ name: string;
335
+ url: string;
336
+ }[] | undefined;
337
+ convertHttpImage2Base64?: boolean | undefined;
338
+ }, {
339
+ images?: {
340
+ name: string;
341
+ url: string;
342
+ }[] | undefined;
343
+ convertHttpImage2Base64?: boolean | undefined;
344
+ }>>]>;
345
+ deepThink: z.ZodOptional<z.ZodBoolean>;
346
+ cacheable: z.ZodOptional<z.ZodBoolean>;
347
+ xpath: z.ZodOptional<z.ZodBoolean>;
348
+ center: z.ZodTuple<[z.ZodNumber, z.ZodNumber], null>;
349
+ rect: z.ZodIntersection<z.ZodIntersection<z.ZodObject<{
350
+ left: z.ZodNumber;
351
+ top: z.ZodNumber;
352
+ }, "strip", z.ZodTypeAny, {
353
+ left: number;
354
+ top: number;
355
+ }, {
356
+ left: number;
357
+ top: number;
358
+ }>, z.ZodObject<{
359
+ width: z.ZodNumber;
360
+ height: z.ZodNumber;
361
+ dpr: z.ZodOptional<z.ZodNumber>;
362
+ }, "strip", z.ZodTypeAny, {
363
+ width: number;
364
+ height: number;
365
+ dpr?: number | undefined;
366
+ }, {
367
+ width: number;
368
+ height: number;
369
+ dpr?: number | undefined;
370
+ }>>, z.ZodObject<{
371
+ zoom: z.ZodOptional<z.ZodNumber>;
372
+ }, "strip", z.ZodTypeAny, {
373
+ zoom?: number | undefined;
374
+ }, {
375
+ zoom?: number | undefined;
376
+ }>>;
377
+ }, z.ZodTypeAny, "passthrough">, z.objectInputType<{
378
+ rpascene_location_field_flag: z.ZodLiteral<true>;
379
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
380
+ prompt: z.ZodString;
381
+ }, "strip", z.ZodTypeAny, {
382
+ prompt: string;
383
+ }, {
384
+ prompt: string;
385
+ }>, z.ZodObject<{
386
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
387
+ name: z.ZodString;
388
+ url: z.ZodString;
389
+ }, "strip", z.ZodTypeAny, {
390
+ name: string;
391
+ url: string;
392
+ }, {
393
+ name: string;
394
+ url: string;
395
+ }>, "many">>>;
396
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
397
+ }, "strip", z.ZodTypeAny, {
398
+ images?: {
399
+ name: string;
400
+ url: string;
401
+ }[] | undefined;
402
+ convertHttpImage2Base64?: boolean | undefined;
403
+ }, {
404
+ images?: {
405
+ name: string;
406
+ url: string;
407
+ }[] | undefined;
408
+ convertHttpImage2Base64?: boolean | undefined;
409
+ }>>]>;
410
+ deepThink: z.ZodOptional<z.ZodBoolean>;
411
+ cacheable: z.ZodOptional<z.ZodBoolean>;
412
+ xpath: z.ZodOptional<z.ZodBoolean>;
413
+ center: z.ZodTuple<[z.ZodNumber, z.ZodNumber], null>;
414
+ rect: z.ZodIntersection<z.ZodIntersection<z.ZodObject<{
415
+ left: z.ZodNumber;
416
+ top: z.ZodNumber;
417
+ }, "strip", z.ZodTypeAny, {
418
+ left: number;
419
+ top: number;
420
+ }, {
421
+ left: number;
422
+ top: number;
423
+ }>, z.ZodObject<{
424
+ width: z.ZodNumber;
425
+ height: z.ZodNumber;
426
+ dpr: z.ZodOptional<z.ZodNumber>;
427
+ }, "strip", z.ZodTypeAny, {
428
+ width: number;
429
+ height: number;
430
+ dpr?: number | undefined;
431
+ }, {
432
+ width: number;
433
+ height: number;
434
+ dpr?: number | undefined;
435
+ }>>, z.ZodObject<{
436
+ zoom: z.ZodOptional<z.ZodNumber>;
437
+ }, "strip", z.ZodTypeAny, {
438
+ zoom?: number | undefined;
439
+ }, {
440
+ zoom?: number | undefined;
441
+ }>>;
442
+ }, z.ZodTypeAny, "passthrough">>;
443
+ export type RpasceneLocationResultType = z.infer<typeof RpasceneLocationResult>;
444
+ export type RpasceneLocationInputType = z.infer<typeof RpasceneLocationInput>;
445
+ /**
446
+ * Returns the schema for locator fields.
447
+ * This now returns the input schema which is more permissive and suitable for validation.
448
+ */
449
+ export declare const getRpasceneLocationSchema: () => z.ZodObject<{
450
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
451
+ prompt: z.ZodString;
452
+ }, "strip", z.ZodTypeAny, {
453
+ prompt: string;
454
+ }, {
455
+ prompt: string;
456
+ }>, z.ZodObject<{
457
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
458
+ name: z.ZodString;
459
+ url: z.ZodString;
460
+ }, "strip", z.ZodTypeAny, {
461
+ name: string;
462
+ url: string;
463
+ }, {
464
+ name: string;
465
+ url: string;
466
+ }>, "many">>>;
467
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
468
+ }, "strip", z.ZodTypeAny, {
469
+ images?: {
470
+ name: string;
471
+ url: string;
472
+ }[] | undefined;
473
+ convertHttpImage2Base64?: boolean | undefined;
474
+ }, {
475
+ images?: {
476
+ name: string;
477
+ url: string;
478
+ }[] | undefined;
479
+ convertHttpImage2Base64?: boolean | undefined;
480
+ }>>]>;
481
+ deepThink: z.ZodOptional<z.ZodBoolean>;
482
+ cacheable: z.ZodOptional<z.ZodBoolean>;
483
+ xpath: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodBoolean]>>;
484
+ }, "passthrough", z.ZodTypeAny, z.objectOutputType<{
485
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
486
+ prompt: z.ZodString;
487
+ }, "strip", z.ZodTypeAny, {
488
+ prompt: string;
489
+ }, {
490
+ prompt: string;
491
+ }>, z.ZodObject<{
492
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
493
+ name: z.ZodString;
494
+ url: z.ZodString;
495
+ }, "strip", z.ZodTypeAny, {
496
+ name: string;
497
+ url: string;
498
+ }, {
499
+ name: string;
500
+ url: string;
501
+ }>, "many">>>;
502
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
503
+ }, "strip", z.ZodTypeAny, {
504
+ images?: {
505
+ name: string;
506
+ url: string;
507
+ }[] | undefined;
508
+ convertHttpImage2Base64?: boolean | undefined;
509
+ }, {
510
+ images?: {
511
+ name: string;
512
+ url: string;
513
+ }[] | undefined;
514
+ convertHttpImage2Base64?: boolean | undefined;
515
+ }>>]>;
516
+ deepThink: z.ZodOptional<z.ZodBoolean>;
517
+ cacheable: z.ZodOptional<z.ZodBoolean>;
518
+ xpath: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodBoolean]>>;
519
+ }, z.ZodTypeAny, "passthrough">, z.objectInputType<{
520
+ prompt: z.ZodUnion<[z.ZodString, z.ZodIntersection<z.ZodObject<{
521
+ prompt: z.ZodString;
522
+ }, "strip", z.ZodTypeAny, {
523
+ prompt: string;
524
+ }, {
525
+ prompt: string;
526
+ }>, z.ZodObject<{
527
+ images: z.ZodOptional<z.ZodOptional<z.ZodArray<z.ZodObject<{
528
+ name: z.ZodString;
529
+ url: z.ZodString;
530
+ }, "strip", z.ZodTypeAny, {
531
+ name: string;
532
+ url: string;
533
+ }, {
534
+ name: string;
535
+ url: string;
536
+ }>, "many">>>;
537
+ convertHttpImage2Base64: z.ZodOptional<z.ZodOptional<z.ZodBoolean>>;
538
+ }, "strip", z.ZodTypeAny, {
539
+ images?: {
540
+ name: string;
541
+ url: string;
542
+ }[] | undefined;
543
+ convertHttpImage2Base64?: boolean | undefined;
544
+ }, {
545
+ images?: {
546
+ name: string;
547
+ url: string;
548
+ }[] | undefined;
549
+ convertHttpImage2Base64?: boolean | undefined;
550
+ }>>]>;
551
+ deepThink: z.ZodOptional<z.ZodBoolean>;
552
+ cacheable: z.ZodOptional<z.ZodBoolean>;
553
+ xpath: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodBoolean]>>;
554
+ }, z.ZodTypeAny, "passthrough">>;
555
+ export declare const ifRpasceneLocatorField: (field: any) => boolean;
556
+ export declare const dumpRpasceneLocatorField: (field: any) => string;
557
+ export declare const findAllRpasceneLocatorField: (zodType?: z.ZodType<any>, requiredOnly?: boolean) => string[];
558
+ export declare const dumpActionParam: (jsonObject: Record<string, any>, zodSchema: z.ZodType<any>) => Record<string, any>;
559
+ export declare const loadActionParam: (jsonObject: Record<string, any>, zodSchema: z.ZodType<any>) => Record<string, any>;
560
+ /**
561
+ * Parse and validate action parameters using Zod schema.
562
+ * All fields are validated through Zod, EXCEPT locator fields which are skipped.
563
+ * Default values defined in the schema are automatically applied.
564
+ *
565
+ * Locator fields are special business logic fields with complex validation requirements,
566
+ * so they are intentionally excluded from Zod parsing and use existing validation logic.
567
+ */
568
+ export declare const parseActionParam: (rawParam: Record<string, any>, zodSchema: z.ZodType<any>) => Record<string, any>;
569
+ export {};
@@ -0,0 +1,18 @@
1
+ import type { ChatCompletionMessageParam } from 'openai/resources/index';
2
+ export interface ConversationHistoryOptions {
3
+ maxUserImageMessages?: number;
4
+ initialMessages?: ChatCompletionMessageParam[];
5
+ }
6
+ export declare class ConversationHistory {
7
+ private readonly maxUserImageMessages;
8
+ private readonly messages;
9
+ constructor(options?: ConversationHistoryOptions);
10
+ append(message: ChatCompletionMessageParam): void;
11
+ seed(messages: ChatCompletionMessageParam[]): void;
12
+ reset(): void;
13
+ snapshot(): ChatCompletionMessageParam[];
14
+ get length(): number;
15
+ [Symbol.iterator](): IterableIterator<ChatCompletionMessageParam>;
16
+ toJSON(): ChatCompletionMessageParam[];
17
+ private pruneOldestUserMessageIfNecessary;
18
+ }
@@ -0,0 +1,13 @@
1
+ export { callAIWithStringResponse, callAIWithObjectResponse, callAI, } from './service-caller/index';
2
+ export { systemPromptToLocateElement } from './prompt/llm-locator';
3
+ export { describeUserPage, elementByPositionWithElementInfo, } from './prompt/util';
4
+ export { generatePlaywrightTest, generatePlaywrightTestStream, } from './prompt/playwright-generator';
5
+ export { generateYamlTest, generateYamlTestStream, } from './prompt/yaml-generator';
6
+ export type { ChatCompletionMessageParam } from 'openai/resources/index';
7
+ export { AiLocateElement, AiExtractElementInfo, AiLocateSection, } from './inspect';
8
+ export { plan } from './llm-planning';
9
+ export { adaptBboxToRect } from './common';
10
+ export { uiTarsPlanning, resizeImageForUiTars } from './ui-tars-planning';
11
+ export { ConversationHistory, type ConversationHistoryOptions, } from './conversation-history';
12
+ export { AIActionType, type AIArgs } from './common';
13
+ export { getRpasceneLocationSchema, type RpasceneLocationResultType, PointSchema, SizeSchema, RectSchema, TMultimodalPromptSchema, TUserPromptSchema, type TMultimodalPrompt, type TUserPrompt, findAllRpasceneLocatorField, dumpActionParam, loadActionParam, parseActionParam, } from './common';
@@ -0,0 +1,46 @@
1
+ import type { AIDataExtractionResponse, AIElementLocatorResponse, AIElementResponse, AIUsageInfo, BaseElement, ElementById, InsightExtractOption, Rect, ReferenceImage, UIContext } from '../types';
2
+ import type { IModelConfig } from '@rpascene/shared/env';
3
+ import type { ChatCompletionSystemMessageParam, ChatCompletionUserMessageParam } from 'openai/resources/index';
4
+ import type { TMultimodalPrompt, TUserPrompt } from './common';
5
+ import { callAIWithObjectResponse } from './service-caller/index';
6
+ export type AIArgs = [
7
+ ChatCompletionSystemMessageParam,
8
+ ...ChatCompletionUserMessageParam[]
9
+ ];
10
+ export declare function AiLocateElement<ElementType extends BaseElement = BaseElement>(options: {
11
+ context: UIContext<ElementType>;
12
+ targetElementDescription: TUserPrompt;
13
+ referenceImage?: ReferenceImage;
14
+ callAIFn: typeof callAIWithObjectResponse<AIElementResponse | [number, number]>;
15
+ searchConfig?: Awaited<ReturnType<typeof AiLocateSection>>;
16
+ modelConfig: IModelConfig;
17
+ }): Promise<{
18
+ parseResult: AIElementLocatorResponse;
19
+ rect?: Rect;
20
+ rawResponse: string;
21
+ elementById: ElementById;
22
+ usage?: AIUsageInfo;
23
+ isOrderSensitive?: boolean;
24
+ }>;
25
+ export declare function AiLocateSection(options: {
26
+ context: UIContext<BaseElement>;
27
+ sectionDescription: TUserPrompt;
28
+ modelConfig: IModelConfig;
29
+ }): Promise<{
30
+ rect?: Rect;
31
+ imageBase64?: string;
32
+ error?: string;
33
+ rawResponse: string;
34
+ usage?: AIUsageInfo;
35
+ }>;
36
+ export declare function AiExtractElementInfo<T, ElementType extends BaseElement = BaseElement>(options: {
37
+ dataQuery: string | Record<string, string>;
38
+ multimodalPrompt?: TMultimodalPrompt;
39
+ context: UIContext<ElementType>;
40
+ extractOption?: InsightExtractOption;
41
+ modelConfig: IModelConfig;
42
+ }): Promise<{
43
+ parseResult: AIDataExtractionResponse<T>;
44
+ elementById: (idOrIndexId: string) => ElementType;
45
+ usage: AIUsageInfo | undefined;
46
+ }>;
@@ -0,0 +1,11 @@
1
+ import type { DeviceAction, InterfaceType, PlanningAIResponse, UIContext } from '../types';
2
+ import type { IModelConfig } from '@rpascene/shared/env';
3
+ import type { ConversationHistory } from './conversation-history';
4
+ export declare function plan(userInstruction: string, opts: {
5
+ context: UIContext;
6
+ interfaceType: InterfaceType;
7
+ actionSpace: DeviceAction<any>[];
8
+ actionContext?: string;
9
+ modelConfig: IModelConfig;
10
+ conversationHistory?: ConversationHistory;
11
+ }): Promise<PlanningAIResponse>;
@@ -0,0 +1,2 @@
1
+ import type { ResponseFormatJSONSchema } from 'openai/resources/index';
2
+ export declare const assertSchema: ResponseFormatJSONSchema;
@@ -0,0 +1,2 @@
1
+ import type { TVlModeTypes } from '@rpascene/shared/env';
2
+ export declare function bboxDescription(vlMode: TVlModeTypes | undefined): "box_2d bounding box for the target element, should be [ymin, xmin, ymax, xmax] normalized to 0-1000." | "2d bounding box as [xmin, ymin, xmax, ymax]";
@@ -0,0 +1 @@
1
+ export declare const elementDescriberInstruction: () => string;
@@ -0,0 +1,4 @@
1
+ import type { ResponseFormatJSONSchema } from 'openai/resources/index';
2
+ export declare function systemPromptToExtract(): string;
3
+ export declare const extractDataQueryPrompt: (pageDescription: string, dataQuery: string | Record<string, string>) => Promise<string>;
4
+ export declare const extractDataSchema: ResponseFormatJSONSchema;
@@ -0,0 +1,9 @@
1
+ import { PromptTemplate } from '@langchain/core/prompts';
2
+ import type { TVlModeTypes } from '@rpascene/shared/env';
3
+ import type { ResponseFormatJSONSchema } from 'openai/resources/index';
4
+ export declare function systemPromptToLocateElement(vlMode: TVlModeTypes | undefined): string;
5
+ export declare const locatorSchema: ResponseFormatJSONSchema;
6
+ export declare const findElementPrompt: PromptTemplate<{
7
+ pageDescription: any;
8
+ targetElementDescription: any;
9
+ }, any>;