@donggui/core 1.5.4-donggui.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/README.md +9 -0
- package/dist/es/agent/agent.mjs +709 -0
- package/dist/es/agent/agent.mjs.map +1 -0
- package/dist/es/agent/common.mjs +0 -0
- package/dist/es/agent/execution-session.mjs +41 -0
- package/dist/es/agent/execution-session.mjs.map +1 -0
- package/dist/es/agent/index.mjs +6 -0
- package/dist/es/agent/task-builder.mjs +330 -0
- package/dist/es/agent/task-builder.mjs.map +1 -0
- package/dist/es/agent/task-cache.mjs +186 -0
- package/dist/es/agent/task-cache.mjs.map +1 -0
- package/dist/es/agent/tasks.mjs +422 -0
- package/dist/es/agent/tasks.mjs.map +1 -0
- package/dist/es/agent/ui-utils.mjs +91 -0
- package/dist/es/agent/ui-utils.mjs.map +1 -0
- package/dist/es/agent/utils.mjs +198 -0
- package/dist/es/agent/utils.mjs.map +1 -0
- package/dist/es/ai-model/auto-glm/actions.mjs +224 -0
- package/dist/es/ai-model/auto-glm/actions.mjs.map +1 -0
- package/dist/es/ai-model/auto-glm/index.mjs +6 -0
- package/dist/es/ai-model/auto-glm/parser.mjs +239 -0
- package/dist/es/ai-model/auto-glm/parser.mjs.map +1 -0
- package/dist/es/ai-model/auto-glm/planning.mjs +71 -0
- package/dist/es/ai-model/auto-glm/planning.mjs.map +1 -0
- package/dist/es/ai-model/auto-glm/prompt.mjs +222 -0
- package/dist/es/ai-model/auto-glm/prompt.mjs.map +1 -0
- package/dist/es/ai-model/auto-glm/util.mjs +9 -0
- package/dist/es/ai-model/auto-glm/util.mjs.map +1 -0
- package/dist/es/ai-model/conversation-history.mjs +195 -0
- package/dist/es/ai-model/conversation-history.mjs.map +1 -0
- package/dist/es/ai-model/index.mjs +11 -0
- package/dist/es/ai-model/inspect.mjs +386 -0
- package/dist/es/ai-model/inspect.mjs.map +1 -0
- package/dist/es/ai-model/llm-planning.mjs +233 -0
- package/dist/es/ai-model/llm-planning.mjs.map +1 -0
- package/dist/es/ai-model/prompt/common.mjs +7 -0
- package/dist/es/ai-model/prompt/common.mjs.map +1 -0
- package/dist/es/ai-model/prompt/describe.mjs +66 -0
- package/dist/es/ai-model/prompt/describe.mjs.map +1 -0
- package/dist/es/ai-model/prompt/extraction.mjs +129 -0
- package/dist/es/ai-model/prompt/extraction.mjs.map +1 -0
- package/dist/es/ai-model/prompt/llm-locator.mjs +51 -0
- package/dist/es/ai-model/prompt/llm-locator.mjs.map +1 -0
- package/dist/es/ai-model/prompt/llm-planning.mjs +364 -0
- package/dist/es/ai-model/prompt/llm-planning.mjs.map +1 -0
- package/dist/es/ai-model/prompt/llm-section-locator.mjs +44 -0
- package/dist/es/ai-model/prompt/llm-section-locator.mjs.map +1 -0
- package/dist/es/ai-model/prompt/order-sensitive-judge.mjs +35 -0
- package/dist/es/ai-model/prompt/order-sensitive-judge.mjs.map +1 -0
- package/dist/es/ai-model/prompt/playwright-generator.mjs +117 -0
- package/dist/es/ai-model/prompt/playwright-generator.mjs.map +1 -0
- package/dist/es/ai-model/prompt/ui-tars-planning.mjs +36 -0
- package/dist/es/ai-model/prompt/ui-tars-planning.mjs.map +1 -0
- package/dist/es/ai-model/prompt/util.mjs +59 -0
- package/dist/es/ai-model/prompt/util.mjs.map +1 -0
- package/dist/es/ai-model/prompt/yaml-generator.mjs +219 -0
- package/dist/es/ai-model/prompt/yaml-generator.mjs.map +1 -0
- package/dist/es/ai-model/service-caller/index.mjs +466 -0
- package/dist/es/ai-model/service-caller/index.mjs.map +1 -0
- package/dist/es/ai-model/ui-tars-planning.mjs +249 -0
- package/dist/es/ai-model/ui-tars-planning.mjs.map +1 -0
- package/dist/es/common.mjs +371 -0
- package/dist/es/common.mjs.map +1 -0
- package/dist/es/device/device-options.mjs +0 -0
- package/dist/es/device/index.mjs +300 -0
- package/dist/es/device/index.mjs.map +1 -0
- package/dist/es/dump/html-utils.mjs +211 -0
- package/dist/es/dump/html-utils.mjs.map +1 -0
- package/dist/es/dump/image-restoration.mjs +43 -0
- package/dist/es/dump/image-restoration.mjs.map +1 -0
- package/dist/es/dump/index.mjs +3 -0
- package/dist/es/index.mjs +15 -0
- package/dist/es/index.mjs.map +1 -0
- package/dist/es/report-generator.mjs +134 -0
- package/dist/es/report-generator.mjs.map +1 -0
- package/dist/es/report.mjs +111 -0
- package/dist/es/report.mjs.map +1 -0
- package/dist/es/screenshot-item.mjs +105 -0
- package/dist/es/screenshot-item.mjs.map +1 -0
- package/dist/es/service/index.mjs +256 -0
- package/dist/es/service/index.mjs.map +1 -0
- package/dist/es/service/utils.mjs +15 -0
- package/dist/es/service/utils.mjs.map +1 -0
- package/dist/es/skill/index.mjs +38 -0
- package/dist/es/skill/index.mjs.map +1 -0
- package/dist/es/task-runner.mjs +258 -0
- package/dist/es/task-runner.mjs.map +1 -0
- package/dist/es/task-timing.mjs +12 -0
- package/dist/es/task-timing.mjs.map +1 -0
- package/dist/es/tree.mjs +13 -0
- package/dist/es/tree.mjs.map +1 -0
- package/dist/es/types.mjs +196 -0
- package/dist/es/types.mjs.map +1 -0
- package/dist/es/utils.mjs +218 -0
- package/dist/es/utils.mjs.map +1 -0
- package/dist/es/yaml/builder.mjs +13 -0
- package/dist/es/yaml/builder.mjs.map +1 -0
- package/dist/es/yaml/index.mjs +4 -0
- package/dist/es/yaml/player.mjs +418 -0
- package/dist/es/yaml/player.mjs.map +1 -0
- package/dist/es/yaml/utils.mjs +73 -0
- package/dist/es/yaml/utils.mjs.map +1 -0
- package/dist/es/yaml.mjs +0 -0
- package/dist/lib/agent/agent.js +757 -0
- package/dist/lib/agent/agent.js.map +1 -0
- package/dist/lib/agent/common.js +5 -0
- package/dist/lib/agent/execution-session.js +75 -0
- package/dist/lib/agent/execution-session.js.map +1 -0
- package/dist/lib/agent/index.js +81 -0
- package/dist/lib/agent/index.js.map +1 -0
- package/dist/lib/agent/task-builder.js +367 -0
- package/dist/lib/agent/task-builder.js.map +1 -0
- package/dist/lib/agent/task-cache.js +238 -0
- package/dist/lib/agent/task-cache.js.map +1 -0
- package/dist/lib/agent/tasks.js +465 -0
- package/dist/lib/agent/tasks.js.map +1 -0
- package/dist/lib/agent/ui-utils.js +143 -0
- package/dist/lib/agent/ui-utils.js.map +1 -0
- package/dist/lib/agent/utils.js +275 -0
- package/dist/lib/agent/utils.js.map +1 -0
- package/dist/lib/ai-model/auto-glm/actions.js +258 -0
- package/dist/lib/ai-model/auto-glm/actions.js.map +1 -0
- package/dist/lib/ai-model/auto-glm/index.js +66 -0
- package/dist/lib/ai-model/auto-glm/index.js.map +1 -0
- package/dist/lib/ai-model/auto-glm/parser.js +282 -0
- package/dist/lib/ai-model/auto-glm/parser.js.map +1 -0
- package/dist/lib/ai-model/auto-glm/planning.js +105 -0
- package/dist/lib/ai-model/auto-glm/planning.js.map +1 -0
- package/dist/lib/ai-model/auto-glm/prompt.js +259 -0
- package/dist/lib/ai-model/auto-glm/prompt.js.map +1 -0
- package/dist/lib/ai-model/auto-glm/util.js +46 -0
- package/dist/lib/ai-model/auto-glm/util.js.map +1 -0
- package/dist/lib/ai-model/conversation-history.js +229 -0
- package/dist/lib/ai-model/conversation-history.js.map +1 -0
- package/dist/lib/ai-model/index.js +125 -0
- package/dist/lib/ai-model/index.js.map +1 -0
- package/dist/lib/ai-model/inspect.js +429 -0
- package/dist/lib/ai-model/inspect.js.map +1 -0
- package/dist/lib/ai-model/llm-planning.js +270 -0
- package/dist/lib/ai-model/llm-planning.js.map +1 -0
- package/dist/lib/ai-model/prompt/common.js +41 -0
- package/dist/lib/ai-model/prompt/common.js.map +1 -0
- package/dist/lib/ai-model/prompt/describe.js +100 -0
- package/dist/lib/ai-model/prompt/describe.js.map +1 -0
- package/dist/lib/ai-model/prompt/extraction.js +169 -0
- package/dist/lib/ai-model/prompt/extraction.js.map +1 -0
- package/dist/lib/ai-model/prompt/llm-locator.js +88 -0
- package/dist/lib/ai-model/prompt/llm-locator.js.map +1 -0
- package/dist/lib/ai-model/prompt/llm-planning.js +401 -0
- package/dist/lib/ai-model/prompt/llm-planning.js.map +1 -0
- package/dist/lib/ai-model/prompt/llm-section-locator.js +81 -0
- package/dist/lib/ai-model/prompt/llm-section-locator.js.map +1 -0
- package/dist/lib/ai-model/prompt/order-sensitive-judge.js +72 -0
- package/dist/lib/ai-model/prompt/order-sensitive-judge.js.map +1 -0
- package/dist/lib/ai-model/prompt/playwright-generator.js +178 -0
- package/dist/lib/ai-model/prompt/playwright-generator.js.map +1 -0
- package/dist/lib/ai-model/prompt/ui-tars-planning.js +73 -0
- package/dist/lib/ai-model/prompt/ui-tars-planning.js.map +1 -0
- package/dist/lib/ai-model/prompt/util.js +105 -0
- package/dist/lib/ai-model/prompt/util.js.map +1 -0
- package/dist/lib/ai-model/prompt/yaml-generator.js +280 -0
- package/dist/lib/ai-model/prompt/yaml-generator.js.map +1 -0
- package/dist/lib/ai-model/service-caller/index.js +531 -0
- package/dist/lib/ai-model/service-caller/index.js.map +1 -0
- package/dist/lib/ai-model/ui-tars-planning.js +283 -0
- package/dist/lib/ai-model/ui-tars-planning.js.map +1 -0
- package/dist/lib/common.js +480 -0
- package/dist/lib/common.js.map +1 -0
- package/dist/lib/device/device-options.js +20 -0
- package/dist/lib/device/device-options.js.map +1 -0
- package/dist/lib/device/index.js +418 -0
- package/dist/lib/device/index.js.map +1 -0
- package/dist/lib/dump/html-utils.js +281 -0
- package/dist/lib/dump/html-utils.js.map +1 -0
- package/dist/lib/dump/image-restoration.js +77 -0
- package/dist/lib/dump/image-restoration.js.map +1 -0
- package/dist/lib/dump/index.js +60 -0
- package/dist/lib/dump/index.js.map +1 -0
- package/dist/lib/index.js +146 -0
- package/dist/lib/index.js.map +1 -0
- package/dist/lib/report-generator.js +172 -0
- package/dist/lib/report-generator.js.map +1 -0
- package/dist/lib/report.js +145 -0
- package/dist/lib/report.js.map +1 -0
- package/dist/lib/screenshot-item.js +139 -0
- package/dist/lib/screenshot-item.js.map +1 -0
- package/dist/lib/service/index.js +290 -0
- package/dist/lib/service/index.js.map +1 -0
- package/dist/lib/service/utils.js +49 -0
- package/dist/lib/service/utils.js.map +1 -0
- package/dist/lib/skill/index.js +72 -0
- package/dist/lib/skill/index.js.map +1 -0
- package/dist/lib/task-runner.js +295 -0
- package/dist/lib/task-runner.js.map +1 -0
- package/dist/lib/task-timing.js +46 -0
- package/dist/lib/task-timing.js.map +1 -0
- package/dist/lib/tree.js +53 -0
- package/dist/lib/tree.js.map +1 -0
- package/dist/lib/types.js +285 -0
- package/dist/lib/types.js.map +1 -0
- package/dist/lib/utils.js +297 -0
- package/dist/lib/utils.js.map +1 -0
- package/dist/lib/yaml/builder.js +57 -0
- package/dist/lib/yaml/builder.js.map +1 -0
- package/dist/lib/yaml/index.js +81 -0
- package/dist/lib/yaml/index.js.map +1 -0
- package/dist/lib/yaml/player.js +452 -0
- package/dist/lib/yaml/player.js.map +1 -0
- package/dist/lib/yaml/utils.js +126 -0
- package/dist/lib/yaml/utils.js.map +1 -0
- package/dist/lib/yaml.js +20 -0
- package/dist/lib/yaml.js.map +1 -0
- package/dist/types/agent/agent.d.ts +190 -0
- package/dist/types/agent/common.d.ts +0 -0
- package/dist/types/agent/execution-session.d.ts +36 -0
- package/dist/types/agent/index.d.ts +10 -0
- package/dist/types/agent/task-builder.d.ts +34 -0
- package/dist/types/agent/task-cache.d.ts +48 -0
- package/dist/types/agent/tasks.d.ts +70 -0
- package/dist/types/agent/ui-utils.d.ts +14 -0
- package/dist/types/agent/utils.d.ts +29 -0
- package/dist/types/ai-model/auto-glm/actions.d.ts +77 -0
- package/dist/types/ai-model/auto-glm/index.d.ts +6 -0
- package/dist/types/ai-model/auto-glm/parser.d.ts +18 -0
- package/dist/types/ai-model/auto-glm/planning.d.ts +10 -0
- package/dist/types/ai-model/auto-glm/prompt.d.ts +27 -0
- package/dist/types/ai-model/auto-glm/util.d.ts +13 -0
- package/dist/types/ai-model/conversation-history.d.ts +105 -0
- package/dist/types/ai-model/index.d.ts +14 -0
- package/dist/types/ai-model/inspect.d.ts +58 -0
- package/dist/types/ai-model/llm-planning.d.ts +19 -0
- package/dist/types/ai-model/prompt/common.d.ts +2 -0
- package/dist/types/ai-model/prompt/describe.d.ts +1 -0
- package/dist/types/ai-model/prompt/extraction.d.ts +7 -0
- package/dist/types/ai-model/prompt/llm-locator.d.ts +3 -0
- package/dist/types/ai-model/prompt/llm-planning.d.ts +10 -0
- package/dist/types/ai-model/prompt/llm-section-locator.d.ts +3 -0
- package/dist/types/ai-model/prompt/order-sensitive-judge.d.ts +2 -0
- package/dist/types/ai-model/prompt/playwright-generator.d.ts +26 -0
- package/dist/types/ai-model/prompt/ui-tars-planning.d.ts +2 -0
- package/dist/types/ai-model/prompt/util.d.ts +33 -0
- package/dist/types/ai-model/prompt/yaml-generator.d.ts +100 -0
- package/dist/types/ai-model/service-caller/index.d.ts +49 -0
- package/dist/types/ai-model/ui-tars-planning.d.ts +72 -0
- package/dist/types/common.d.ts +288 -0
- package/dist/types/device/device-options.d.ts +142 -0
- package/dist/types/device/index.d.ts +2315 -0
- package/dist/types/dump/html-utils.d.ts +52 -0
- package/dist/types/dump/image-restoration.d.ts +6 -0
- package/dist/types/dump/index.d.ts +5 -0
- package/dist/types/index.d.ts +17 -0
- package/dist/types/report-generator.d.ts +48 -0
- package/dist/types/report.d.ts +15 -0
- package/dist/types/screenshot-item.d.ts +66 -0
- package/dist/types/service/index.d.ts +23 -0
- package/dist/types/service/utils.d.ts +2 -0
- package/dist/types/skill/index.d.ts +25 -0
- package/dist/types/task-runner.d.ts +48 -0
- package/dist/types/task-timing.d.ts +8 -0
- package/dist/types/tree.d.ts +4 -0
- package/dist/types/types.d.ts +645 -0
- package/dist/types/utils.d.ts +40 -0
- package/dist/types/yaml/builder.d.ts +2 -0
- package/dist/types/yaml/index.d.ts +4 -0
- package/dist/types/yaml/player.d.ts +34 -0
- package/dist/types/yaml/utils.d.ts +9 -0
- package/dist/types/yaml.d.ts +203 -0
- package/package.json +111 -0
|
@@ -0,0 +1,105 @@
|
|
|
1
|
+
import { readFileSync } from "node:fs";
|
|
2
|
+
import { uuid } from "@midscene/shared/utils";
|
|
3
|
+
import { extractImageByIdSync } from "./dump/html-utils.mjs";
|
|
4
|
+
function _define_property(obj, key, value) {
|
|
5
|
+
if (key in obj) Object.defineProperty(obj, key, {
|
|
6
|
+
value: value,
|
|
7
|
+
enumerable: true,
|
|
8
|
+
configurable: true,
|
|
9
|
+
writable: true
|
|
10
|
+
});
|
|
11
|
+
else obj[key] = value;
|
|
12
|
+
return obj;
|
|
13
|
+
}
|
|
14
|
+
function detectFormat(base64) {
|
|
15
|
+
if (base64.startsWith('data:image/jpeg')) return 'jpeg';
|
|
16
|
+
if (base64.startsWith('data:image/jpg')) return 'jpeg';
|
|
17
|
+
return 'png';
|
|
18
|
+
}
|
|
19
|
+
class ScreenshotItem {
|
|
20
|
+
static create(base64, capturedAt) {
|
|
21
|
+
return new ScreenshotItem(uuid(), base64, capturedAt);
|
|
22
|
+
}
|
|
23
|
+
get id() {
|
|
24
|
+
return this._id;
|
|
25
|
+
}
|
|
26
|
+
get format() {
|
|
27
|
+
return this._format;
|
|
28
|
+
}
|
|
29
|
+
get extension() {
|
|
30
|
+
return 'jpeg' === this._format ? 'jpeg' : 'png';
|
|
31
|
+
}
|
|
32
|
+
get capturedAt() {
|
|
33
|
+
return this._capturedAt;
|
|
34
|
+
}
|
|
35
|
+
get base64() {
|
|
36
|
+
if (null !== this._base64) return this._base64;
|
|
37
|
+
if (null !== this._persistedPath) {
|
|
38
|
+
const buffer = readFileSync(this._persistedPath);
|
|
39
|
+
return `data:image/${this._format};base64,${buffer.toString('base64')}`;
|
|
40
|
+
}
|
|
41
|
+
if (null !== this._persistedHtmlPath) {
|
|
42
|
+
const data = extractImageByIdSync(this._persistedHtmlPath, this._id);
|
|
43
|
+
if (data) return data;
|
|
44
|
+
throw new Error(`Screenshot ${this._id}: cannot recover from HTML (id not found in ${this._persistedHtmlPath})`);
|
|
45
|
+
}
|
|
46
|
+
throw new Error(`Screenshot ${this._id}: base64 data released without recovery path`);
|
|
47
|
+
}
|
|
48
|
+
hasBase64() {
|
|
49
|
+
return null !== this._base64;
|
|
50
|
+
}
|
|
51
|
+
markPersistedInline(htmlPath) {
|
|
52
|
+
this._persistedAs = {
|
|
53
|
+
$screenshot: this._id,
|
|
54
|
+
capturedAt: this._capturedAt
|
|
55
|
+
};
|
|
56
|
+
this._persistedHtmlPath = htmlPath;
|
|
57
|
+
this._base64 = null;
|
|
58
|
+
}
|
|
59
|
+
markPersistedToPath(relativePath, absolutePath) {
|
|
60
|
+
this._persistedAs = {
|
|
61
|
+
base64: relativePath,
|
|
62
|
+
capturedAt: this._capturedAt
|
|
63
|
+
};
|
|
64
|
+
this._persistedPath = absolutePath;
|
|
65
|
+
this._base64 = null;
|
|
66
|
+
}
|
|
67
|
+
toSerializable() {
|
|
68
|
+
return this._persistedAs ?? {
|
|
69
|
+
$screenshot: this._id,
|
|
70
|
+
capturedAt: this._capturedAt
|
|
71
|
+
};
|
|
72
|
+
}
|
|
73
|
+
static isSerialized(value) {
|
|
74
|
+
if ('object' != typeof value || null === value) return false;
|
|
75
|
+
const record = value;
|
|
76
|
+
if ('$screenshot' in record && 'string' == typeof record.$screenshot) {
|
|
77
|
+
if (!('capturedAt' in record) || 'number' != typeof record.capturedAt) return false;
|
|
78
|
+
return true;
|
|
79
|
+
}
|
|
80
|
+
if ('base64' in record && 'string' == typeof record.base64) {
|
|
81
|
+
if (!('capturedAt' in record) || 'number' != typeof record.capturedAt) return false;
|
|
82
|
+
return true;
|
|
83
|
+
}
|
|
84
|
+
return false;
|
|
85
|
+
}
|
|
86
|
+
get rawBase64() {
|
|
87
|
+
return this.base64.replace(/^data:image\/(png|jpeg|jpg);base64,/, '');
|
|
88
|
+
}
|
|
89
|
+
constructor(id, base64, capturedAt){
|
|
90
|
+
_define_property(this, "_id", void 0);
|
|
91
|
+
_define_property(this, "_base64", void 0);
|
|
92
|
+
_define_property(this, "_format", void 0);
|
|
93
|
+
_define_property(this, "_capturedAt", void 0);
|
|
94
|
+
_define_property(this, "_persistedAs", null);
|
|
95
|
+
_define_property(this, "_persistedPath", null);
|
|
96
|
+
_define_property(this, "_persistedHtmlPath", null);
|
|
97
|
+
this._id = id;
|
|
98
|
+
this._base64 = base64;
|
|
99
|
+
this._format = detectFormat(base64);
|
|
100
|
+
this._capturedAt = capturedAt;
|
|
101
|
+
}
|
|
102
|
+
}
|
|
103
|
+
export { ScreenshotItem };
|
|
104
|
+
|
|
105
|
+
//# sourceMappingURL=screenshot-item.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"screenshot-item.mjs","sources":["../../src/screenshot-item.ts"],"sourcesContent":["import { readFileSync } from 'node:fs';\nimport { uuid } from '@midscene/shared/utils';\nimport { extractImageByIdSync } from './dump/html-utils';\n\n/**\n * Serialization format for ScreenshotItem\n * - { $screenshot: \"id\" } - inline mode, references imageMap in HTML\n * - { base64: \"path\" } - directory mode, references external file path\n */\nexport type ScreenshotSerializeFormat =\n | { $screenshot: string; capturedAt: number }\n | { base64: string; capturedAt: number };\n\n/**\n * Detect image format from base64 data URI prefix.\n */\nfunction detectFormat(base64: string): 'png' | 'jpeg' {\n if (base64.startsWith('data:image/jpeg')) return 'jpeg';\n if (base64.startsWith('data:image/jpg')) return 'jpeg';\n return 'png';\n}\n\n/**\n * ScreenshotItem encapsulates screenshot data.\n *\n * Supports lazy loading after memory release:\n * - inline mode: reads from HTML file using streaming (extractImageByIdSync)\n * - directory mode: reads from file on disk\n *\n * After persistence, memory is released but the screenshot can be recovered\n * on-demand from disk, making it safe to release memory at any time.\n */\nexport class ScreenshotItem {\n private _id: string;\n private _base64: string | null;\n private _format: 'png' | 'jpeg';\n private _capturedAt: number;\n private _persistedAs: ScreenshotSerializeFormat | null = null;\n private _persistedPath: string | null = null;\n private _persistedHtmlPath: string | null = null;\n\n private constructor(id: string, base64: string, capturedAt: number) {\n this._id = id;\n this._base64 = base64;\n this._format = detectFormat(base64);\n this._capturedAt = capturedAt;\n }\n\n /** Create a new ScreenshotItem from base64 data */\n static create(base64: string, capturedAt: number): ScreenshotItem {\n return new ScreenshotItem(uuid(), base64, capturedAt);\n }\n\n get id(): string {\n return this._id;\n }\n\n /** Get the image format (png or jpeg) */\n get format(): 'png' | 'jpeg' {\n return this._format;\n }\n\n /** Get the file extension for this screenshot */\n get extension(): string {\n return this._format === 'jpeg' ? 'jpeg' : 'png';\n }\n\n /** Get screenshot capture timestamp in milliseconds */\n get capturedAt(): number {\n return this._capturedAt;\n }\n\n get base64(): string {\n // If data is in memory, return it directly\n if (this._base64 !== null) {\n return this._base64;\n }\n\n // Directory mode: recover from file\n if (this._persistedPath !== null) {\n const buffer = readFileSync(this._persistedPath);\n return `data:image/${this._format};base64,${buffer.toString('base64')}`;\n }\n\n // Inline mode: recover from HTML file using streaming\n if (this._persistedHtmlPath !== null) {\n const data = extractImageByIdSync(this._persistedHtmlPath, this._id);\n if (data) {\n return data;\n }\n throw new Error(\n `Screenshot ${this._id}: cannot recover from HTML (id not found in ${this._persistedHtmlPath})`,\n );\n }\n\n throw new Error(\n `Screenshot ${this._id}: base64 data released without recovery path`,\n );\n }\n\n /** Check if base64 data is still available in memory (not yet released) */\n hasBase64(): boolean {\n return this._base64 !== null;\n }\n\n /**\n * Mark as persisted to HTML (inline mode).\n * Releases base64 memory, but keeps HTML path for lazy loading recovery.\n * @param htmlPath - absolute path to the HTML file containing the image\n */\n markPersistedInline(htmlPath: string): void {\n this._persistedAs = {\n $screenshot: this._id,\n capturedAt: this._capturedAt,\n };\n this._persistedHtmlPath = htmlPath;\n this._base64 = null;\n }\n\n /**\n * Mark as persisted to file (directory mode).\n * Releases base64 memory, but keeps file path for lazy loading recovery.\n * @param relativePath - relative path for serialization (e.g., \"./screenshots/id.jpeg\")\n * @param absolutePath - absolute path for lazy loading recovery\n */\n markPersistedToPath(relativePath: string, absolutePath: string): void {\n this._persistedAs = {\n base64: relativePath,\n capturedAt: this._capturedAt,\n };\n this._persistedPath = absolutePath;\n this._base64 = null;\n }\n\n /** Serialize for JSON - format depends on persistence state */\n toSerializable(): ScreenshotSerializeFormat {\n return (\n this._persistedAs ?? {\n $screenshot: this._id,\n capturedAt: this._capturedAt,\n }\n );\n }\n\n /** Check if a value is a serialized ScreenshotItem reference (inline or directory mode) */\n static isSerialized(value: unknown): value is ScreenshotSerializeFormat {\n if (typeof value !== 'object' || value === null) return false;\n const record = value as Record<string, unknown>;\n // Check for inline mode: { $screenshot: string }\n if ('$screenshot' in record && typeof record.$screenshot === 'string') {\n if (!('capturedAt' in record) || typeof record.capturedAt !== 'number') {\n return false;\n }\n return true;\n }\n // Check for directory mode: { base64: string } where base64 is a path\n if ('base64' in record && typeof record.base64 === 'string') {\n if (!('capturedAt' in record) || typeof record.capturedAt !== 'number') {\n return false;\n }\n return true;\n }\n return false;\n }\n\n /**\n * Get base64 data without the data URI prefix.\n * Useful for writing raw binary data to files.\n */\n get rawBase64(): string {\n return this.base64.replace(/^data:image\\/(png|jpeg|jpg);base64,/, '');\n }\n}\n"],"names":["detectFormat","base64","ScreenshotItem","capturedAt","uuid","buffer","readFileSync","data","extractImageByIdSync","Error","htmlPath","relativePath","absolutePath","value","record","id"],"mappings":";;;;;;;;;;;;;AAgBA,SAASA,aAAaC,MAAc;IAClC,IAAIA,OAAO,UAAU,CAAC,oBAAoB,OAAO;IACjD,IAAIA,OAAO,UAAU,CAAC,mBAAmB,OAAO;IAChD,OAAO;AACT;AAYO,MAAMC;IAiBX,OAAO,OAAOD,MAAc,EAAEE,UAAkB,EAAkB;QAChE,OAAO,IAAID,eAAeE,QAAQH,QAAQE;IAC5C;IAEA,IAAI,KAAa;QACf,OAAO,IAAI,CAAC,GAAG;IACjB;IAGA,IAAI,SAAyB;QAC3B,OAAO,IAAI,CAAC,OAAO;IACrB;IAGA,IAAI,YAAoB;QACtB,OAAO,AAAiB,WAAjB,IAAI,CAAC,OAAO,GAAc,SAAS;IAC5C;IAGA,IAAI,aAAqB;QACvB,OAAO,IAAI,CAAC,WAAW;IACzB;IAEA,IAAI,SAAiB;QAEnB,IAAI,AAAiB,SAAjB,IAAI,CAAC,OAAO,EACd,OAAO,IAAI,CAAC,OAAO;QAIrB,IAAI,AAAwB,SAAxB,IAAI,CAAC,cAAc,EAAW;YAChC,MAAME,SAASC,aAAa,IAAI,CAAC,cAAc;YAC/C,OAAO,CAAC,WAAW,EAAE,IAAI,CAAC,OAAO,CAAC,QAAQ,EAAED,OAAO,QAAQ,CAAC,WAAW;QACzE;QAGA,IAAI,AAA4B,SAA5B,IAAI,CAAC,kBAAkB,EAAW;YACpC,MAAME,OAAOC,qBAAqB,IAAI,CAAC,kBAAkB,EAAE,IAAI,CAAC,GAAG;YACnE,IAAID,MACF,OAAOA;YAET,MAAM,IAAIE,MACR,CAAC,WAAW,EAAE,IAAI,CAAC,GAAG,CAAC,4CAA4C,EAAE,IAAI,CAAC,kBAAkB,CAAC,CAAC,CAAC;QAEnG;QAEA,MAAM,IAAIA,MACR,CAAC,WAAW,EAAE,IAAI,CAAC,GAAG,CAAC,4CAA4C,CAAC;IAExE;IAGA,YAAqB;QACnB,OAAO,AAAiB,SAAjB,IAAI,CAAC,OAAO;IACrB;IAOA,oBAAoBC,QAAgB,EAAQ;QAC1C,IAAI,CAAC,YAAY,GAAG;YAClB,aAAa,IAAI,CAAC,GAAG;YACrB,YAAY,IAAI,CAAC,WAAW;QAC9B;QACA,IAAI,CAAC,kBAAkB,GAAGA;QAC1B,IAAI,CAAC,OAAO,GAAG;IACjB;IAQA,oBAAoBC,YAAoB,EAAEC,YAAoB,EAAQ;QACpE,IAAI,CAAC,YAAY,GAAG;YAClB,QAAQD;YACR,YAAY,IAAI,CAAC,WAAW;QAC9B;QACA,IAAI,CAAC,cAAc,GAAGC;QACtB,IAAI,CAAC,OAAO,GAAG;IACjB;IAGA,iBAA4C;QAC1C,OACE,IAAI,CAAC,YAAY,IAAI;YACnB,aAAa,IAAI,CAAC,GAAG;YACrB,YAAY,IAAI,CAAC,WAAW;QAC9B;IAEJ;IAGA,OAAO,aAAaC,KAAc,EAAsC;QACtE,IAAI,AAAiB,YAAjB,OAAOA,SAAsBA,AAAU,SAAVA,OAAgB,OAAO;QACxD,MAAMC,SAASD;QAEf,IAAI,iBAAiBC,UAAU,AAA8B,YAA9B,OAAOA,OAAO,WAAW,EAAe;YACrE,IAAI,CAAE,iBAAgBA,MAAK,KAAM,AAA6B,YAA7B,OAAOA,OAAO,UAAU,EACvD,OAAO;YAET,OAAO;QACT;QAEA,IAAI,YAAYA,UAAU,AAAyB,YAAzB,OAAOA,OAAO,MAAM,EAAe;YAC3D,IAAI,CAAE,iBAAgBA,MAAK,KAAM,AAA6B,YAA7B,OAAOA,OAAO,UAAU,EACvD,OAAO;YAET,OAAO;QACT;QACA,OAAO;IACT;IAMA,IAAI,YAAoB;QACtB,OAAO,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,uCAAuC;IACpE;IAlIA,YAAoBC,EAAU,EAAEd,MAAc,EAAEE,UAAkB,CAAE;QARpE,uBAAQ,OAAR;QACA,uBAAQ,WAAR;QACA,uBAAQ,WAAR;QACA,uBAAQ,eAAR;QACA,uBAAQ,gBAAiD;QACzD,uBAAQ,kBAAgC;QACxC,uBAAQ,sBAAoC;QAG1C,IAAI,CAAC,GAAG,GAAGY;QACX,IAAI,CAAC,OAAO,GAAGd;QACf,IAAI,CAAC,OAAO,GAAGD,aAAaC;QAC5B,IAAI,CAAC,WAAW,GAAGE;IACrB;AA8HF"}
|
|
@@ -0,0 +1,256 @@
|
|
|
1
|
+
import { isAutoGLM } from "../ai-model/auto-glm/util.mjs";
|
|
2
|
+
import { AIResponseParseError, AiExtractElementInfo, AiLocateElement, callAIWithObjectResponse } from "../ai-model/index.mjs";
|
|
3
|
+
import { AiLocateSection } from "../ai-model/inspect.mjs";
|
|
4
|
+
import { elementDescriberInstruction } from "../ai-model/prompt/describe.mjs";
|
|
5
|
+
import { expandSearchArea } from "../common.mjs";
|
|
6
|
+
import { ServiceError } from "../types.mjs";
|
|
7
|
+
import { compositeElementInfoImg, cropByRect } from "@midscene/shared/img";
|
|
8
|
+
import { getDebug } from "@midscene/shared/logger";
|
|
9
|
+
import { assert } from "@midscene/shared/utils";
|
|
10
|
+
import { createServiceDump } from "./utils.mjs";
|
|
11
|
+
function _define_property(obj, key, value) {
|
|
12
|
+
if (key in obj) Object.defineProperty(obj, key, {
|
|
13
|
+
value: value,
|
|
14
|
+
enumerable: true,
|
|
15
|
+
configurable: true,
|
|
16
|
+
writable: true
|
|
17
|
+
});
|
|
18
|
+
else obj[key] = value;
|
|
19
|
+
return obj;
|
|
20
|
+
}
|
|
21
|
+
const debug = getDebug('ai:service');
|
|
22
|
+
class Service {
|
|
23
|
+
async locate(query, opt, modelConfig, abortSignal) {
|
|
24
|
+
const queryPrompt = 'string' == typeof query ? query : query.prompt;
|
|
25
|
+
assert(queryPrompt, 'query is required for locate');
|
|
26
|
+
assert('object' == typeof query, 'query should be an object for locate');
|
|
27
|
+
let searchAreaPrompt;
|
|
28
|
+
if (query.deepLocate) searchAreaPrompt = query.prompt;
|
|
29
|
+
const { modelFamily } = modelConfig;
|
|
30
|
+
if (searchAreaPrompt && !modelFamily) {
|
|
31
|
+
console.warn('The "deepLocate" feature is not supported with multimodal LLM. Please config VL model for Midscene. https://midscenejs.com/model-config');
|
|
32
|
+
searchAreaPrompt = void 0;
|
|
33
|
+
}
|
|
34
|
+
if (searchAreaPrompt && isAutoGLM(modelFamily)) {
|
|
35
|
+
console.warn('The "deepLocate" feature is not supported with AutoGLM.');
|
|
36
|
+
searchAreaPrompt = void 0;
|
|
37
|
+
}
|
|
38
|
+
const context = opt?.context || await this.contextRetrieverFn();
|
|
39
|
+
let searchArea;
|
|
40
|
+
let searchAreaRawResponse;
|
|
41
|
+
let searchAreaUsage;
|
|
42
|
+
let searchAreaResponse;
|
|
43
|
+
if (searchAreaPrompt) {
|
|
44
|
+
searchAreaResponse = await AiLocateSection({
|
|
45
|
+
context,
|
|
46
|
+
sectionDescription: searchAreaPrompt,
|
|
47
|
+
modelConfig,
|
|
48
|
+
abortSignal
|
|
49
|
+
});
|
|
50
|
+
assert(searchAreaResponse.rect, `cannot find search area for "${searchAreaPrompt}"${searchAreaResponse.error ? `: ${searchAreaResponse.error}` : ''}`);
|
|
51
|
+
searchAreaRawResponse = searchAreaResponse.rawResponse;
|
|
52
|
+
searchAreaUsage = searchAreaResponse.usage;
|
|
53
|
+
searchArea = searchAreaResponse.rect;
|
|
54
|
+
}
|
|
55
|
+
const startTime = Date.now();
|
|
56
|
+
const { parseResult, rect, rawResponse, usage, reasoning_content } = await AiLocateElement({
|
|
57
|
+
context,
|
|
58
|
+
targetElementDescription: queryPrompt,
|
|
59
|
+
searchConfig: searchAreaResponse,
|
|
60
|
+
modelConfig,
|
|
61
|
+
abortSignal
|
|
62
|
+
});
|
|
63
|
+
const timeCost = Date.now() - startTime;
|
|
64
|
+
const taskInfo = {
|
|
65
|
+
...this.taskInfo ? this.taskInfo : {},
|
|
66
|
+
durationMs: timeCost,
|
|
67
|
+
rawResponse: JSON.stringify(rawResponse),
|
|
68
|
+
formatResponse: JSON.stringify(parseResult),
|
|
69
|
+
usage,
|
|
70
|
+
searchArea,
|
|
71
|
+
searchAreaRawResponse,
|
|
72
|
+
searchAreaUsage,
|
|
73
|
+
reasoning_content
|
|
74
|
+
};
|
|
75
|
+
let errorLog;
|
|
76
|
+
if (parseResult.errors?.length) errorLog = `failed to locate element: \n${parseResult.errors.join('\n')}`;
|
|
77
|
+
const dumpData = {
|
|
78
|
+
type: 'locate',
|
|
79
|
+
userQuery: {
|
|
80
|
+
element: queryPrompt
|
|
81
|
+
},
|
|
82
|
+
matchedElement: [],
|
|
83
|
+
matchedRect: rect,
|
|
84
|
+
data: null,
|
|
85
|
+
taskInfo,
|
|
86
|
+
deepLocate: !!searchArea,
|
|
87
|
+
error: errorLog
|
|
88
|
+
};
|
|
89
|
+
const elements = parseResult.elements || [];
|
|
90
|
+
const dump = createServiceDump({
|
|
91
|
+
...dumpData,
|
|
92
|
+
matchedElement: elements
|
|
93
|
+
});
|
|
94
|
+
if (errorLog) throw new ServiceError(errorLog, dump);
|
|
95
|
+
if (elements.length > 1) throw new ServiceError(`locate: multiple elements found, length = ${elements.length}`, dump);
|
|
96
|
+
if (1 === elements.length) return {
|
|
97
|
+
element: {
|
|
98
|
+
center: elements[0].center,
|
|
99
|
+
rect: elements[0].rect,
|
|
100
|
+
description: elements[0].description
|
|
101
|
+
},
|
|
102
|
+
rect,
|
|
103
|
+
dump
|
|
104
|
+
};
|
|
105
|
+
return {
|
|
106
|
+
element: null,
|
|
107
|
+
rect,
|
|
108
|
+
dump
|
|
109
|
+
};
|
|
110
|
+
}
|
|
111
|
+
async extract(dataDemand, modelConfig, opt, pageDescription, multimodalPrompt, context) {
|
|
112
|
+
assert(context, 'context is required for extract');
|
|
113
|
+
assert('object' == typeof dataDemand || 'string' == typeof dataDemand, `dataDemand should be object or string, but get ${typeof dataDemand}`);
|
|
114
|
+
const startTime = Date.now();
|
|
115
|
+
let parseResult;
|
|
116
|
+
let rawResponse;
|
|
117
|
+
let usage;
|
|
118
|
+
let reasoning_content;
|
|
119
|
+
try {
|
|
120
|
+
const result = await AiExtractElementInfo({
|
|
121
|
+
context,
|
|
122
|
+
dataQuery: dataDemand,
|
|
123
|
+
multimodalPrompt,
|
|
124
|
+
extractOption: opt,
|
|
125
|
+
modelConfig,
|
|
126
|
+
pageDescription
|
|
127
|
+
});
|
|
128
|
+
parseResult = result.parseResult;
|
|
129
|
+
rawResponse = result.rawResponse;
|
|
130
|
+
usage = result.usage;
|
|
131
|
+
reasoning_content = result.reasoning_content;
|
|
132
|
+
} catch (error) {
|
|
133
|
+
if (error instanceof AIResponseParseError) {
|
|
134
|
+
const timeCost = Date.now() - startTime;
|
|
135
|
+
const taskInfo = {
|
|
136
|
+
...this.taskInfo ? this.taskInfo : {},
|
|
137
|
+
durationMs: timeCost,
|
|
138
|
+
rawResponse: error.rawResponse,
|
|
139
|
+
usage: error.usage
|
|
140
|
+
};
|
|
141
|
+
const dump = createServiceDump({
|
|
142
|
+
type: 'extract',
|
|
143
|
+
userQuery: {
|
|
144
|
+
dataDemand
|
|
145
|
+
},
|
|
146
|
+
matchedElement: [],
|
|
147
|
+
data: null,
|
|
148
|
+
taskInfo,
|
|
149
|
+
error: error.message
|
|
150
|
+
});
|
|
151
|
+
throw new ServiceError(error.message, dump);
|
|
152
|
+
}
|
|
153
|
+
throw error;
|
|
154
|
+
}
|
|
155
|
+
const timeCost = Date.now() - startTime;
|
|
156
|
+
const taskInfo = {
|
|
157
|
+
...this.taskInfo ? this.taskInfo : {},
|
|
158
|
+
durationMs: timeCost,
|
|
159
|
+
rawResponse,
|
|
160
|
+
formatResponse: JSON.stringify(parseResult),
|
|
161
|
+
usage,
|
|
162
|
+
reasoning_content
|
|
163
|
+
};
|
|
164
|
+
let errorLog;
|
|
165
|
+
if (parseResult.errors?.length) errorLog = `AI response error: \n${parseResult.errors.join('\n')}`;
|
|
166
|
+
const dumpData = {
|
|
167
|
+
type: 'extract',
|
|
168
|
+
userQuery: {
|
|
169
|
+
dataDemand
|
|
170
|
+
},
|
|
171
|
+
matchedElement: [],
|
|
172
|
+
data: null,
|
|
173
|
+
taskInfo,
|
|
174
|
+
error: errorLog
|
|
175
|
+
};
|
|
176
|
+
const { data, thought } = parseResult || {};
|
|
177
|
+
const dump = createServiceDump({
|
|
178
|
+
...dumpData,
|
|
179
|
+
data
|
|
180
|
+
});
|
|
181
|
+
if (errorLog && !data) throw new ServiceError(errorLog, dump);
|
|
182
|
+
return {
|
|
183
|
+
data,
|
|
184
|
+
thought,
|
|
185
|
+
usage,
|
|
186
|
+
reasoning_content,
|
|
187
|
+
dump
|
|
188
|
+
};
|
|
189
|
+
}
|
|
190
|
+
async describe(target, modelConfig, opt) {
|
|
191
|
+
assert(target, 'target is required for service.describe');
|
|
192
|
+
const context = await this.contextRetrieverFn();
|
|
193
|
+
const { shotSize } = context;
|
|
194
|
+
const screenshotBase64 = context.screenshot.base64;
|
|
195
|
+
assert(screenshotBase64, 'screenshot is required for service.describe');
|
|
196
|
+
const { modelFamily } = modelConfig;
|
|
197
|
+
const systemPrompt = elementDescriberInstruction();
|
|
198
|
+
const defaultRectSize = 30;
|
|
199
|
+
const targetRect = Array.isArray(target) ? {
|
|
200
|
+
left: Math.floor(target[0] - defaultRectSize / 2),
|
|
201
|
+
top: Math.floor(target[1] - defaultRectSize / 2),
|
|
202
|
+
width: defaultRectSize,
|
|
203
|
+
height: defaultRectSize
|
|
204
|
+
} : target;
|
|
205
|
+
let imagePayload = await compositeElementInfoImg({
|
|
206
|
+
inputImgBase64: screenshotBase64,
|
|
207
|
+
size: shotSize,
|
|
208
|
+
elementsPositionInfo: [
|
|
209
|
+
{
|
|
210
|
+
rect: targetRect
|
|
211
|
+
}
|
|
212
|
+
],
|
|
213
|
+
borderThickness: 3
|
|
214
|
+
});
|
|
215
|
+
if (opt?.deepLocate) {
|
|
216
|
+
const searchArea = expandSearchArea(targetRect, shotSize);
|
|
217
|
+
debug('describe: cropping to searchArea', searchArea);
|
|
218
|
+
const croppedResult = await cropByRect(imagePayload, searchArea, 'qwen2.5-vl' === modelFamily);
|
|
219
|
+
imagePayload = croppedResult.imageBase64;
|
|
220
|
+
}
|
|
221
|
+
const msgs = [
|
|
222
|
+
{
|
|
223
|
+
role: 'system',
|
|
224
|
+
content: systemPrompt
|
|
225
|
+
},
|
|
226
|
+
{
|
|
227
|
+
role: 'user',
|
|
228
|
+
content: [
|
|
229
|
+
{
|
|
230
|
+
type: 'image_url',
|
|
231
|
+
image_url: {
|
|
232
|
+
url: imagePayload,
|
|
233
|
+
detail: 'high'
|
|
234
|
+
}
|
|
235
|
+
}
|
|
236
|
+
]
|
|
237
|
+
}
|
|
238
|
+
];
|
|
239
|
+
const res = await callAIWithObjectResponse(msgs, modelConfig);
|
|
240
|
+
const { content } = res;
|
|
241
|
+
assert(!content.error, `describe failed: ${content.error}`);
|
|
242
|
+
assert(content.description, 'failed to describe the element');
|
|
243
|
+
return content;
|
|
244
|
+
}
|
|
245
|
+
constructor(context, opt){
|
|
246
|
+
_define_property(this, "contextRetrieverFn", void 0);
|
|
247
|
+
_define_property(this, "taskInfo", void 0);
|
|
248
|
+
assert(context, 'context is required for Service');
|
|
249
|
+
if ('function' == typeof context) this.contextRetrieverFn = context;
|
|
250
|
+
else this.contextRetrieverFn = ()=>Promise.resolve(context);
|
|
251
|
+
if (void 0 !== opt?.taskInfo) this.taskInfo = opt.taskInfo;
|
|
252
|
+
}
|
|
253
|
+
}
|
|
254
|
+
export { Service as default };
|
|
255
|
+
|
|
256
|
+
//# sourceMappingURL=index.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"service/index.mjs","sources":["../../../src/service/index.ts"],"sourcesContent":["import { isAutoGLM, isUITars } from '@/ai-model/auto-glm/util';\nimport {\n AIResponseParseError,\n AiExtractElementInfo,\n AiLocateElement,\n callAIWithObjectResponse,\n} from '@/ai-model/index';\nimport { AiLocateSection } from '@/ai-model/inspect';\nimport { elementDescriberInstruction } from '@/ai-model/prompt/describe';\nimport { type AIArgs, expandSearchArea } from '@/common';\nimport type {\n AIDescribeElementResponse,\n AIUsageInfo,\n DetailedLocateParam,\n LocateResultWithDump,\n PartialServiceDumpFromSDK,\n Rect,\n ServiceExtractOption,\n ServiceExtractParam,\n ServiceExtractResult,\n ServiceTaskInfo,\n UIContext,\n} from '@/types';\nimport { ServiceError } from '@/types';\nimport type { IModelConfig } from '@midscene/shared/env';\nimport { compositeElementInfoImg, cropByRect } from '@midscene/shared/img';\nimport { getDebug } from '@midscene/shared/logger';\nimport { assert } from '@midscene/shared/utils';\nimport type { TMultimodalPrompt } from '../common';\nimport { createServiceDump } from './utils';\n\nexport interface LocateOpts {\n context?: UIContext;\n}\n\nexport type AnyValue<T> = {\n [K in keyof T]: unknown extends T[K] ? any : T[K];\n};\n\ninterface ServiceOptions {\n taskInfo?: Omit<ServiceTaskInfo, 'durationMs'>;\n}\n\nconst debug = getDebug('ai:service');\nexport default class Service {\n contextRetrieverFn: () => Promise<UIContext> | UIContext;\n\n taskInfo?: Omit<ServiceTaskInfo, 'durationMs'>;\n\n constructor(\n context: UIContext | (() => Promise<UIContext> | UIContext),\n opt?: ServiceOptions,\n ) {\n assert(context, 'context is required for Service');\n if (typeof context === 'function') {\n this.contextRetrieverFn = context;\n } else {\n this.contextRetrieverFn = () => Promise.resolve(context);\n }\n\n if (typeof opt?.taskInfo !== 'undefined') {\n this.taskInfo = opt.taskInfo;\n }\n }\n\n async locate(\n query: DetailedLocateParam,\n opt: LocateOpts,\n modelConfig: IModelConfig,\n abortSignal?: AbortSignal,\n ): Promise<LocateResultWithDump> {\n const queryPrompt = typeof query === 'string' ? query : query.prompt;\n assert(queryPrompt, 'query is required for locate');\n\n assert(typeof query === 'object', 'query should be an object for locate');\n\n let searchAreaPrompt;\n if (query.deepLocate) {\n searchAreaPrompt = query.prompt;\n }\n\n const { modelFamily } = modelConfig;\n\n if (searchAreaPrompt && !modelFamily) {\n console.warn(\n 'The \"deepLocate\" feature is not supported with multimodal LLM. Please config VL model for Midscene. https://midscenejs.com/model-config',\n );\n searchAreaPrompt = undefined;\n }\n\n if (searchAreaPrompt && isAutoGLM(modelFamily)) {\n console.warn('The \"deepLocate\" feature is not supported with AutoGLM.');\n searchAreaPrompt = undefined;\n }\n\n const context = opt?.context || (await this.contextRetrieverFn());\n\n let searchArea: Rect | undefined = undefined;\n let searchAreaRawResponse: string | undefined = undefined;\n let searchAreaUsage: AIUsageInfo | undefined = undefined;\n let searchAreaResponse:\n | Awaited<ReturnType<typeof AiLocateSection>>\n | undefined = undefined;\n if (searchAreaPrompt) {\n searchAreaResponse = await AiLocateSection({\n context,\n sectionDescription: searchAreaPrompt,\n modelConfig,\n abortSignal,\n });\n assert(\n searchAreaResponse.rect,\n `cannot find search area for \"${searchAreaPrompt}\"${\n searchAreaResponse.error ? `: ${searchAreaResponse.error}` : ''\n }`,\n );\n searchAreaRawResponse = searchAreaResponse.rawResponse;\n searchAreaUsage = searchAreaResponse.usage;\n searchArea = searchAreaResponse.rect;\n }\n\n const startTime = Date.now();\n const { parseResult, rect, rawResponse, usage, reasoning_content } =\n await AiLocateElement({\n context,\n targetElementDescription: queryPrompt,\n searchConfig: searchAreaResponse,\n modelConfig,\n abortSignal,\n });\n\n const timeCost = Date.now() - startTime;\n const taskInfo: ServiceTaskInfo = {\n ...(this.taskInfo ? this.taskInfo : {}),\n durationMs: timeCost,\n rawResponse: JSON.stringify(rawResponse),\n formatResponse: JSON.stringify(parseResult),\n usage,\n searchArea,\n searchAreaRawResponse,\n searchAreaUsage,\n reasoning_content,\n };\n\n let errorLog: string | undefined;\n if (parseResult.errors?.length) {\n errorLog = `failed to locate element: \\n${parseResult.errors.join('\\n')}`;\n }\n\n const dumpData: PartialServiceDumpFromSDK = {\n type: 'locate',\n userQuery: {\n element: queryPrompt,\n },\n matchedElement: [],\n matchedRect: rect,\n data: null,\n taskInfo,\n deepLocate: !!searchArea,\n error: errorLog,\n };\n\n const elements = parseResult.elements || [];\n\n const dump = createServiceDump({\n ...dumpData,\n matchedElement: elements,\n });\n\n if (errorLog) {\n throw new ServiceError(errorLog, dump);\n }\n\n if (elements.length > 1) {\n throw new ServiceError(\n `locate: multiple elements found, length = ${elements.length}`,\n dump,\n );\n }\n\n if (elements.length === 1) {\n return {\n element: {\n center: elements[0]!.center,\n rect: elements[0]!.rect,\n description: elements[0]!.description,\n },\n rect,\n dump,\n };\n }\n\n return {\n element: null,\n rect,\n dump,\n };\n }\n\n async extract<T>(\n dataDemand: ServiceExtractParam,\n modelConfig: IModelConfig,\n opt?: ServiceExtractOption,\n pageDescription?: string,\n multimodalPrompt?: TMultimodalPrompt,\n context?: UIContext,\n ): Promise<ServiceExtractResult<T>> {\n assert(context, 'context is required for extract');\n assert(\n typeof dataDemand === 'object' || typeof dataDemand === 'string',\n `dataDemand should be object or string, but get ${typeof dataDemand}`,\n );\n\n const startTime = Date.now();\n\n let parseResult: Awaited<\n ReturnType<typeof AiExtractElementInfo<T>>\n >['parseResult'];\n let rawResponse: string;\n let usage: Awaited<ReturnType<typeof AiExtractElementInfo<T>>>['usage'];\n let reasoning_content: string | undefined;\n\n try {\n const result = await AiExtractElementInfo<T>({\n context,\n dataQuery: dataDemand,\n multimodalPrompt,\n extractOption: opt,\n modelConfig,\n pageDescription,\n });\n parseResult = result.parseResult;\n rawResponse = result.rawResponse;\n usage = result.usage;\n reasoning_content = result.reasoning_content;\n } catch (error) {\n if (error instanceof AIResponseParseError) {\n // Create dump with usage and rawResponse from the error\n const timeCost = Date.now() - startTime;\n const taskInfo: ServiceTaskInfo = {\n ...(this.taskInfo ? this.taskInfo : {}),\n durationMs: timeCost,\n rawResponse: error.rawResponse,\n usage: error.usage,\n };\n const dump = createServiceDump({\n type: 'extract',\n userQuery: { dataDemand },\n matchedElement: [],\n data: null,\n taskInfo,\n error: error.message,\n });\n throw new ServiceError(error.message, dump);\n }\n throw error;\n }\n\n const timeCost = Date.now() - startTime;\n const taskInfo: ServiceTaskInfo = {\n ...(this.taskInfo ? this.taskInfo : {}),\n durationMs: timeCost,\n rawResponse,\n formatResponse: JSON.stringify(parseResult),\n usage,\n reasoning_content,\n };\n\n let errorLog: string | undefined;\n if (parseResult.errors?.length) {\n errorLog = `AI response error: \\n${parseResult.errors.join('\\n')}`;\n }\n\n const dumpData: PartialServiceDumpFromSDK = {\n type: 'extract',\n userQuery: {\n dataDemand,\n },\n matchedElement: [],\n data: null,\n taskInfo,\n error: errorLog,\n };\n\n const { data, thought } = parseResult || {};\n\n const dump = createServiceDump({\n ...dumpData,\n data,\n });\n\n if (errorLog && !data) {\n throw new ServiceError(errorLog, dump);\n }\n\n return {\n data,\n thought,\n usage,\n reasoning_content,\n dump,\n };\n }\n\n async describe(\n target: Rect | [number, number],\n modelConfig: IModelConfig,\n opt?: {\n deepLocate?: boolean;\n },\n ): Promise<Pick<AIDescribeElementResponse, 'description'>> {\n assert(target, 'target is required for service.describe');\n const context = await this.contextRetrieverFn();\n const { shotSize } = context;\n const screenshotBase64 = context.screenshot.base64;\n assert(screenshotBase64, 'screenshot is required for service.describe');\n // The result of the \"describe\" function will be used for positioning, so essentially it is a form of grounding.\n const { modelFamily } = modelConfig;\n const systemPrompt = elementDescriberInstruction();\n\n // Convert [x,y] center point to Rect if needed\n const defaultRectSize = 30;\n const targetRect: Rect = Array.isArray(target)\n ? {\n left: Math.floor(target[0] - defaultRectSize / 2),\n top: Math.floor(target[1] - defaultRectSize / 2),\n width: defaultRectSize,\n height: defaultRectSize,\n }\n : target;\n\n let imagePayload = await compositeElementInfoImg({\n inputImgBase64: screenshotBase64,\n size: shotSize,\n elementsPositionInfo: [\n {\n rect: targetRect,\n },\n ],\n borderThickness: 3,\n });\n\n if (opt?.deepLocate) {\n const searchArea = expandSearchArea(targetRect, shotSize);\n // Always crop in describe mode. Unlike locate's deepLocate (where\n // cropping too small loses context for finding elements), describe's\n // deepLocate intentionally zooms in so the model produces a more\n // precise description from a focused view. expandSearchArea already\n // guarantees a minimum 400x400 area with surrounding context.\n debug('describe: cropping to searchArea', searchArea);\n const croppedResult = await cropByRect(\n imagePayload,\n searchArea,\n modelFamily === 'qwen2.5-vl',\n );\n imagePayload = croppedResult.imageBase64;\n }\n\n const msgs: AIArgs = [\n { role: 'system', content: systemPrompt },\n {\n role: 'user',\n content: [\n {\n type: 'image_url',\n image_url: {\n url: imagePayload,\n detail: 'high',\n },\n },\n ],\n },\n ];\n\n const res = await callAIWithObjectResponse<AIDescribeElementResponse>(\n msgs,\n modelConfig,\n );\n\n const { content } = res;\n assert(!content.error, `describe failed: ${content.error}`);\n assert(content.description, 'failed to describe the element');\n return content;\n }\n}\n"],"names":["debug","getDebug","Service","query","opt","modelConfig","abortSignal","queryPrompt","assert","searchAreaPrompt","modelFamily","console","undefined","isAutoGLM","context","searchArea","searchAreaRawResponse","searchAreaUsage","searchAreaResponse","AiLocateSection","startTime","Date","parseResult","rect","rawResponse","usage","reasoning_content","AiLocateElement","timeCost","taskInfo","JSON","errorLog","dumpData","elements","dump","createServiceDump","ServiceError","dataDemand","pageDescription","multimodalPrompt","result","AiExtractElementInfo","error","AIResponseParseError","data","thought","target","shotSize","screenshotBase64","systemPrompt","elementDescriberInstruction","defaultRectSize","targetRect","Array","Math","imagePayload","compositeElementInfoImg","expandSearchArea","croppedResult","cropByRect","msgs","res","callAIWithObjectResponse","content","Promise"],"mappings":";;;;;;;;;;;;;;;;;;;;AA2CA,MAAMA,QAAQC,SAAS;AACR,MAAMC;IAqBnB,MAAM,OACJC,KAA0B,EAC1BC,GAAe,EACfC,WAAyB,EACzBC,WAAyB,EACM;QAC/B,MAAMC,cAAc,AAAiB,YAAjB,OAAOJ,QAAqBA,QAAQA,MAAM,MAAM;QACpEK,OAAOD,aAAa;QAEpBC,OAAO,AAAiB,YAAjB,OAAOL,OAAoB;QAElC,IAAIM;QACJ,IAAIN,MAAM,UAAU,EAClBM,mBAAmBN,MAAM,MAAM;QAGjC,MAAM,EAAEO,WAAW,EAAE,GAAGL;QAExB,IAAII,oBAAoB,CAACC,aAAa;YACpCC,QAAQ,IAAI,CACV;YAEFF,mBAAmBG;QACrB;QAEA,IAAIH,oBAAoBI,UAAUH,cAAc;YAC9CC,QAAQ,IAAI,CAAC;YACbF,mBAAmBG;QACrB;QAEA,MAAME,UAAUV,KAAK,WAAY,MAAM,IAAI,CAAC,kBAAkB;QAE9D,IAAIW;QACJ,IAAIC;QACJ,IAAIC;QACJ,IAAIC;QAGJ,IAAIT,kBAAkB;YACpBS,qBAAqB,MAAMC,gBAAgB;gBACzCL;gBACA,oBAAoBL;gBACpBJ;gBACAC;YACF;YACAE,OACEU,mBAAmB,IAAI,EACvB,CAAC,6BAA6B,EAAET,iBAAiB,CAAC,EAChDS,mBAAmB,KAAK,GAAG,CAAC,EAAE,EAAEA,mBAAmB,KAAK,EAAE,GAAG,IAC7D;YAEJF,wBAAwBE,mBAAmB,WAAW;YACtDD,kBAAkBC,mBAAmB,KAAK;YAC1CH,aAAaG,mBAAmB,IAAI;QACtC;QAEA,MAAME,YAAYC,KAAK,GAAG;QAC1B,MAAM,EAAEC,WAAW,EAAEC,IAAI,EAAEC,WAAW,EAAEC,KAAK,EAAEC,iBAAiB,EAAE,GAChE,MAAMC,gBAAgB;YACpBb;YACA,0BAA0BP;YAC1B,cAAcW;YACdb;YACAC;QACF;QAEF,MAAMsB,WAAWP,KAAK,GAAG,KAAKD;QAC9B,MAAMS,WAA4B;YAChC,GAAI,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC,QAAQ,GAAG,CAAC,CAAC;YACtC,YAAYD;YACZ,aAAaE,KAAK,SAAS,CAACN;YAC5B,gBAAgBM,KAAK,SAAS,CAACR;YAC/BG;YACAV;YACAC;YACAC;YACAS;QACF;QAEA,IAAIK;QACJ,IAAIT,YAAY,MAAM,EAAE,QACtBS,WAAW,CAAC,4BAA4B,EAAET,YAAY,MAAM,CAAC,IAAI,CAAC,OAAO;QAG3E,MAAMU,WAAsC;YAC1C,MAAM;YACN,WAAW;gBACT,SAASzB;YACX;YACA,gBAAgB,EAAE;YAClB,aAAagB;YACb,MAAM;YACNM;YACA,YAAY,CAAC,CAACd;YACd,OAAOgB;QACT;QAEA,MAAME,WAAWX,YAAY,QAAQ,IAAI,EAAE;QAE3C,MAAMY,OAAOC,kBAAkB;YAC7B,GAAGH,QAAQ;YACX,gBAAgBC;QAClB;QAEA,IAAIF,UACF,MAAM,IAAIK,aAAaL,UAAUG;QAGnC,IAAID,SAAS,MAAM,GAAG,GACpB,MAAM,IAAIG,aACR,CAAC,0CAA0C,EAAEH,SAAS,MAAM,EAAE,EAC9DC;QAIJ,IAAID,AAAoB,MAApBA,SAAS,MAAM,EACjB,OAAO;YACL,SAAS;gBACP,QAAQA,QAAQ,CAAC,EAAE,CAAE,MAAM;gBAC3B,MAAMA,QAAQ,CAAC,EAAE,CAAE,IAAI;gBACvB,aAAaA,QAAQ,CAAC,EAAE,CAAE,WAAW;YACvC;YACAV;YACAW;QACF;QAGF,OAAO;YACL,SAAS;YACTX;YACAW;QACF;IACF;IAEA,MAAM,QACJG,UAA+B,EAC/BhC,WAAyB,EACzBD,GAA0B,EAC1BkC,eAAwB,EACxBC,gBAAoC,EACpCzB,OAAmB,EACe;QAClCN,OAAOM,SAAS;QAChBN,OACE,AAAsB,YAAtB,OAAO6B,cAA2B,AAAsB,YAAtB,OAAOA,YACzC,CAAC,+CAA+C,EAAE,OAAOA,YAAY;QAGvE,MAAMjB,YAAYC,KAAK,GAAG;QAE1B,IAAIC;QAGJ,IAAIE;QACJ,IAAIC;QACJ,IAAIC;QAEJ,IAAI;YACF,MAAMc,SAAS,MAAMC,qBAAwB;gBAC3C3B;gBACA,WAAWuB;gBACXE;gBACA,eAAenC;gBACfC;gBACAiC;YACF;YACAhB,cAAckB,OAAO,WAAW;YAChChB,cAAcgB,OAAO,WAAW;YAChCf,QAAQe,OAAO,KAAK;YACpBd,oBAAoBc,OAAO,iBAAiB;QAC9C,EAAE,OAAOE,OAAO;YACd,IAAIA,iBAAiBC,sBAAsB;gBAEzC,MAAMf,WAAWP,KAAK,GAAG,KAAKD;gBAC9B,MAAMS,WAA4B;oBAChC,GAAI,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC,QAAQ,GAAG,CAAC,CAAC;oBACtC,YAAYD;oBACZ,aAAac,MAAM,WAAW;oBAC9B,OAAOA,MAAM,KAAK;gBACpB;gBACA,MAAMR,OAAOC,kBAAkB;oBAC7B,MAAM;oBACN,WAAW;wBAAEE;oBAAW;oBACxB,gBAAgB,EAAE;oBAClB,MAAM;oBACNR;oBACA,OAAOa,MAAM,OAAO;gBACtB;gBACA,MAAM,IAAIN,aAAaM,MAAM,OAAO,EAAER;YACxC;YACA,MAAMQ;QACR;QAEA,MAAMd,WAAWP,KAAK,GAAG,KAAKD;QAC9B,MAAMS,WAA4B;YAChC,GAAI,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC,QAAQ,GAAG,CAAC,CAAC;YACtC,YAAYD;YACZJ;YACA,gBAAgBM,KAAK,SAAS,CAACR;YAC/BG;YACAC;QACF;QAEA,IAAIK;QACJ,IAAIT,YAAY,MAAM,EAAE,QACtBS,WAAW,CAAC,qBAAqB,EAAET,YAAY,MAAM,CAAC,IAAI,CAAC,OAAO;QAGpE,MAAMU,WAAsC;YAC1C,MAAM;YACN,WAAW;gBACTK;YACF;YACA,gBAAgB,EAAE;YAClB,MAAM;YACNR;YACA,OAAOE;QACT;QAEA,MAAM,EAAEa,IAAI,EAAEC,OAAO,EAAE,GAAGvB,eAAe,CAAC;QAE1C,MAAMY,OAAOC,kBAAkB;YAC7B,GAAGH,QAAQ;YACXY;QACF;QAEA,IAAIb,YAAY,CAACa,MACf,MAAM,IAAIR,aAAaL,UAAUG;QAGnC,OAAO;YACLU;YACAC;YACApB;YACAC;YACAQ;QACF;IACF;IAEA,MAAM,SACJY,MAA+B,EAC/BzC,WAAyB,EACzBD,GAEC,EACwD;QACzDI,OAAOsC,QAAQ;QACf,MAAMhC,UAAU,MAAM,IAAI,CAAC,kBAAkB;QAC7C,MAAM,EAAEiC,QAAQ,EAAE,GAAGjC;QACrB,MAAMkC,mBAAmBlC,QAAQ,UAAU,CAAC,MAAM;QAClDN,OAAOwC,kBAAkB;QAEzB,MAAM,EAAEtC,WAAW,EAAE,GAAGL;QACxB,MAAM4C,eAAeC;QAGrB,MAAMC,kBAAkB;QACxB,MAAMC,aAAmBC,MAAM,OAAO,CAACP,UACnC;YACE,MAAMQ,KAAK,KAAK,CAACR,MAAM,CAAC,EAAE,GAAGK,kBAAkB;YAC/C,KAAKG,KAAK,KAAK,CAACR,MAAM,CAAC,EAAE,GAAGK,kBAAkB;YAC9C,OAAOA;YACP,QAAQA;QACV,IACAL;QAEJ,IAAIS,eAAe,MAAMC,wBAAwB;YAC/C,gBAAgBR;YAChB,MAAMD;YACN,sBAAsB;gBACpB;oBACE,MAAMK;gBACR;aACD;YACD,iBAAiB;QACnB;QAEA,IAAIhD,KAAK,YAAY;YACnB,MAAMW,aAAa0C,iBAAiBL,YAAYL;YAMhD/C,MAAM,oCAAoCe;YAC1C,MAAM2C,gBAAgB,MAAMC,WAC1BJ,cACAxC,YACAL,AAAgB,iBAAhBA;YAEF6C,eAAeG,cAAc,WAAW;QAC1C;QAEA,MAAME,OAAe;YACnB;gBAAE,MAAM;gBAAU,SAASX;YAAa;YACxC;gBACE,MAAM;gBACN,SAAS;oBACP;wBACE,MAAM;wBACN,WAAW;4BACT,KAAKM;4BACL,QAAQ;wBACV;oBACF;iBACD;YACH;SACD;QAED,MAAMM,MAAM,MAAMC,yBAChBF,MACAvD;QAGF,MAAM,EAAE0D,OAAO,EAAE,GAAGF;QACpBrD,OAAO,CAACuD,QAAQ,KAAK,EAAE,CAAC,iBAAiB,EAAEA,QAAQ,KAAK,EAAE;QAC1DvD,OAAOuD,QAAQ,WAAW,EAAE;QAC5B,OAAOA;IACT;IA9UA,YACEjD,OAA2D,EAC3DV,GAAoB,CACpB;QAPF;QAEA;QAMEI,OAAOM,SAAS;QAChB,IAAI,AAAmB,cAAnB,OAAOA,SACT,IAAI,CAAC,kBAAkB,GAAGA;aAE1B,IAAI,CAAC,kBAAkB,GAAG,IAAMkD,QAAQ,OAAO,CAAClD;QAGlD,IAAI,AAAyB,WAAlBV,KAAK,UACd,IAAI,CAAC,QAAQ,GAAGA,IAAI,QAAQ;IAEhC;AAiUF"}
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
import { uuid } from "@midscene/shared/utils";
|
|
2
|
+
function createServiceDump(data) {
|
|
3
|
+
const baseData = {
|
|
4
|
+
logTime: Date.now()
|
|
5
|
+
};
|
|
6
|
+
const finalData = {
|
|
7
|
+
logId: uuid(),
|
|
8
|
+
...baseData,
|
|
9
|
+
...data
|
|
10
|
+
};
|
|
11
|
+
return finalData;
|
|
12
|
+
}
|
|
13
|
+
export { createServiceDump };
|
|
14
|
+
|
|
15
|
+
//# sourceMappingURL=utils.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"service/utils.mjs","sources":["../../../src/service/utils.ts"],"sourcesContent":["import type { DumpMeta, PartialServiceDumpFromSDK, ServiceDump } from '@/types';\nimport { uuid } from '@midscene/shared/utils';\n\nexport function createServiceDump(\n data: PartialServiceDumpFromSDK,\n): ServiceDump {\n const baseData: DumpMeta = {\n logTime: Date.now(),\n };\n const finalData: ServiceDump = {\n logId: uuid(),\n ...baseData,\n ...data,\n };\n\n return finalData;\n}\n"],"names":["createServiceDump","data","baseData","Date","finalData","uuid"],"mappings":";AAGO,SAASA,kBACdC,IAA+B;IAE/B,MAAMC,WAAqB;QACzB,SAASC,KAAK,GAAG;IACnB;IACA,MAAMC,YAAyB;QAC7B,OAAOC;QACP,GAAGH,QAAQ;QACX,GAAGD,IAAI;IACT;IAEA,OAAOG;AACT"}
|
|
@@ -0,0 +1,38 @@
|
|
|
1
|
+
import { CLIError, runToolsCLI } from "@midscene/shared/cli";
|
|
2
|
+
import { BaseMidsceneTools } from "@midscene/shared/mcp";
|
|
3
|
+
import { Agent } from "../agent/agent.mjs";
|
|
4
|
+
function _define_property(obj, key, value) {
|
|
5
|
+
if (key in obj) Object.defineProperty(obj, key, {
|
|
6
|
+
value: value,
|
|
7
|
+
enumerable: true,
|
|
8
|
+
configurable: true,
|
|
9
|
+
writable: true
|
|
10
|
+
});
|
|
11
|
+
else obj[key] = value;
|
|
12
|
+
return obj;
|
|
13
|
+
}
|
|
14
|
+
class SkillMidsceneTools extends BaseMidsceneTools {
|
|
15
|
+
createTemporaryDevice() {
|
|
16
|
+
return new this.DeviceClass();
|
|
17
|
+
}
|
|
18
|
+
async ensureAgent() {
|
|
19
|
+
if (!this.agent) {
|
|
20
|
+
const device = new this.DeviceClass();
|
|
21
|
+
this.agent = new Agent(device);
|
|
22
|
+
}
|
|
23
|
+
return this.agent;
|
|
24
|
+
}
|
|
25
|
+
constructor(DeviceClass){
|
|
26
|
+
super(), _define_property(this, "DeviceClass", void 0), this.DeviceClass = DeviceClass;
|
|
27
|
+
}
|
|
28
|
+
}
|
|
29
|
+
function runSkillCLI(options) {
|
|
30
|
+
const tools = new SkillMidsceneTools(options.DeviceClass);
|
|
31
|
+
return runToolsCLI(tools, options.scriptName).catch((e)=>{
|
|
32
|
+
if (!(e instanceof CLIError)) console.error(e);
|
|
33
|
+
process.exit(e instanceof CLIError ? e.exitCode : 1);
|
|
34
|
+
});
|
|
35
|
+
}
|
|
36
|
+
export { runSkillCLI };
|
|
37
|
+
|
|
38
|
+
//# sourceMappingURL=index.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"skill/index.mjs","sources":["../../../src/skill/index.ts"],"sourcesContent":["import { CLIError, runToolsCLI } from '@midscene/shared/cli';\nimport { BaseMidsceneTools } from '@midscene/shared/mcp';\nimport type { BaseAgent, BaseDevice } from '@midscene/shared/mcp';\nimport { Agent } from '../agent/agent';\nimport type { AbstractInterface } from '../device';\n\ntype DeviceClass = new (...args: any[]) => AbstractInterface;\n\n/**\n * Skill tools manager that lazily creates Agent from a Device class.\n * Used by runSkillCLI for CLI / Agent Skills scenarios where no agent exists at startup.\n */\nclass SkillMidsceneTools extends BaseMidsceneTools<BaseAgent> {\n constructor(private DeviceClass: DeviceClass) {\n super();\n }\n\n protected createTemporaryDevice(): BaseDevice {\n return new this.DeviceClass() as unknown as BaseDevice;\n }\n\n protected async ensureAgent(): Promise<BaseAgent> {\n if (!this.agent) {\n const device = new this.DeviceClass();\n this.agent = new Agent(device) as unknown as BaseAgent;\n }\n return this.agent;\n }\n}\n\nexport interface SkillCLIOptions {\n scriptName: string;\n DeviceClass: DeviceClass;\n}\n\n/**\n * Launch a Skill CLI for a custom interface Device class.\n * This enables AI coding assistants (Claude Code, Cline, etc.) to control\n * your custom interface through CLI commands.\n *\n * @example\n * ```typescript\n * #!/usr/bin/env node\n * import { runSkillCLI } from '@midscene/core/skill';\n * import { SampleDevice } from './sample-device';\n *\n * runSkillCLI({\n * DeviceClass: SampleDevice,\n * scriptName: 'my-device',\n * });\n * ```\n */\nexport function runSkillCLI(options: SkillCLIOptions): Promise<void> {\n const tools = new SkillMidsceneTools(options.DeviceClass);\n return runToolsCLI(tools, options.scriptName).catch((e) => {\n if (!(e instanceof CLIError)) console.error(e);\n process.exit(e instanceof CLIError ? e.exitCode : 1);\n });\n}\n"],"names":["SkillMidsceneTools","BaseMidsceneTools","device","Agent","DeviceClass","runSkillCLI","options","tools","runToolsCLI","e","CLIError","console","process"],"mappings":";;;;;;;;;;;;;AAYA,MAAMA,2BAA2BC;IAKrB,wBAAoC;QAC5C,OAAO,IAAI,IAAI,CAAC,WAAW;IAC7B;IAEA,MAAgB,cAAkC;QAChD,IAAI,CAAC,IAAI,CAAC,KAAK,EAAE;YACf,MAAMC,SAAS,IAAI,IAAI,CAAC,WAAW;YACnC,IAAI,CAAC,KAAK,GAAG,IAAIC,MAAMD;QACzB;QACA,OAAO,IAAI,CAAC,KAAK;IACnB;IAdA,YAAoBE,WAAwB,CAAE;QAC5C,KAAK,wDADaA,WAAW,GAAXA;IAEpB;AAaF;AAwBO,SAASC,YAAYC,OAAwB;IAClD,MAAMC,QAAQ,IAAIP,mBAAmBM,QAAQ,WAAW;IACxD,OAAOE,YAAYD,OAAOD,QAAQ,UAAU,EAAE,KAAK,CAAC,CAACG;QACnD,IAAI,CAAEA,CAAAA,aAAaC,QAAO,GAAIC,QAAQ,KAAK,CAACF;QAC5CG,QAAQ,IAAI,CAACH,aAAaC,WAAWD,EAAE,QAAQ,GAAG;IACpD;AACF"}
|