@midscene/core 1.0.5-beta-20251230135517.0 → 1.0.5-beta-20251231065132.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (42) hide show
  1. package/dist/es/agent/agent.mjs +3 -5
  2. package/dist/es/agent/agent.mjs.map +1 -1
  3. package/dist/es/agent/task-builder.mjs +1 -0
  4. package/dist/es/agent/task-builder.mjs.map +1 -1
  5. package/dist/es/agent/tasks.mjs +6 -4
  6. package/dist/es/agent/tasks.mjs.map +1 -1
  7. package/dist/es/agent/utils.mjs +1 -1
  8. package/dist/es/ai-model/inspect.mjs +4 -2
  9. package/dist/es/ai-model/inspect.mjs.map +1 -1
  10. package/dist/es/ai-model/llm-planning.mjs +3 -2
  11. package/dist/es/ai-model/llm-planning.mjs.map +1 -1
  12. package/dist/es/ai-model/service-caller/index.mjs +48 -9
  13. package/dist/es/ai-model/service-caller/index.mjs.map +1 -1
  14. package/dist/es/service/index.mjs +7 -4
  15. package/dist/es/service/index.mjs.map +1 -1
  16. package/dist/es/types.mjs.map +1 -1
  17. package/dist/es/utils.mjs +2 -2
  18. package/dist/lib/agent/agent.js +3 -5
  19. package/dist/lib/agent/agent.js.map +1 -1
  20. package/dist/lib/agent/task-builder.js +1 -0
  21. package/dist/lib/agent/task-builder.js.map +1 -1
  22. package/dist/lib/agent/tasks.js +6 -4
  23. package/dist/lib/agent/tasks.js.map +1 -1
  24. package/dist/lib/agent/utils.js +1 -1
  25. package/dist/lib/ai-model/inspect.js +4 -2
  26. package/dist/lib/ai-model/inspect.js.map +1 -1
  27. package/dist/lib/ai-model/llm-planning.js +3 -2
  28. package/dist/lib/ai-model/llm-planning.js.map +1 -1
  29. package/dist/lib/ai-model/service-caller/index.js +50 -8
  30. package/dist/lib/ai-model/service-caller/index.js.map +1 -1
  31. package/dist/lib/service/index.js +7 -4
  32. package/dist/lib/service/index.js.map +1 -1
  33. package/dist/lib/types.js.map +1 -1
  34. package/dist/lib/utils.js +2 -2
  35. package/dist/types/agent/agent.d.ts +1 -1
  36. package/dist/types/agent/tasks.d.ts +1 -1
  37. package/dist/types/ai-model/inspect.d.ts +2 -0
  38. package/dist/types/ai-model/llm-planning.d.ts +1 -1
  39. package/dist/types/ai-model/service-caller/index.d.ts +12 -2
  40. package/dist/types/types.d.ts +4 -0
  41. package/dist/types/yaml.d.ts +0 -1
  42. package/package.json +2 -2
@@ -7,7 +7,7 @@ import { TaskCache } from './task-cache';
7
7
  import { TaskExecutor } from './tasks';
8
8
  export type AiActOptions = {
9
9
  cacheable?: boolean;
10
- qwen3_vl_enable_thinking?: boolean;
10
+ deepThink?: boolean;
11
11
  };
12
12
  export declare class Agent<InterfaceType extends AbstractInterface = AbstractInterface> {
13
13
  interface: InterfaceType;
@@ -46,7 +46,7 @@ export declare class TaskExecutor {
46
46
  runner: TaskRunner;
47
47
  }>;
48
48
  runPlans(title: string, plans: PlanningAction[], modelConfigForPlanning: IModelConfig, modelConfigForDefaultIntent: IModelConfig): Promise<ExecutionResult>;
49
- action(userPrompt: string, modelConfigForPlanning: IModelConfig, modelConfigForDefaultIntent: IModelConfig, includeBboxInPlanning: boolean, aiActContext?: string, cacheable?: boolean, replanningCycleLimitOverride?: number, imagesIncludeCount?: number, qwen3_vl_enable_thinking?: boolean): Promise<ExecutionResult<{
49
+ action(userPrompt: string, modelConfigForPlanning: IModelConfig, modelConfigForDefaultIntent: IModelConfig, includeBboxInPlanning: boolean, aiActContext?: string, cacheable?: boolean, replanningCycleLimitOverride?: number, imagesIncludeCount?: number, deepThink?: boolean): Promise<ExecutionResult<{
50
50
  yamlFlow?: MidsceneYamlFlowItem[];
51
51
  } | undefined>>;
52
52
  private createTypeQueryTask;
@@ -23,6 +23,7 @@ export declare function AiLocateElement(options: {
23
23
  rect?: Rect;
24
24
  rawResponse: string;
25
25
  usage?: AIUsageInfo;
26
+ reasoning_content?: string;
26
27
  }>;
27
28
  export declare function AiLocateSection(options: {
28
29
  context: UIContext;
@@ -45,6 +46,7 @@ export declare function AiExtractElementInfo<T>(options: {
45
46
  }): Promise<{
46
47
  parseResult: AIDataExtractionResponse<T>;
47
48
  usage: AIUsageInfo | undefined;
49
+ reasoning_content: string | undefined;
48
50
  }>;
49
51
  export declare function AiJudgeOrderSensitive(description: string, callAIFn: typeof callAIWithObjectResponse<{
50
52
  isOrderSensitive: boolean;
@@ -10,5 +10,5 @@ export declare function plan(userInstruction: string, opts: {
10
10
  conversationHistory: ConversationHistory;
11
11
  includeBbox: boolean;
12
12
  imagesIncludeCount?: number;
13
- qwen3_vl_enable_thinking?: boolean;
13
+ deepThink?: boolean;
14
14
  }): Promise<PlanningAIResponse>;
@@ -6,18 +6,20 @@ import type { AIActionType, AIArgs } from '../../common';
6
6
  export declare function callAI(messages: ChatCompletionMessageParam[], AIActionTypeValue: AIActionType, modelConfig: IModelConfig, options?: {
7
7
  stream?: boolean;
8
8
  onChunk?: StreamingCallback;
9
- qwen3_vl_enable_thinking?: boolean;
9
+ deepThink?: boolean;
10
10
  }): Promise<{
11
11
  content: string;
12
+ reasoning_content?: string;
12
13
  usage?: AIUsageInfo;
13
14
  isStreamed: boolean;
14
15
  }>;
15
16
  export declare function callAIWithObjectResponse<T>(messages: ChatCompletionMessageParam[], AIActionTypeValue: AIActionType, modelConfig: IModelConfig, options?: {
16
- qwen3_vl_enable_thinking?: boolean;
17
+ deepThink?: boolean;
17
18
  }): Promise<{
18
19
  content: T;
19
20
  contentString: string;
20
21
  usage?: AIUsageInfo;
22
+ reasoning_content?: string;
21
23
  }>;
22
24
  export declare function callAIWithStringResponse(msgs: AIArgs, AIActionTypeValue: AIActionType, modelConfig: IModelConfig): Promise<{
23
25
  content: string;
@@ -25,4 +27,12 @@ export declare function callAIWithStringResponse(msgs: AIArgs, AIActionTypeValue
25
27
  }>;
26
28
  export declare function extractJSONFromCodeBlock(response: string): string;
27
29
  export declare function preprocessDoubaoBboxJson(input: string): string;
30
+ export declare function resolveDeepThinkConfig({ deepThink, vlMode, }: {
31
+ deepThink?: boolean;
32
+ vlMode?: TVlModeTypes;
33
+ }): {
34
+ config: Record<string, unknown>;
35
+ debugMessage?: string;
36
+ warningMessage?: string;
37
+ };
28
38
  export declare function safeParseJson(input: string, vlMode: TVlModeTypes | undefined): any;
@@ -105,6 +105,7 @@ export interface ServiceTaskInfo {
105
105
  searchArea?: Rect;
106
106
  searchAreaRawResponse?: string;
107
107
  searchAreaUsage?: AIUsageInfo;
108
+ reasoning_content?: string;
108
109
  }
109
110
  export interface DumpMeta {
110
111
  logTime: number;
@@ -140,6 +141,7 @@ export interface ServiceExtractResult<T> extends ServiceResultBase {
140
141
  data: T;
141
142
  thought?: string;
142
143
  usage?: AIUsageInfo;
144
+ reasoning_content?: string;
143
145
  }
144
146
  export declare class ServiceError extends Error {
145
147
  dump: ServiceDump;
@@ -193,6 +195,7 @@ export interface PlanningAIResponse extends Omit<RawResponsePlanningAIResponse,
193
195
  yamlFlow?: MidsceneYamlFlowItem[];
194
196
  yamlString?: string;
195
197
  error?: string;
198
+ reasoning_content?: string;
196
199
  }
197
200
  export interface PlanningActionParamSleep {
198
201
  timeMs: number;
@@ -269,6 +272,7 @@ export type ExecutionTask<E extends ExecutionTaskApply<any, any, any> = Executio
269
272
  };
270
273
  usage?: AIUsageInfo;
271
274
  searchAreaUsage?: AIUsageInfo;
275
+ reasoning_content?: string;
272
276
  };
273
277
  export interface ExecutionDump extends DumpMeta {
274
278
  name: string;
@@ -129,7 +129,6 @@ export interface MidsceneYamlFlowItemAIAction {
129
129
  aiAct?: string;
130
130
  aiActionProgressTips?: string[];
131
131
  cacheable?: boolean;
132
- _deepThink?: boolean;
133
132
  [key: string]: unknown;
134
133
  }
135
134
  export interface MidsceneYamlFlowItemAIAssert {
package/package.json CHANGED
@@ -1,7 +1,7 @@
1
1
  {
2
2
  "name": "@midscene/core",
3
3
  "description": "Automate browser actions, extract data, and perform assertions using AI. It offers JavaScript SDK, Chrome extension, and support for scripting in YAML. See https://midscenejs.com/ for details.",
4
- "version": "1.0.5-beta-20251230135517.0",
4
+ "version": "1.0.5-beta-20251231065132.0",
5
5
  "repository": "https://github.com/web-infra-dev/midscene",
6
6
  "homepage": "https://midscenejs.com/",
7
7
  "main": "./dist/lib/index.js",
@@ -89,7 +89,7 @@
89
89
  "semver": "7.5.2",
90
90
  "js-yaml": "4.1.0",
91
91
  "zod": "3.24.3",
92
- "@midscene/shared": "1.0.5-beta-20251230135517.0"
92
+ "@midscene/shared": "1.0.5-beta-20251231065132.0"
93
93
  },
94
94
  "devDependencies": {
95
95
  "@rslib/core": "^0.18.3",