npm - @midscene/core - Versions diffs - 1.0.5-beta-20260104042628.0 → 1.0.5-beta-20260105023603.0 - Mend

@midscene/core 1.0.5-beta-20260104042628.0 → 1.0.5-beta-20260105023603.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

package/dist/es/agent/agent.mjs +3 -4
package/dist/es/agent/agent.mjs.map +1 -1
package/dist/es/agent/task-builder.mjs +1 -0
package/dist/es/agent/task-builder.mjs.map +1 -1
package/dist/es/agent/tasks.mjs +7 -4
package/dist/es/agent/tasks.mjs.map +1 -1
package/dist/es/agent/utils.mjs +1 -1
package/dist/es/ai-model/inspect.mjs +4 -2
package/dist/es/ai-model/inspect.mjs.map +1 -1
package/dist/es/ai-model/llm-planning.mjs +4 -1
package/dist/es/ai-model/llm-planning.mjs.map +1 -1
package/dist/es/ai-model/service-caller/index.mjs +52 -7
package/dist/es/ai-model/service-caller/index.mjs.map +1 -1
package/dist/es/service/index.mjs +7 -4
package/dist/es/service/index.mjs.map +1 -1
package/dist/es/types.mjs.map +1 -1
package/dist/es/utils.mjs +2 -2
package/dist/lib/agent/agent.js +3 -4
package/dist/lib/agent/agent.js.map +1 -1
package/dist/lib/agent/task-builder.js +1 -0
package/dist/lib/agent/task-builder.js.map +1 -1
package/dist/lib/agent/tasks.js +7 -4
package/dist/lib/agent/tasks.js.map +1 -1
package/dist/lib/agent/utils.js +1 -1
package/dist/lib/ai-model/inspect.js +4 -2
package/dist/lib/ai-model/inspect.js.map +1 -1
package/dist/lib/ai-model/llm-planning.js +4 -1
package/dist/lib/ai-model/llm-planning.js.map +1 -1
package/dist/lib/ai-model/service-caller/index.js +54 -6
package/dist/lib/ai-model/service-caller/index.js.map +1 -1
package/dist/lib/service/index.js +7 -4
package/dist/lib/service/index.js.map +1 -1
package/dist/lib/types.js.map +1 -1
package/dist/lib/utils.js +2 -2
package/dist/types/agent/agent.d.ts +2 -1
package/dist/types/agent/tasks.d.ts +2 -2
package/dist/types/ai-model/inspect.d.ts +2 -0
package/dist/types/ai-model/llm-planning.d.ts +2 -1
package/dist/types/ai-model/service-caller/index.d.ts +15 -2
package/dist/types/types.d.ts +5 -0
package/dist/types/yaml.d.ts +0 -1
package/package.json +2 -2

package/dist/types/agent/agent.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { type ActionParam, type ActionReturn, type AgentAssertOpt, type AgentDescribeElementAtPointResult, type AgentOpt, type AgentWaitForOpt, type DeviceAction, type ExecutionDump, type GroupedActionDump, type LocateOption, type LocateResultElement, type LocateValidatorResult, type LocatorValidatorOption, type OnTaskStartTip, type ScrollParam, Service, type ServiceAction, type ServiceExtractOption, type ServiceExtractParam, type TUserPrompt, type UIContext } from '../index';
+import { type ActionParam, type ActionReturn, type AgentAssertOpt, type AgentDescribeElementAtPointResult, type AgentOpt, type AgentWaitForOpt, type DeepThinkOption, type DeviceAction, type ExecutionDump, type GroupedActionDump, type LocateOption, type LocateResultElement, type LocateValidatorResult, type LocatorValidatorOption, type OnTaskStartTip, type ScrollParam, Service, type ServiceAction, type ServiceExtractOption, type ServiceExtractParam, type TUserPrompt, type UIContext } from '../index';
 export type TestStatus = 'passed' | 'failed' | 'timedOut' | 'skipped' | 'interrupted';
 import type { AbstractInterface } from '../device';
 import type { TaskRunner } from '../task-runner';
@@ -7,6 +7,7 @@ import { TaskCache } from './task-cache';
 import { TaskExecutor } from './tasks';
 export type AiActOptions = {
     cacheable?: boolean;
+    deepThink?: DeepThinkOption;
 };
 export declare class Agent<InterfaceType extends AbstractInterface = AbstractInterface> {
     interface: InterfaceType;

package/dist/types/agent/tasks.d.ts CHANGED Viewed

@@ -3,7 +3,7 @@ import type { AbstractInterface } from '../device';
 import type Service from '../service';
 import type { TaskRunner } from '../task-runner';
 import { TaskExecutionError } from '../task-runner';
-import type { DeviceAction, ExecutionTaskApply, ExecutionTaskProgressOptions, MidsceneYamlFlowItem, PlanningAction, PlanningActionParamSleep, PlanningActionParamWaitFor, ServiceExtractOption, ServiceExtractParam } from '../types';
+import type { DeepThinkOption, DeviceAction, ExecutionTaskApply, ExecutionTaskProgressOptions, MidsceneYamlFlowItem, PlanningAction, PlanningActionParamSleep, PlanningActionParamWaitFor, ServiceExtractOption, ServiceExtractParam } from '../types';
 import type { IModelConfig } from '@midscene/shared/env';
 import type { TaskCache } from './task-cache';
 export { locatePlanForLocate } from './task-builder';
@@ -46,7 +46,7 @@ export declare class TaskExecutor {
         runner: TaskRunner;
     }>;
     runPlans(title: string, plans: PlanningAction[], modelConfigForPlanning: IModelConfig, modelConfigForDefaultIntent: IModelConfig): Promise<ExecutionResult>;
-    action(userPrompt: string, modelConfigForPlanning: IModelConfig, modelConfigForDefaultIntent: IModelConfig, includeBboxInPlanning: boolean, aiActContext?: string, cacheable?: boolean, replanningCycleLimitOverride?: number, imagesIncludeCount?: number): Promise<ExecutionResult<{
+    action(userPrompt: string, modelConfigForPlanning: IModelConfig, modelConfigForDefaultIntent: IModelConfig, includeBboxInPlanning: boolean, aiActContext?: string, cacheable?: boolean, replanningCycleLimitOverride?: number, imagesIncludeCount?: number, deepThink?: DeepThinkOption): Promise<ExecutionResult<{
         yamlFlow?: MidsceneYamlFlowItem[];
     } | undefined>>;
     private createTypeQueryTask;

package/dist/types/ai-model/inspect.d.ts CHANGED Viewed

@@ -23,6 +23,7 @@ export declare function AiLocateElement(options: {
     rect?: Rect;
     rawResponse: string;
     usage?: AIUsageInfo;
+    reasoning_content?: string;
 }>;
 export declare function AiLocateSection(options: {
     context: UIContext;
@@ -45,6 +46,7 @@ export declare function AiExtractElementInfo<T>(options: {
 }): Promise<{
     parseResult: AIDataExtractionResponse<T>;
     usage: AIUsageInfo | undefined;
+    reasoning_content: string | undefined;
 }>;
 export declare function AiJudgeOrderSensitive(description: string, callAIFn: typeof callAIWithObjectResponse<{
     isOrderSensitive: boolean;

package/dist/types/ai-model/llm-planning.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import type { DeviceAction, InterfaceType, PlanningAIResponse, UIContext } from '../types';
+import type { DeepThinkOption, DeviceAction, InterfaceType, PlanningAIResponse, UIContext } from '../types';
 import type { IModelConfig } from '@midscene/shared/env';
 import type { ConversationHistory } from './conversation-history';
 export declare function plan(userInstruction: string, opts: {
@@ -10,4 +10,5 @@ export declare function plan(userInstruction: string, opts: {
     conversationHistory: ConversationHistory;
     includeBbox: boolean;
     imagesIncludeCount?: number;
+    deepThink?: DeepThinkOption;
 }): Promise<PlanningAIResponse>;

package/dist/types/ai-model/service-caller/index.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { type AIUsageInfo } from '../../types';
+import { type AIUsageInfo, type DeepThinkOption } from '../../types';
 import type { StreamingCallback } from '../../types';
 import { type IModelConfig, type TVlModeTypes } from '@midscene/shared/env';
 import type { ChatCompletionMessageParam } from 'openai/resources/index';
@@ -6,15 +6,20 @@ import type { AIActionType, AIArgs } from '../../common';
 export declare function callAI(messages: ChatCompletionMessageParam[], AIActionTypeValue: AIActionType, modelConfig: IModelConfig, options?: {
     stream?: boolean;
     onChunk?: StreamingCallback;
+    deepThink?: DeepThinkOption;
 }): Promise<{
     content: string;
+    reasoning_content?: string;
     usage?: AIUsageInfo;
     isStreamed: boolean;
 }>;
-export declare function callAIWithObjectResponse<T>(messages: ChatCompletionMessageParam[], AIActionTypeValue: AIActionType, modelConfig: IModelConfig): Promise<{
+export declare function callAIWithObjectResponse<T>(messages: ChatCompletionMessageParam[], AIActionTypeValue: AIActionType, modelConfig: IModelConfig, options?: {
+    deepThink?: DeepThinkOption;
+}): Promise<{
     content: T;
     contentString: string;
     usage?: AIUsageInfo;
+    reasoning_content?: string;
 }>;
 export declare function callAIWithStringResponse(msgs: AIArgs, AIActionTypeValue: AIActionType, modelConfig: IModelConfig): Promise<{
     content: string;
@@ -22,4 +27,12 @@ export declare function callAIWithStringResponse(msgs: AIArgs, AIActionTypeValue
 }>;
 export declare function extractJSONFromCodeBlock(response: string): string;
 export declare function preprocessDoubaoBboxJson(input: string): string;
+export declare function resolveDeepThinkConfig({ deepThink, vlMode, }: {
+    deepThink?: DeepThinkOption;
+    vlMode?: TVlModeTypes;
+}): {
+    config: Record<string, unknown>;
+    debugMessage?: string;
+    warningMessage?: string;
+};
 export declare function safeParseJson(input: string, vlMode: TVlModeTypes | undefined): any;

package/dist/types/types.d.ts CHANGED Viewed

@@ -97,6 +97,7 @@ export interface LocateResult {
     rect?: Rect;
 }
 export type ThinkingLevel = 'off' | 'medium' | 'high';
+export type DeepThinkOption = 'unset' | true | false;
 export interface ServiceTaskInfo {
     durationMs: number;
     formatResponse?: string;
@@ -105,6 +106,7 @@ export interface ServiceTaskInfo {
     searchArea?: Rect;
     searchAreaRawResponse?: string;
     searchAreaUsage?: AIUsageInfo;
+    reasoning_content?: string;
 }
 export interface DumpMeta {
     logTime: number;
@@ -140,6 +142,7 @@ export interface ServiceExtractResult<T> extends ServiceResultBase {
     data: T;
     thought?: string;
     usage?: AIUsageInfo;
+    reasoning_content?: string;
 }
 export declare class ServiceError extends Error {
     dump: ServiceDump;
@@ -193,6 +196,7 @@ export interface PlanningAIResponse extends Omit<RawResponsePlanningAIResponse,
     yamlFlow?: MidsceneYamlFlowItem[];
     yamlString?: string;
     error?: string;
+    reasoning_content?: string;
 }
 export interface PlanningActionParamSleep {
     timeMs: number;
@@ -269,6 +273,7 @@ export type ExecutionTask<E extends ExecutionTaskApply<any, any, any> = Executio
     };
     usage?: AIUsageInfo;
     searchAreaUsage?: AIUsageInfo;
+    reasoning_content?: string;
 };
 export interface ExecutionDump extends DumpMeta {
     name: string;

package/dist/types/yaml.d.ts CHANGED Viewed

@@ -129,7 +129,6 @@ export interface MidsceneYamlFlowItemAIAction {
     aiAct?: string;
     aiActionProgressTips?: string[];
     cacheable?: boolean;
-    _deepThink?: boolean;
     [key: string]: unknown;
 }
 export interface MidsceneYamlFlowItemAIAssert {

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@midscene/core",
   "description": "Automate browser actions, extract data, and perform assertions using AI. It offers JavaScript SDK, Chrome extension, and support for scripting in YAML. See https://midscenejs.com/ for details.",
-  "version": "1.0.5-beta-20260104042628.0",
+  "version": "1.0.5-beta-20260105023603.0",
   "repository": "https://github.com/web-infra-dev/midscene",
   "homepage": "https://midscenejs.com/",
   "main": "./dist/lib/index.js",
@@ -89,7 +89,7 @@
     "semver": "7.5.2",
     "js-yaml": "4.1.0",
     "zod": "3.24.3",
-    "@midscene/shared": "1.0.5-beta-20260104042628.0"
+    "@midscene/shared": "1.0.5-beta-20260105023603.0"
   },
   "devDependencies": {
     "@rslib/core": "^0.18.3",