npm - @midscene/core - Versions diffs - 1.4.9 → 1.5.0 - Mend

@midscene/core 1.4.9 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/dist/es/agent/task-builder.mjs +12 -4
package/dist/es/agent/task-builder.mjs.map +1 -1
package/dist/es/agent/utils.mjs +1 -1
package/dist/es/ai-model/conversation-history.mjs +19 -0
package/dist/es/ai-model/conversation-history.mjs.map +1 -1
package/dist/es/ai-model/llm-planning.mjs +23 -7
package/dist/es/ai-model/llm-planning.mjs.map +1 -1
package/dist/es/ai-model/prompt/llm-planning.mjs +239 -25
package/dist/es/ai-model/prompt/llm-planning.mjs.map +1 -1
package/dist/es/device/index.mjs.map +1 -1
package/dist/es/task-runner.mjs +5 -0
package/dist/es/task-runner.mjs.map +1 -1
package/dist/es/task-timing.mjs +12 -0
package/dist/es/task-timing.mjs.map +1 -0
package/dist/es/types.mjs.map +1 -1
package/dist/es/utils.mjs +2 -2
package/dist/lib/agent/task-builder.js +12 -4
package/dist/lib/agent/task-builder.js.map +1 -1
package/dist/lib/agent/utils.js +1 -1
package/dist/lib/ai-model/conversation-history.js +19 -0
package/dist/lib/ai-model/conversation-history.js.map +1 -1
package/dist/lib/ai-model/llm-planning.js +22 -6
package/dist/lib/ai-model/llm-planning.js.map +1 -1
package/dist/lib/ai-model/prompt/llm-planning.js +239 -25
package/dist/lib/ai-model/prompt/llm-planning.js.map +1 -1
package/dist/lib/device/index.js.map +1 -1
package/dist/lib/task-runner.js +5 -0
package/dist/lib/task-runner.js.map +1 -1
package/dist/lib/task-timing.js +46 -0
package/dist/lib/task-timing.js.map +1 -0
package/dist/lib/types.js.map +1 -1
package/dist/lib/utils.js +2 -2
package/dist/types/ai-model/conversation-history.d.ts +8 -0
package/dist/types/ai-model/prompt/llm-planning.d.ts +2 -2
package/dist/types/device/device-options.d.ts +18 -0
package/dist/types/device/index.d.ts +1 -1
package/dist/types/task-timing.d.ts +8 -0
package/dist/types/types.d.ts +10 -0
package/package.json +2 -2

package/dist/types/ai-model/conversation-history.d.ts CHANGED Viewed

@@ -28,6 +28,14 @@ export declare class ConversationHistory {
      * Automatically marks the first pending goal as running.
      */
     setSubGoals(subGoals: SubGoal[]): void;
+    /**
+     * Merge sub-goals from update-plan-content.
+     * Preserves existing descriptions when incoming description is empty.
+     *
+     * This handles compact XML updates like:
+     * <sub-goal index="1" status="finished" />
+     */
+    mergeSubGoals(subGoals: SubGoal[]): void;
     /**
      * Update a single sub-goal by index.
      * Clears logs if status or description actually changes.

package/dist/types/ai-model/prompt/llm-planning.d.ts CHANGED Viewed

@@ -1,10 +1,10 @@
 import type { DeviceAction } from '../../types';
 import type { TModelFamily } from '@midscene/shared/env';
 export declare const descriptionForAction: (action: DeviceAction<any>, locatorSchemaTypeDescription: string) => string;
-export declare function systemPromptToTaskPlanning({ actionSpace, modelFamily, includeBbox, includeThought, deepThink, }: {
+export declare function systemPromptToTaskPlanning({ actionSpace, modelFamily, includeBbox, includeThought, includeSubGoals, }: {
     actionSpace: DeviceAction<any>[];
     modelFamily: TModelFamily | undefined;
     includeBbox: boolean;
     includeThought?: boolean;
-    deepThink?: boolean;
+    includeSubGoals?: boolean;
 }): Promise<string>;

package/dist/types/device/device-options.d.ts CHANGED Viewed

@@ -122,3 +122,21 @@ export type IOSDeviceOpt = {
     /** WDA MJPEG server port for real-time screen streaming (default: 9100) */
     wdaMjpegPort?: number;
 } & IOSDeviceInputOpt;
+/**
+ * HarmonyOS device input options
+ */
+export type HarmonyDeviceInputOpt = {
+    /** Automatically dismiss the keyboard after input is completed */
+    autoDismissKeyboard?: boolean;
+};
+/**
+ * HarmonyOS device options
+ */
+export type HarmonyDeviceOpt = {
+    /** Path to the HDC executable */
+    hdcPath?: string;
+    /** Custom device actions to register */
+    customActions?: DeviceAction<any>[];
+    /** Screenshot resize scale factor */
+    screenshotResizeScale?: number;
+} & HarmonyDeviceInputOpt;

package/dist/types/device/index.d.ts CHANGED Viewed

@@ -2247,4 +2247,4 @@ export type ActionSleepParam = {
 };
 export declare const defineActionSleep: () => DeviceAction<ActionSleepParam>;
 export type { DeviceAction } from '../types';
-export type { AndroidDeviceOpt, AndroidDeviceInputOpt, IOSDeviceOpt, IOSDeviceInputOpt, } from './device-options';
+export type { AndroidDeviceOpt, AndroidDeviceInputOpt, IOSDeviceOpt, IOSDeviceInputOpt, HarmonyDeviceOpt, HarmonyDeviceInputOpt, } from './device-options';

package/dist/types/task-timing.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+import type { ExecutionTask } from './types';
+type ExecutionTaskTiming = NonNullable<ExecutionTask['timing']>;
+type NumericTimingField = {
+    [K in keyof ExecutionTaskTiming]-?: ExecutionTaskTiming[K] extends number | undefined ? K : never;
+}[keyof ExecutionTaskTiming];
+export type TimingSettableField = Exclude<NumericTimingField, 'start' | 'end' | 'cost'>;
+export declare function setTimingFieldOnce(timing: ExecutionTaskTiming | undefined, field: TimingSettableField): void;
+export {};

package/dist/types/types.d.ts CHANGED Viewed

@@ -287,6 +287,16 @@ export type ExecutionTask<E extends ExecutionTaskApply<any, any, any> = Executio
     errorStack?: string;
     timing?: {
         start: number;
+        getUiContextStart?: number;
+        getUiContextEnd?: number;
+        beforeInvokeActionHookStart?: number;
+        beforeInvokeActionHookEnd?: number;
+        callActionStart?: number;
+        callActionEnd?: number;
+        afterInvokeActionHookStart?: number;
+        afterInvokeActionHookEnd?: number;
+        captureAfterCallingSnapshotStart?: number;
+        captureAfterCallingSnapshotEnd?: number;
         end?: number;
         cost?: number;
     };

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@midscene/core",
   "description": "Automate browser actions, extract data, and perform assertions using AI. It offers JavaScript SDK, Chrome extension, and support for scripting in YAML. See https://midscenejs.com/ for details.",
-  "version": "1.4.9",
+  "version": "1.5.0",
   "repository": "https://github.com/web-infra-dev/midscene",
   "homepage": "https://midscenejs.com/",
   "main": "./dist/lib/index.js",
@@ -89,7 +89,7 @@
     "semver": "7.5.2",
     "undici": "^6.0.0",
     "zod": "3.24.3",
-    "@midscene/shared": "1.4.9"
+    "@midscene/shared": "1.5.0"
   },
   "devDependencies": {
     "@rslib/core": "^0.18.3",