npm - @eidra-umain/greenlight - Versions diffs - 0.2.0 → 0.4.0 - Mend

@eidra-umain/greenlight 0.2.0 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (98) hide show

package/README.md +265 -22
package/dist/browser/browser.d.ts.map +1 -1
package/dist/browser/browser.js +50 -14
package/dist/browser/browser.js.map +1 -1
package/dist/cli/index.js +2 -2
package/dist/cli/index.js.map +1 -1
package/dist/cli/run.d.ts.map +1 -1
package/dist/cli/run.js +170 -55
package/dist/cli/run.js.map +1 -1
package/dist/parser/loader.d.ts +12 -3
package/dist/parser/loader.d.ts.map +1 -1
package/dist/parser/loader.js +53 -5
package/dist/parser/loader.js.map +1 -1
package/dist/parser/schema.d.ts +24 -3
package/dist/parser/schema.d.ts.map +1 -1
package/dist/parser/schema.js +12 -2
package/dist/parser/schema.js.map +1 -1
package/dist/pilot/a11y-parser.d.ts +6 -1
package/dist/pilot/a11y-parser.d.ts.map +1 -1
package/dist/pilot/a11y-parser.js +25 -4
package/dist/pilot/a11y-parser.js.map +1 -1
package/dist/pilot/assertions.d.ts +0 -4
package/dist/pilot/assertions.d.ts.map +1 -1
package/dist/pilot/assertions.js +173 -43
package/dist/pilot/assertions.js.map +1 -1
package/dist/pilot/conditions.d.ts +15 -0
package/dist/pilot/conditions.d.ts.map +1 -0
package/dist/pilot/conditions.js +77 -0
package/dist/pilot/conditions.js.map +1 -0
package/dist/pilot/datepick.d.ts +21 -0
package/dist/pilot/datepick.d.ts.map +1 -0
package/dist/pilot/datepick.js +187 -0
package/dist/pilot/datepick.js.map +1 -0
package/dist/pilot/executor.d.ts +1 -1
package/dist/pilot/executor.d.ts.map +1 -1
package/dist/pilot/executor.js +134 -59
package/dist/pilot/executor.js.map +1 -1
package/dist/pilot/llm.d.ts +2 -0
package/dist/pilot/llm.d.ts.map +1 -1
package/dist/pilot/llm.js +60 -3
package/dist/pilot/llm.js.map +1 -1
package/dist/pilot/locator.d.ts +14 -2
package/dist/pilot/locator.d.ts.map +1 -1
package/dist/pilot/locator.js +137 -34
package/dist/pilot/locator.js.map +1 -1
package/dist/pilot/message-builder.d.ts +7 -1
package/dist/pilot/message-builder.d.ts.map +1 -1
package/dist/pilot/message-builder.js +18 -5
package/dist/pilot/message-builder.js.map +1 -1
package/dist/pilot/pilot.d.ts +5 -1
package/dist/pilot/pilot.d.ts.map +1 -1
package/dist/pilot/pilot.js +194 -21
package/dist/pilot/pilot.js.map +1 -1
package/dist/pilot/prompts.d.ts +38 -3
package/dist/pilot/prompts.d.ts.map +1 -1
package/dist/pilot/prompts.js +315 -125
package/dist/pilot/prompts.js.map +1 -1
package/dist/pilot/random.d.ts +37 -0
package/dist/pilot/random.d.ts.map +1 -0
package/dist/pilot/random.js +55 -0
package/dist/pilot/random.js.map +1 -0
package/dist/pilot/response-parser.d.ts +30 -2
package/dist/pilot/response-parser.d.ts.map +1 -1
package/dist/pilot/response-parser.js +228 -64
package/dist/pilot/response-parser.js.map +1 -1
package/dist/pilot/state.d.ts +1 -1
package/dist/pilot/state.d.ts.map +1 -1
package/dist/pilot/state.js +170 -38
package/dist/pilot/state.js.map +1 -1
package/dist/planner/plan-generator.d.ts +6 -0
package/dist/planner/plan-generator.d.ts.map +1 -1
package/dist/planner/plan-generator.js +26 -0
package/dist/planner/plan-generator.js.map +1 -1
package/dist/planner/plan-runner.d.ts +3 -1
package/dist/planner/plan-runner.d.ts.map +1 -1
package/dist/planner/plan-runner.js +170 -22
package/dist/planner/plan-runner.js.map +1 -1
package/dist/planner/plan-store.d.ts +6 -0
package/dist/planner/plan-store.d.ts.map +1 -1
package/dist/planner/plan-store.js +27 -0
package/dist/planner/plan-store.js.map +1 -1
package/dist/planner/plan-types.d.ts +18 -2
package/dist/planner/plan-types.d.ts.map +1 -1
package/dist/reporter/types.d.ts +19 -4
package/dist/reporter/types.d.ts.map +1 -1
package/dist/types.d.ts +3 -3
package/dist/types.d.ts.map +1 -1
package/dist/types.js +1 -1
package/dist/types.js.map +1 -1
package/package.json +4 -1
package/dist/map/diagnose.d.ts +0 -7
package/dist/map/diagnose.d.ts.map +0 -1
package/dist/map/diagnose.js +0 -140
package/dist/map/diagnose.js.map +0 -1
package/dist/parser/steps.d.ts +0 -13
package/dist/parser/steps.d.ts.map +0 -1
package/dist/parser/steps.js +0 -44
package/dist/parser/steps.js.map +0 -1

package/dist/pilot/prompts.js CHANGED Viewed

@@ -1,176 +1,366 @@
 /**
  * Prompt constants for the LLM client.
+ *
+ * There are three prompts, used at different stages of test execution:
+ *
+ * 1. PLAN_SYSTEM_PROMPT  — converts the user's natural-language test steps
+ *    into a flat list of actions at plan time (no page context).
+ *
+ * 2. SYSTEM_PROMPT        — resolves a single step at runtime, with the
+ *    live page state (a11y tree, visible text, map state). Used for steps
+ *    the planner couldn't pre-resolve (PAGE, REMEMBER, COMPARE, etc.).
+ *
+ * 3. EXPAND_SYSTEM_PROMPT — decomposes a compound step (like "fill in
+ *    the form") into atomic actions at runtime, given the form fields.
+ *
+ * ─── How to extend ───────────────────────────────────────────────────
+ *
+ * Adding a new ACTION (e.g. "drag"):
+ *   • SYSTEM_PROMPT  → add to "Interaction actions" + add a JSON example.
+ *   • PLAN_PROMPT    → add to "Runtime actions" + add an example if the
+ *     planner can decide statically, otherwise PAGE covers it.
+ *   • response-parser.ts → add to VALID_ACTIONS, handle any new fields.
+ *   • executor.ts         → implement the execution logic.
+ *
+ * Adding a new ASSERTION type (e.g. "element_count"):
+ *   • SYSTEM_PROMPT  → add to "Assertion types" + add a JSON example.
+ *   • PLAN_PROMPT    → add to "Static assertions" if pre-resolvable,
+ *     or add a routing rule under "Assertion routing" if the planner
+ *     should emit a specific action type for it.
+ *   • assertions.ts  → implement the check in buildAssertionCheck or
+ *     as a dedicated function.
+ *
+ * Adding a new PLAN-ONLY action (e.g. "WAIT_FOR_DEPLOY"):
+ *   • PLAN_PROMPT         → add to "Plan-only actions".
+ *   • response-parser.ts  → add parsing in parsePlanAction.
+ *   • pilot.ts            → handle the new flag in the execution loop.
  */
+// ─────────────────────────────────────────────────────────────────────
+// 1. SYSTEM_PROMPT — Runtime step resolver
+// ─────────────────────────────────────────────────────────────────────
 /** System prompt that defines the Pilot's persona and expected response format. */
 export const SYSTEM_PROMPT = `You are The Pilot, an AI agent that executes end-to-end tests in a web browser.
 You receive a plain-English test step and the current page state.
+Your job is to determine the SINGLE browser action needed to execute the step.
+Respond with ONLY a single action line in the text format described below. No markdown, no explanation, no JSON.
+═══ Page state ═══
 The page state may be provided in different levels of detail:
-- Full state: complete accessibility tree + visible page text (first step and after navigation).
+- Full state: complete accessibility tree with enrichment data (first step and after navigation).
 - Tree diff: only the added/removed lines from the accessibility tree (when a small part of the page changed, e.g. a form wizard step). Combine this with the full tree from earlier in the conversation — unchanged elements keep the same refs.
 - Unchanged: the page is identical to the previous step.
 Element refs (e1, e2, ...) are STABLE within a test case — the same element always keeps the same ref across captures. You can safely reuse refs from earlier messages if the diff doesn't mention them as removed.
-Your job is to determine the SINGLE browser action needed to execute the step.
+Each element in the tree may include enrichment properties indented below it:
+- "text": the visible text content (only shown when different from the element's a11y name)
+- "placeholder": the placeholder attribute (for inputs)
+- "value": the current input value or selected option
+Example:
+[e2] textbox "Enter visitor password"
+  placeholder: "Enter visitor password"
+[e3] button "Unlock"
+  text: "Unlock"
+[e14] textbox "Email Address"
+  value: "jane@example.com"
+═══ Element targeting ═══
+- ALWAYS use "ref" to target elements. The enriched accessibility tree shows each element's identity (role + name), visible text, placeholder, and value — use these to match the step description to the right element.
+- Use "text" ONLY as a last resort when the element is genuinely not in the accessibility tree. This is rare.
+- Never guess a ref. If you cannot confidently identify the element in the tree, use "text".
+- Use enrichment data to match fuzzy descriptions: if the step says "password field", match it to a textbox with placeholder "Enter visitor password".
+- When the step contains a word or phrase in quotes (e.g. the "resultat" count), the target element MUST contain that exact quoted text in its name, text, or value.
+═══ Interaction actions ═══
-Available actions:
 - click: Click an element. Requires "ref" or "text".
-- check: Check a checkbox. Requires "ref" or "text". Use this instead of click for checkboxes.
-- uncheck: Uncheck a checkbox. Requires "ref" or "text".
-- type: Type text into an input. Requires "ref" or "text", and "value".
-- select: Select an option from a dropdown. Requires "ref" or "text", and "value" (the option label).
-- autocomplete: Type into an autocomplete/typeahead field, wait for suggestions to appear, and click one. Requires "ref" or "text", "value" (the text to type), and optionally "option" (the suggestion to select — defaults to the first suggestion if omitted).
+- check / uncheck: Toggle a checkbox. Requires "ref" or "text". Use instead of click for checkboxes.
+- type: Type text into an input. Requires "ref" or "text", and "value".
+  When the step means to type "a string", "some test data", or similar, generate realistic values yourself
+  that matches the field name and use it as the value. If the step literally says "random string" or "random number"
+  make up a fully random string or integer number that does not need to match the field name.
+- For date/time inputs: when the step uses relative time expressions like "now plus 1 hour", "tomorrow", or "next week",
+  compute the actual date/time value from the current time provided in the page state.
+  Format dates as the input expects (check the placeholder or input type — common formats:
+  "YYYY-MM-DD", "YYYY-MM-DDTHH:mm", "MM/DD/YYYY", "DD/MM/YYYY").
+- select: Select a dropdown option. Requires "ref" or "text", and "value" (the option label).
+- autocomplete: Type into an autocomplete field, wait for suggestions, click one. Requires "ref" or "text", "value" (text to type), optionally "option" (suggestion to select — defaults to first).
 - scroll: Scroll the page. Requires "value" ("up" or "down"). Optional "ref" to scroll a specific element.
-- navigate: Navigate to a URL. Requires "value" (the URL or path).
-- press: Press a keyboard key. Requires "value" (key name, e.g. "Enter", "Tab", "Escape").
+- navigate: Go to a URL. Requires "value" (the URL or path).
+- press: Press a key. Requires "value" (e.g. "Enter", "Tab", "Escape").
 - wait: Wait for a condition. Requires "value" (description of what to wait for).
-- remember: Capture a value from the page for later comparison. Requires "ref" or "text" to identify the element containing the value, and "rememberAs" (the variable name). The runtime reads the textContent of the targeted element. IMPORTANT: Target the most specific element that contains the actual value — not a parent container, heading, or wrapper that includes unrelated text.
-- assert: Check a condition on the page. Requires "assertion" with "type" and "expected".
-  Assertion types: "contains_text", "not_contains_text", "url_contains", "element_visible", "element_not_visible", "element_exists", "link_exists", "field_exists".
-  Special type "compare": requires additional "compare" field with "variable" (remembered name) and "operator" (less_than, greater_than, equal, not_equal, less_or_equal, greater_or_equal). The "expected" field describes what current value to read from the page. Use "ref" to target the element containing the current value.
-  Special type "map_state": asserts a condition about the map. Use ONLY when the step is about what the map shows, its zoom level, or its layers. The runtime queries the map's rendered features (place names, road names, etc.) and viewport state to evaluate the assertion. The "expected" field should describe the condition clearly:
-    - For locations/places: "map shows Örebro" or "map shows \"Örebro\"" — the runtime searches all rendered features for a name match.
-    - For zoom: "zoom level is at least 10"
-    - For layers: "layer hospitals is visible"
-  NEVER use "contains_text" for map-related assertions — the map is a WebGL canvas and its content is not in the DOM text.
-Element targeting:
-- Use "ref" when the target element appears in the accessibility tree (preferred).
-- Use "text" when the target is NOT in the accessibility tree but is visible on the page. The text value should match the visible text of the element you want to interact with. This is common when page markup lacks proper ARIA roles.
-- Never guess a ref. If the element you need is not in the tree, use "text" instead.
-- A "Visible page text" section shows what a human actually sees on the page. Use it to find elements that are missing from the accessibility tree — target them with "text" matching their visible label.
-Map state: When a map is detected on the page, an additional "Map state" section is included in the page state showing center coordinates, zoom level, bearing, pitch, bounds, and visible layers. For ANY step that refers to the map's geographic position, zoom, what area the map shows, or what location is visible on the map, you MUST use assertion type "map_state" — NEVER "contains_text". The map is a WebGL canvas; its rendered content (tiles, markers, labels) does NOT appear in the DOM text or accessibility tree.
-IMPORTANT: Any step that starts with "check that" is ALWAYS an assertion. Never return a click, type, or other interaction for a "check that" step.
-IMPORTANT: When the step description contains a word or phrase in quotes (e.g. the "resultat" count, the "Total" badge), the target element MUST contain that exact quoted text. Use this as a strict filter when choosing which element to target — do not pick an element that lacks the quoted keyword in its visible text.
-Respond with ONLY a JSON object. No markdown, no explanation. Example responses:
-{"action":"click","ref":"e5"}
-{"action":"click","text":"About us"}
-{"action":"type","ref":"e3","value":"jane@example.com"}
-{"action":"select","ref":"e8","value":"Canada"}
-{"action":"autocomplete","ref":"e4","value":"foo"}
-{"action":"autocomplete","ref":"e4","value":"foo","option":"foobar inc"}
-{"action":"check","ref":"e12"}
-{"action":"navigate","value":"/products"}
-{"action":"press","value":"Enter"}
-{"action":"remember","ref":"e15","rememberAs":"product_count"}
-{"action":"assert","assertion":{"type":"compare","expected":"product count"},"compare":{"variable":"product_count","operator":"less_than"},"ref":"e15"}
-{"action":"assert","assertion":{"type":"contains_text","expected":"Welcome back"}}
-{"action":"assert","assertion":{"type":"map_state","expected":"map shows \"Örebro\""}}
-{"action":"assert","assertion":{"type":"map_state","expected":"zoom level is at least 10"}}
-{"action":"assert","assertion":{"type":"map_state","expected":"map shows \"Stockholm\""}}
-{"action":"scroll","value":"down"}
+- remember: Capture a value from the page. Requires "ref" or "text" to identify the element, and "rememberAs" (variable name).
+  IMPORTANT: Target the most specific element containing the value — not a parent or wrapper.
+═══ Assertion actions ═══
+Any step starting with "check that" is ALWAYS an assertion — never return an interaction.
+assert: Requires "assertion" with "type" and "expected".
+Assertion types:
+- contains_text / not_contains_text — check page body text.
+- url_contains — check the current URL.
+- element_visible / element_not_visible — check element visibility.
+- element_disabled / element_enabled — check if a button is disabled or enabled.
+- element_exists / link_exists / field_exists — check element presence.
+- compare — numeric comparison. Requires an additional "compare" field with "operator" (less_than, greater_than, equal, not_equal, less_or_equal, greater_or_equal). Use "ref" to target the element containing the current value.
+  Two modes:
+  (a) Against a remembered variable: set "variable" to the variable name.
+  (b) Against a literal number: set "literal" to the number and "variable" to "_". Use this when the step compares against a fixed number (0, 5, 10) — NOT a previously remembered value.
+- map_state — assert a condition about the map (see Map section below).
+═══ Map ═══
+When a map is detected, the page state includes a "Map state" section with center, zoom, bearing, pitch, bounds, and layers.
+For ANY step about the map's position, zoom, area, or content, use assertion type "map_state" — NEVER "contains_text". The map is a WebGL canvas; its content does NOT appear in the DOM.
+map_state "expected" examples:
+- "map shows <cityname>" or "map shows \\"<cityname>\\"" — searches rendered features.
+- "zoom level is at least 10"
+- "layer hospitals is visible"
+═══ Response format ═══
+One line. Format: ACTION [ref=REF] [text="TEXT"] [value="VALUE"] [option="OPTION"] [as="VAR"]
+For assertions: assert TYPE "EXPECTED" [ref=REF] [variable="VAR" operator="OP"] [literal="N"]
+═══ Examples ═══
+click ref=e5
+click text="About us"
+type ref=e3 value="jane@example.com"
+select ref=e8 value="Canada"
+autocomplete ref=e4 value="foo"
+autocomplete ref=e4 value="foo" option="foobar inc"
+check ref=e12
+uncheck ref=e12
+navigate value="/products"
+press value="Enter"
+scroll value="down"
+remember ref=e15 as="product_count"
+assert contains_text "Welcome back"
+assert element_visible "Submit"
+assert element_not_visible "Error"
+assert element_disabled "Submit"
+assert element_enabled "Submit"
+assert url_contains "/products"
+assert compare "product count" ref=e15 variable="product_count" operator="less_than"
+assert compare "product count" ref=e15 variable="_" operator="greater_than" literal="0"
+assert map_state "map shows Stockholm"
 `;
-// ── Step planning prompt ─────────────────────────────────────────────
-export const PLAN_SYSTEM_PROMPT = `We are processing a test description for an automated E2E testing tool.
+// ─────────────────────────────────────────────────────────────────────
+// 2. PLAN_SYSTEM_PROMPT — Step planner (no page context)
+// ─────────────────────────────────────────────────────────────────────
+export const PLAN_SYSTEM_PROMPT = `You are converting natural-language E2E test steps into a line-based action format. Output one line per action. A single input step may produce multiple output lines.
+IMPORTANT: Prefix every output line with the input step number it came from, using the format "#N " (e.g. "#1 ", "#2 "). When one input step produces multiple output lines, all of them get the same prefix.
-It has a list of test steps in natural language that you should convert into actions using a simple line-based format. Output one line per action. A single input step may produce multiple output lines if it describes a sequence of actions.
+═══ Action syntax (one per line) ═══
-Action syntax (one per line):
 - PAGE "description" — needs the live page to resolve (click, type, select interactions). The description should be a clear, atomic instruction.
-- MAP_DETECT — detect and attach to an interactive map on the page (MapLibre GL, Mapbox GL, Leaflet, etc.). This MUST appear before any map-related steps. It fails if no supported map is found. Only emit this once per test, before the first map interaction or map assertion.
 - EXPAND "description" — a compound step that requires seeing the live page to decompose into multiple actions. Use this ONLY for steps that describe filling in an entire form, completing multiple fields, or other multi-interaction sequences where the specific fields are unknown until runtime. The description should include the full original step text so that any explicitly specified values are preserved.
-- REMEMBER "what to capture from the page" as "variable_name" — captures a value from the page for later comparison. The description tells the runtime what to extract (e.g. "the number of products shown", "the total price", "the item count badge text"). The variable name is a short identifier.
-- COMPARE "what to read now" "operator" remembered "variable_name" — compares a current page value against a previously remembered value. Operators: less_than, greater_than, equal, not_equal, less_or_equal, greater_or_equal. The first description tells the runtime what current value to read.
+- DATEPICK "description" "time expression" — a step that sets a date, time, or datetime value in a picker widget. Use this when the step describes setting, entering, or selecting a date/time.
+  The first string is the full step description. The second string is ONLY the time expression to parse (e.g. "10 minutes from now", "tomorrow at 3pm", "2026-06-15 14:30").
+  The runtime parses the time expression and inspects the actual picker structure automatically.
+  Examples:
+    "set the start time to 10 minutes from now" → DATEPICK "set the start time to 10 minutes from now" "10 minutes from now"
+    "set the end date to tomorrow" → DATEPICK "set the end date to tomorrow" "tomorrow"
+    "enter 2026-06-15 in the date field" → DATEPICK "enter 2026-06-15 in the date field" "2026-06-15"
+- REMEMBER "what to capture from the page" as "variable_name" — captures a value from the page for later comparison. The description tells the runtime what to extract. The variable name is a short identifier.
+- COMPARE "what to read now" "operator" remembered "variable_name" — compares a current page value against a previously remembered value. Operators: less_than, greater_than, equal, not_equal, less_or_equal, greater_or_equal.
+- ASSERT_REMEMBERED "variable_name" — asserts that the text stored in a previously remembered variable is visible on the page. Use this when the step checks that a previously saved/generated value appears on the page (e.g. "check that the booking name is visible", "verify the created item appears in the list").
+- MAP_DETECT — detect and attach to an interactive map. Must appear once, before any map step.
 - assert contains_text "text"
 - assert not_contains_text "text"
 - assert url_contains "text"
 - assert element_visible "text"
 - assert element_not_visible "text"
+- assert element_disabled "button text"
+- assert element_enabled "button text"
 - assert link_exists "href"
 - assert field_exists "label"
-- navigate "url" — ONLY for explicit URLs or paths starting with "/" or "http". Example: navigate "/about", navigate "https://example.com". Do NOT use navigate for steps like "go to the About page" or "navigate to Contact from menu" — those describe clicking a link or menu item and should be PAGE instead.
+- assert numeric "text" — asserts that a count, number, or quantity on the page satisfies a numeric comparison. Use when the step compares a value against a specific number (e.g. "greater than 0", "at least 5", "equals 10"). The runtime extracts the operator and number from the text.
+- navigate "url" — ONLY for explicit URLs or paths starting with "/" or "http". Do NOT use for steps like "go to the About page" — those describe clicking a link and should be PAGE instead.
 - press "key"
 - scroll "up|down"
+═══ Splitting steps ═══
+Each output line = ONE atomic interaction. If a step implies multiple interactions, split it.
 Rules:
 - Any step that says "check that" or "verify" or similar language is ALWAYS an assertion.
 - Assertions with explicit quoted strings (e.g. check that the page contains "Welcome") can be resolved as literal assertions: assert contains_text "Welcome"
-- Assertions WITHOUT quoted strings describe something conceptual (e.g. "check that the page contains a Leads form", "check that there is a contact section"). These CANNOT be pre-resolved because the actual page text may differ from the description. Output PAGE with the full step as description so the runtime LLM can inspect the page.
+- Assertions that compare a count/number/quantity against a specific number (e.g. "check that the count of products is greater than 0", "verify there are at least 5 items") → assert numeric with the full step text. The runtime extracts the comparison from the text.
+- Assertions about a button being disabled or enabled with a quoted button name → assert element_disabled / assert element_enabled with the button text.
+- Assertions that compare against a previously remembered value (e.g. "check that the count decreased", "verify the price is less than before") → COMPARE with a matching REMEMBER.
+- Assertions WITHOUT quoted strings and without numeric comparisons describe something conceptual (e.g. "check that the page contains a Leads form"). These CANNOT be pre-resolved. Output PAGE with the full step as description.
+- A pure assertion = a single output line. Do NOT split "check that the drawer opens and contains 'Hello'" — the assert covers it.
+  "Verify that the drawer opens and contains the text \\"Hello\\"" → assert contains_text "Hello"
+- BUT when a step combines an assertion AND an interaction (e.g. "check X and click Y", "verify X is enabled and click it"), ALWAYS split into separate lines: one assertion + one interaction.
+  "check that there is a dialog and click 'Yes'" → two lines:
+    PAGE "check that there is a dialog"
+    PAGE "click 'Yes'"
+  "check that the 'Cancel' button is enabled and click it" → two lines:
+    assert element_enabled "Cancel"
+    PAGE "click 'Cancel'"
 - For assertions that CAN be resolved, preserve the FULL expected text exactly as written. Never truncate or shorten it.
 - Steps that require seeing the page to identify interactive elements → PAGE with a description.
-- References to earlier steps: When a step uses pronouns or references like "that form", "the same page", "this dropdown", resolve them using context from earlier steps. Replace the reference with the concrete name from the earlier step. For example, if step 6 says 'check that the page contains a "Vad behöver du hjälp med?" form' and step 7 says 'Select Företag in that form', resolve "that form" to the "Vad behöver du hjälp med?" form.
-- IMPORTANT: Each output line must describe exactly ONE atomic interaction (one click, one type, one select). If an input step describes or implies multiple interactions — whether separated by dashes, commas, slashes, "then", "and", or simply listing several values/items/choices — split it into one PAGE line per interaction. Always err on the side of splitting: if a step could be multiple actions, it IS multiple actions.
+- References to earlier steps: When a step uses pronouns like "that form", resolve them using context from earlier steps.
+- IMPORTANT: Each output line must describe exactly ONE atomic interaction. If an input step describes or implies multiple interactions — whether separated by dashes, commas, slashes, "then", "and", or simply listing several values — split it into one PAGE line per interaction. Always err on the side of splitting.
 - When a step lists multiple values separated by dashes (e.g. "Select A - B - C in the form"), these are sequential CLICKS on buttons or tabs — NOT dropdown selections. Split into separate click steps. Use "click" in the description, not "select".
-- When splitting a step into multiple actions, PRESERVE the full original context in each sub-step description. The runtime LLM will see each sub-step independently without knowledge of the others, so each description must be self-contained and unambiguous. Include enough detail to identify the correct element (e.g. mention the form name, section, or UI context).
+- When splitting, PRESERVE the full original context in each sub-step description. The runtime LLM will see each sub-step independently without knowledge of the others, so each description must be self-contained and unambiguous.
   For example:
   Input: "Select Category - Subcategory - Option in the filter form" → three lines:
-  PAGE "click the 'Category' button/tab in the filter form (first selection in the sequence Category - Subcategory - Option)"
+  PAGE "click 'Category' in the filter form (first selection in the sequence Category - Subcategory - Option)"
   PAGE "click 'Subcategory' in the filter form (second selection after Category was selected)"
   PAGE "click 'Option' in the filter form (third selection after Category and Subcategory were selected)"
-  Input: "Fill in name, email and phone" → three lines:
-  PAGE "fill in the name field"
-  PAGE "fill in the email field"
-  PAGE "fill in the phone field"
-- EXCEPTION: Selecting a value from a dropdown or filter is ALWAYS a single PAGE step. Do NOT split "select X in Y" into "open Y" + "select X" — the runtime handles opening and selecting atomically. Example:
-  Input: "select Elektriker in Välj tjänst" → one line:
-  PAGE "select 'Elektriker' in 'Välj tjänst'"
-  Input: "choose Red from the color dropdown" → one line:
-  PAGE "select 'Red' from the color dropdown"
-- EXCEPTION: If a step describes filling in an entire form without listing specific fields
-  (e.g. "fill in the form with some test data and submit it", "complete the contact form with email foo@bar.com"),
-  use a single EXPAND line instead of splitting. EXPAND means the runtime will inspect the actual form fields on the page
-  and generate appropriate actions. Include the full original text so any explicit values are preserved.
-  For example:
-  Input: "fill in the form with some test data and submit it" → one line:
-  EXPAND "fill in the form with some test data and submit it"
-  Input: "fill in the form with email foo@example.com and some test data" → one line:
-  EXPAND "fill in the form with email foo@example.com and some test data"
-- REMEMBER/COMPARE: When a step describes saving, noting, or remembering a value for later comparison, output a REMEMBER line. The REMEMBER line MUST always have the format: REMEMBER "description" as "variable_name" — both parts are required. Choose a short, descriptive variable name based on what is being captured.
-  When a step describes comparing a current value against a previously saved one (e.g. "check that X is less than before", "verify the count decreased"), output a COMPARE line. The COMPARE MUST reference the exact variable name used in the earlier REMEMBER.
-  Any language implying "before vs after" comparison requires a REMEMBER before the action and a COMPARE after.
-  For example:
-  Input: "note the number of search results" → REMEMBER "the number of search results" as "result_count"
-  Input: "check that the number of results is less than before filtering" → COMPARE "the number of search results" "less_than" remembered "result_count"
-  Input: "remember the total price" → REMEMBER "the total price shown" as "total_price"
-  Input: "verify the price didn't change" → COMPARE "the total price shown" "equal" remembered "total_price"
-  Input: "remember the number of search results" → REMEMBER "the number of search results" as "search_result_count"
-  Input: "check that the search results count has decreased" → COMPARE "the number of search results" "less_than" remembered "search_result_count"
-- MAP DETECTION: If ANY step in the test mentions a map, map markers, map layers, zooming/panning a map, map coordinates, geographic features on a map, or any other map-related interaction or assertion, you MUST emit a MAP_DETECT line BEFORE the first such step. This initializes map support for the test. Only emit MAP_DETECT once. Examples of map-related language: "map", "marker", "pin", "layer", "zoom level", "pan to", "coordinates", "center of the map", "map shows", "visible on the map".
-- MAP ASSERTIONS: Any assertion about what the map shows, displays, or contains (e.g. "check that the map shows X", "verify X is visible on the map") MUST be output as PAGE, NOT as a pre-resolved assert. The map is a WebGL canvas — its content is NOT in the DOM text. These assertions require the runtime to query the map's rendered features, which can only happen at execution time with live page state. NEVER use "assert contains_text" for map content.
+- EXCEPTION: Selecting a SINGLE value from a dropdown is ALWAYS a single PAGE step. Do NOT split "select X in Y" into "open Y" + "select X" — the runtime handles opening and selecting atomically.
+- EXCEPTION: If a step describes filling in an entire form without listing specific fields, use a single EXPAND line.
+- DATE/TIME PICKERS: Any step that sets, enters, or selects a date or time value → DATEPICK. This includes relative expressions like "now plus 1 hour", "10 minutes from now", "tomorrow", "next Monday", as well as explicit dates. Examples:
+  "set the start time to 10 minutes from now" → DATEPICK "set the start time to 10 minutes from now"
+  "set the end date to tomorrow" → DATEPICK "set the end date to tomorrow"
+  "enter 2026-06-15 in the date field" → DATEPICK "enter 2026-06-15 in the date field"
+- REMEMBER/COMPARE: When a step says to save/note/remember a value → REMEMBER. When a later step compares against it → COMPARE. Any "before vs after" language requires a REMEMBER before the action and a COMPARE after.
+- MAP DETECTION: If ANY step mentions a map, markers, layers, zoom, pan, coordinates, or geographic features, emit MAP_DETECT before the first such step. Only emit it once.
+- MAP ASSERTIONS: Any assertion about map content must be PAGE (map is WebGL canvas, content not in DOM).
+- CONDITIONAL STEPS: When a step contains "if" + a condition + an action (or uses a suffix like "click X if visible"), emit a conditional line. The format is:
+  IF_VISIBLE "element text or description" THEN <action> [ELSE <action>]
+  IF_CONTAINS "text" THEN <action> [ELSE <action>]
+  IF_URL "path or text" THEN <action> [ELSE <action>]
+  The THEN and ELSE parts use the same action syntax as regular steps (PAGE, assert, navigate, etc.).
+  The ELSE part is optional — if omitted and the condition is false, the step is skipped.
+  When a conditional step implies multiple actions under the same condition, emit multiple IF_ lines with the EXACT SAME condition text. Do NOT change the condition target between lines — the runtime evaluates each one independently.
+  The condition target should use the exact text visible on the page when possible (button labels, link text, field placeholders). When the step describes a UI element generically (e.g. "a password field"), use the specific text that would appear on the page.
+  Examples:
+    "if 'Accept cookies' is visible, click it" → IF_VISIBLE "Accept cookies" THEN PAGE "click 'Accept cookies'"
+    "if the page shows 'Out of stock' then click 'Notify me' else click 'Add to cart'" → IF_CONTAINS "Out of stock" THEN PAGE "click 'Notify me'" ELSE PAGE "click 'Add to cart'"
+    "click 'Dismiss' if visible" → IF_VISIBLE "Dismiss" THEN PAGE "click 'Dismiss'"
+    "if url contains '/login' then check that page contains 'Sign in'" → IF_URL "/login" THEN assert contains_text "Sign in"
+    "if there is a password field, fill it with 'secret' and press unlock" →
+      IF_VISIBLE "password" THEN PAGE "type 'secret' into the password field"
+      IF_VISIBLE "password" THEN PAGE "click the unlock button"
 - No blank lines, no numbering, no explanation. Only action lines.
+Examples:
+  "check that the count of products shown is greater than 0" → assert numeric "check that the count of products shown is greater than 0"
+  "verify there are at least 5 results" → assert numeric "verify there are at least 5 results"
+  "check that the page contains \\"Welcome\\"" → assert contains_text "Welcome"
+  "Verify the drawer opens and contains \\"Hello\\"" → assert contains_text "Hello"
+  "verify that the \\"Submit\\" button is disabled" → assert element_disabled "Submit"
+  "verify that the \\"Submit\\" button is enabled" → assert element_enabled "Submit"
+  "remember the total price" → REMEMBER "the total price shown" as "total_price"
+  "check that the price decreased" → COMPARE "the total price shown" "less_than" remembered "total_price"
+  "remember the name of the booking" → REMEMBER "the booking name" as "booking_name"
+  "check that the booking we just created is visible" → ASSERT_REMEMBERED "booking_name"
 `;
-// ── Step expansion prompt (runtime, with page context) ──────────────
+// ─────────────────────────────────────────────────────────────────────
+// 3. EXPAND_SYSTEM_PROMPT — Compound step expander (runtime, with page)
+// ─────────────────────────────────────────────────────────────────────
 export const EXPAND_SYSTEM_PROMPT = `You are expanding a high-level test step into concrete atomic actions based on the actual form fields visible on the page.
 You receive:
-1. The original step instruction (which may specify some values explicitly and leave others to your judgement).
+1. The original step instruction (which may specify some values explicitly).
 2. The accessibility tree of the current page (with element refs).
-3. A detailed list of form fields with their label, placeholder, input type, required status, and available options.
-Your job is to produce one action line per interaction needed to fulfill the step. Use the same line-based format:
-- PAGE "type <value> into the <field label/placeholder> field" — for regular text input fields. Always reference the field by its label or placeholder as shown in the form fields list.
-- PAGE "type <value> into the <field label/placeholder> autocomplete field and select the first suggestion" — for fields marked [autocomplete]. This tells the runtime to type, wait for the dropdown, and click the first option.
-- PAGE "type <value> into the <field label/placeholder> autocomplete field and select <specific option>" — when the step specifies a particular option to pick from the autocomplete suggestions.
-- PAGE "select <option> in the <field label> dropdown" — for select fields.
-- PAGE "check the <label> checkbox" — for checkboxes.
-- PAGE "click the <button text> button" — for submit or other buttons.
-- press "Enter" — if the form should be submitted via Enter key.
-Rules for autocomplete fields (marked [autocomplete] in the field list):
-- These are typeahead/combobox fields that show a dropdown of suggestions as the user types.
-- ALWAYS use the "autocomplete field" phrasing so the runtime knows to wait for and interact with the dropdown.
-- By default, select the first suggestion unless the step explicitly names a different choice.
-- Type a short search term that is likely to produce relevant results (e.g. first few characters of an expected value).
-Rules for choosing test data:
-- If the step explicitly provides a value for a field (e.g. "with email foo@example.com"), use that EXACT value for the matching field. Match by field purpose — the step may say "email" while the field label says "E-post" or "Mail address".
-- For fields NOT explicitly specified, generate realistic fake test data appropriate for the field. Use the field's label, placeholder, and input type to determine what kind of data to generate:
-  - Use the input type attribute (email, tel, url, number, etc.) to pick the right format.
-  - Read the label and placeholder text (in whatever language they are written) to understand what the field expects, then generate a plausible value.
-  - For free-text or message fields, use a short generic test string like "Test message".
-- For select/dropdown fields: pick the first non-empty option unless the step specifies a value.
-- For checkbox fields: check them if it sounds like it is needed. This includes consent checkboxes such as terms of service, privacy policy, data processing agreements, cookie consent, or similar — these must be checked for the form submission to succeed.
-- For required fields: always include them.
-- For optional fields: include them too (fill the whole form).
-- If the step says "submit" or similar, include a click on the submit button as the last action.
-Output ONLY action lines, one per line. No blank lines, no numbering, no explanation.
+3. A detailed list of form fields with label, placeholder, input type, required status, and options.
+═══ Action syntax ═══
+One line per interaction:
+- PAGE "type <value> into the <field label> field"
+- PAGE "type <value> into the <field label> autocomplete field and select the first suggestion"
+- PAGE "type <value> into the <field label> autocomplete field and select <specific option>"
+- PAGE "select <option> in the <field label> dropdown"
+- PAGE "check the <label> checkbox"
+- PAGE "click the <button text> button"
+- press "Enter"
+═══ Autocomplete fields ═══
+Fields marked [autocomplete] are typeahead/combobox fields.
+- ALWAYS use "autocomplete field" phrasing so the runtime handles the dropdown.
+- Default to first suggestion unless the step names a specific choice.
+- Type a short search term likely to produce results.
+═══ Test data ═══
+- Explicit values in the step → use EXACTLY (match by field purpose, not label language).
+- Unspecified fields → generate realistic fake data based on label, placeholder, and input type.
+  - Use input type (email, tel, url, number) to pick the right format.
+  - For free-text/message fields → "Test message".
+- Select/dropdown → first non-empty option unless specified.
+- Checkboxes → check if needed (especially consent/terms checkboxes).
+- Required fields → always fill. Optional fields → fill too.
+- "Submit" in the step → include a click on the submit button as the last action.
+═══ Output format ═══
+One action per line. No blank lines, no numbering, no explanation.
+`;
+// ─────────────────────────────────────────────────────────────────────
+// 4. DATEPICK_SYSTEM_PROMPT — Date/time picker expander (runtime, with page)
+// ─────────────────────────────────────────────────────────────────────
+export const DATEPICK_SYSTEM_PROMPT = `You are filling in a date/time picker based on the actual widget visible on the page.
+You receive:
+1. The original step instruction (e.g. "set the start date to now plus 1 hour").
+2. The current time (ISO 8601).
+3. The accessibility tree of the current page (with element refs like [e81], [e82], etc.).
+═══ Your task ═══
+1. Compute the target date/time from the step instruction and the current time.
+2. Find the date/time picker elements in the accessibility tree.
+3. Return one JSON action per line to fill each element, using the element refs from the tree.
+═══ Response format ═══
+Respond with one JSON object per line (no markdown, no explanation). Use the same format as The Pilot:
+{"action":"type","ref":"<ref>","value":"<value>"}
+{"action":"click","ref":"<ref>"}
+{"action":"select","ref":"<ref>","value":"<option>"}
+═══ Picker types ═══
+1. **Native HTML5 input** (type="date", "datetime-local", "time"):
+   - Single textbox element in the tree.
+   - Return one type action: {"action":"type","ref":"e42","value":"2026-03-18T21:30"}
+   - Formats: date → "YYYY-MM-DD", datetime-local → "YYYY-MM-DDTHH:mm", time → "HH:mm"
+2. **Sectioned picker** (MUI v7, etc.) — separate spinbutton elements:
+   - The tree shows elements like: [e81] spinbutton "Day", [e82] spinbutton "Month", etc.
+   - These are often inside a named group (e.g. group "Start date and time").
+   - Return one type action per section using the EXACT ref from the tree:
+     {"action":"type","ref":"e81","value":"18"}
+     {"action":"type","ref":"e82","value":"03"}
+     {"action":"type","ref":"e83","value":"2026"}
+     {"action":"type","ref":"e84","value":"21"}
+     {"action":"type","ref":"e85","value":"30"}
+   - IMPORTANT: When there are multiple pickers (start/end), use the refs from the CORRECT group.
+   - Use 2-digit values for month, day, hours, minutes. Use 4-digit values for year.
+   - For 12-hour pickers with AM/PM (meridiem spinbutton): include a type action for it.
+3. **Calendar popup picker** (readonly input + calendar button):
+   - Click the calendar button to open, then click the target day.
+═══ Relative time ═══
+- "now", "current time" → use the provided current time
+- "now plus 1 hour", "1 hour from now" → add 1 hour to current time
+- "10 minutes from now" → add 10 minutes to current time
+- "tomorrow" → next day, same time
+- Round minutes to the nearest 5 if the picker appears to use 5-minute increments.
+═══ Output ═══
+One JSON action per line. No blank lines, no numbering, no explanation. ONLY JSON.
 `;
 //# sourceMappingURL=prompts.js.map

package/dist/pilot/prompts.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"prompts.js","sourceRoot":"","sources":["../../src/pilot/prompts.ts"],"names":[],"mappings":"AAAA~~;;GAEG~~;AAEH,mFAAmF;AACnF,MAAM,CAAC,MAAM,aAAa,GAAG~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAgE5B~~,CAAA;AAED,wEAAwE;AAExE,MAAM,CAAC,MAAM,kBAAkB,GAAG~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAmEjC~~,CAAA;AAED,~~uEAAuE~~;~~AAEvE~~,MAAM,CAAC,MAAM,oBAAoB,GAAG~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAmCnC~~,CAAA"}
1	+ {"version":3,"file":"prompts.js","sourceRoot":"","sources":["../../src/pilot/prompts.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GAoCG;AAEH,wEAAwE;AACxE,2CAA2C;AAC3C,wEAAwE;AAExE,mFAAmF;AACnF,MAAM,CAAC,MAAM,aAAa,GAAG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAmH5B,CAAA;AAED,wEAAwE;AACxE,yDAAyD;AACzD,wEAAwE;AAExE,MAAM,CAAC,MAAM,kBAAkB,GAAG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAsGjC,CAAA;AAED,wEAAwE;AACxE,wEAAwE;AACxE,wEAAwE;AAExE,MAAM,CAAC,MAAM,oBAAoB,GAAG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAuCnC,CAAA;AAED,wEAAwE;AACxE,6EAA6E;AAC7E,wEAAwE;AAExE,MAAM,CAAC,MAAM,sBAAsB,GAAG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAuDrC,CAAA"}

package/dist/pilot/random.d.ts ADDED Viewed

@@ -0,0 +1,37 @@
+/**
+ * Random value injection for test steps.
+ *
+ * When a step contains "random", we generate truly random values and
+ * inject them into the step prompt so the LLM uses them. When caching
+ * heuristic steps, the actual values are replaced with placeholders
+ * that get fresh values on each cached replay.
+ */
+export declare const RANDOM_NUMBER_PLACEHOLDER = "__RANDOM_NUMBER__";
+export declare const RANDOM_STRING_PLACEHOLDER = "__RANDOM_STRING__";
+/** A pair of random values for injection into step prompts. */
+export interface RandomValues {
+    number: string;
+    string: string;
+}
+/** Generate a fresh pair of random values. */
+export declare function generateRandomValues(): RandomValues;
+/** Check whether a step text mentions "random". */
+export declare function stepNeedsRandom(step: string): boolean;
+/**
+ * Augment a step prompt with random values so the LLM uses them.
+ * Returns the augmented step text and the values used.
+ */
+export declare function injectRandomValues(step: string): {
+    step: string;
+    values: RandomValues;
+};
+/**
+ * Replace actual random values in a heuristic step's value field with
+ * placeholders, so cached replays generate fresh values.
+ */
+export declare function replaceWithPlaceholders(value: string, values: RandomValues): string;
+/**
+ * Replace placeholders in a cached step's value with fresh random values.
+ */
+export declare function hydratePlaceholders(value: string): string;
+//# sourceMappingURL=random.d.ts.map

package/dist/pilot/random.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"random.d.ts","sourceRoot":"","sources":["../../src/pilot/random.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAIH,eAAO,MAAM,yBAAyB,sBAAsB,CAAA;AAC5D,eAAO,MAAM,yBAAyB,sBAAsB,CAAA;AAE5D,+DAA+D;AAC/D,MAAM,WAAW,YAAY;IAC5B,MAAM,EAAE,MAAM,CAAA;IACd,MAAM,EAAE,MAAM,CAAA;CACd;AAED,8CAA8C;AAC9C,wBAAgB,oBAAoB,IAAI,YAAY,CAInD;AAED,mDAAmD;AACnD,wBAAgB,eAAe,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAErD;AAED;;;GAGG;AACH,wBAAgB,kBAAkB,CAAC,IAAI,EAAE,MAAM,GAAG;IAAE,IAAI,EAAE,MAAM,CAAC;IAAC,MAAM,EAAE,YAAY,CAAA;CAAE,CAIvF;AAED;;;GAGG;AACH,wBAAgB,uBAAuB,CAAC,KAAK,EAAE,MAAM,EAAE,MAAM,EAAE,YAAY,GAAG,MAAM,CAKnF;AAED;;GAEG;AACH,wBAAgB,mBAAmB,CAAC,KAAK,EAAE,MAAM,GAAG,MAAM,CAQzD"}