npm - @testdriverai/agent - Versions diffs - 7.8.0-test.38 - Mend

@testdriverai/agent 7.8.0-test.38

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (528) hide show

package/.claude/settings.local.json +7 -0
package/.env.example +4 -0
package/.prettierignore +4 -0
package/.prettierrc +1 -0
package/CHANGELOG.md +953 -0
package/README.md +81 -0
package/agent/events.js +135 -0
package/agent/index.js +2450 -0
package/agent/interface.js +35 -0
package/agent/lib/analytics.js +22 -0
package/agent/lib/censorship.js +75 -0
package/agent/lib/commander.js +246 -0
package/agent/lib/commands.js +1684 -0
package/agent/lib/config.js +60 -0
package/agent/lib/generator.js +91 -0
package/agent/lib/http.js +144 -0
package/agent/lib/logger.js +56 -0
package/agent/lib/outputs.js +29 -0
package/agent/lib/parser.js +209 -0
package/agent/lib/redraw.js +386 -0
package/agent/lib/resources/cursor-2.png +0 -0
package/agent/lib/sandbox.js +1104 -0
package/agent/lib/sdk.js +633 -0
package/agent/lib/session.js +25 -0
package/agent/lib/source-mapper.js +342 -0
package/agent/lib/subimage/index.js +77 -0
package/agent/lib/subimage/opencv.js +69 -0
package/agent/lib/system.js +204 -0
package/agent/lib/theme.js +14 -0
package/agent/lib/valid-version.js +21 -0
package/agent/lib/validation.js +169 -0
package/ai/.claude-plugin/plugin.json +9 -0
package/ai/agents/testdriver.md +638 -0
package/ai/skills/testdriver-ai/SKILL.md +204 -0
package/ai/skills/testdriver-assert/SKILL.md +315 -0
package/ai/skills/testdriver-aws-setup/SKILL.md +448 -0
package/ai/skills/testdriver-cache/SKILL.md +221 -0
package/ai/skills/testdriver-caching/SKILL.md +124 -0
package/ai/skills/testdriver-captcha/SKILL.md +158 -0
package/ai/skills/testdriver-ci-cd/SKILL.md +602 -0
package/ai/skills/testdriver-click/SKILL.md +286 -0
package/ai/skills/testdriver-client/SKILL.md +477 -0
package/ai/skills/testdriver-cloud/SKILL.md +119 -0
package/ai/skills/testdriver-customizing-devices/SKILL.md +319 -0
package/ai/skills/testdriver-dashcam/SKILL.md +418 -0
package/ai/skills/testdriver-debugging-with-screenshots/SKILL.md +401 -0
package/ai/skills/testdriver-device-config/SKILL.md +317 -0
package/ai/skills/testdriver-double-click/SKILL.md +102 -0
package/ai/skills/testdriver-elements/SKILL.md +605 -0
package/ai/skills/testdriver-enterprise/SKILL.md +114 -0
package/ai/skills/testdriver-errors/SKILL.md +246 -0
package/ai/skills/testdriver-events/SKILL.md +356 -0
package/ai/skills/testdriver-examples/SKILL.md +7 -0
package/ai/skills/testdriver-exec/SKILL.md +317 -0
package/ai/skills/testdriver-find/SKILL.md +829 -0
package/ai/skills/testdriver-focus-application/SKILL.md +293 -0
package/ai/skills/testdriver-generating-tests/SKILL.md +36 -0
package/ai/skills/testdriver-hover/SKILL.md +278 -0
package/ai/skills/testdriver-locating-elements/SKILL.md +71 -0
package/ai/skills/testdriver-making-assertions/SKILL.md +32 -0
package/ai/skills/testdriver-mcp/SKILL.md +7 -0
package/ai/skills/testdriver-mcp-workflow/SKILL.md +410 -0
package/ai/skills/testdriver-mouse-down/SKILL.md +161 -0
package/ai/skills/testdriver-mouse-up/SKILL.md +164 -0
package/ai/skills/testdriver-parse/SKILL.md +236 -0
package/ai/skills/testdriver-performing-actions/SKILL.md +54 -0
package/ai/skills/testdriver-press-keys/SKILL.md +348 -0
package/ai/skills/testdriver-provision/SKILL.md +331 -0
package/ai/skills/testdriver-quickstart/SKILL.md +144 -0
package/ai/skills/testdriver-redraw/SKILL.md +214 -0
package/ai/skills/testdriver-reusable-code/SKILL.md +249 -0
package/ai/skills/testdriver-right-click/SKILL.md +123 -0
package/ai/skills/testdriver-running-tests/SKILL.md +185 -0
package/ai/skills/testdriver-screenshot/SKILL.md +248 -0
package/ai/skills/testdriver-screenshots/SKILL.md +184 -0
package/ai/skills/testdriver-scroll/SKILL.md +335 -0
package/ai/skills/testdriver-secrets/SKILL.md +115 -0
package/ai/skills/testdriver-self-hosted/SKILL.md +65 -0
package/ai/skills/testdriver-test-writer/SKILL.md +448 -0
package/ai/skills/testdriver-testdriver/SKILL.md +628 -0
package/ai/skills/testdriver-testdriver-mechanic/SKILL.md +165 -0
package/ai/skills/testdriver-type/SKILL.md +357 -0
package/ai/skills/testdriver-variables/SKILL.md +111 -0
package/ai/skills/testdriver-wait/SKILL.md +50 -0
package/ai/skills/testdriver-waiting-for-elements/SKILL.md +90 -0
package/ai/skills/testdriver-what-is-testdriver/SKILL.md +54 -0
package/bin/testdriverai.js +22 -0
package/debugger/bg.png +0 -0
package/debugger/icon.png +0 -0
package/debugger/index.html +469 -0
package/debugger/td.png +0 -0
package/debugger/tray-buffered.png +0 -0
package/debugger/tray.png +0 -0
package/docs/GITHUB_COMMENTS.md +330 -0
package/docs/GITHUB_COMMENTS_ANNOUNCEMENT.md +167 -0
package/docs/QUICK-START-GITHUB-COMMENTS.md +84 -0
package/docs/TEST-GITHUB-COMMENTS.md +129 -0
package/docs/_data/examples-manifest.json +177 -0
package/docs/_data/examples-manifest.schema.json +41 -0
package/docs/_scripts/extract-example-urls.js +165 -0
package/docs/_scripts/generate-examples.js +560 -0
package/docs/_scripts/generate-skills.js +154 -0
package/docs/_scripts/link-replacer.js +164 -0
package/docs/_scripts/upload-docs-to-openai.js +284 -0
package/docs/changelog.mdx +161 -0
package/docs/claude-mcp-plugin.mdx +160 -0
package/docs/docs.json +442 -0
package/docs/github-integration-setup.md +266 -0
package/docs/guide/best-practices-polling.mdx +174 -0
package/docs/images/content/account/newprojectsettings.png +0 -0
package/docs/images/content/account/projectpage.png +0 -0
package/docs/images/content/account/projectreplays.png +0 -0
package/docs/images/content/account/team-manage.png +0 -0
package/docs/images/content/account/teampage.png +0 -0
package/docs/images/content/extension/cursor.svg +1 -0
package/docs/images/content/extension/vscode.svg +57 -0
package/docs/images/content/extension/windsurf.svg +3 -0
package/docs/images/content/parse/output.png +0 -0
package/docs/images/content/self-hosted/launchtemplateid.png +0 -0
package/docs/images/content/side-by-side.png +0 -0
package/docs/images/content/vscode/ide-full.png +0 -0
package/docs/images/content/vscode/running.png +0 -0
package/docs/images/content/vscode/v7-chat.png +0 -0
package/docs/images/content/vscode/v7-choose-agent.png +0 -0
package/docs/images/content/vscode/v7-full.png +0 -0
package/docs/images/content/vscode/v7-onboarding.png +0 -0
package/docs/images/content/vscode/vscode-2-assert.png +0 -0
package/docs/images/content/vscode/vscode-agent-preview.png +0 -0
package/docs/images/content/vscode/vscode-copilot-ask.png +0 -0
package/docs/images/content/vscode/vscode-file-creation.png +0 -0
package/docs/images/content/vscode/vscode-install.png +0 -0
package/docs/images/content/vscode/vscode-overview.png +0 -0
package/docs/images/content/vscode/vscode-setup-walkthrough.png +0 -0
package/docs/images/content/vscode/vscode-stopchat.png +0 -0
package/docs/images/content/vscode/vscode-stoptest.png +0 -0
package/docs/images/content/vscode/vscode-tdservice.png +0 -0
package/docs/images/content/vscode/vscode-test-output.png +0 -0
package/docs/images/content/vscode/vscode-testhistory.png +0 -0
package/docs/images/content/vscode/vscode-testpane-runtests.png +0 -0
package/docs/images/content/vscode/vscode-testpane.png +0 -0
package/docs/images/template/dark.png +0 -0
package/docs/images/template/icon.png +0 -0
package/docs/images/template/light.png +0 -0
package/docs/snippets/calendar-link.mdx +4 -0
package/docs/snippets/gitignore-warning.mdx +7 -0
package/docs/snippets/lifecycle-warning.mdx +6 -0
package/docs/snippets/test-prereqs.mdx +12 -0
package/docs/snippets/tests/assert-replay.mdx +7 -0
package/docs/snippets/tests/assert-yaml.mdx +8 -0
package/docs/snippets/tests/exec-js-replay.mdx +7 -0
package/docs/snippets/tests/exec-js-yaml.mdx +32 -0
package/docs/snippets/tests/exec-shell-replay.mdx +7 -0
package/docs/snippets/tests/exec-shell-yaml.mdx +15 -0
package/docs/snippets/tests/hover-image-replay.mdx +7 -0
package/docs/snippets/tests/hover-image-yaml.mdx +17 -0
package/docs/snippets/tests/hover-text-replay.mdx +7 -0
package/docs/snippets/tests/hover-text-with-description-replay.mdx +7 -0
package/docs/snippets/tests/hover-text-with-description-yaml.mdx +24 -0
package/docs/snippets/tests/hover-text-yaml.mdx +14 -0
package/docs/snippets/tests/match-image-replay.mdx +7 -0
package/docs/snippets/tests/match-image-yaml.mdx +17 -0
package/docs/snippets/tests/press-keys-replay.mdx +7 -0
package/docs/snippets/tests/press-keys-yaml.mdx +36 -0
package/docs/snippets/tests/remember-replay.mdx +7 -0
package/docs/snippets/tests/remember-yaml.mdx +28 -0
package/docs/snippets/tests/scroll-replay.mdx +7 -0
package/docs/snippets/tests/scroll-until-image-replay.mdx +7 -0
package/docs/snippets/tests/scroll-until-image-yaml.mdx +14 -0
package/docs/snippets/tests/scroll-until-text-replay.mdx +7 -0
package/docs/snippets/tests/scroll-until-text-yaml.mdx +17 -0
package/docs/snippets/tests/scroll-yaml.mdx +30 -0
package/docs/snippets/tests/type-repeated-replay.mdx +7 -0
package/docs/snippets/tests/type-repeated-yaml.mdx +22 -0
package/docs/snippets/tests/type-replay.mdx +7 -0
package/docs/snippets/tests/type-yaml.mdx +28 -0
package/docs/snippets/tests/wait-for-image-replay.mdx +7 -0
package/docs/snippets/tests/wait-for-image-yaml.mdx +18 -0
package/docs/snippets/tests/wait-for-text-replay.mdx +7 -0
package/docs/snippets/tests/wait-for-text-yaml.mdx +18 -0
package/docs/snippets/tests/wait-replay.mdx +7 -0
package/docs/snippets/tests/wait-yaml.mdx +13 -0
package/docs/styles.css +65 -0
package/docs/v6/account/dashboard.mdx +16 -0
package/docs/v6/account/enterprise.mdx +110 -0
package/docs/v6/account/pricing.mdx +33 -0
package/docs/v6/account/projects.mdx +33 -0
package/docs/v6/account/team.mdx +35 -0
package/docs/v6/action/ami.mdx +109 -0
package/docs/v6/action/performance.mdx +105 -0
package/docs/v6/action/secrets.mdx +93 -0
package/docs/v6/apps/chrome-extensions.mdx +48 -0
package/docs/v6/apps/desktop-apps.mdx +93 -0
package/docs/v6/apps/mobile-apps.mdx +26 -0
package/docs/v6/apps/static-websites.mdx +54 -0
package/docs/v6/apps/tauri-apps.mdx +361 -0
package/docs/v6/bugs/jira.mdx +232 -0
package/docs/v6/cli/overview.mdx +66 -0
package/docs/v6/commands/assert.mdx +45 -0
package/docs/v6/commands/exec.mdx +276 -0
package/docs/v6/commands/focus-application.mdx +44 -0
package/docs/v6/commands/hover-image.mdx +69 -0
package/docs/v6/commands/hover-text.mdx +47 -0
package/docs/v6/commands/if.mdx +53 -0
package/docs/v6/commands/match-image.mdx +67 -0
package/docs/v6/commands/press-keys.mdx +87 -0
package/docs/v6/commands/remember.mdx +49 -0
package/docs/v6/commands/run.mdx +44 -0
package/docs/v6/commands/scroll-until-image.mdx +66 -0
package/docs/v6/commands/scroll-until-text.mdx +60 -0
package/docs/v6/commands/scroll.mdx +69 -0
package/docs/v6/commands/type.mdx +45 -0
package/docs/v6/commands/wait-for-image.mdx +54 -0
package/docs/v6/commands/wait-for-text.mdx +48 -0
package/docs/v6/commands/wait.mdx +45 -0
package/docs/v6/exporting/junit.mdx +218 -0
package/docs/v6/exporting/playwright.mdx +197 -0
package/docs/v6/features/auto-healing.mdx +144 -0
package/docs/v6/features/generation.mdx +116 -0
package/docs/v6/features/parallel-testing.mdx +151 -0
package/docs/v6/features/reusable-snippets.mdx +131 -0
package/docs/v6/features/selectorless.mdx +80 -0
package/docs/v6/features/visual-assertions.mdx +139 -0
package/docs/v6/getting-started/ci.mdx +146 -0
package/docs/v6/getting-started/cli.mdx +91 -0
package/docs/v6/getting-started/editing.mdx +100 -0
package/docs/v6/getting-started/playwright.mdx +342 -0
package/docs/v6/getting-started/running.mdx +48 -0
package/docs/v6/getting-started/self-hosting.mdx +408 -0
package/docs/v6/getting-started/vscode.mdx +88 -0
package/docs/v6/guide/assertions.mdx +189 -0
package/docs/v6/guide/authentication.mdx +136 -0
package/docs/v6/guide/code.mdx +65 -0
package/docs/v6/guide/dashcam.mdx +118 -0
package/docs/v6/guide/environment-variables.mdx +26 -0
package/docs/v6/guide/lifecycle.mdx +242 -0
package/docs/v6/guide/locating.mdx +141 -0
package/docs/v6/guide/protips.mdx +43 -0
package/docs/v6/guide/variables.mdx +143 -0
package/docs/v6/guide/waiting.mdx +130 -0
package/docs/v6/importing/csv.mdx +196 -0
package/docs/v6/importing/gherkin.mdx +143 -0
package/docs/v6/importing/jira.mdx +164 -0
package/docs/v6/importing/testrail.mdx +162 -0
package/docs/v6/integrations/electron.mdx +146 -0
package/docs/v6/integrations/netlify.mdx +100 -0
package/docs/v6/integrations/vercel.mdx +125 -0
package/docs/v6/interactive/explore.mdx +99 -0
package/docs/v6/interactive/run.mdx +52 -0
package/docs/v6/interactive/save.mdx +63 -0
package/docs/v6/overview/comparison.mdx +101 -0
package/docs/v6/overview/faq.mdx +162 -0
package/docs/v6/overview/performance.mdx +52 -0
package/docs/v6/overview/quickstart.mdx +137 -0
package/docs/v6/overview/what-is-testdriver.mdx +85 -0
package/docs/v6/scenarios/ai-chatbot.mdx +28 -0
package/docs/v6/scenarios/cookie-banner.mdx +32 -0
package/docs/v6/scenarios/file-upload.mdx +33 -0
package/docs/v6/scenarios/form-filling.mdx +32 -0
package/docs/v6/scenarios/log-in.mdx +75 -0
package/docs/v6/scenarios/pdf-generation.mdx +25 -0
package/docs/v6/scenarios/spell-check.mdx +22 -0
package/docs/v6/security/action.mdx +84 -0
package/docs/v6/security/agent.mdx +73 -0
package/docs/v6/security/platform.mdx +77 -0
package/docs/v6/tutorials/advanced-test.mdx +81 -0
package/docs/v6/tutorials/basic-test.mdx +45 -0
package/docs/v7/_drafts/agents.mdx +843 -0
package/docs/v7/_drafts/architecture.mdx +399 -0
package/docs/v7/_drafts/auto-cache-key.mdx +167 -0
package/docs/v7/_drafts/awesome-logs-quick-ref.mdx +100 -0
package/docs/v7/_drafts/best-practices.mdx +486 -0
package/docs/v7/_drafts/caching-ai.mdx +215 -0
package/docs/v7/_drafts/caching-selectors.mdx +424 -0
package/docs/v7/_drafts/caching.mdx +366 -0
package/docs/v7/_drafts/cli-to-sdk-migration.mdx +425 -0
package/docs/v7/_drafts/commands/assert.mdx +45 -0
package/docs/v7/_drafts/commands/exec.mdx +276 -0
package/docs/v7/_drafts/commands/focus-application.mdx +44 -0
package/docs/v7/_drafts/commands/hover-image.mdx +69 -0
package/docs/v7/_drafts/commands/hover-text.mdx +47 -0
package/docs/v7/_drafts/commands/if.mdx +53 -0
package/docs/v7/_drafts/commands/match-image.mdx +67 -0
package/docs/v7/_drafts/commands/press-keys.mdx +87 -0
package/docs/v7/_drafts/commands/remember.mdx +49 -0
package/docs/v7/_drafts/commands/run.mdx +44 -0
package/docs/v7/_drafts/commands/scroll-until-image.mdx +66 -0
package/docs/v7/_drafts/commands/scroll-until-text.mdx +60 -0
package/docs/v7/_drafts/commands/scroll.mdx +69 -0
package/docs/v7/_drafts/commands/type.mdx +45 -0
package/docs/v7/_drafts/commands/wait-for-image.mdx +54 -0
package/docs/v7/_drafts/commands/wait-for-text.mdx +48 -0
package/docs/v7/_drafts/commands/wait.mdx +45 -0
package/docs/v7/_drafts/configuration.mdx +378 -0
package/docs/v7/_drafts/contributing.mdx +174 -0
package/docs/v7/_drafts/core.mdx +458 -0
package/docs/v7/_drafts/dashcam-title-feature.mdx +89 -0
package/docs/v7/_drafts/debugging.mdx +349 -0
package/docs/v7/_drafts/error-handling.mdx +501 -0
package/docs/v7/_drafts/faq.mdx +393 -0
package/docs/v7/_drafts/hooks.mdx +360 -0
package/docs/v7/_drafts/init-command.mdx +95 -0
package/docs/v7/_drafts/installation.mdx +420 -0
package/docs/v7/_drafts/migration.mdx +562 -0
package/docs/v7/_drafts/observable.mdx +604 -0
package/docs/v7/_drafts/playwright.mdx +342 -0
package/docs/v7/_drafts/plugin-migration.mdx +220 -0
package/docs/v7/_drafts/powerful.mdx +419 -0
package/docs/v7/_drafts/presets.mdx +210 -0
package/docs/v7/_drafts/progressive-disclosure.mdx +230 -0
package/docs/v7/_drafts/prompt-cache.mdx +200 -0
package/docs/v7/_drafts/provision.mdx +390 -0
package/docs/v7/_drafts/quick-start-test-recording.mdx +214 -0
package/docs/v7/_drafts/readme.mdx +135 -0
package/docs/v7/_drafts/reports.mdx +414 -0
package/docs/v7/_drafts/scalable.mdx +763 -0
package/docs/v7/_drafts/screenshot.mdx +155 -0
package/docs/v7/_drafts/sdk-awesome-logs.mdx +468 -0
package/docs/v7/_drafts/sdk-browser-rendering.mdx +167 -0
package/docs/v7/_drafts/sdk-migration.mdx +474 -0
package/docs/v7/_drafts/sdk-v7-complete.mdx +345 -0
package/docs/v7/_drafts/self-hosting.mdx +369 -0
package/docs/v7/_drafts/test-recording.mdx +382 -0
package/docs/v7/_drafts/troubleshooting.mdx +526 -0
package/docs/v7/_drafts/vitest-plugin.mdx +477 -0
package/docs/v7/_drafts/vitest.mdx +535 -0
package/docs/v7/_drafts/writing-tests.mdx +25 -0
package/docs/v7/ai.mdx +205 -0
package/docs/v7/assert.mdx +316 -0
package/docs/v7/aws-setup.mdx +449 -0
package/docs/v7/cache.mdx +223 -0
package/docs/v7/caching.mdx +128 -0
package/docs/v7/captcha.mdx +159 -0
package/docs/v7/ci-cd.mdx +603 -0
package/docs/v7/click.mdx +287 -0
package/docs/v7/client.mdx +478 -0
package/docs/v7/copilot/auto-healing.mdx +265 -0
package/docs/v7/copilot/creating-tests.mdx +156 -0
package/docs/v7/copilot/github.mdx +143 -0
package/docs/v7/copilot/running-tests.mdx +149 -0
package/docs/v7/copilot/setup.mdx +143 -0
package/docs/v7/customizing-devices.mdx +319 -0
package/docs/v7/dashcam.mdx +419 -0
package/docs/v7/debugging-with-screenshots.mdx +402 -0
package/docs/v7/device-config.mdx +317 -0
package/docs/v7/double-click.mdx +102 -0
package/docs/v7/elements.mdx +606 -0
package/docs/v7/enterprise.mdx +9 -0
package/docs/v7/errors.mdx +248 -0
package/docs/v7/events.mdx +358 -0
package/docs/v7/examples/ai.mdx +72 -0
package/docs/v7/examples/assert.mdx +72 -0
package/docs/v7/examples/captcha-api.mdx +92 -0
package/docs/v7/examples/chrome-extension.mdx +132 -0
package/docs/v7/examples/drag-and-drop.mdx +100 -0
package/docs/v7/examples/element-not-found.mdx +67 -0
package/docs/v7/examples/exec-output.mdx +85 -0
package/docs/v7/examples/exec-pwsh.mdx +83 -0
package/docs/v7/examples/focus-window.mdx +62 -0
package/docs/v7/examples/hover-image.mdx +94 -0
package/docs/v7/examples/hover-text.mdx +69 -0
package/docs/v7/examples/installer.mdx +91 -0
package/docs/v7/examples/launch-vscode-linux.mdx +101 -0
package/docs/v7/examples/match-image.mdx +96 -0
package/docs/v7/examples/press-keys.mdx +92 -0
package/docs/v7/examples/scroll-keyboard.mdx +79 -0
package/docs/v7/examples/scroll-until-image.mdx +81 -0
package/docs/v7/examples/scroll-until-text.mdx +109 -0
package/docs/v7/examples/scroll.mdx +81 -0
package/docs/v7/examples/type.mdx +92 -0
package/docs/v7/examples/windows-installer.mdx +89 -0
package/docs/v7/exec.mdx +318 -0
package/docs/v7/find.mdx +830 -0
package/docs/v7/focus-application.mdx +294 -0
package/docs/v7/generating-tests.mdx +36 -0
package/docs/v7/hosted.mdx +158 -0
package/docs/v7/hover.mdx +279 -0
package/docs/v7/locating-elements.mdx +71 -0
package/docs/v7/making-assertions.mdx +32 -0
package/docs/v7/mcp.mdx +9 -0
package/docs/v7/mouse-down.mdx +161 -0
package/docs/v7/mouse-up.mdx +164 -0
package/docs/v7/parse.mdx +237 -0
package/docs/v7/performing-actions.mdx +54 -0
package/docs/v7/press-keys.mdx +349 -0
package/docs/v7/provision.mdx +333 -0
package/docs/v7/quickstart.mdx +173 -0
package/docs/v7/redraw.mdx +216 -0
package/docs/v7/reusable-code.mdx +249 -0
package/docs/v7/right-click.mdx +123 -0
package/docs/v7/running-tests.mdx +185 -0
package/docs/v7/screenshot.mdx +249 -0
package/docs/v7/screenshots.mdx +186 -0
package/docs/v7/scroll.mdx +336 -0
package/docs/v7/secrets.mdx +115 -0
package/docs/v7/self-hosted.mdx +149 -0
package/docs/v7/type.mdx +358 -0
package/docs/v7/variables.mdx +111 -0
package/docs/v7/wait.mdx +52 -0
package/docs/v7/waiting-for-elements.mdx +90 -0
package/docs/v7/what-is-testdriver.mdx +54 -0
package/eslint.config.js +67 -0
package/examples/ai.test.mjs +31 -0
package/examples/assert.test.mjs +47 -0
package/examples/chrome-extension.test.mjs +97 -0
package/examples/config.mjs +5 -0
package/examples/element-not-found.test.mjs +27 -0
package/examples/exec-output.test.mjs +60 -0
package/examples/exec-pwsh.test.mjs +58 -0
package/examples/findall-coffee-icons.test.mjs +42 -0
package/examples/focus-window.test.mjs +37 -0
package/examples/formatted-logging.test.mjs +27 -0
package/examples/hover-image.test.mjs +53 -0
package/examples/hover-text-with-description.test.mjs +57 -0
package/examples/hover-text.test.mjs +28 -0
package/examples/installer.test.mjs +50 -0
package/examples/launch-vscode-linux.test.mjs +55 -0
package/examples/match-image.test.mjs +55 -0
package/examples/parse.test.mjs +19 -0
package/examples/press-keys.test.mjs +44 -0
package/examples/prompt.test.mjs +34 -0
package/examples/scroll-keyboard.test.mjs +38 -0
package/examples/scroll-until-image.test.mjs +40 -0
package/examples/scroll.test.mjs +42 -0
package/examples/type.test.mjs +46 -0
package/examples/windows-installer.test.mjs +54 -0
package/index.js +2 -0
package/interfaces/cli/commands/init.js +438 -0
package/interfaces/cli/commands/setup.js +382 -0
package/interfaces/cli/lib/base.js +285 -0
package/interfaces/cli.js +20 -0
package/interfaces/junit-reporter.js +290 -0
package/interfaces/logger.js +388 -0
package/interfaces/readline.js +234 -0
package/interfaces/shared-test-state.mjs +64 -0
package/interfaces/vitest-plugin.d.ts +115 -0
package/interfaces/vitest-plugin.mjs +1698 -0
package/lib/captcha/solver.js +358 -0
package/lib/core/Dashcam.js +533 -0
package/lib/core/index.d.ts +172 -0
package/lib/core/index.js +12 -0
package/lib/environments.json +18 -0
package/lib/github-comment-formatter.js +263 -0
package/lib/github-comment.mjs +452 -0
package/lib/init-project.js +575 -0
package/lib/presets/index.mjs +331 -0
package/lib/resolve-channel.js +46 -0
package/lib/sentry.js +417 -0
package/lib/vitest/hooks.d.ts +57 -0
package/lib/vitest/hooks.mjs +674 -0
package/lib/vitest/setup-aws.mjs +247 -0
package/lib/vitest/setup-self-hosted.mjs +151 -0
package/lib/vitest/setup.mjs +46 -0
package/manual/captcha-api.test.mjs +51 -0
package/manual/drag-and-drop.test.mjs +59 -0
package/manual/flake-diffthreshold-001.test.mjs +9 -0
package/manual/flake-diffthreshold-01.test.mjs +9 -0
package/manual/flake-diffthreshold-05.test.mjs +9 -0
package/manual/flake-noredraw-cache.test.mjs +9 -0
package/manual/flake-noredraw-nocache.test.mjs +9 -0
package/manual/flake-redraw-cache.test.mjs +9 -0
package/manual/flake-redraw-nocache.test.mjs +9 -0
package/manual/flake-rocket-match.test.mjs +30 -0
package/manual/flake-shared.mjs +51 -0
package/manual/no-provision.test.mjs +31 -0
package/manual/packer-hover-image.test.mjs +176 -0
package/manual/scroll-until-text.test.mjs +68 -0
package/manual/test-init-command.js +223 -0
package/mcp-server/README.md +322 -0
package/mcp-server/dist/codegen.d.ts +9 -0
package/mcp-server/dist/codegen.js +165 -0
package/mcp-server/dist/mcp-app.html +114 -0
package/mcp-server/dist/package.json +1 -0
package/mcp-server/dist/provision-types.d.ts +290 -0
package/mcp-server/dist/provision-types.js +174 -0
package/mcp-server/dist/server.d.ts +6 -0
package/mcp-server/dist/server.mjs +1925 -0
package/mcp-server/dist/session.d.ts +85 -0
package/mcp-server/dist/session.js +152 -0
package/mcp-server/mcp-app.html +28 -0
package/mcp-server/mcp-config.example.json +19 -0
package/mcp-server/package-lock.json +4027 -0
package/mcp-server/package.json +31 -0
package/mcp-server/src/codegen.ts +189 -0
package/mcp-server/src/mcp-app.css +360 -0
package/mcp-server/src/mcp-app.ts +547 -0
package/mcp-server/src/provision-types.ts +209 -0
package/mcp-server/src/server.ts +2391 -0
package/mcp-server/src/session.ts +194 -0
package/mcp-server/tsconfig.json +16 -0
package/mcp-server/vite.config.ts +23 -0
package/package.json +158 -0
package/schema.json +1046 -0
package/scripts/generate-skills.js +94 -0
package/sdk-log-formatter.js +1157 -0
package/sdk.d.ts +1486 -0
package/sdk.js +4336 -0
package/setup/aws/cloudformation.yaml +463 -0
package/setup/aws/disable-defender.sh +42 -0
package/setup/aws/install-dev-runner.sh +79 -0
package/setup/aws/spawn-runner.sh +289 -0
package/test/captcha-solver.test.mjs +152 -0
package/test/chrome-remote-debugging.test.mjs +66 -0
package/test/duckduckgo/experiment.test.mjs +28 -0
package/test/duckduckgo/setup.test.mjs +29 -0
package/test/manual/debug-locate-response.js +82 -0
package/test/manual/reconnect-provision.test.mjs +49 -0
package/test/manual/test-console-logs.test.mjs +42 -0
package/test/manual/test-find-api.js +73 -0
package/test/manual/test-init.sh +54 -0
package/test/manual/test-prompt-cache.js +97 -0
package/test/manual/test-provision-auth.mjs +22 -0
package/test/manual/test-sandbox-render.js +29 -0
package/test/manual/test-sdk-methods.js +15 -0
package/test/manual/test-sdk-refactor.js +53 -0
package/test/manual/test-stack-trace.mjs +57 -0
package/test/manual/verify-element-api.js +89 -0
package/test/manual/verify-types.js +0 -0
package/test/manual-unawaited-promise.test.mjs +31 -0
package/vitest.config.mjs +58 -0
package/vitest.runner.config.mjs +33 -0
package/vscode-extension/.vscodeignore +12 -0
package/vscode-extension/README.md +94 -0
package/vscode-extension/media/icon.png +0 -0
package/vscode-extension/package-lock.json +4126 -0
package/vscode-extension/package.json +86 -0
package/vscode-extension/src/extension.ts +829 -0
package/vscode-extension/testdriverai-0.1.0.vsix +0 -0
package/vscode-extension/tsconfig.json +16 -0

package/agent/index.js ADDED Viewed

@@ -0,0 +1,2450 @@
+// disable depreciation warnings
+process.removeAllListeners("warning");
+// package.json is included to get the version number
+const packageJson = require("../package.json");
+// nodejs modules
+const fs = require("fs");
+const os = require("os");
+// third party modules
+const path = require("path");
+const yaml = require("js-yaml");
+const sanitizeFilename = require("sanitize-filename");
+const { EventEmitter2 } = require("eventemitter2");
+const diff = require("diff");
+// global utilities
+const generator = require("./lib/generator.js");
+const theme = require("./lib/theme.js");
+const SourceMapper = require("./lib/source-mapper.js");
+// agent modules
+const { createParser } = require("./lib/parser.js");
+const { createSystem } = require("./lib/system.js");
+const { createCommander } = require("./lib/commander.js");
+const { createCommands } = require("./lib/commands.js");
+const { createSandbox } = require("./lib/sandbox.js");
+const { createCommandDefinitions } = require("./interface.js");
+const { createSDK } = require("./lib/sdk.js");
+const { createConfig } = require("./lib/config.js");
+const { createAnalytics } = require("./lib/analytics.js");
+const { createSession } = require("./lib/session.js");
+const { createOutputs } = require("./lib/outputs.js");
+const isValidVersion = require("./lib/valid-version.js");
+const { events, createEmitter } = require("./events.js");
+const logger = require("./lib/logger.js");
+class TestDriverAgent extends EventEmitter2 {
+  constructor(environment = {}, cliArgs = {}) {
+    super({
+      wildcard: true,
+      delimiter: ":",
+      newListener: false,
+      removeListener: false,
+      maxListeners: 20,
+      verboseMemoryLeak: false,
+      ignoreErrors: false,
+    }); // Create the agent's own emitter for internal events
+    this.emitter = createEmitter();
+    // Create config instance for this agent using provided environment
+    this.config = createConfig(environment);
+    // Store CLI arguments passed to this agent
+    this.cliArgs = cliArgs;
+    // Derive properties from cliArgs
+    const flags = cliArgs.options || {};
+    const firstArg = cliArgs.args && cliArgs.args[0];
+    // All commands (run, edit, generate) use the same pattern:
+    // first argument is the main file to work with
+    this.thisFile = firstArg || this.config.TD_DEFAULT_TEST_FILE;
+    this.resultFile = flags.resultFile || null;
+    this.newSandbox = flags.newSandbox || false;
+    this.healMode = flags.healMode || flags.heal || false;
+    this.sandboxId = flags["sandbox-id"] || null;
+    this.sandboxAmi = flags["sandbox-ami"] || null;
+    this.sandboxInstance = flags["sandbox-instance"] || null;
+    this.sandboxOs = flags.os || "linux";
+    this.ip = flags.ip || null;
+    this.workingDir = flags.workingDir || process.cwd();
+    // Resolve thisFile to absolute path with proper extension
+    if (this.thisFile) {
+      if (this.thisFile === ".") {
+        this.thisFile = path.join(this.workingDir, "testdriver.yaml");
+      } else {
+        this.thisFile = path.join(this.workingDir, this.thisFile);
+        if (
+          !this.thisFile.endsWith(".yaml") &&
+          !this.thisFile.endsWith(".yml")
+        ) {
+          this.thisFile += ".yaml";
+        }
+      }
+    }
+    // Create parser instance with this agent's emitter
+    this.parser = createParser(this.emitter);
+    // Create session instance for this agent
+    this.session = createSession();
+    // Create outputs instance for this agent
+    this.outputs = createOutputs();
+    // Create SDK instance with this agent's emitter, config, session, and abort signal
+    this.sdk = createSDK(this.emitter, this.config, this.session);
+    // Create analytics instance with this agent's emitter, config, and session
+    this.analytics = createAnalytics(this.emitter, this.config, this.session);
+    // Create sandbox instance with this agent's emitter, analytics, and session
+    this.sandbox = createSandbox(this.emitter, this.analytics, this.session);
+    // Attach Sentry log listeners to capture CLI logs as breadcrumbs
+    const sentry = require("../lib/sentry");
+    sentry.attachLogListeners(this.emitter);
+    // Set the OS for the sandbox to use
+    this.sandbox.os = this.sandboxOs;
+    // Create system instance with emitter, sandbox and config
+    this.system = createSystem(this.emitter, this.sandbox, this.config);
+    // Create commands instance with this agent's emitter and system
+    const commandsResult = createCommands(
+      this.emitter,
+      this.system,
+      this.sandbox,
+      this.config,
+      this.session,
+      () => this.sourceMapper.currentFilePath || this.thisFile,
+      this.cliArgs.options.redrawThreshold,
+      null, // getDashcamElapsedTime - will be set by SDK when dashcam is available
+      () => this.softAssertMode, // getter for soft assert mode (used by act())
+    );
+    this.commands = commandsResult.commands;
+    this.redraw = commandsResult.redraw;
+    // Create commander instance with this agent's emitter and commands
+    this.commander = createCommander(
+      this.emitter,
+      this.commands,
+      this.analytics,
+      this.config,
+      this.outputs,
+      this.session,
+    );
+    // these are "in-memory" globals
+    // they represent the current state of the agent
+    this.lastPrompt = ""; // the last prompt to be input
+    this.executionHistory = []; // a history of commands run in the current session
+    this.errorCounts = {}; // counts of different errors encountered in this session
+    this.errorLimit = 3; // the max number of times an error can be encountered before exiting
+    this.checkCount = 0; // the number of times the AI has checked the task
+    this.checkLimit = 7; // the max number of times the AI can check the task before exiting
+    this.lastScreenshot = null; // the last screenshot taken by the agent
+    this.readlineInterface = null; // the readline interface for interactive mode
+    this.tasks = []; // list of prompts that the user has given us
+    this.hasRunPostrun = false; // whether the postrun lifecycle has been run. prevents infinite loops
+    this.lastCommand = new Date().getTime();
+    this.csv = [["command,time"]];
+    // Source mapping for YAML files
+    this.sourceMapper = new SourceMapper();
+    // temporary file for command history
+    this.commandHistoryFile = path.join(os.homedir(), ".testdriver_history");
+    // Flag to indicate if the agent should stop execution
+    this.stopped = false;
+    // Flag to suppress assertion throws (used by act() to make check-phase assertions non-fatal)
+    this.softAssertMode = false;
+    this.emitter.emit(events.log.log, JSON.stringify(environment));
+    this.emitter.emit(events.log.log, JSON.stringify(cliArgs));
+  }
+  // Stop method to immediately halt execution
+  stop() {
+    this.stopped = true;
+    this.emitter.emit(
+      events.log.narration,
+      theme.dim("stopping execution..."),
+      true,
+    );
+  }
+  // single function to handle all program exits
+  // allows us to save the current state, run lifecycle hooks, and track analytics
+  async exit(failed = true, shouldSave = false, shouldRunPostrun = false) {
+    const { formatter } = require("../sdk-log-formatter.js");
+    this.emitter.emit(
+      events.log.narration,
+      formatter.getPrefix("disconnect") +
+        " " +
+        theme.yellow.bold("Exiting") +
+        theme.dim("..."),
+      true,
+    );
+    // Clean up redraw interval
+    if (this.redraw && this.redraw.cleanup) {
+      this.redraw.cleanup();
+    }
+    // Close sandbox connection to release the connection slot
+    if (this.sandbox) {
+      try {
+        this.sandbox.close();
+      } catch (err) {
+        // Ignore sandbox close errors during exit
+      }
+    }
+    shouldRunPostrun =
+      !this.hasRunPostrun &&
+      (shouldRunPostrun || this.cliArgs?.command == "run");
+    if (shouldSave) {
+      await this.save();
+    }
+    this.analytics.track("exit", { failed });
+    if (shouldRunPostrun) {
+      this.hasRunPostrun = true;
+      await this.runLifecycle("postrun");
+    }
+    // Emit exit event with exit code and close readline interface
+    this.readlineInterface?.close();
+    this.emitter.emit(events.exit, failed ? 1 : 0);
+    // we purposly never resolve this promise so the process will hang
+    return new Promise(() => {
+      // The process exit should be handled by the base/entry point listening to the exit event
+    });
+  }
+  // fatal errors always exit the program
+  // this ensure we log the error, summarize it, and exit cleanly
+  async dieOnFatal(error, skipPostrun = false) {
+    // Show error with source context if available
+    const errorContext = this.sourceMapper.getErrorWithSourceContext(error);
+    if (errorContext) {
+      this.emitter.emit(events.error.fatal, errorContext);
+    } else {
+      this.emitter.emit(events.error.fatal, error);
+    }
+    if (skipPostrun) {
+      return await this.exit(true);
+    } else {
+      try {
+        await this.summarize(error.message);
+      } catch (summarizeError) {
+        // If summarization fails, log it but don't let it prevent postrun from running
+        this.emitter.emit(
+          events.log.warn,
+          theme.yellow(`Failed to summarize: ${summarizeError.message}`),
+        );
+      }
+      // Always run postrun lifecycle script, even for fatal errors
+      return await this.exit(true, false, true);
+    }
+  }
+  // creates a new "thread" in which the AI is given an error
+  // and responds. notice `actOnMarkdown` which will continue
+  // the thread until there are no more codeblocks to execute
+  async haveAIResolveError(
+    error,
+    markdown,
+    depth = 0,
+    undo = true,
+    shouldSave,
+  ) {
+    // healMode must be required to attempt to recover from errors
+    // otherwise we go directly to fatal
+    if (!this.healMode) {
+      this.emitter.emit(
+        events.error.general,
+        theme.red("Error detected, but recovery mode is not enabled."),
+      );
+      this.emitter.emit(
+        events.log.log,
+        "To attempt automatic recovery, re-run with the --heal flag.",
+      );
+      return await this.dieOnFatal(error);
+    }
+    if (error.fatal) {
+      return await this.dieOnFatal(error);
+    }
+    // Get error message
+    let eMessage = error.message ? error.message : error;
+    // Truncate error message if too long to prevent 400 errors from API
+    // Keep first 5000 characters as a reasonable limit for API payloads
+    const MAX_ERROR_LENGTH = 5000;
+    if (typeof eMessage === "string" && eMessage.length > MAX_ERROR_LENGTH) {
+      eMessage =
+        eMessage.substring(0, MAX_ERROR_LENGTH) +
+        "\n\n[Error message truncated - message was too long]";
+    }
+    // we sanitize the error message to use it as a key in the errorCounts object
+    let safeKey = JSON.stringify(error.message ? error.message : error);
+    this.errorCounts[safeKey] = this.errorCounts[safeKey]
+      ? this.errorCounts[safeKey] + 1
+      : 1;
+    this.emitter.emit(
+      events.log.warn,
+      theme.red("Error detected. Attempting to recover (via --heal)..."),
+    );
+    // Show error with source context if available
+    const errorContext = this.sourceMapper.getErrorWithSourceContext(error);
+    if (errorContext) {
+      this.emitter.emit(events.log.warn, errorContext);
+    } else {
+      this.emitter.emit(events.log.markdown.static, eMessage);
+    }
+    this.emitter.emit(events.log.debug, error);
+    this.emitter.emit(events.log.debug, error.stack);
+    // if we get the same error 3 times in `run` mode, we exit
+    if (this.errorCounts[safeKey] > this.errorLimit - 1) {
+      this.emitter.emit(
+        events.log.log,
+        theme.red("Error loop detected. Exiting."),
+      );
+      this.emitter.emit(events.log.log, this.getErrorWithPosition(error));
+      await this.summarize(eMessage);
+      return await this.exit(true);
+    }
+    // remove this step from the execution history
+    if (undo) {
+      await this.popFromHistory();
+    }
+    // ask the AI what to do
+    let image;
+    if (error.attachScreenshot) {
+      image = await this.system.captureScreenBase64();
+    } else {
+      image = null;
+    }
+    this.emitter.emit(events.log.narration, theme.dim("thinking..."), true);
+    const streamId = `error-${Date.now()}`;
+    this.emitter.emit(events.log.markdown.start, streamId);
+    // Truncate markdown if too long to prevent 400 errors
+    const MAX_MARKDOWN_LENGTH = 10000;
+    let truncatedMarkdown = markdown;
+    if (typeof markdown === "string" && markdown.length > MAX_MARKDOWN_LENGTH) {
+      truncatedMarkdown =
+        markdown.substring(0, MAX_MARKDOWN_LENGTH) +
+        "\n\n[Markdown truncated - content was too long]";
+    }
+    let response;
+    try {
+      response = await this.sdk.req(
+        "error",
+        {
+          description: eMessage,
+          markdown: truncatedMarkdown,
+          image,
+        },
+        (chunk) => {
+          if (chunk.type === "data" && chunk.data) {
+            this.emitter.emit(events.log.markdown.chunk, streamId, chunk.data);
+          }
+        },
+      );
+    } catch (apiError) {
+      // If the error API call itself fails, prevent infinite loop
+      // by not retrying and instead treating as fatal
+      this.emitter.emit(
+        events.log.error,
+        theme.red(`Failed to get AI error resolution: ${apiError.message}`),
+      );
+      this.emitter.emit(events.log.log, "Original error: " + eMessage);
+      return await this.dieOnFatal(error);
+    }
+    this.emitter.emit(events.log.markdown.end, streamId);
+    // if the response worked, we try to execute the codeblocks in the response,
+    // which begins the recursive process of executing codeblocks
+    if (response?.data) {
+      return await this.actOnMarkdown(
+        response.data,
+        depth,
+        true,
+        false,
+        shouldSave,
+      );
+    }
+  }
+  // this is run after all possible codeblocks have been executed, but only at depth 0, which is the top level
+  // this checks that the task is "really done" using a screenshot of the desktop state
+  // it's likely that the task will not be complete and the AI will respond with more codeblocks to execute
+  async check() {
+    // Check if execution has been stopped
+    if (this.stopped) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim("execution stopped"),
+        true,
+      );
+      return;
+    }
+    this.checkCount++;
+    if (this.checkCount >= this.checkLimit) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.red("Exploratory loop detected. Exiting."),
+      );
+      await this.summarize("Check loop detected.");
+      return await this.exit(true);
+    }
+    this.emitter.emit(events.log.narration, theme.dim("checking..."));
+    // check asks the ai if the task is complete
+    // Parallelize system calls for better performance
+    const [thisScreenshot, mousePosition, activeWindow] = await Promise.all([
+      this.system.captureScreenBase64(1, false, true),
+      this.system.getMousePosition(),
+      this.system.activeWin(),
+    ]);
+    let images = [this.lastScreenshot, thisScreenshot];
+    let response = await this.sdk.req("check", {
+      tasks: this.tasks,
+      images,
+      mousePosition,
+      activeWindow,
+    });
+    // Use log.log (not markdown.static) so output goes through console spy to sandbox
+    this.emitter.emit(events.log.log, response.data);
+    this.lastScreenshot = thisScreenshot;
+    return response.data;
+  }
+  // command is transformed from a single yml entry generated by the AI into a JSON object
+  // it is mapped via `commander` to the `commands` module so the yaml
+  // parameters can be mapped to actual functions
+  async runCommand(command, depth, shouldSave, pushToHistory) {
+    let yml = await yaml.dump(command);
+    const commandName = command.command;
+    const startTime = Date.now();
+    // Get current source position
+    const sourcePosition = this.sourceMapper.getCurrentSourcePosition();
+    // Emit command start event with source mapping
+    this.emitter.emit(events.command.start, {
+      command: commandName,
+      depth,
+      data: command,
+      timestamp: startTime,
+      sourcePosition: sourcePosition,
+    });
+    // Log current execution position for debugging
+    if (this.sourceMapper.currentFileSourceMap) {
+      this.emitter.emit(events.log.log, "");
+      this.emitter.emit(
+        events.log.log,
+        theme.dim(`${this.sourceMapper.getCurrentPositionDescription()}`),
+      );
+    }
+    try {
+      let response;
+      // "run" and "if" commands are special meta commands
+      // that change the flow of execution
+      if (command.command == "run") {
+        response = await this.embed(command.file, depth, pushToHistory);
+      } else if (command.command == "if") {
+        response = await this.iffy(
+          command.condition,
+          command.then,
+          command.else,
+          depth,
+        );
+      } else {
+        response = await this.commander.run(command, depth);
+      }
+      const endTime = Date.now();
+      const duration = endTime - startTime;
+      // Emit command success event with source mapping
+      this.emitter.emit(events.command.success, {
+        command: commandName,
+        depth,
+        data: command,
+        duration,
+        response,
+        timestamp: endTime,
+        sourcePosition: sourcePosition,
+      });
+      // if the result of a command contains more commands, we perform the process again
+      if (response && typeof response === "string") {
+        return await this.actOnMarkdown(response, depth, false, false, false);
+      }
+    } catch (error) {
+      const endTime = Date.now();
+      const duration = endTime - startTime;
+      // Emit command error event with source mapping
+      this.emitter.emit(events.command.error, {
+        command: commandName,
+        depth,
+        data: command,
+        error: error.message,
+        duration,
+        timestamp: endTime,
+        sourcePosition: sourcePosition,
+      });
+      return await this.haveAIResolveError(
+        error,
+        yaml.dump({ commands: [yml] }),
+        depth,
+        true,
+        shouldSave,
+      );
+    }
+  }
+  async executeCommands(
+    commands,
+    depth,
+    pushToHistory = false,
+    dry = false,
+    shouldSave = false,
+  ) {
+    // Check if execution has been stopped
+    if (this.stopped) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim("execution stopped"),
+        true,
+      );
+      return;
+    }
+    if (commands?.length) {
+      for (const command of commands) {
+        // Check if execution has been stopped before each command
+        if (this.stopped) {
+          this.emitter.emit(
+            events.log.narration,
+            theme.dim("execution stopped"),
+            true,
+          );
+          return;
+        }
+        // Update current command tracking
+        const commandIndex = commands.indexOf(command);
+        this.sourceMapper.setCurrentCommand(commandIndex);
+        if (pushToHistory) {
+          this.executionHistory[
+            this.executionHistory.length - 1
+          ]?.commands.push(command);
+        }
+        if (shouldSave) {
+          await this.save({ silent: true });
+        }
+        if (!dry) {
+          await this.runCommand(command, depth, shouldSave);
+        }
+        let timeToComplete = (new Date().getTime() - this.lastCommand) / 1000;
+        // this.emitter.emit(events.log.log, timeToComplete, 'seconds')
+        this.csv.push([command.command, timeToComplete]);
+        this.lastCommand = new Date().getTime();
+      }
+    }
+  }
+  // codeblocks are ```yml ... ``` blocks found in ai responses
+  // this is similar to "function calling" in other ai frameworks
+  // here we parse the codeblocks and execute the commands within them
+  async executeCodeBlocks(
+    codeblocks,
+    depth,
+    pushToHistory = false,
+    dry = false,
+    shouldSave = false,
+  ) {
+    // Check if execution has been stopped
+    if (this.stopped) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim("execution stopped"),
+        true,
+      );
+      return;
+    }
+    depth = depth + 1;
+    for (const codeblock of codeblocks) {
+      // Check if execution has been stopped before each codeblock
+      if (this.stopped) {
+        this.emitter.emit(
+          events.log.narration,
+          theme.dim("execution stopped"),
+          true,
+        );
+        return;
+      }
+      let commands;
+      try {
+        commands = await this.parser.getCommands(codeblock);
+      } catch (e) {
+        // For parser errors
+        return await this.haveAIResolveError(
+          e,
+          yaml.dump(this.parser.getYAMLFromCodeBlock(codeblock)),
+          depth,
+          shouldSave,
+        );
+      }
+      await this.executeCommands(
+        commands,
+        depth,
+        pushToHistory,
+        dry,
+        shouldSave,
+      );
+    }
+  }
+  // this is the main function that interacts with the ai, runs commands, and checks the results
+  // notice that depth is 0 here. when this function resolves, the task is considered complete
+  // notice the call to `check()` which validates the prompt is complete
+  async aiExecute(
+    message,
+    validateAndLoop = false,
+    dry = false,
+    shouldSave = false,
+    isLoopContinuation = false,
+  ) {
+    // Check if execution has been stopped
+    if (this.stopped) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim("execution stopped"),
+        true,
+      );
+      return;
+    }
+    // Only create new execution history entry if this is not a loop continuation
+    if (!isLoopContinuation) {
+      this.executionHistory.push({ prompt: this.lastPrompt, commands: [] });
+    }
+    if (shouldSave) {
+      await this.save({ silent: true });
+    }
+    this.emitter.emit(events.log.debug, "kicking off exploratory loop");
+    // kick everything off
+    await this.actOnMarkdown(message, 0, true, dry, shouldSave);
+    // this calls the "check" function to validate the task is complete"
+    // the ai determines if it's complete or not
+    // if it is incomplete, the ai will likely return more codeblocks to execute
+    if (validateAndLoop) {
+      this.emitter.emit(
+        events.log.debug,
+        "exploratory loop resolved, check your work",
+      );
+      let response = await this.check();
+      let checkCodeblocks = [];
+      try {
+        checkCodeblocks = await this.parser.findCodeBlocks(response);
+      } catch (error) {
+        return await this.haveAIResolveError(error, response, 0, true, true);
+      }
+      this.emitter.emit(
+        events.log.debug,
+        `found ${checkCodeblocks.length} codeblocks`,
+      );
+      if (checkCodeblocks.length > 0) {
+        this.emitter.emit(
+          events.log.debug,
+          "check thinks more needs to be done",
+        );
+        return await this.aiExecute(
+          response,
+          validateAndLoop,
+          dry,
+          shouldSave,
+          true,
+        );
+      } else {
+        this.emitter.emit(events.log.debug, "seems complete, returning");
+        this.emitter.emit(events.log.log, theme.green("success!"));
+        return response;
+      }
+    }
+  }
+  // reads a yaml file and interprets the variables found within it
+  async loadYML(file) {
+    const startTime = Date.now();
+    // Emit file load start event
+    this.emitter.emit(events.file.start, {
+      operation: "load",
+      filePath: file,
+      timestamp: startTime,
+    });
+    let yml;
+    //wrap this in try/catch so if the file doesn't exist output an error message to the user
+    try {
+      yml = fs.readFileSync(file, "utf-8");
+      // Emit file load success event
+      this.emitter.emit(events.file.load, {
+        filePath: file,
+        size: yml.length,
+        timestamp: Date.now(),
+      });
+    } catch (e) {
+      // Emit file error event
+      this.emitter.emit(events.file.error, {
+        operation: "load",
+        filePath: file,
+        error: e.message,
+        timestamp: Date.now(),
+      });
+      this.emitter.emit(events.error.fatal, `File not found: ${file}`);
+      await this.summarize("File not found");
+      await this.exit(true);
+    }
+    if (!yml) {
+      return {};
+    }
+    yml = await this.parser.validateYAML(yml);
+    // Inject environment variables into any ${VAR} strings
+    yml = this.parser.interpolate(yml, {
+      TD_THIS_FILE: file,
+      ...this.config._environment,
+    });
+    // Show Unreplaced Variables
+    let unreplacedVars = this.parser.collectUnreplacedVariables(yml);
+    // Remove all variables that start with OUTPUT- these are special
+    unreplacedVars = unreplacedVars.filter((v) => {
+      return !v.startsWith("OUTPUT.");
+    });
+    if (unreplacedVars.length > 0) {
+      this.emitter.emit(
+        events.log.warn,
+        theme.yellow(
+          `Unreplaced variables in YAML: ${unreplacedVars.join(", ")}`,
+        ),
+      );
+    }
+    let ymlObj = null;
+    let sourceMap = null;
+    try {
+      // Parse YAML with source mapping
+      const parseResult = this.sourceMapper.parseYamlWithSourceMap(yml, file);
+      ymlObj = parseResult.yamlObj;
+      sourceMap = parseResult.sourceMap;
+      const endTime = Date.now();
+      // Emit file load completion event with source mapping
+      this.emitter.emit(events.file.stop, {
+        operation: "load",
+        filePath: file,
+        duration: endTime - startTime,
+        success: true,
+        sourceMap: sourceMap,
+        timestamp: endTime,
+      });
+    } catch (e) {
+      const endTime = Date.now();
+      // Emit file error event
+      this.emitter.emit(events.file.error, {
+        operation: "parse",
+        filePath: file,
+        error: e.message,
+        duration: endTime - startTime,
+        timestamp: endTime,
+      });
+      this.emitter.emit(events.error.fatal, e.message);
+      await this.summarize("Invalid YAML");
+      await this.exit(true);
+    }
+    return ymlObj;
+  }
+  // this is a rarely used command that likely doesn't need to exist
+  // it's used to call /assert in interactive mode
+  // @todo remove assert() command from agent.js
+  async assert(expect) {
+    this.analytics.track("assert");
+    let task = expect;
+    if (!task) {
+      // set task to last value of tasks
+      let task = this.tasks[this.tasks.length - 1];
+      // throw error if no task
+      if (!task) {
+        throw new Error("No task to assert");
+      }
+    }
+    this.emitter.emit(events.log.narration, theme.dim("thinking..."), true);
+    let response = `\`\`\`yaml
+commands:
+  - command: assert
+    expect: ${expect}
+\`\`\``;
+    await this.aiExecute(response);
+    await this.save({ silent: true });
+  }
+  // this function responds to the result of `promptUser()` which is the user input
+  // it kicks off the exploratory loop, which is the main function that interacts with the AI
+  async exploratoryLoop(
+    currentTask,
+    dry = false,
+    validateAndLoop = false,
+    shouldSave = true,
+  ) {
+    // Check if execution has been stopped
+    if (this.stopped) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim("execution stopped"),
+        true,
+      );
+      return;
+    }
+    this.lastPrompt = currentTask;
+    this.checkCount = 0;
+    this.emitter.emit(events.log.debug, "exploratoryLoop called");
+    this.tasks.push(currentTask);
+    this.emitter.emit(events.log.narration, theme.dim("thinking..."), true);
+    // Parallelize system calls for better performance
+    const [screenshot, mousePosition, activeWindow] = await Promise.all([
+      this.system.captureScreenBase64(),
+      this.system.getMousePosition(),
+      this.system.activeWin(),
+    ]);
+    this.lastScreenshot = screenshot;
+    let message = await this.sdk.req("input", {
+      input: currentTask,
+      mousePosition,
+      activeWindow,
+      image: this.lastScreenshot,
+    });
+    this.emitter.emit(events.log.log, message.data);
+    if (message && message.data) {
+      await this.aiExecute(message.data, validateAndLoop, dry, shouldSave);
+      this.emitter.emit(
+        events.log.debug,
+        "showing prompt from exploratoryLoop response check",
+      );
+    }
+    return;
+  }
+  // generate asks the AI to come up with ideas for test files
+  // based on the current state of the system (primarily the current screenshot)
+  // it will generate files that contain only "prompts"
+  // @todo revit the generate command
+  async generate(count = 1, prompt = null) {
+    this.emitter.emit(
+      events.log.debug,
+      `generate called with count: ${count}, prompt: ${prompt}`,
+    );
+    await this.runLifecycle("prerun");
+    this.emitter.emit(events.log.narration, theme.dim("thinking..."), true);
+    const streamId = `generate-${Date.now()}`;
+    this.emitter.emit(events.log.markdown.start, streamId);
+    // Parallelize system calls for better performance
+    const [image, mouse, activeWindow] = await Promise.all([
+      this.system.captureScreenBase64(),
+      this.system.getMousePosition(),
+      this.system.activeWin(),
+    ]);
+    let message = await this.sdk.req(
+      "generate",
+      {
+        prompt: prompt || "make sure to do a spellcheck",
+        image,
+        mousePosition: mouse,
+        activeWindow: activeWindow,
+        count,
+        stream: false,
+      },
+      (chunk) => {
+        if (chunk.type === "data") {
+          this.emitter.emit(events.log.markdown.chunk, streamId, chunk.data);
+        }
+      },
+    );
+    this.emitter.emit(events.log.markdown.end, streamId);
+    let testPrompts = await this.parser.findGenerativePrompts(message.data);
+    // for each testPrompt
+    for (const testPrompt of testPrompts) {
+      // with the contents of the testPrompt
+      let fileName =
+        sanitizeFilename(testPrompt.name)
+          .trim()
+          .replace(/ /g, "-")
+          .replace(/['"`]/g, "")
+          .replace(/[^a-zA-Z0-9-]/g, "") // remove any non-alphanumeric chars except hyphens
+          .toLowerCase() + ".yaml";
+      let path1 = path.join(
+        this.workingDir,
+        "testdriver",
+        "generate",
+        fileName,
+      );
+      // create generate directory if it doesn't exist
+      const generateDir = path.join(this.workingDir, "testdriver", "generate");
+      if (!fs.existsSync(generateDir)) {
+        fs.mkdirSync(generateDir);
+        logger.log("Created generate directory:", generateDir);
+      } else {
+        logger.log("Generate directory already exists:", generateDir);
+      }
+      let list = testPrompt.steps;
+      let contents = yaml.dump({
+        version: packageJson.version,
+        steps: list,
+      });
+      this.emitter.emit(events.log.debug, `writing file ${path1} ${contents}`);
+      fs.writeFileSync(path1, contents);
+    }
+    await this.runLifecycle("postrun");
+    this.exit(false);
+  }
+  // this is the functinoality for "undo"
+  async popFromHistory(fullStep) {
+    this.emitter.emit(events.log.narration, theme.dim("undoing..."), true);
+    if (this.executionHistory.length) {
+      if (fullStep) {
+        this.executionHistory.pop();
+      } else {
+        this.executionHistory[this.executionHistory.length - 1].commands.pop();
+      }
+      if (
+        !this.executionHistory[this.executionHistory.length - 1].commands.length
+      ) {
+        this.executionHistory.pop();
+      }
+    }
+  }
+  async undo() {
+    this.analytics.track("undo");
+    this.popFromHistory();
+    await this.save();
+  }
+  // this allows the user to input "flattened yaml"
+  // like "command='focus-application' name='Google Chrome'"
+  async manualInput(commandString) {
+    this.analytics.track("manual input");
+    let yml = await generator.manualToYml(commandString);
+    let message = `\`\`\`yaml
+${yml}
+\`\`\``;
+    await this.aiExecute(message, false);
+    await this.save({ silent: true });
+  }
+  // this function is responsible for starting the recursive process of executing codeblocks
+  async actOnMarkdown(
+    content,
+    depth,
+    pushToHistory = false,
+    dry = false,
+    shouldSave = false,
+  ) {
+    let codeblocks = [];
+    try {
+      codeblocks = await this.parser.findCodeBlocks(content);
+    } catch (error) {
+      pushToHistory = false;
+      return await this.haveAIResolveError(
+        error,
+        content,
+        depth,
+        false,
+        shouldSave,
+      );
+    }
+    if (codeblocks.length) {
+      let executions = await this.executeCodeBlocks(
+        codeblocks,
+        depth,
+        pushToHistory,
+        dry,
+        shouldSave,
+      );
+      return executions;
+    } else {
+      return true;
+    }
+  }
+  // this function is responsible for summarizing the test script that has already executed
+  // it is what is saved to the `/tmp/testdriver-summary.md` file and output to the action as a summary
+  async summarize(error = null) {
+    this.analytics.track("summarize");
+    this.emitter.emit(
+      events.log.narration,
+      theme.dim("reviewing test..."),
+      true,
+    );
+    // let text = prompts.summarize(tasks, error);
+    let image = await this.system.captureScreenBase64();
+    this.emitter.emit(events.log.narration, theme.dim("summarizing..."), true);
+    const streamId = `summarize-${Date.now()}`;
+    this.emitter.emit(events.log.markdown.start, streamId);
+    let reply = await this.sdk.req(
+      "summarize",
+      {
+        image,
+        error: error?.toString(),
+        tasks: this.tasks,
+      },
+      (chunk) => {
+        if (chunk.type === "data") {
+          this.emitter.emit(events.log.markdown.chunk, streamId, chunk.data);
+        }
+      },
+    );
+    this.emitter.emit(events.log.markdown.end, streamId);
+    // Only write summary to file if --summary option was provided
+    if (this.resultFile) {
+      // Ensure the output directory exists
+      const outputDir = path.dirname(this.resultFile);
+      if (!fs.existsSync(outputDir)) {
+        fs.mkdirSync(outputDir, { recursive: true });
+      }
+      fs.writeFileSync(this.resultFile, reply.data);
+      this.emitter.emit(
+        events.log.log,
+        theme.dim(`Summary written to: ${this.resultFile}`),
+      );
+    } else {
+      const tmpFile = path.join(os.tmpdir(), "testdriver-summary.md");
+      fs.writeFileSync(tmpFile, reply?.data);
+      this.emitter.emit(
+        events.log.log,
+        theme.dim(`Summary written to: ${tmpFile}`),
+      );
+    }
+  }
+  // this function is responsible for saving the regression test script to a file
+  async save({ filepath = this.thisFile, silent = false } = {}) {
+    const startTime = Date.now();
+    // Emit file save start event
+    this.emitter.emit(events.file.start, {
+      operation: "save",
+      filePath: filepath,
+      timestamp: startTime,
+    });
+    this.analytics.track("save", { silent });
+    if (!this.executionHistory.length) {
+      // Emit file save completion event for empty history
+      this.emitter.emit(events.file.stop, {
+        operation: "save",
+        filePath: filepath,
+        duration: Date.now() - startTime,
+        success: true,
+        reason: "empty_history",
+        timestamp: Date.now(),
+      });
+      return;
+    }
+    // Read existing file content for diff comparison
+    let existingContent = "";
+    let fileExists = false;
+    try {
+      if (fs.existsSync(filepath)) {
+        existingContent = fs.readFileSync(filepath, "utf8");
+        fileExists = true;
+      }
+    } catch {
+      // File doesn't exist or can't be read, treat as empty
+      existingContent = "";
+    }
+    // write reply to /tmp/testdriver-summary.md
+    let regression = await generator.dumpToYML(
+      this.executionHistory,
+      this.session,
+    );
+    // Create diff if file exists and content has changed
+    let diffResult = null;
+    if (fileExists && existingContent !== regression) {
+      const patches = diff.structuredPatch(
+        filepath,
+        filepath,
+        existingContent,
+        regression,
+        `${new Date().toISOString()} (before)`,
+        `${new Date().toISOString()} (after)`,
+      );
+      // Create source map-like information for VS Code
+      const diffLines = diff.diffLines(existingContent, regression);
+      const sourceMaps = [];
+      let oldLineNumber = 1;
+      let newLineNumber = 1;
+      diffLines.forEach((part) => {
+        const lineCount = part.value.split("\n").length - 1;
+        if (part.added) {
+          sourceMaps.push({
+            type: "addition",
+            oldStart: oldLineNumber,
+            oldEnd: oldLineNumber,
+            newStart: newLineNumber,
+            newEnd: newLineNumber + lineCount,
+            content: part.value,
+            lines: lineCount,
+          });
+          newLineNumber += lineCount;
+        } else if (part.removed) {
+          sourceMaps.push({
+            type: "deletion",
+            oldStart: oldLineNumber,
+            oldEnd: oldLineNumber + lineCount,
+            newStart: newLineNumber,
+            newEnd: newLineNumber,
+            content: part.value,
+            lines: lineCount,
+          });
+          oldLineNumber += lineCount;
+        } else {
+          // unchanged
+          sourceMaps.push({
+            type: "unchanged",
+            oldStart: oldLineNumber,
+            oldEnd: oldLineNumber + lineCount,
+            newStart: newLineNumber,
+            newEnd: newLineNumber + lineCount,
+            content: part.value,
+            lines: lineCount,
+          });
+          oldLineNumber += lineCount;
+          newLineNumber += lineCount;
+        }
+      });
+      diffResult = {
+        patches,
+        sourceMaps,
+        summary: {
+          additions: diffLines.filter((part) => part.added).length,
+          deletions: diffLines.filter((part) => part.removed).length,
+          modifications: diffLines.filter(
+            (part) => !part.added && !part.removed,
+          ).length,
+        },
+      };
+    }
+    try {
+      fs.writeFileSync(filepath, regression);
+      const endTime = Date.now();
+      // Emit file save success event
+      this.emitter.emit(events.file.save, {
+        filePath: filepath,
+        size: regression.length,
+        timestamp: endTime,
+      });
+      // Emit diff event if there were changes
+      if (diffResult) {
+        this.emitter.emit(events.file.diff, {
+          filePath: filepath,
+          diff: diffResult,
+          timestamp: endTime,
+        });
+      }
+      // Emit file save completion event
+      this.emitter.emit(events.file.stop, {
+        operation: "save",
+        filePath: filepath,
+        duration: endTime - startTime,
+        success: true,
+        timestamp: endTime,
+      });
+    } catch (e) {
+      const endTime = Date.now();
+      // Emit file save error event
+      this.emitter.emit(events.file.error, {
+        operation: "save",
+        filePath: filepath,
+        error: e.message,
+        duration: endTime - startTime,
+        timestamp: endTime,
+      });
+      this.emitter.emit(events.error.fatal, e.message);
+    }
+    if (!silent) {
+      this.emitter.emit(
+        events.log.markdown.static,
+        `Current test script:
+\`\`\`yaml
+${regression}
+\`\`\``,
+      );
+      if (!silent) {
+        this.emitter.emit(events.log.log, theme.dim(`saved as ${filepath}`));
+      }
+    }
+    return;
+  }
+  async runRawYML(yml) {
+    const tmp = require("tmp");
+    let tmpobj = tmp.fileSync();
+    let decoded = decodeURIComponent(yml);
+    // parse the yaml
+    let ymlObj = null;
+    try {
+      ymlObj = await yaml.load(decoded);
+    } catch (e) {
+      this.emitter.emit(events.error.fatal, e);
+    }
+    // add the root key steps: with array of commands:
+    if (ymlObj && !ymlObj.steps) {
+      ymlObj = {
+        version: packageJson.version,
+        steps: [ymlObj],
+      };
+    }
+    // write the yaml to a file
+    fs.writeFileSync(tmpobj.name, yaml.dump(ymlObj));
+    // and run it with run()
+    await this.runLifecycle("prerun");
+    await this.run(tmpobj.name, false, false);
+    await this.runLifecycle("postrun");
+  }
+  // this will load a regression test from a file location
+  // it parses the markdown file and executes the codeblocks exactly as if they were
+  // generated by the AI in a single prompt
+  async run(file = this.thisFile, shouldSave = false, shouldExit = true) {
+    const fileStartTime = Date.now();
+    // Emit file start event (for individual file execution within a test)
+    this.emitter.emit(events.file.start, {
+      operation: "run",
+      filePath: file,
+      timestamp: fileStartTime,
+    });
+    this.emitter.emit(events.log.narration, theme.cyan(`running ${file}...`));
+    let ymlObj = await this.loadYML(file);
+    // Store source mapping for current file
+    const parseResult = this.sourceMapper.parseYamlWithSourceMap(
+      fs.readFileSync(file, "utf-8"),
+      file,
+    );
+    this.sourceMapper.setCurrentContext(file, parseResult.sourceMap, -1, -1);
+    if (ymlObj.version) {
+      let valid = isValidVersion(ymlObj.version);
+      if (!valid) {
+        this.emitter.emit(
+          events.log.warn,
+          theme.yellow(`Version mismatch detected!`),
+        );
+        this.emitter.emit(
+          events.log.warn,
+          theme.yellow(`Running a test created with v${ymlObj.version}.`),
+        );
+        this.emitter.emit(
+          events.log.warn,
+          theme.yellow(
+            `The local testdriverai version is v${packageJson.version}.`,
+          ),
+        );
+      }
+    }
+    this.executionHistory = [];
+    if (!ymlObj.steps || !ymlObj.steps.length) {
+      this.emitter.emit(
+        events.log.log,
+        theme.red("No steps found in the YAML file"),
+      );
+      await this.exit(true, shouldSave, true);
+    }
+    try {
+      for (const step of ymlObj.steps) {
+        const stepIndex = ymlObj.steps.indexOf(step);
+        const stepStartTime = Date.now();
+        // Update current step tracking
+        this.sourceMapper.setCurrentStep(stepIndex);
+        // Get source position for current step
+        const sourcePosition = this.sourceMapper.getCurrentSourcePosition();
+        // Emit step start event with source mapping
+        this.emitter.emit(events.step.start, {
+          stepIndex,
+          prompt: step.prompt,
+          commandCount: step.commands ? step.commands.length : 0,
+          timestamp: stepStartTime,
+          sourcePosition: sourcePosition,
+        });
+        this.emitter.emit(events.log.log, ``, null);
+        this.emitter.emit(
+          events.log.log,
+          theme.yellow(`> ${step.prompt || "no prompt"}`),
+          null,
+        );
+        try {
+          if (!step.commands && !step.prompt) {
+            this.emitter.emit(
+              events.log.log,
+              theme.red("No commands or prompt found"),
+            );
+            this.emitter.emit(events.step.error, {
+              stepIndex,
+              prompt: step.prompt,
+              error: "No commands or prompt found",
+              timestamp: Date.now(),
+            });
+            await this.exit(true, shouldSave, true);
+          } else if (!step.commands) {
+            this.emitter.emit(
+              events.log.log,
+              theme.yellow("No commands found, running exploratory"),
+            );
+            await this.exploratoryLoop(step.prompt, false, true, shouldSave);
+          } else {
+            await this.executeCommands(
+              step.commands,
+              0,
+              true,
+              false,
+              shouldSave,
+            );
+          }
+          const stepEndTime = Date.now();
+          const stepDuration = stepEndTime - stepStartTime;
+          // Emit step success event with source mapping
+          this.emitter.emit(events.step.success, {
+            stepIndex,
+            prompt: step.prompt,
+            commandCount: step.commands ? step.commands.length : 0,
+            duration: stepDuration,
+            timestamp: stepEndTime,
+            sourcePosition: sourcePosition,
+          });
+          if (shouldSave) {
+            await this.save({ silent: true });
+          }
+        } catch (error) {
+          const stepEndTime = Date.now();
+          const stepDuration = stepEndTime - stepStartTime;
+          // Emit step error event with source mapping
+          this.emitter.emit(events.step.error, {
+            stepIndex,
+            prompt: step.prompt,
+            error: error.message,
+            duration: stepDuration,
+            timestamp: stepEndTime,
+            sourcePosition: sourcePosition,
+          });
+          throw error; // Re-throw to maintain existing error handling
+        }
+      }
+      const testEndTime = Date.now();
+      const fileDuration = testEndTime - fileStartTime;
+      // Emit file success event
+      this.emitter.emit(events.file.stop, {
+        operation: "run",
+        filePath: file,
+        duration: fileDuration,
+        success: true,
+        timestamp: testEndTime,
+      });
+      if (shouldSave) {
+        await this.save({ filepath: file, silent: false });
+      }
+      if (shouldExit) {
+        await this.summarize();
+        await this.exit(false, shouldSave, true);
+      }
+    } catch (error) {
+      const testEndTime = Date.now();
+      const fileDuration = testEndTime - fileStartTime;
+      // Emit file error event
+      this.emitter.emit(events.file.error, {
+        operation: "run",
+        filePath: file,
+        error: error.message,
+        duration: fileDuration,
+        timestamp: testEndTime,
+      });
+      // Re-throw the error to maintain existing error handling
+      throw error;
+    }
+  }
+  async iffy(condition, then, otherwise, depth) {
+    this.analytics.track("if", { condition });
+    this.emitter.emit(
+      events.log.log,
+      generator.jsonToManual({ command: "if", condition }),
+    );
+    try {
+      await this.commands.assert(condition, false);
+      return await this.executeCommands(then, ++depth);
+      // eslint-disable-next-line no-unused-vars
+    } catch (error) {
+      return await this.executeCommands(otherwise, ++depth);
+    }
+  }
+  async embed(file, depth, pushToHistory) {
+    let inputFile = JSON.parse(JSON.stringify(file));
+    this.analytics.track("embed", { file });
+    this.emitter.emit(
+      events.log.log,
+      generator.jsonToManual({ command: "run", file }),
+    );
+    depth = depth + 1;
+    this.emitter.emit(events.log.log, `${inputFile} (start)`);
+    // Use the new helper method to resolve file paths relative to testdriver directory
+    const currentFilePath = this.sourceMapper.currentFilePath || this.thisFile;
+    // if the file is not an absolute path, resolve it using the new helper
+    if (!path.isAbsolute(file)) {
+      file = this.resolveTestDriverRelativePath(currentFilePath, file);
+    }
+    // check if the file exists
+    if (!fs.existsSync(file)) {
+      throw `Embedded file not found: ${file}`;
+    }
+    let ymlObj = await this.loadYML(file);
+    // Store current source mapping state
+    const previousContext = this.sourceMapper.saveContext();
+    // Set up source mapping for embedded file
+    const parseResult = this.sourceMapper.parseYamlWithSourceMap(
+      fs.readFileSync(file, "utf-8"),
+      file,
+    );
+    this.sourceMapper.setCurrentContext(file, parseResult.sourceMap, -1, -1);
+    try {
+      for (const step of ymlObj.steps) {
+        const stepIndex = ymlObj.steps.indexOf(step);
+        this.sourceMapper.setCurrentStep(stepIndex);
+        if (!step.commands && !step.prompt) {
+          this.emitter.emit(
+            events.log.log,
+            theme.red("No commands or prompt found"),
+          );
+          await this.exit(true);
+        } else if (!step.commands) {
+          this.emitter.emit(
+            events.log.log,
+            theme.yellow("No commands found, running exploratory"),
+          );
+          await this.exploratoryLoop(step.prompt, false, true, false);
+        } else {
+          await this.executeCommands(step.commands, depth, pushToHistory);
+        }
+      }
+    } finally {
+      // Restore previous source mapping state
+      this.sourceMapper.restoreContext(previousContext);
+    }
+    this.emitter.emit(events.log.log, `${inputFile} (end)`);
+  }
+  async buildEnv(options = {}) {
+    // If instance already exists, do not build environment again
+    if (this.instance) {
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim("sandbox instance already exists, skipping launch."),
+      );
+      return;
+    }
+    let { headless = false, heal, new: createNew = false } = options;
+    // Prioritize this.newSandbox flag if it's set
+    if (this.newSandbox) {
+      createNew = true;
+    }
+    // If CI environment variable is true, always create a new sandbox
+    if (this.config.CI) {
+      createNew = true;
+      this.emitter.emit(
+        events.log.log,
+        theme.dim("CI environment detected, will create a new sandbox"),
+      );
+    }
+    if (heal) this.healMode = heal;
+    // If createNew flag is set, clear sandboxId to prevent reconnection attempts
+    if (createNew) {
+      this.sandboxId = null;
+      if (!this.config.CI && !this.newSandbox) {
+        this.emitter.emit(events.log.log, theme.dim("Creating a new sandbox"));
+      } else if (this.newSandbox) {
+        this.emitter.emit(events.log.log, theme.dim("Creating a new sandbox"));
+      }
+    }
+    // Create session first so session ID is available for Sentry tracing in WebSocket connection
+    await this.newSession();
+    // order is important!
+    await this.connectToSandboxService();
+    // Set sandbox ID for reconnection (only if not creating new and recent ID exists)
+    if (this.ip) {
+      let instance = await this.sandbox.send({
+        type: "direct",
+        resolution: this.config.TD_RESOLUTION,
+        ci: this.config.CI,
+        ip: this.ip,
+        instanceId: this.instanceId || undefined,
+      });
+      // Store connection params for reconnection
+      // For direct IP connections, store as a direct type so reconnection
+      // sends a 'direct' message instead of 'connect' with an IP as sandboxId
+      this.sandbox.setConnectionParams({
+        type: 'direct',
+        ip: this.ip,
+        sandboxId: instance?.instance?.instanceId || instance?.instance?.sandboxId || null,
+        persist: true,
+        keepAlive: this.keepAlive,
+      });
+      // Mark instance socket as connected so console logs are forwarded
+      this.sandbox.instanceSocketConnected = true;
+      this.emitter.emit(events.sandbox.connected);
+      this.instance = instance.instance;
+      await this.renderSandbox(this.instance, headless);
+      await this.runLifecycle("provision");
+      return;
+    } else if (!createNew && this.sandboxId && !this.config.CI) {
+      // Only attempt to connect to existing sandbox if not in CI mode and not creating new
+      // Attempt to connect to known instance
+      this.emitter.emit(
+        events.log.narration,
+        theme.dim(`connecting to sandbox ${this.sandboxId}...`),
+      );
+      try {
+        let instance = await this.connectToSandboxDirect(
+          this.sandboxId,
+          true, // always persist by default
+          this.keepAlive, // pass keepAlive TTL
+        );
+        this.instance = instance;
+        await this.renderSandbox(instance, headless);
+        return;
+      } catch (error) {
+        // If connection fails, fall through to creating a new sandbox
+        this.emitter.emit(
+          events.log.narration,
+          theme.dim(`failed to connect to recent sandbox, creating new one...`),
+        );
+        console.error("Failed to reconnect to sandbox:", error);
+      }
+    }
+    // Create new sandbox (either because createNew is true, or no existing sandbox to connect to)
+    if (!this.instance) {
+      const { formatter } = require("../sdk-log-formatter.js");
+      this.emitter.emit(
+        events.log.narration,
+        formatter.getPrefix("connect") +
+          " " +
+          theme.green.bold("Creating") +
+          " " +
+          theme.cyan(`new sandbox...`),
+      );
+      let newSandbox = await this.createNewSandbox();
+      // Extract the sandbox ID from the newly created sandbox
+      this.sandboxId =
+        newSandbox?.sandbox?.sandboxId || newSandbox?.sandbox?.instanceId;
+      // E2B sandboxes return a url directly from create — no separate
+      // connect step needed (the API proxies commands via Ably).
+      if (newSandbox?.sandbox?.url) {
+        this.sandbox.setConnectionParams({
+          sandboxId: this.sandboxId,
+          persist: true,
+          keepAlive: this.keepAlive,
+        });
+        this.emitter.emit(events.sandbox.connected);
+        this.instance = newSandbox.sandbox;
+        await this.renderSandbox(this.instance, headless);
+        await this.runLifecycle("provision");
+      } else {
+        let instance = await this.connectToSandboxDirect(
+          this.sandboxId,
+          true, // always persist by default
+          this.keepAlive, // pass keepAlive TTL
+        );
+        this.instance = instance;
+        await this.renderSandbox(instance, headless);
+        await this.runLifecycle("provision");
+      }
+    }
+  }
+  async start() {
+    try {
+      this.emitter.emit(
+        events.log.log,
+        theme.green(`Howdy! I'm TestDriver v${packageJson.version}`),
+      );
+      // Emit test start event for the entire test execution
+      this.emitter.emit(events.test.start, {
+        filePath: this.thisFile,
+        timestamp: Date.now(),
+      });
+      // Debugger UI is hosted on the web app (console.testdriver.ai/debugger/)
+      // No local debugger server needed
+      this.emitter.emit(events.log.log, `This is beta software!`);
+      this.emitter.emit(events.log.log, ``);
+      this.emitter.emit(
+        events.log.log,
+        theme.yellow(`Join our Discord for help`),
+      );
+      this.emitter.emit(
+        events.log.log,
+        `https://discord.com/invite/cWDFW8DzPm`,
+      );
+      this.emitter.emit(events.log.log, ``);
+      // make testdriver directory if it doesn't exist
+      let testdriverFolder = path.join(this.workingDir);
+      if (!fs.existsSync(testdriverFolder)) {
+        fs.mkdirSync(testdriverFolder);
+        // log
+        this.emitter.emit(
+          events.log.log,
+          theme.dim(`Created testdriver directory: ${testdriverFolder}`),
+        );
+      }
+      // if the directory for thisFile doesn't exist, create it
+      if (
+        this.cliArgs.command !== "sandbox" &&
+        this.cliArgs.command !== "generate"
+      ) {
+        const dir = path.dirname(this.thisFile);
+        if (!fs.existsSync(dir)) {
+          fs.mkdirSync(dir, { recursive: true });
+          this.emitter.emit(
+            events.log.log,
+            theme.dim(`Created directory ${dir}`),
+          );
+        }
+        // if thisFile doesn't exist, create it
+        // thisFile def to testdriver/testdriver.yaml, during init, it just creates an empty file
+        if (!fs.existsSync(this.thisFile)) {
+          fs.writeFileSync(this.thisFile, "");
+          this.emitter.emit(
+            events.log.log,
+            theme.dim(`Created ${this.thisFile}`),
+          );
+        }
+      }
+      if (this.config.TD_API_KEY) {
+        await this.sdk.auth();
+      }
+      if (
+        this.cliArgs.command !== "sandbox" &&
+        this.cliArgs.command !== "generate"
+      ) {
+        this.emitter.emit(
+          events.log.log,
+          theme.dim(`Working on ${this.thisFile}`),
+        );
+        this.loadYML(this.thisFile);
+      }
+      this.analytics.track("command", {
+        command: this.cliArgs.command,
+        file: this.thisFile,
+      });
+      // Dynamically handle all available commands (except edit which is handled by CLI)
+      const availableCommands = Object.keys(this.getCommandDefinitions());
+      if (
+        availableCommands.includes(this.cliArgs.command) &&
+        this.cliArgs.command !== "edit"
+      ) {
+        await this.executeUnifiedCommand(
+          this.cliArgs.command,
+          this.cliArgs.args,
+          this.cliArgs.options,
+          this.cliArgs.options._optionValues,
+        );
+      } else if (this.cliArgs.command !== "edit") {
+        this.emitter.emit(
+          events.error.fatal,
+          `Unknown command: ${this.cliArgs.command}`,
+        );
+        await this.exit(true);
+      }
+    } catch (error) {
+      this.emitter.emit(events.error.fatal, error.message || error);
+      await this.exit(true);
+    }
+  }
+  async renderSandbox(instance, headless = false) {
+    if (!headless) {
+      let url;
+      // If the instance already has a URL (from reconnection), use it
+      if (instance.url) {
+        url = instance.url;
+      } else if (instance.ip || instance.publicIp) {
+        // Otherwise construct it from IP and port
+        url =
+          "http://" +
+          (instance.ip || instance.publicIp) +
+          ":" +
+          (instance.vncPort || "5800") +
+          "/vnc_lite.html?token=V3b8wG9";
+      } else {
+        // If we don't have URL or IP, we can't render
+        logger.warn("renderSandbox: Missing URL and IP in instance", instance);
+        return;
+      }
+      let data = {
+        resolution: this.config.TD_RESOLUTION,
+        url: url,
+        token: "V3b8wG9",
+        testFile: this.testFile || null,
+        os: this.sandboxOs || "linux",
+      };
+      // Base64 encode the data (the debugger expects base64, not URL encoding)
+      const encodedData = Buffer.from(JSON.stringify(data)).toString("base64");
+      // Build debugger URL — hosted on S3 (v7-vnc bucket)
+      const debuggerBase = process.env.TD_DEBUGGER_BASE_URL || "http://v7-vnc.s3.us-east-2.amazonaws.com";
+      // URL-encode the base64 data to handle +, /, = characters safely
+      const urlToOpen = `${debuggerBase}/index.html?data=${encodeURIComponent(encodedData)}`;
+      // Check preview mode from CLI options (SDK passes it directly)
+      const previewMode = (this.cliArgs.options && this.cliArgs.options.preview) || this.config.TD_PREVIEW || "browser";
+      if (previewMode === "ide") {
+        // Send session to VS Code extension via HTTP
+        this.writeIdeSessionFile(urlToOpen, data);
+      } else if (previewMode !== "none") {
+        // Open in browser (default behavior)
+        this.emitter.emit(events.showWindow, urlToOpen);
+      }
+      // If preview is "none", don't open anything
+    }
+  }
+  // Get the console (web app) URL for the given API root
+  _getConsoleUrl(apiRoot) {
+    // Allow explicit override via env (e.g. VITE_DOMAIN from .env)
+    if (process.env.VITE_DOMAIN) return process.env.VITE_DOMAIN;
+    const environments = require("../lib/environments.json");
+    const mapping = {
+      "https://v6.testdriver.ai": environments.stable.consoleUrl,
+    };
+    for (const env of Object.values(environments)) {
+      mapping[env.apiRoot] = env.consoleUrl;
+    }
+    if (mapping[apiRoot]) return mapping[apiRoot];
+    // Local dev: API on localhost:1337 -> Web on localhost:3001
+    if (apiRoot.includes("localhost:1337") || apiRoot.includes("127.0.0.1:1337")) {
+      return "http://localhost:3001";
+    }
+    return environments.stable.consoleUrl;
+  }
+  // Write session file for IDE preview (VSCode extension watches for these)
+  writeIdeSessionFile(debuggerUrl, data) {
+    const fs = require("fs");
+    const path = require("path");
+    const sessionId = `${Date.now()}-${Math.random().toString(36).substring(2, 8)}`;
+    const previewsDir = path.join(process.cwd(), ".testdriver", ".previews");
+    // Create the previews directory if it doesn't exist
+    if (!fs.existsSync(previewsDir)) {
+      fs.mkdirSync(previewsDir, { recursive: true });
+    }
+    const sessionData = {
+      sessionId,
+      debuggerUrl,
+      resolution: Array.isArray(data.resolution) ? data.resolution : (data.resolution ? data.resolution.split("x").map(Number) : [1920, 1080]),
+      testFile: data.testFile || this.testFile || null,
+      os: data.os || this.sandboxOs || "linux",
+      timestamp: Date.now(),
+    };
+    const filePath = path.join(previewsDir, `${sessionId}.json`);
+    fs.writeFileSync(filePath, JSON.stringify(sessionData, null, 2));
+    logger.log(`IDE preview session written to ${filePath}`);
+  }
+  // Find the VS Code instance that contains the test file
+  findTargetIdeInstance(testFilePath) {
+    const fs = require("fs");
+    const os = require("os");
+    const path = require("path");
+    const instancesDir = path.join(os.homedir(), ".testdriver", "ide-instances");
+    if (!fs.existsSync(instancesDir)) {
+      return null;
+    }
+    const files = fs.readdirSync(instancesDir);
+    const normalizedTestPath = testFilePath ? path.normalize(testFilePath) : null;
+    let matchingInstance = null;
+    let longestMatchLength = 0;
+    for (const file of files) {
+      if (!file.endsWith('.json')) continue;
+      try {
+        const registrationPath = path.join(instancesDir, file);
+        const registration = JSON.parse(fs.readFileSync(registrationPath, 'utf-8'));
+        // Check if this instance is still alive (registration within last 60 seconds or process exists)
+        const isRecent = Date.now() - registration.timestamp < 60000;
+        // Skip stale registrations
+        if (!isRecent) {
+          // Try to clean up stale file
+          try { fs.unlinkSync(registrationPath); } catch {}
+          continue;
+        }
+        // If we have a test file path, find the best matching workspace
+        if (normalizedTestPath && registration.workspacePaths) {
+          for (const workspacePath of registration.workspacePaths) {
+            const normalizedWorkspace = path.normalize(workspacePath);
+            if (normalizedTestPath.startsWith(normalizedWorkspace + path.sep) ||
+                normalizedTestPath === normalizedWorkspace) {
+              // Prefer longest match (most specific workspace)
+              if (normalizedWorkspace.length > longestMatchLength) {
+                longestMatchLength = normalizedWorkspace.length;
+                matchingInstance = registration;
+              }
+            }
+          }
+        } else if (!matchingInstance) {
+          // If no test file path, just use the first available instance
+          matchingInstance = registration;
+        }
+      } catch (error) {
+        // Ignore malformed registration files
+      }
+    }
+    return matchingInstance;
+  }
+  // Send session notification to VS Code extension via HTTP
+  sendIdeSessionNotification(debuggerUrl, data) {
+    const http = require("http");
+    const path = require("path");
+    const testFilePath = data.testFile || this.thisFile;
+    const targetInstance = this.findTargetIdeInstance(testFilePath);
+    if (!targetInstance) {
+      logger.warn("No VS Code instance found for IDE preview. Make sure VS Code with TestDriver extension is open.");
+      // Fall back to browser
+      this.emitter.emit(events.showWindow, debuggerUrl);
+      return;
+    }
+    // Generate a unique session ID
+    const testFileName = (testFilePath || "test")
+      .split(path.sep).pop()
+      .replace(/\.[^/.]+$/, "");
+    const sessionId = `${testFileName}-${Date.now()}-${Math.random().toString(36).substring(2, 8)}`;
+    const sessionData = {
+      sessionId: sessionId,
+      debuggerUrl: debuggerUrl,
+      resolution: data.resolution || this.config.TD_RESOLUTION,
+      testFile: testFilePath,
+      os: data.os || this.sandboxOs || "linux",
+      timestamp: Date.now(),
+    };
+    const postData = JSON.stringify(sessionData);
+    const options = {
+      hostname: '127.0.0.1',
+      port: targetInstance.port,
+      path: '/session',
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        'Content-Length': Buffer.byteLength(postData)
+      },
+      timeout: 5000
+    };
+    const req = http.request(options, (res) => {
+      if (res.statusCode === 200) {
+        logger.log(`IDE session notification sent to port ${targetInstance.port}`);
+      } else {
+        logger.warn(`IDE session notification failed with status ${res.statusCode}`);
+        // Fall back to browser on failure
+        this.emitter.emit(events.showWindow, debuggerUrl);
+      }
+    });
+    req.on('error', (error) => {
+      logger.warn(`Failed to send IDE session notification: ${error.message}`);
+      // Fall back to browser on error
+      this.emitter.emit(events.showWindow, debuggerUrl);
+    });
+    req.on('timeout', () => {
+      req.destroy();
+      logger.warn('IDE session notification timed out');
+      // Fall back to browser on timeout
+      this.emitter.emit(events.showWindow, debuggerUrl);
+    });
+    req.write(postData);
+    req.end();
+  }
+  async connectToSandboxService() {
+    this.emitter.emit(
+      events.log.narration,
+      theme.dim(`establishing connection...`),
+    );
+    let ableToBoot = await this.sandbox.boot(this.config.TD_API_ROOT);
+    if (!ableToBoot) {
+      return await this.dieOnFatal(
+        `Unable to connect to TestDriver sandbox service at ${this.config.TD_API_ROOT}.
+Please check your network connection, TD_API_KEY, or the service status.`,
+        true,
+      );
+    }
+    const { formatter } = require("../sdk-log-formatter.js");
+    this.emitter.emit(
+      events.log.narration,
+      formatter.getPrefix("connect") +
+        " " +
+        theme.green.bold("Authenticating") +
+        theme.dim("..."),
+    );
+    let ableToAuth = await this.sandbox.auth(this.config.TD_API_KEY);
+    if (!ableToAuth) {
+      return await this.dieOnFatal(
+        `Unable to authorize with TestDriver sandbox service at ${this.config.TD_API_ROOT}.
+Please check your network connection, TD_API_KEY, or the service status.`,
+        true,
+      );
+    }
+  }
+  async connectToSandboxDirect(sandboxId, persist = false, keepAlive = null) {
+    const { formatter } = require("../sdk-log-formatter.js");
+    this.emitter.emit(
+      events.log.narration,
+      formatter.getPrefix("connect") +
+        " " +
+        theme.green.bold("Connecting") +
+        " " +
+        theme.cyan(`to sandbox...`),
+    );
+    let reply = await this.sandbox.connect(sandboxId, persist, keepAlive);
+    // reply includes { success, url, sandbox: {...} }
+    // For renderSandbox, we need the sandbox object with url merged in
+    const sandbox = reply.sandbox || {};
+    // If reply has a URL at top level, merge it into the sandbox object
+    if (reply.url && !sandbox.url) {
+      sandbox.url = reply.url;
+    }
+    return sandbox;
+  }
+  async createNewSandbox() {
+    const sandboxConfig = {
+      type: "create",
+      resolution: this.config.TD_RESOLUTION,
+      ci: this.config.CI,
+      os: this.sandboxOs || "linux",
+    };
+    // Add AMI and instance type if specified
+    if (this.sandboxAmi) {
+      sandboxConfig.ami = this.sandboxAmi;
+    }
+    if (this.sandboxInstance) {
+      sandboxConfig.instanceType = this.sandboxInstance;
+    }
+    // Add keepAlive TTL if specified
+    if (this.keepAlive !== undefined && this.keepAlive !== null) {
+      sandboxConfig.keepAlive = this.keepAlive;
+    }
+    const { formatter } = require("../sdk-log-formatter.js");
+    const retryDelay = 15000; // 15 seconds between retries
+    while (true) {
+      let response = await this.sandbox.send(sandboxConfig, 60000 * 8);
+      // Check if queued (all slots in use)
+      if (response.type === "create.queued") {
+        this.emitter.emit(
+          events.log.narration,
+          formatter.getPrefix("queue") +
+            " " +
+            theme.yellow.bold("Waiting") +
+            " " +
+            theme.dim(response.message),
+        );
+        // Wait then retry
+        await new Promise((resolve) => setTimeout(resolve, retryDelay));
+        continue;
+      }
+      // Success - got a sandbox
+      return response;
+    }
+  }
+  async newSession() {
+    // should be start of new session
+    // If sandbox is connected, get system info; otherwise pass empty objects
+    const isSandboxConnected = this.sandbox.apiSocketConnected;
+    const sessionRes = await this.sdk.req("session/start", {
+      systemInformationOsInfo: isSandboxConnected
+        ? await this.system.getSystemInformationOsInfo()
+        : {},
+      mousePosition: isSandboxConnected
+        ? await this.system.getMousePosition()
+        : {},
+      activeWindow: isSandboxConnected ? await this.system.activeWin() : {},
+    });
+    if (!sessionRes) {
+      throw new Error(
+        "Unable to start TestDriver session.  Check your network connection or restart the CLI.",
+      );
+    }
+    this.session.set(sessionRes.data.id);
+    // Set Sentry session trace context for distributed tracing
+    // This links CLI errors/logs to the same trace as API calls
+    try {
+      const sentry = require("../lib/sentry");
+      sentry.setSessionTraceContext(sessionRes.data.id);
+    } catch (e) {
+      // Sentry module may not be available, ignore
+    }
+  }
+  // Helper method to find testdriver directory by traversing up from a file path
+  findTestDriverDirectory(filePath) {
+    // Start from the directory containing the file, or use workingDir as fallback
+    let currentDir = filePath
+      ? path.dirname(path.resolve(filePath))
+      : this.workingDir;
+    while (currentDir !== path.dirname(currentDir)) {
+      // Continue until we reach the root
+      const testdriverPath = path.join(currentDir, "testdriver");
+      if (
+        fs.existsSync(testdriverPath) &&
+        fs.statSync(testdriverPath).isDirectory()
+      ) {
+        return testdriverPath;
+      }
+      currentDir = path.dirname(currentDir);
+    }
+    // Fallback to workingDir/testdriver if not found
+    return path.join(this.workingDir, "testdriver");
+  }
+  // Helper method to resolve file paths relative to the testdriver directory
+  // This handles both snippets and other relative files that should be resolved
+  // relative to the nearest testdriver directory
+  resolveTestDriverRelativePath(filePath, relativePath) {
+    // If it's already an absolute path, return as-is
+    if (path.isAbsolute(relativePath)) {
+      return relativePath;
+    }
+    // Check if this looks like a snippet or lifecycle reference
+    if (
+      relativePath.startsWith("snippets/") ||
+      relativePath.startsWith("lifecycle/")
+    ) {
+      // First, check if there's a local directory in the same directory as the current file
+      if (filePath) {
+        const currentFileDir = path.dirname(path.resolve(filePath));
+        const localPath = path.join(currentFileDir, relativePath);
+        if (fs.existsSync(localPath)) {
+          return localPath;
+        }
+      }
+      // If no local file found, fall back to the testdriver directory
+      const testdriverDir = this.findTestDriverDirectory(filePath);
+      return path.join(testdriverDir, relativePath);
+    }
+    // For other relative paths, resolve relative to the current file's directory
+    if (filePath) {
+      return path.resolve(path.dirname(filePath), relativePath);
+    }
+    // Fallback to workingDir
+    return path.resolve(this.workingDir, relativePath);
+  }
+  async runLifecycle(lifecycleName) {
+    // Use the current file path from sourceMapper to find the lifecycle directory
+    // If sourceMapper doesn't have a current file, use thisFile which should be the file being run
+    let currentFilePath = this.sourceMapper.currentFilePath || this.thisFile;
+    // If we still don't have a currentFilePath, fall back to the default testdriver directory
+    if (!currentFilePath) {
+      currentFilePath = path.join(
+        this.workingDir,
+        "testdriver",
+        "testdriver.yaml",
+      );
+    }
+    // Ensure we have an absolute path
+    if (currentFilePath && !path.isAbsolute(currentFilePath)) {
+      currentFilePath = path.resolve(this.workingDir, currentFilePath);
+    }
+    let lifecycleFile = null;
+    // First, check if there's a local lifecycle directory in the same directory as the current file
+    if (currentFilePath) {
+      const currentFileDir = path.dirname(currentFilePath);
+      const localLifecycleDir = path.join(currentFileDir, "lifecycle");
+      const localLifecycleFile = path.join(
+        localLifecycleDir,
+        `${lifecycleName}.yaml`,
+      );
+      // If there's a local lifecycle directory, only look there (don't fall back to global)
+      if (
+        fs.existsSync(localLifecycleDir) &&
+        fs.statSync(localLifecycleDir).isDirectory()
+      ) {
+        if (fs.existsSync(localLifecycleFile)) {
+          lifecycleFile = localLifecycleFile;
+        }
+        // Stop here - don't fall back to global if local lifecycle directory exists
+      } else {
+        // Only fall back to global if there's no local lifecycle directory
+        const testdriverDir = this.findTestDriverDirectory(currentFilePath);
+        const globalLifecycleFile = path.join(
+          testdriverDir,
+          "lifecycle",
+          `${lifecycleName}.yaml`,
+        );
+        if (fs.existsSync(globalLifecycleFile)) {
+          lifecycleFile = globalLifecycleFile;
+        }
+      }
+    }
+    this.emitter.emit(events.log.log, lifecycleFile);
+    if (lifecycleFile) {
+      // Store current source mapping state before running lifecycle file
+      const previousContext = this.sourceMapper.saveContext();
+      try {
+        await this.run(lifecycleFile, false, false);
+      } finally {
+        // Restore previous source mapping state after lifecycle file execution
+        this.sourceMapper.restoreContext(previousContext);
+      }
+    }
+  } // Unified command definitions that work for both CLI and interactive modes
+  getCommandDefinitions() {
+    return createCommandDefinitions(this);
+  }
+  // Execute a unified command
+  async executeUnifiedCommand(commandName, args = {}, options = {}) {
+    const commands = this.getCommandDefinitions();
+    const command = commands[commandName];
+    if (!command) {
+      throw new Error(`Unknown command: ${commandName}`);
+    }
+    // Convert args array to object if needed
+    const argsObj = {};
+    if (Array.isArray(args)) {
+      // Get argument definitions from the command
+      const argDefs = command.args ? Object.values(command.args) : [];
+      const argNames = command.args ? Object.keys(command.args) : [];
+      // Handle both positional args (/run myfile) and named args (/run file=myfile)
+      args.forEach((arg, index) => {
+        if (typeof arg === "string" && arg.includes("=")) {
+          // Named argument: file=myfile or path=myfile
+          const [key, value] = arg.split("=", 2);
+          // Support both 'file' and 'path' for the run command
+          if (commandName === "run" && key === "path") {
+            argsObj["file"] = value;
+          } else {
+            argsObj[key] = value;
+          }
+        } else {
+          // Positional argument: myfile
+          const argName = argNames[index];
+          if (argName) {
+            const argDef = argDefs[index];
+            if (argDef && argDef.variadic) {
+              argsObj[argName] = args.slice(index);
+            } else {
+              argsObj[argName] = arg;
+            }
+          }
+        }
+      });
+      // Apply defaults for any missing arguments
+      argNames.forEach((argName, index) => {
+        const argDef = argDefs[index];
+        if (argsObj[argName] === undefined && argDef && argDef.default) {
+          argsObj[argName] = argDef.default;
+        }
+      });
+    } else {
+      Object.assign(argsObj, args);
+    }
+    // Move environment setup and special handling here
+    if (["edit", "run", "generate"].includes(commandName)) {
+      await this.buildEnv(options);
+    }
+    if (commandName === "run") {
+      this.errorLimit = 100;
+    }
+    await command.handler(argsObj, options);
+  }
+}
+module.exports = TestDriverAgent;