npm - codeceptjs - Versions diffs - 4.0.0-rc.17 → 4.0.0-rc.19 - Mend

codeceptjs 4.0.0-rc.17 → 4.0.0-rc.19

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (240) hide show

package/bin/codecept.js +15 -2
package/bin/codeceptq.js +49 -0
package/bin/mcp-server.js +733 -196
package/docs/advanced.md +201 -0
package/docs/agents.md +159 -0
package/docs/ai.md +537 -0
package/docs/aitrace.md +266 -0
package/docs/api.md +332 -0
package/docs/assertions.md +415 -0
package/docs/auth.md +318 -0
package/docs/basics.md +424 -0
package/docs/bdd.md +539 -0
package/docs/best.md +240 -0
package/docs/bootstrap.md +132 -0
package/docs/commands.md +352 -0
package/docs/community-helpers.md +63 -0
package/docs/configuration.md +230 -0
package/docs/continuous-integration.md +497 -0
package/docs/custom-helpers.md +297 -0
package/docs/data.md +448 -0
package/docs/debugging.md +332 -0
package/docs/detox.md +235 -0
package/docs/docker.md +136 -0
package/docs/effects.md +179 -0
package/docs/element-based-testing.md +295 -0
package/docs/element-selection.md +125 -0
package/docs/els.md +328 -0
package/docs/examples.md +161 -0
package/docs/heal.md +213 -0
package/docs/helpers/ApiDataFactory.md +267 -0
package/docs/helpers/Appium.md +1405 -0
package/docs/helpers/Detox.md +665 -0
package/docs/helpers/ExpectHelper.md +275 -0
package/docs/helpers/FileSystem.md +152 -0
package/docs/helpers/GraphQL.md +152 -0
package/docs/helpers/GraphQLDataFactory.md +226 -0
package/docs/helpers/JSONResponse.md +255 -0
package/docs/helpers/Mochawesome.md +8 -0
package/docs/helpers/MockRequest.md +377 -0
package/docs/helpers/MockServer.md +212 -0
package/docs/helpers/Playwright.md +2969 -0
package/docs/helpers/Polly.md +44 -0
package/docs/helpers/Protractor.md +1769 -0
package/docs/helpers/Puppeteer-firefox.md +86 -0
package/docs/helpers/Puppeteer.md +2690 -0
package/docs/helpers/REST.md +289 -0
package/docs/helpers/SoftExpectHelper.md +352 -0
package/docs/helpers/WebDriver.md +2682 -0
package/docs/hooks.md +339 -0
package/docs/index.md +111 -0
package/docs/installation.md +83 -0
package/docs/internal-api.md +265 -0
package/docs/internal-test-server.md +89 -0
package/docs/locators.md +355 -0
package/docs/mcp.md +485 -0
package/docs/migration-4.md +556 -0
package/docs/mobile.md +338 -0
package/docs/pageobjects.md +399 -0
package/docs/parallel.md +585 -0
package/docs/playwright.md +714 -0
package/docs/plugins.md +866 -0
package/docs/puppeteer.md +314 -0
package/docs/quickstart.md +120 -0
package/docs/react.md +70 -0
package/docs/reports.md +483 -0
package/docs/retry.md +274 -0
package/docs/secrets.md +150 -0
package/docs/sessions.md +80 -0
package/docs/shadow.md +68 -0
package/docs/test-structure.md +275 -0
package/docs/timeouts.md +183 -0
package/docs/translation.md +247 -0
package/docs/tutorial.md +271 -0
package/docs/typescript.md +374 -0
package/docs/web-element.md +251 -0
package/docs/webdriver.md +708 -0
package/docs/within.md +55 -0
package/lib/aria.js +260 -0
package/lib/command/dryRun.js +23 -3
package/lib/command/init.js +247 -266
package/lib/command/list.js +150 -10
package/lib/command/query.js +218 -0
package/lib/config.js +77 -4
package/lib/container.js +34 -2
package/lib/element/WebElement.js +37 -0
package/lib/globals.js +11 -10
package/lib/helper/Playwright.js +5 -6
package/lib/helper/extras/PlaywrightReactVueLocator.js +45 -36
package/lib/html.js +90 -16
package/lib/index.js +9 -1
package/lib/locator.js +2 -2
package/lib/mocha/factory.js +5 -1
package/lib/mocha/inject.js +1 -1
package/lib/parser.js +2 -2
package/lib/pause.js +38 -4
package/lib/plugin/aiTrace.js +72 -84
package/lib/plugin/browser.js +77 -0
package/lib/plugin/expose.js +159 -0
package/lib/plugin/heal.js +44 -1
package/lib/plugin/pageInfo.js +51 -48
package/lib/plugin/pause.js +131 -0
package/lib/plugin/pauseOnFail.js +10 -34
package/lib/plugin/screencast.js +287 -0
package/lib/plugin/screenshot.js +563 -0
package/lib/plugin/screenshotOnFail.js +8 -170
package/lib/utils/pluginParser.js +151 -0
package/lib/utils/trace.js +297 -0
package/lib/utils.js +25 -0
package/lib/workers.js +1 -15
package/package.json +12 -10
package/typings/index.d.ts +0 -5
package/docs/webapi/amOnPage.mustache +0 -11
package/docs/webapi/appendField.mustache +0 -16
package/docs/webapi/attachFile.mustache +0 -24
package/docs/webapi/blur.mustache +0 -18
package/docs/webapi/checkOption.mustache +0 -13
package/docs/webapi/clearCookie.mustache +0 -9
package/docs/webapi/clearField.mustache +0 -14
package/docs/webapi/click.mustache +0 -29
package/docs/webapi/clickLink.mustache +0 -8
package/docs/webapi/closeCurrentTab.mustache +0 -7
package/docs/webapi/closeOtherTabs.mustache +0 -8
package/docs/webapi/dontSee.mustache +0 -11
package/docs/webapi/dontSeeCheckboxIsChecked.mustache +0 -10
package/docs/webapi/dontSeeCookie.mustache +0 -8
package/docs/webapi/dontSeeCurrentPathEquals.mustache +0 -10
package/docs/webapi/dontSeeCurrentUrlEquals.mustache +0 -10
package/docs/webapi/dontSeeElement.mustache +0 -12
package/docs/webapi/dontSeeElementInDOM.mustache +0 -8
package/docs/webapi/dontSeeInCurrentUrl.mustache +0 -4
package/docs/webapi/dontSeeInField.mustache +0 -16
package/docs/webapi/dontSeeInSource.mustache +0 -8
package/docs/webapi/dontSeeInTitle.mustache +0 -8
package/docs/webapi/dontSeeTraffic.mustache +0 -13
package/docs/webapi/doubleClick.mustache +0 -13
package/docs/webapi/downloadFile.mustache +0 -12
package/docs/webapi/dragAndDrop.mustache +0 -9
package/docs/webapi/dragSlider.mustache +0 -11
package/docs/webapi/executeAsyncScript.mustache +0 -24
package/docs/webapi/executeScript.mustache +0 -26
package/docs/webapi/fillField.mustache +0 -21
package/docs/webapi/flushNetworkTraffics.mustache +0 -5
package/docs/webapi/focus.mustache +0 -13
package/docs/webapi/forceClick.mustache +0 -28
package/docs/webapi/forceRightClick.mustache +0 -18
package/docs/webapi/grabAllWindowHandles.mustache +0 -7
package/docs/webapi/grabAttributeFrom.mustache +0 -10
package/docs/webapi/grabAttributeFromAll.mustache +0 -9
package/docs/webapi/grabBrowserLogs.mustache +0 -9
package/docs/webapi/grabCookie.mustache +0 -11
package/docs/webapi/grabCssPropertyFrom.mustache +0 -11
package/docs/webapi/grabCssPropertyFromAll.mustache +0 -10
package/docs/webapi/grabCurrentUrl.mustache +0 -9
package/docs/webapi/grabCurrentWindowHandle.mustache +0 -6
package/docs/webapi/grabDataFromPerformanceTiming.mustache +0 -20
package/docs/webapi/grabElementBoundingRect.mustache +0 -20
package/docs/webapi/grabGeoLocation.mustache +0 -8
package/docs/webapi/grabHTMLFrom.mustache +0 -10
package/docs/webapi/grabHTMLFromAll.mustache +0 -9
package/docs/webapi/grabNumberOfOpenTabs.mustache +0 -8
package/docs/webapi/grabNumberOfVisibleElements.mustache +0 -9
package/docs/webapi/grabPageScrollPosition.mustache +0 -8
package/docs/webapi/grabPopupText.mustache +0 -5
package/docs/webapi/grabRecordedNetworkTraffics.mustache +0 -10
package/docs/webapi/grabSource.mustache +0 -8
package/docs/webapi/grabTextFrom.mustache +0 -10
package/docs/webapi/grabTextFromAll.mustache +0 -9
package/docs/webapi/grabTitle.mustache +0 -8
package/docs/webapi/grabValueFrom.mustache +0 -9
package/docs/webapi/grabValueFromAll.mustache +0 -8
package/docs/webapi/grabWebElement.mustache +0 -9
package/docs/webapi/grabWebElements.mustache +0 -9
package/docs/webapi/moveCursorTo.mustache +0 -16
package/docs/webapi/openNewTab.mustache +0 -7
package/docs/webapi/pressKey.mustache +0 -12
package/docs/webapi/pressKeyDown.mustache +0 -12
package/docs/webapi/pressKeyUp.mustache +0 -12
package/docs/webapi/pressKeyWithKeyNormalization.mustache +0 -60
package/docs/webapi/refreshPage.mustache +0 -6
package/docs/webapi/resizeWindow.mustache +0 -6
package/docs/webapi/rightClick.mustache +0 -14
package/docs/webapi/saveElementScreenshot.mustache +0 -10
package/docs/webapi/saveScreenshot.mustache +0 -12
package/docs/webapi/say.mustache +0 -10
package/docs/webapi/scrollIntoView.mustache +0 -11
package/docs/webapi/scrollPageToBottom.mustache +0 -6
package/docs/webapi/scrollPageToTop.mustache +0 -6
package/docs/webapi/scrollTo.mustache +0 -12
package/docs/webapi/see.mustache +0 -11
package/docs/webapi/seeAttributesOnElements.mustache +0 -9
package/docs/webapi/seeCheckboxIsChecked.mustache +0 -10
package/docs/webapi/seeCookie.mustache +0 -8
package/docs/webapi/seeCssPropertiesOnElements.mustache +0 -9
package/docs/webapi/seeCurrentPathEquals.mustache +0 -10
package/docs/webapi/seeCurrentUrlEquals.mustache +0 -11
package/docs/webapi/seeElement.mustache +0 -12
package/docs/webapi/seeElementInDOM.mustache +0 -8
package/docs/webapi/seeInCurrentUrl.mustache +0 -8
package/docs/webapi/seeInField.mustache +0 -17
package/docs/webapi/seeInPopup.mustache +0 -8
package/docs/webapi/seeInSource.mustache +0 -7
package/docs/webapi/seeInTitle.mustache +0 -8
package/docs/webapi/seeNumberOfElements.mustache +0 -11
package/docs/webapi/seeNumberOfVisibleElements.mustache +0 -10
package/docs/webapi/seeTextEquals.mustache +0 -9
package/docs/webapi/seeTitleEquals.mustache +0 -8
package/docs/webapi/seeTraffic.mustache +0 -36
package/docs/webapi/selectOption.mustache +0 -26
package/docs/webapi/setCookie.mustache +0 -16
package/docs/webapi/setGeoLocation.mustache +0 -12
package/docs/webapi/startRecordingTraffic.mustache +0 -8
package/docs/webapi/startRecordingWebSocketMessages.mustache +0 -8
package/docs/webapi/stopRecordingTraffic.mustache +0 -5
package/docs/webapi/stopRecordingWebSocketMessages.mustache +0 -7
package/docs/webapi/switchTo.mustache +0 -9
package/docs/webapi/switchToNextTab.mustache +0 -10
package/docs/webapi/switchToPreviousTab.mustache +0 -10
package/docs/webapi/type.mustache +0 -21
package/docs/webapi/uncheckOption.mustache +0 -13
package/docs/webapi/wait.mustache +0 -8
package/docs/webapi/waitForClickable.mustache +0 -11
package/docs/webapi/waitForCookie.mustache +0 -9
package/docs/webapi/waitForDetached.mustache +0 -10
package/docs/webapi/waitForDisabled.mustache +0 -6
package/docs/webapi/waitForElement.mustache +0 -11
package/docs/webapi/waitForEnabled.mustache +0 -6
package/docs/webapi/waitForFunction.mustache +0 -17
package/docs/webapi/waitForInvisible.mustache +0 -10
package/docs/webapi/waitForNumberOfTabs.mustache +0 -9
package/docs/webapi/waitForText.mustache +0 -13
package/docs/webapi/waitForValue.mustache +0 -10
package/docs/webapi/waitForVisible.mustache +0 -10
package/docs/webapi/waitInUrl.mustache +0 -9
package/docs/webapi/waitNumberOfVisibleElements.mustache +0 -10
package/docs/webapi/waitToHide.mustache +0 -10
package/docs/webapi/waitUrlEquals.mustache +0 -10
package/lib/helper/AI.js +0 -214
package/lib/plugin/pauseOn.js +0 -167
package/lib/plugin/stepByStepReport.js +0 -432
package/lib/plugin/subtitles.js +0 -89

package/bin/mcp-server.js CHANGED Viewed

@@ -1,18 +1,36 @@
+#!/usr/bin/env node
 import { Server } from '@modelcontextprotocol/sdk/server/index.js'
 import { StdioServerTransport } from '@modelcontextprotocol/sdk/server/stdio.js'
 import { CallToolRequestSchema, ListToolsRequestSchema } from '@modelcontextprotocol/sdk/types.js'
 import Codecept from '../lib/codecept.js'
 import container from '../lib/container.js'
 import { getParamsToString } from '../lib/parser.js'
-import { methodsOfObject } from '../lib/utils.js'
+import { methodsOfObject, safeStringify, truncateString } from '../lib/utils.js'
+import {
+  captureSnapshot,
+  pickActingHelper,
+  traceDirFor,
+  snapshotDirFor,
+  artifactsToFileUrls,
+  writeTraceMarkdown,
+  TraceReader,
+  ariaDiff,
+} from '../lib/utils/trace.js'
 import event from '../lib/event.js'
-import { fileURLToPath } from 'url'
+import recorder from '../lib/recorder.js'
+import WebElement from '../lib/element/WebElement.js'
+import { locate, within, session, secret, inject, pause } from '../lib/index.js'
+import { tryTo, retryTo, hopeThat } from '../lib/effects.js'
+import step from '../lib/steps.js'
+import { element, eachElement, expectElement, expectAnyElement, expectAllElements } from '../lib/els.js'
+import { setPauseHandler, pauseNow } from '../lib/pause.js'
+import { EventEmitter } from 'events'
+import { fileURLToPath, pathToFileURL } from 'url'
 import { dirname, resolve as resolvePath } from 'path'
 import path from 'path'
-import crypto from 'crypto'
 import { spawn } from 'child_process'
 import { createRequire } from 'module'
-import { existsSync, readdirSync, writeFileSync } from 'fs'
+import { existsSync, readdirSync } from 'fs'
 import { mkdirp } from 'mkdirp'
 const require = createRequire(import.meta.url)
@@ -23,6 +41,129 @@ const __dirname = dirname(__filename)
 let codecept = null
 let containerInitialized = false
 let browserStarted = false
+let shellSessionActive = false
+let bootstrapDone = false
+let currentPluginsSig = ''
+let currentAiTraceDir = null  // mirrors the dir aiTrace plugin computes per test/session
+let aiTraceEnabled = false  // tracked across the session so tool responses can surface a hint when off
+event.dispatcher.on(event.test.before, test => {
+  try {
+    const title = (test && (test.fullTitle ? test.fullTitle() : test.title)) || 'MCP Session'
+    currentAiTraceDir = traceDirFor(test?.file, title, outputBaseDir())
+  } catch {}
+})
+function aiTraceHint() {
+  if (aiTraceEnabled) return undefined
+  return 'aiTrace plugin is disabled — re-run start_browser with plugins={ aiTrace: { enabled: true } } to capture per-step DOM/ARIA/console traces for debugging.'
+}
+function applyMochaGrep(grep) {
+  if (!grep) return
+  const mocha = typeof container.mocha === 'function' ? container.mocha() : container.mocha
+  if (mocha && typeof mocha.grep === 'function') mocha.grep(grep)
+}
+function pauseAtMatcher(pauseAt) {
+  if (pauseAt == null) return () => false
+  if (typeof pauseAt === 'number') return (idx) => idx === pauseAt
+  if (typeof pauseAt === 'string') {
+    const m = pauseAt.match(/^\/(.+)\/([gimsuy]*)$/)
+    const re = m ? new RegExp(m[1], m[2]) : new RegExp(pauseAt.replace(/[.+?^${}()|[\]\\]/g, '\\$&'), 'i')
+    return (_idx, name) => re.test(name)
+  }
+  return () => false
+}
+async function ensureBootstrap() {
+  if (bootstrapDone) return
+  await codecept.bootstrap()
+  bootstrapDone = true
+}
+async function startShellSession() {
+  if (shellSessionActive) return
+  await ensureBootstrap()
+  recorder.start()
+  event.emit(event.suite.before, {
+    fullTitle: () => 'MCP Session',
+    tests: [],
+    retries: () => {},
+  })
+  event.emit(event.test.before, {
+    title: 'MCP Session',
+    artifacts: {},
+    retries: () => {},
+  })
+  shellSessionActive = true
+}
+async function endShellSession() {
+  if (!shellSessionActive) return
+  try { event.emit(event.test.after, {}) } catch {}
+  try { event.emit(event.suite.after, {}) } catch {}
+  try { event.emit(event.all.result, {}) } catch {}
+  shellSessionActive = false
+}
+async function ensureSession() {
+  if (shellSessionActive || pausedController) return
+  await startShellSession()
+}
+function normalizePluginOverrides(plugins) {
+  if (!plugins || typeof plugins !== 'object') return {}
+  const out = {}
+  for (const [name, opts] of Object.entries(plugins)) {
+    if (opts === false) continue
+    out[name] = (opts === true || opts == null) ? {} : opts
+  }
+  return out
+}
+function applyPluginOverrides(config, plugins) {
+  config.plugins = config.plugins || {}
+  for (const [name, opts] of Object.entries(plugins)) {
+    config.plugins[name] = { ...(config.plugins[name] || {}), ...opts, enabled: true }
+  }
+}
+function pluginsSignature(plugins) {
+  const keys = Object.keys(plugins).sort()
+  return JSON.stringify(keys.map(k => [k, plugins[k]]))
+}
+async function teardownContainer() {
+  if (!containerInitialized) return
+  try {
+    await closeBrowser()
+    try { if (codecept?.teardown) await codecept.teardown() } catch {}
+  } finally {
+    containerInitialized = false
+    browserStarted = false
+    bootstrapDone = false
+    aiTraceEnabled = false
+    codecept = null
+    currentPluginsSig = ''
+  }
+}
+let shutdownStarted = false
+function installShutdownHooks() {
+  const onSignal = (signal) => {
+    if (shutdownStarted) return
+    shutdownStarted = true
+    teardownContainer().finally(() => process.exit(signal === 'SIGINT' ? 130 : 0))
+  }
+  process.on('SIGTERM', () => onSignal('SIGTERM'))
+  process.on('SIGINT', () => onSignal('SIGINT'))
+  process.on('beforeExit', () => {
+    if (shutdownStarted) return
+    shutdownStarted = true
+    teardownContainer().catch(() => {})
+  })
+}
 let runLock = Promise.resolve()
 async function withLock(fn) {
@@ -224,19 +365,136 @@ async function resolveTestToFile({ cli, root, configPath, test }) {
   return fsFound ? normalizePath(fsFound) : null
 }
-function clearString(str) {
-  return str.replace(/[^a-zA-Z0-9]/g, '_')
+function outputBaseDir() {
+  return global.output_dir || resolvePath(process.cwd(), 'output')
+}
+// In-process pause coordination. When a test running through run_test calls
+// pause(), the handler registered via setPauseHandler resolves a "paused"
+// promise that run_test is racing against test completion. The "pause" tool
+// then drives the REPL by mutating next/abort and resolving the controller.
+let pausedController = null
+let pendingRunPromise = null
+let pendingRunResults = null
+let pendingRunCleanup = null
+let pendingTestFile = null
+let pendingStepInfo = null
+let abortRun = false
+const pauseEvents = new EventEmitter()
+setPauseHandler(({ registeredVariables }) => {
+  if (abortRun) return Promise.reject(new Error('MCP session aborted'))
+  return new Promise(resolve => {
+    pausedController = {
+      registeredVariables,
+      resolveContinue: () => {
+        pausedController = null
+        resolve()
+      },
+    }
+    pauseEvents.emit('paused')
+  })
+})
+async function cancelRun() {
+  if (!pendingRunPromise && !pausedController) return false
+  abortRun = true
+  if (typeof pendingRunCleanup === 'function') { try { pendingRunCleanup() } catch {} }
+  if (pausedController) { try { pausedController.resolveContinue() } catch {} ; pausedController = null }
+  if (pendingRunPromise) {
+    try { await Promise.race([pendingRunPromise.catch(() => {}), new Promise(r => setTimeout(r, 5000))]) } catch {}
+  }
+  pendingRunPromise = null
+  pendingRunResults = null
+  pendingTestFile = null
+  pendingStepInfo = null
+  abortRun = false
+  return true
+}
+async function closeBrowser() {
+  if (!containerInitialized) return
+  await cancelRun()
+  await endShellSession()
+  for (const helper of Object.values(container.helpers() || {})) {
+    try { if (helper._cleanup) await helper._cleanup() } catch {}
+    try { if (helper._finishTest) await helper._finishTest() } catch {}
+  }
+  browserStarted = false
+}
+async function captureLiveArtifacts(prefix = 'pause') {
+  const helper = pickActingHelper(container.helpers())
+  if (!helper) return {}
+  const dir = snapshotDirFor(outputBaseDir())
+  mkdirp.sync(dir)
+  const captured = await captureSnapshot(helper, { dir, prefix })
+  return artifactsToFileUrls(captured, dir)
+}
+async function gatherPageBrief() {
+  const helper = pickActingHelper(container.helpers())
+  if (!helper) return {}
+  const out = {}
+  try { if (helper.grabCurrentUrl) out.url = await helper.grabCurrentUrl() } catch {}
+  try { if (helper.grabTitle) out.title = await helper.grabTitle() } catch {}
+  try {
+    if (helper.grabSource) {
+      const html = await helper.grabSource()
+      out.contentSize = typeof html === 'string' ? html.length : null
+    }
+  } catch {}
+  return out
+}
+function collectRunCompletion(errorMessage) {
+  const results = pendingRunResults || []
+  const stats = {
+    tests: results.length,
+    passes: results.filter(r => r.status === 'passed').length,
+    failures: results.filter(r => r.status === 'failed').length,
+  }
+  if (typeof pendingRunCleanup === 'function') pendingRunCleanup()
+  pendingRunPromise = null
+  pendingRunResults = null
+  pendingTestFile = null
+  pendingStepInfo = null
+  let error = errorMessage || null
+  if (!error && results.length === 0) {
+    error = 'No tests ran and no error was reported. The Mocha instance may have been disposed (set mocha.cleanReferencesAfterRun=false in config) or the test file matched no scenarios.'
+  }
+  return {
+    status: error ? 'failed' : 'completed',
+    aiTraceDir: currentAiTraceDir,
+    reporterJson: { stats, tests: results },
+    error,
+    aiTraceHint: aiTraceHint(),
+  }
 }
-function getTraceDir(testTitle, testFile) {
-  const hash = crypto.createHash('sha256').update(testFile + testTitle).digest('hex').slice(0, 8)
-  const cleanTitle = clearString(testTitle).slice(0, 200)
-  const outputDir = global.output_dir || resolvePath(process.cwd(), 'output')
-  return resolvePath(outputDir, `trace_${cleanTitle}_${hash}`)
+function pausedPayload() {
+  return {
+    status: 'paused',
+    file: pendingTestFile,
+    aiTraceDir: currentAiTraceDir,
+    pausedAfter: pendingStepInfo,
+    suggestions: [
+      'Call snapshot to capture URL/HTML/ARIA/screenshot/console/storage at this point',
+      'Call run_code to inspect or manipulate state (e.g. return await I.grabText("h1"))',
+      'Call continue to release the pause and let the test run the next step (or finish)',
+      'Query a saved step snapshot offline: codeceptq <locator> --file <aiTraceDir>/<NNNN>_<step>_page.html',
+    ],
+  }
 }
-async function initCodecept(configPath) {
-  if (containerInitialized) return
+async function initCodecept(configPath, pluginOverrides) {
+  const plugins = normalizePluginOverrides(pluginOverrides)
+  const sig = pluginsSignature(plugins)
+  if (containerInitialized) {
+    if (!Object.keys(plugins).length || sig === currentPluginsSig) return
+    await teardownContainer()
+  }
   const testRoot = process.env.CODECEPTJS_PROJECT_DIR || process.cwd()
@@ -261,13 +519,27 @@ async function initCodecept(configPath) {
   const { getConfig } = await import('../lib/command/utils.js')
   const config = await getConfig(configPath)
+  // aiTrace is the canonical per-step ARIA/HTML/screenshot capture for MCP.
+  // Always on so run_code / continue can read the latest snapshot from disk
+  // instead of double-capturing through grabAriaSnapshot etc.
+  applyPluginOverrides(config, { aiTrace: { on: 'step' }, browser: { show: false }, ...plugins })
   codecept = new Codecept(config, {})
   await codecept.init(testRoot)
-  await container.create(config, {})
   await container.started()
   containerInitialized = true
   browserStarted = true
+  aiTraceEnabled = config.plugins?.aiTrace?.enabled === true
+  currentPluginsSig = sig
+}
+async function formatReturnValue(value) {
+  if (value instanceof WebElement) return await value.describe()
+  if (Array.isArray(value) && value.length && value.every(v => v instanceof WebElement)) {
+    return await Promise.all(value.map(v => v.describe()))
+  }
+  return value
 }
 const server = new Server(
@@ -275,66 +547,124 @@ const server = new Server(
   { capabilities: { tools: {} } }
 )
+const PLUGINS_PROP = {
+  type: 'object',
+  description: 'Plugin configs to enable for this session, keyed by plugin name. Same shape as `plugins` in codecept.conf.js — each value is the plugin\'s config object (`enabled: true` is added automatically). Common entries:\n' +
+    '  • { browser: { show: true } } — visible browser (headed)\n' +
+    '  • { browser: { show: false } } — headless\n' +
+    '  • { browser: { browser: "firefox", windowSize: "1280x720" } } — switch browser + viewport\n' +
+    '  • { pause: { on: "fail" } } / { screenshot: { on: "step" } } / { aiTrace: {} }\n' +
+    'Override or add to whatever the project config already enables.',
+  additionalProperties: { type: 'object' },
+}
+const CONFIG_PROP = {
+  type: 'string',
+  description: 'Path to codecept.conf.js (or .cjs). Defaults to $CODECEPTJS_CONFIG, then ./codecept.conf.js in $CODECEPTJS_PROJECT_DIR or cwd. Only needed for projects with a non-standard config location.',
+}
 server.setRequestHandler(ListToolsRequestSchema, async () => ({
   tools: [
     {
       name: 'list_tests',
-      description: 'List all tests in the CodeceptJS project',
-      inputSchema: { type: 'object', properties: { config: { type: 'string' } } },
+      description: 'List all tests in the CodeceptJS project. Uses the active session if start_browser was called, otherwise auto-inits with project defaults.',
+      inputSchema: { type: 'object', properties: {} },
     },
     {
       name: 'list_actions',
-      description: 'List all available CodeceptJS actions (I.* methods)',
-      inputSchema: { type: 'object', properties: { config: { type: 'string' } } },
+      description: 'List all available CodeceptJS actions (I.* methods). Uses the active session if start_browser was called, otherwise auto-inits with project defaults.',
+      inputSchema: { type: 'object', properties: {} },
     },
     {
       name: 'run_code',
-      description: 'Run arbitrary CodeceptJS code.',
+      description: 'Run arbitrary CodeceptJS code. Response includes `availableObjects` listing every symbol in scope (I, helpers, container, step, tryTo, within, etc.).',
       inputSchema: {
         type: 'object',
         properties: {
           code: { type: 'string' },
           timeout: { type: 'number' },
-          config: { type: 'string' },
           saveArtifacts: { type: 'boolean' },
+          settleMs: { type: 'number', description: 'Wait N ms after the code finishes before capturing artifacts. Default 300. Set higher (1000+) when actions trigger slow re-renders, or 0 to skip.' },
         },
         required: ['code'],
       },
     },
     {
       name: 'run_test',
-      description: 'Run a specific test.',
+      description: 'Run a specific test. Returns reporter JSON with one entry per scenario; each entry has a `traceFile` (file:// URL) pointing to the aiTrace markdown for that scenario — Read it on failures to see the failing step\'s DOM/ARIA/screenshot. If aiTrace is disabled the response includes an `aiTraceHint`. If the test calls pause() — or if pauseAt is set and reached — returns early with status "paused" so the agent can inspect via run_code and release with continue. To learn step indices for pauseAt, call run_step_by_step first. Auto-inits with project defaults if no session is active — call start_browser first to customize launch (e.g. plugins={ browser: { show: true } } to watch the run).',
       inputSchema: {
         type: 'object',
         properties: {
           test: { type: 'string' },
           timeout: { type: 'number' },
-          config: { type: 'string' },
+          grep: { type: 'string', description: 'Filter scenarios by title (passed to mocha.grep). Mirrors --grep on the CLI.' },
+          pauseAt: {
+            description: 'Programmatic breakpoint. Either a 1-based step index (number) or a step-name match (string — substring case-insensitive, or `/regex/i` literal). Examples: 5 / "fill field" / "/grab.*url/i".',
+            oneOf: [{ type: 'number' }, { type: 'string' }],
+          },
+          plugins: PLUGINS_PROP,
         },
         required: ['test'],
       },
     },
     {
       name: 'run_step_by_step',
-      description: 'Run a test step by step with pauses between steps.',
+      description: 'Run a test interactively, pausing after every step. Returns paused payload after the first step (URL/title/contentSize, last step info, suggestions). Call continue to advance one step (and re-pause), or run_code/snapshot to inspect state. On completion each scenario in `reporterJson.tests[]` has a `traceFile` (file:// URL) for the per-step aiTrace markdown — Read it for the full execution log. Much more useful when start_browser was called with plugins={ browser: { show: true } } so you can watch what happens between pauses.',
       inputSchema: {
         type: 'object',
         properties: {
           test: { type: 'string' },
           timeout: { type: 'number' },
-          config: { type: 'string' },
+          grep: { type: 'string', description: 'Filter scenarios by title (passed to mocha.grep). Mirrors --grep on the CLI.' },
+          plugins: PLUGINS_PROP,
         },
         required: ['test'],
       },
     },
     {
       name: 'start_browser',
-      description: 'Start the browser session.',
-      inputSchema: { type: 'object', properties: { config: { type: 'string' } } },
+      description: 'Start the session — initializes the codeceptjs container, loads helpers, and applies any plugin overrides. This is the only tool that customizes initialization; every other tool either uses the active session or auto-inits with project defaults.\n\n' +
+        'MCP enforces two plugin defaults so the agent gets useful telemetry:\n' +
+        '  • aiTrace: { on: "step", enabled: true } — per-step DOM/ARIA/console/screenshot traces for debugging\n' +
+        '  • browser: { show: false, enabled: true } — headless by default\n' +
+        'Both can be overridden via the `plugins` arg. To watch the run live: plugins={ browser: { show: true } }. To skip per-step trace overhead on a re-run: plugins={ aiTrace: { enabled: false } } (or { on: "fail" } to only capture failures). To switch config or plugins mid-session, call stop_browser first.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          config: CONFIG_PROP,
+          plugins: PLUGINS_PROP,
+        },
+      },
     },
     {
       name: 'stop_browser',
-      description: 'Stop the browser session.',
+      description: 'Stop the session, close browsers, and tear down the container. Required before re-initing with different config or plugins.',
+      inputSchema: { type: 'object', properties: {} },
+    },
+    {
+      name: 'snapshot',
+      description: 'Capture current browser state (HTML, ARIA, screenshot, console, URL) without performing any action. Returns `traceFile` (file:// URL) to a markdown trace bundling the captured artifacts — Read it for full context. Auto-inits with project defaults if no session is active.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          fullPage: { type: 'boolean' },
+          settleMs: { type: 'number', description: 'Wait N ms before capturing. Default 300. Set higher when the previous action is still re-rendering, or 0 to skip.' },
+        },
+      },
+    },
+    {
+      name: 'continue',
+      description: 'Release a paused test (one that called pause() during run_test) and let it run to completion. Returns the final reporter result. Use run_code to inspect or manipulate state while the test is paused — both tools share the same container.',
+      inputSchema: {
+        type: 'object',
+        properties: {
+          timeout: { type: 'number' },
+        },
+      },
+    },
+    {
+      name: 'cancel',
+      description: 'Abort the currently paused or in-progress test run without closing the browser. Use when you want to bail out of a paused test and start something else without going through stop_browser/start_browser. The browser session and Mocha state stay alive.',
       inputSchema: { type: 'object', properties: {} },
     },
   ],
@@ -346,8 +676,7 @@ server.setRequestHandler(CallToolRequestSchema, async (request) => {
   try {
     switch (name) {
       case 'list_tests': {
-        const configPath = args?.config
-        await initCodecept(configPath)
+        await initCodecept()
         codecept.loadTests()
         const tests = codecept.testFiles.map(testFile => {
@@ -362,8 +691,7 @@ server.setRequestHandler(CallToolRequestSchema, async (request) => {
       }
       case 'list_actions': {
-        const configPath = args?.config
-        await initCodecept(configPath)
+        await initCodecept()
         const helpers = container.helpers()
         const supportI = container.support('I')
@@ -391,225 +719,433 @@ server.setRequestHandler(CallToolRequestSchema, async (request) => {
       }
       case 'start_browser': {
-        const configPath = args?.config
-        if (browserStarted) {
-          return { content: [{ type: 'text', text: JSON.stringify({ status: 'Browser already started' }, null, 2) }] }
+        const { config: configPath, plugins } = args || {}
+        if (browserStarted && shellSessionActive) {
+          return { content: [{ type: 'text', text: JSON.stringify({ status: 'Session already active', plugins: plugins ?? null }, null, 2) }] }
+        }
+        await initCodecept(configPath, plugins)
+        if (containerInitialized && !browserStarted) {
+          for (const helper of Object.values(container.helpers() || {})) {
+            try { if (helper._beforeSuite) await helper._beforeSuite() } catch {}
+          }
+          browserStarted = true
         }
-        await initCodecept(configPath)
-        return { content: [{ type: 'text', text: JSON.stringify({ status: 'Browser started successfully' }, null, 2) }] }
+        await startShellSession()
+        return { content: [{ type: 'text', text: JSON.stringify({ status: 'Session started — run_code and snapshot are now available', plugins: plugins ?? null }, null, 2) }] }
       }
       case 'stop_browser': {
         if (!containerInitialized) {
           return { content: [{ type: 'text', text: JSON.stringify({ status: 'Browser not initialized' }, null, 2) }] }
         }
+        await closeBrowser()
+        return { content: [{ type: 'text', text: JSON.stringify({ status: 'Browser stopped — Mocha and config preserved; call start_browser to reopen' }, null, 2) }] }
+      }
-        const helpers = container.helpers()
-        for (const helperName in helpers) {
-          const helper = helpers[helperName]
-          try { if (helper._finish) await helper._finish() } catch {}
+      case 'snapshot': {
+        const { fullPage = false, settleMs = 300 } = args || {}
+        await initCodecept()
+        await ensureSession()
+        const helper = pickActingHelper(container.helpers())
+        if (!helper) throw new Error('No supported acting helper available (Playwright, Puppeteer, WebDriver).')
+        const dir = snapshotDirFor(outputBaseDir())
+        mkdirp.sync(dir)
+        if (settleMs > 0) await new Promise(r => setTimeout(r, settleMs))
+        const captured = await captureSnapshot(helper, { dir, prefix: 'snapshot', fullPage })
+        const traceFile = writeTraceMarkdown({
+          dir,
+          title: 'snapshot',
+          file: 'mcp',
+          durationMs: 0,
+          commands: [],
+          captured,
+        })
+        return {
+          content: [{
+            type: 'text',
+            text: JSON.stringify({
+              status: 'success',
+              dir,
+              traceFile: pathToFileURL(traceFile).href,
+              artifacts: artifactsToFileUrls(captured, dir),
+              aiTraceHint: aiTraceHint(),
+            }, null, 2),
+          }],
         }
+      }
+      case 'continue': {
+        if (!pausedController) throw new Error('No paused test. Run a test first via run_test or run_step_by_step; this tool becomes available if the test pauses.')
+        const { timeout = 60000 } = args || {}
+        return await withSilencedIO(async () => {
+          pausedController.resolveContinue()
+          if (!pendingRunPromise) {
+            return { content: [{ type: 'text', text: JSON.stringify({ status: 'continued' }, null, 2) }] }
+          }
+          // Race: test pauses again (step-by-step or another pause()) vs test finishes.
+          const pausedAgain = new Promise(resolve => pauseEvents.once('paused', () => resolve('paused')))
+          const completed = pendingRunPromise.then(() => 'completed', () => 'completed')
+          const which = await Promise.race([
+            pausedAgain,
+            completed,
+            new Promise((_, reject) => setTimeout(() => reject(new Error(`Timeout after ${timeout}ms`)), timeout)),
+          ])
-        browserStarted = false
-        containerInitialized = false
+          if (which === 'paused') {
+            const page = await gatherPageBrief()
+            return { content: [{ type: 'text', text: JSON.stringify({ ...pausedPayload(), page }, null, 2) }] }
+          }
+          let runError = null
+          try { await pendingRunPromise } catch (err) { runError = err }
+          const file = pendingTestFile
+          const final = collectRunCompletion(runError?.message)
+          return { content: [{ type: 'text', text: JSON.stringify({ ...final, file }, null, 2) }] }
+        })
+      }
-        return { content: [{ type: 'text', text: JSON.stringify({ status: 'Browser stopped successfully' }, null, 2) }] }
+      case 'cancel': {
+        const cancelled = await cancelRun()
+        await ensureSession()
+        return { content: [{ type: 'text', text: JSON.stringify({ status: cancelled ? 'Run cancelled — browser kept open' : 'No run in progress' }, null, 2) }] }
       }
       case 'run_code': {
-        const { code, timeout = 60000, config: configPath, saveArtifacts = true } = args
-        await initCodecept(configPath)
+        const { code, timeout = 60000, saveArtifacts = true, settleMs = 300 } = args
+        await initCodecept()
+        await ensureSession()
+        const support = container.supportObjects() || {}
+        if (!support.I) throw new Error('I object not available. Make sure helpers are configured.')
+        const result = { status: 'unknown', output: '', error: null, commands: [], artifacts: {} }
+        const commands = []
+        let lastStepValue
+        const onStepAfter = step => {
+          try { commands.push(step.toString()) } catch {}
+        }
+        const onStepPassed = (step, val) => {
+          if (val !== undefined) lastStepValue = val
+        }
+        event.dispatcher.on(event.step.after, onStepAfter)
+        event.dispatcher.on(event.step.passed, onStepPassed)
+        const traceDir = traceDirFor(`mcp_${Date.now()}`, 'run_code', outputBaseDir())
+        mkdirp.sync(traceDir)
+        const startedAt = Date.now()
+        // Pin the latest aiTrace ARIA file before running the code, so we
+        // can diff after. aiTrace owns per-step capture; we just read it.
+        const reader = new TraceReader(currentAiTraceDir)
+        const ariaBefore = reader.last('aria')
+        const MAX_LOG_ENTRIES = 100
+        const MAX_LOG_MSG_BYTES = 2000
+        const MAX_RETURN_BYTES = 20000
+        const consoleLogs = []
+        const consoleMethods = ['log', 'info', 'warn', 'error', 'debug']
+        const origConsoleMethods = {}
+        const captureLog = level => (...args) => {
+          if (consoleLogs.length >= MAX_LOG_ENTRIES) return
+          const message = args.map(a => {
+            if (typeof a === 'string') return a
+            return truncateString(safeStringify(a, [], 2), MAX_LOG_MSG_BYTES).value
+          }).join(' ')
+          consoleLogs.push({ level, message, t: Date.now() - startedAt })
+        }
+        for (const m of consoleMethods) {
+          origConsoleMethods[m] = console[m]
+          console[m] = captureLog(m)
+        }
-        const I = container.support('I')
-        if (!I) throw new Error('I object not available. Make sure helpers are configured.')
+        const scope = {
+          locate, within, session, secret, inject, pause, share: container.share,
+          tryTo, retryTo, hopeThat,
+          step, element, eachElement, expectElement, expectAnyElement, expectAllElements,
+          container, helpers: container.helpers(),
+          ...support,
+        }
+        const paramNames = ['I', ...Object.keys(scope).filter(k => k !== 'I').sort()]
+        const paramValues = paramNames.map(k => scope[k])
-        const result = { status: 'unknown', output: '', error: null, artifacts: {} }
+        const wasPaused = !!pausedController
+        if (wasPaused) recorder.session.start('mcp_run_code')
+        let returnValue
         try {
-          const asyncFn = new Function('I', `return (async () => { ${code} })()`)
-          await Promise.race([
-            asyncFn(I),
+          const asyncFn = new Function(...paramNames, `return (async () => { ${code} })()`)
+          returnValue = await Promise.race([
+            asyncFn(...paramValues),
             new Promise((_, reject) => setTimeout(() => reject(new Error(`Timeout after ${timeout}ms`)), timeout)),
           ])
+          await recorder.promise()
           result.status = 'success'
           result.output = 'Code executed successfully'
-          if (saveArtifacts) {
-            const helpers = container.helpers()
-            const helper = Object.values(helpers)[0]
-            if (helper) {
-              try {
-                const traceDir = getTraceDir('mcp', 'run_code')
-                mkdirp.sync(traceDir)
-                if (helper.grabAriaSnapshot) {
-                  const aria = await helper.grabAriaSnapshot()
-                  const ariaFile = path.join(traceDir, 'aria.txt')
-                  writeFileSync(ariaFile, aria)
-                  result.artifacts.aria = `file://${ariaFile}`
-                }
-                if (helper.grabCurrentUrl) {
-                  result.artifacts.url = await helper.grabCurrentUrl()
-                }
-                if (helper.grabBrowserLogs) {
-                  const logs = (await helper.grabBrowserLogs()) || []
-                  const logsFile = path.join(traceDir, 'console.json')
-                  writeFileSync(logsFile, JSON.stringify(logs, null, 2))
-                  result.artifacts.consoleLogs = `file://${logsFile}`
-                }
-                if (helper.grabSource) {
-                  const html = await helper.grabSource()
-                  const htmlFile = path.join(traceDir, 'page.html')
-                  writeFileSync(htmlFile, html)
-                  result.artifacts.html = `file://${htmlFile}`
-                }
-                if (helper.saveScreenshot) {
-                  const screenshotFile = path.join(traceDir, 'screenshot.png')
-                  await helper.saveScreenshot(screenshotFile)
-                  result.artifacts.screenshot = `file://${screenshotFile}`
-                }
-              } catch (e) {
-                result.output += ` (Warning: ${e.message})`
-              }
-            }
-          }
         } catch (error) {
           result.status = 'failed'
           result.error = error.message
           result.output = error.stack || error.message
+        } finally {
+          for (const m of consoleMethods) console[m] = origConsoleMethods[m]
+          try { event.dispatcher.removeListener(event.step.after, onStepAfter) } catch {}
+          try { event.dispatcher.removeListener(event.step.passed, onStepPassed) } catch {}
+          if (wasPaused) {
+            try { recorder.session.restore('mcp_run_code') } catch {}
+          } else {
+            try { recorder.reset() } catch {}
+          }
+        }
+        result.commands = commands
+        result.logs = consoleLogs
+        if (consoleLogs.length === MAX_LOG_ENTRIES) result.logsTruncated = true
+        result.availableObjects = paramNames
+        if (returnValue === undefined) returnValue = await Promise.resolve(lastStepValue)
+        returnValue = await formatReturnValue(returnValue)
+        if (returnValue !== undefined) {
+          const json = typeof returnValue === 'string' ? returnValue : safeStringify(returnValue, [], 2)
+          const stringified = truncateString(json, MAX_RETURN_BYTES)
+          result.returnValue = stringified.value
+          if (stringified.truncated) result.returnValueTruncated = true
         }
+        let captured = {}
+        if (saveArtifacts) {
+          const helper = pickActingHelper(container.helpers())
+          if (helper) {
+            try {
+              if (settleMs > 0) await new Promise(r => setTimeout(r, settleMs))
+              captured = await captureSnapshot(helper, { dir: traceDir, prefix: 'mcp' })
+              result.artifacts = artifactsToFileUrls(captured, traceDir)
+            } catch (e) {
+              result.output += ` (Warning: ${e.message})`
+            }
+          }
+        }
+        // Diff against the latest aiTrace ARIA file produced by the steps
+        // that just ran inside this run_code call.
+        const ariaAfter = reader.last('aria')
+        if (ariaBefore && ariaAfter && ariaBefore !== ariaAfter) {
+          const diff = ariaDiff(ariaBefore, ariaAfter)
+          if (diff) result.ariaDiff = diff
+        }
+        const traceFile = writeTraceMarkdown({
+          dir: traceDir,
+          title: 'run_code',
+          file: 'mcp',
+          durationMs: Date.now() - startedAt,
+          commands,
+          captured,
+          error: result.error,
+        })
+        result.dir = traceDir
+        result.traceFile = pathToFileURL(traceFile).href
+        result.aiTraceHint = aiTraceHint()
         return { content: [{ type: 'text', text: JSON.stringify(result, null, 2) }] }
       }
       case 'run_test': {
         return await withLock(async () => {
-          const { test, timeout = 60000, config: configPathArg } = args || {}
-          const { configPath, configDir } = resolveConfigPath(configPathArg)
-          const { cli, root } = findCodeceptCliUpwards(configDir)
-          const isNodeScript = cli.endsWith('.js')
+          if (pausedController) {
+            throw new Error('A previous run_test is still paused. Call "continue" first.')
+          }
+          const { test, timeout = 60000, pauseAt, grep, plugins } = args || {}
+          await initCodecept(undefined, plugins)
+          await endShellSession()
+          applyMochaGrep(grep)
+          return await withSilencedIO(async () => {
+            codecept.loadTests()
+            let testFiles = codecept.testFiles
+            if (test) {
+              const testName = normalizePath(test).toLowerCase()
+              testFiles = codecept.testFiles.filter(f => {
+                const filePath = normalizePath(f).toLowerCase()
+                return filePath.includes(testName) || filePath.endsWith(testName)
+              })
+            }
-          const resolvedFile = await resolveTestToFile({ cli, root, configPath, test })
-          const runArgs = ['run', '--config', configPath, '--reporter', 'json']
+            if (!testFiles.length) throw new Error(`No tests found matching: ${test}`)
+            const testFile = testFiles[0]
+            pendingRunResults = []
+            pendingTestFile = testFile
+            pendingStepInfo = null
+            let stepIndex = 0
+            const matchPauseAt = pauseAtMatcher(pauseAt)
+            const onAfter = t => {
+              const aiTrace = t.artifacts?.aiTrace
+              pendingRunResults.push({
+                title: t.title,
+                file: t.file,
+                status: t.err ? 'failed' : 'passed',
+                error: t.err?.message,
+                duration: t.duration,
+                traceFile: aiTrace ? pathToFileURL(aiTrace).href : null,
+              })
+            }
+            const onStepAfter = step => {
+              stepIndex += 1
+              const idx = stepIndex
+              const name = (() => { try { return step.toString() } catch { return '' } })()
+              recorder.add('mcp pause info', () => {
+                pendingStepInfo = { index: idx, name, status: step.status }
+              })
+              if (matchPauseAt(idx, name)) pauseNow()
+            }
+            event.dispatcher.on(event.test.after, onAfter)
+            event.dispatcher.on(event.step.after, onStepAfter)
+            pendingRunCleanup = () => {
+              try { event.dispatcher.removeListener(event.test.after, onAfter) } catch {}
+              try { event.dispatcher.removeListener(event.step.after, onStepAfter) } catch {}
+              pendingRunCleanup = null
+            }
-          if (resolvedFile) runArgs.push(resolvedFile)
-          else if (looksLikePath(test)) runArgs.push(test)
-          else runArgs.push('--grep', String(test))
+            let runError = null
+            const runPromise = (async () => {
+              try {
+                await ensureBootstrap()
+                await codecept.run(testFile)
+              } catch (err) {
+                runError = err
+                throw err
+              }
+            })()
-          const res = isNodeScript
-            ? await runCmd(process.execPath, [cli, ...runArgs], { cwd: root, timeout })
-            : await runCmd(cli, runArgs, { cwd: root, timeout })
+            const pausedPromise = new Promise(resolve => pauseEvents.once('paused', () => resolve('paused')))
+            const completedPromise = runPromise.then(() => 'completed', () => 'completed')
-          const { code, out, err } = res
+            const which = await Promise.race([
+              completedPromise,
+              pausedPromise,
+              new Promise((_, reject) => setTimeout(() => reject(new Error(`Timeout after ${timeout}ms`)), timeout)),
+            ])
-          let parsed = null
-          const jsonStart = out.indexOf('{')
-          const jsonEnd = out.lastIndexOf('}')
-          if (jsonStart !== -1 && jsonEnd !== -1 && jsonEnd > jsonStart) {
-            try { parsed = JSON.parse(out.slice(jsonStart, jsonEnd + 1)) } catch {}
-          }
+            if (which === 'paused') {
+              pendingRunPromise = runPromise
+              const page = await gatherPageBrief()
+              return {
+                content: [{
+                  type: 'text',
+                  text: JSON.stringify({ ...pausedPayload(), page }, null, 2),
+                }],
+              }
+            }
-          return {
-            content: [{
-              type: 'text',
-              text: JSON.stringify({
-                meta: { exitCode: code, cli, root, configPath, args: runArgs, resolvedFile: resolvedFile || null },
-                reporterJson: parsed,
-                stderr: err ? err.slice(0, 20000) : '',
-                rawStdout: parsed ? '' : out.slice(0, 20000),
-              }, null, 2),
-            }],
-          }
+            const final = collectRunCompletion(runError?.message)
+            await startShellSession()
+            return { content: [{ type: 'text', text: JSON.stringify({ ...final, file: testFile }, null, 2) }] }
+          })
         })
       }
       case 'run_step_by_step': {
-        const { test, timeout = 60000, config: configPath } = args
-        await initCodecept(configPath)
-        return await withSilencedIO(async () => {
-          codecept.loadTests()
-          let testFiles = codecept.testFiles
-          if (test) {
-            const testName = normalizePath(test).toLowerCase()
-            testFiles = codecept.testFiles.filter(f => {
-              const filePath = normalizePath(f).toLowerCase()
-              return filePath.includes(testName) || filePath.endsWith(testName)
-            })
-          }
-          if (!testFiles.length) throw new Error(`No tests found matching: ${test}`)
-          const results = []
-          const currentSteps = {}
-          let currentTestTitle = null
-          const testFile = testFiles[0]
-          const onBefore = (t) => {
-            const traceDir = getTraceDir(t.title, t.file)
-            currentTestTitle = t.title
-            currentSteps[t.title] = []
-            results.push({
-              test: t.title,
-              file: t.file,
-              traceFile: `file://${resolvePath(traceDir, 'trace.md')}`,
-              status: 'running',
-              steps: [],
-            })
+        return await withLock(async () => {
+          if (pausedController) {
+            throw new Error('A previous run is still paused. Call "continue" first.')
           }
+          const { test, timeout = 60000, grep, plugins } = args || {}
+          await initCodecept(undefined, plugins)
+          await endShellSession()
+          applyMochaGrep(grep)
+          return await withSilencedIO(async () => {
+            codecept.loadTests()
+            let testFiles = codecept.testFiles
+            if (test) {
+              const testName = normalizePath(test).toLowerCase()
+              testFiles = codecept.testFiles.filter(f => {
+                const filePath = normalizePath(f).toLowerCase()
+                return filePath.includes(testName) || filePath.endsWith(testName)
+              })
+            }
-          const onAfter = (t) => {
-            const r = results.find(x => x.test === t.title)
-            if (r) {
-              r.status = t.err ? 'failed' : 'completed'
-              if (t.err) r.error = t.err.message
+            if (!testFiles.length) throw new Error(`No tests found matching: ${test}`)
+            const testFile = testFiles[0]
+            pendingRunResults = []
+            pendingTestFile = testFile
+            pendingStepInfo = null
+            let stepIndex = 0
+            const onAfter = t => {
+              const aiTrace = t.artifacts?.aiTrace
+              pendingRunResults.push({
+                title: t.title,
+                file: t.file,
+                status: t.err ? 'failed' : 'passed',
+                error: t.err?.message,
+                duration: t.duration,
+                traceFile: aiTrace ? pathToFileURL(aiTrace).href : null,
+              })
+            }
+            const onStepAfter = step => {
+              stepIndex += 1
+              const idx = stepIndex
+              const name = (() => { try { return step.toString() } catch { return '' } })()
+              recorder.add('mcp pause info', () => {
+                pendingStepInfo = { index: idx, name, status: step.status }
+              })
+              pauseNow()
+            }
+            event.dispatcher.on(event.test.after, onAfter)
+            event.dispatcher.on(event.step.after, onStepAfter)
+            pendingRunCleanup = () => {
+              try { event.dispatcher.removeListener(event.test.after, onAfter) } catch {}
+              try { event.dispatcher.removeListener(event.step.after, onStepAfter) } catch {}
+              pendingRunCleanup = null
             }
-            currentTestTitle = null
-          }
-          const onStepAfter = (step) => {
-            if (!currentTestTitle || !currentSteps[currentTestTitle]) return
-            currentSteps[currentTestTitle].push({
-              step: step.toString(),
-              status: step.status,
-              time: step.endTime - step.startTime,
-            })
-            const r = results.find(x => x.test === currentTestTitle)
-            if (r) r.steps = [...currentSteps[currentTestTitle]]
-          }
+            let runError = null
+            const runPromise = (async () => {
+              try {
+                await ensureBootstrap()
+                await codecept.run(testFile)
+              } catch (err) {
+                runError = err
+                throw err
+              }
+            })()
-          event.dispatcher.on(event.test.before, onBefore)
-          event.dispatcher.on(event.test.after, onAfter)
-          event.dispatcher.on(event.step.after, onStepAfter)
+            const pausedPromise = new Promise(resolve => pauseEvents.once('paused', () => resolve('paused')))
+            const completedPromise = runPromise.then(() => 'completed', () => 'completed')
-          try {
-            await Promise.race([
-              (async () => {
-                await codecept.bootstrap()
-                await codecept.run(testFile)
-              })(),
+            const which = await Promise.race([
+              completedPromise,
+              pausedPromise,
               new Promise((_, reject) => setTimeout(() => reject(new Error(`Timeout after ${timeout}ms`)), timeout)),
             ])
-          } catch (error) {
-            const lastRunning = results.filter(r => r.status === 'running').pop()
-            if (lastRunning) {
-              lastRunning.status = 'failed'
-              lastRunning.error = error.message
+            if (which === 'paused') {
+              pendingRunPromise = runPromise
+              const page = await gatherPageBrief()
+              return {
+                content: [{
+                  type: 'text',
+                  text: JSON.stringify({ ...pausedPayload(), page }, null, 2),
+                }],
+              }
             }
-          } finally {
-            try { event.dispatcher.removeListener(event.test.before, onBefore) } catch {}
-            try { event.dispatcher.removeListener(event.test.after, onAfter) } catch {}
-            try { event.dispatcher.removeListener(event.step.after, onStepAfter) } catch {}
-          }
-          return { content: [{ type: 'text', text: JSON.stringify({ results, stepByStep: true }, null, 2) }] }
+            const final = collectRunCompletion(runError?.message)
+            await startShellSession()
+            return { content: [{ type: 'text', text: JSON.stringify({ ...final, file: testFile }, null, 2) }] }
+          })
         })
       }
@@ -625,6 +1161,7 @@ server.setRequestHandler(CallToolRequestSchema, async (request) => {
 })
 async function main() {
+  installShutdownHooks()
   const transport = new StdioServerTransport()
   await server.connect(transport)
 }