npm - @muggleai/works - Versions diffs - 4.4.0 → 4.6.0 - Mend

@muggleai/works 4.4.0 → 4.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

package/README.md +31 -13
package/dist/{chunk-PMI2DI3V.js → chunk-TP4T4T2Z.js} +348 -105
package/dist/cli.js +1 -1
package/dist/index.js +1 -1
package/dist/plugin/.claude-plugin/plugin.json +1 -1
package/dist/plugin/.cursor-plugin/plugin.json +1 -1
package/dist/plugin/README.md +1 -0
package/dist/plugin/skills/do/e2e-acceptance.md +6 -3
package/dist/plugin/skills/do/open-prs.md +35 -74
package/dist/plugin/skills/muggle-pr-visual-walkthrough/SKILL.md +181 -0
package/dist/plugin/skills/muggle-test/SKILL.md +146 -121
package/dist/plugin/skills/muggle-test-feature-local/SKILL.md +66 -16
package/dist/plugin/skills/muggle-test-import/SKILL.md +127 -25
package/dist/plugin/skills/muggle-test-regenerate-missing/SKILL.md +201 -0
package/dist/plugin/skills/muggle-test-regenerate-missing/evals/evals.json +58 -0
package/dist/plugin/skills/muggle-test-regenerate-missing/evals/trigger-eval.json +22 -0
package/dist/release-manifest.json +7 -0
package/package.json +7 -7
package/plugin/.claude-plugin/plugin.json +1 -1
package/plugin/.cursor-plugin/plugin.json +1 -1
package/plugin/README.md +1 -0
package/plugin/skills/do/e2e-acceptance.md +6 -3
package/plugin/skills/do/open-prs.md +35 -74
package/plugin/skills/muggle-pr-visual-walkthrough/SKILL.md +181 -0
package/plugin/skills/muggle-test/SKILL.md +146 -121
package/plugin/skills/muggle-test-feature-local/SKILL.md +66 -16
package/plugin/skills/muggle-test-import/SKILL.md +127 -25
package/plugin/skills/muggle-test-regenerate-missing/SKILL.md +201 -0
package/plugin/skills/muggle-test-regenerate-missing/evals/evals.json +58 -0
package/plugin/skills/muggle-test-regenerate-missing/evals/trigger-eval.json +22 -0

package/dist/{chunk-PMI2DI3V.js → chunk-TP4T4T2Z.js} RENAMED Viewed

@@ -1,9 +1,9 @@
 import * as fs3 from 'fs';
-import { readFileSync, existsSync, rmSync, mkdirSync, readdirSync, createWriteStream, writeFileSync, statSync } from 'fs';
+import { readFileSync, existsSync, mkdirSync, writeFileSync, rmSync, readdirSync, createWriteStream, statSync } from 'fs';
 import * as os3 from 'os';
 import { platform, arch, homedir } from 'os';
 import * as path2 from 'path';
-import { dirname, resolve, join } from 'path';
+import { join, dirname, resolve } from 'path';
 import { fileURLToPath } from 'url';
 import winston from 'winston';
 import axios, { AxiosError } from 'axios';
@@ -34,6 +34,49 @@ var DATA_DIR_NAME = ".muggle-ai";
 function getDataDir() {
   return path2.join(os3.homedir(), DATA_DIR_NAME);
 }
+var DEV_MANIFEST = {
+  release: "dev",
+  buildId: "dev",
+  commitSha: "dev",
+  buildTime: "1970-01-01T00:00:00Z",
+  serviceName: "muggle-ai-works-mcp"
+};
+var MANIFEST_PATH = (() => {
+  try {
+    return join(dirname(fileURLToPath(import.meta.url)), "release-manifest.json");
+  } catch {
+    return "release-manifest.json";
+  }
+})();
+var cachedManifest;
+function isValidManifest(value) {
+  if (typeof value !== "object" || value === null) return false;
+  const m = value;
+  return typeof m.release === "string" && typeof m.buildId === "string" && typeof m.commitSha === "string" && typeof m.buildTime === "string" && typeof m.serviceName === "string";
+}
+function readReleaseManifest() {
+  if (cachedManifest !== void 0) return cachedManifest;
+  try {
+    const raw = readFileSync(MANIFEST_PATH, "utf8");
+    const parsed = JSON.parse(raw);
+    if (!isValidManifest(parsed)) {
+      cachedManifest = DEV_MANIFEST;
+      return cachedManifest;
+    }
+    cachedManifest = parsed;
+    return cachedManifest;
+  } catch (err) {
+    const code = err.code;
+    if (code !== "ENOENT") {
+      console.warn(
+        "release_manifest: unexpected error reading manifest, using DEV fallback",
+        { error: err.message }
+      );
+    }
+    cachedManifest = DEV_MANIFEST;
+    return cachedManifest;
+  }
+}
 // packages/mcps/src/shared/config.ts
 var DEFAULT_PROMPT_SERVICE_PRODUCTION_URL = "https://promptservice.muggle-ai.com";
@@ -303,9 +346,10 @@ function getConfig() {
   if (configInstance) {
     return configInstance;
   }
+  const manifest = readReleaseManifest();
   configInstance = {
     serverName: "muggle",
-    serverVersion: "1.0.0",
+    serverVersion: manifest.release,
     logLevel: process.env.LOG_LEVEL ?? "info",
     auth0: buildAuth0Config(),
     e2e: buildE2eConfig(),
@@ -425,6 +469,14 @@ __export(e2e_exports2, {
   ApiKeyRevokeInputSchema: () => ApiKeyRevokeInputSchema,
   AuthLoginInputSchema: () => AuthLoginInputSchema,
   AuthPollInputSchema: () => AuthPollInputSchema,
+  BulkPreviewJobCancelInputSchema: () => BulkPreviewJobCancelInputSchema,
+  BulkPreviewJobGetInputSchema: () => BulkPreviewJobGetInputSchema,
+  BulkPreviewJobKindSchema: () => BulkPreviewJobKindSchema,
+  BulkPreviewJobListInputSchema: () => BulkPreviewJobListInputSchema,
+  BulkPreviewJobStatusSchema: () => BulkPreviewJobStatusSchema,
+  BulkPreviewPromptSchema: () => BulkPreviewPromptSchema,
+  BulkPreviewSubmitTestCaseInputSchema: () => BulkPreviewSubmitTestCaseInputSchema,
+  BulkPreviewSubmitUseCaseInputSchema: () => BulkPreviewSubmitUseCaseInputSchema,
   EmptyInputSchema: () => EmptyInputSchema,
   GatewayError: () => GatewayError,
   IdSchema: () => IdSchema,
@@ -467,11 +519,11 @@ __export(e2e_exports2, {
   TestCaseListInputSchema: () => TestCaseListInputSchema,
   TestScriptGetInputSchema: () => TestScriptGetInputSchema,
   TestScriptListInputSchema: () => TestScriptListInputSchema,
-  TestScriptListPaginatedInputSchema: () => TestScriptListPaginatedInputSchema,
   TokenPackageIdSchema: () => TokenPackageIdSchema,
   TokenUsageFilterTypeSchema: () => TokenUsageFilterTypeSchema,
   UseCaseCandidatesApproveInputSchema: () => UseCaseCandidatesApproveInputSchema,
   UseCaseCreateFromPromptsInputSchema: () => UseCaseCreateFromPromptsInputSchema,
+  UseCaseCreateInputSchema: () => UseCaseCreateInputSchema,
   UseCaseDiscoveryMemoryGetInputSchema: () => UseCaseDiscoveryMemoryGetInputSchema,
   UseCaseGetInputSchema: () => UseCaseGetInputSchema,
   UseCaseListInputSchema: () => UseCaseListInputSchema,
@@ -671,8 +723,9 @@ var AuthService = class {
   }
   /**
    * Start the device code flow.
+   * @param options.forceNewSession - Clear existing Auth0 browser session before login to allow account switching.
    */
-  async startDeviceCodeFlow() {
+  async startDeviceCodeFlow(options) {
     const logger14 = getLogger();
     const config = getConfig();
     const { domain, clientId, audience, scopes } = config.localQa.auth0;
@@ -709,15 +762,25 @@ var AuthService = class {
       userCode: data.user_code,
       expiresAt: new Date(Date.now() + data.expires_in * 1e3).toISOString()
     });
+    let browserUrl = data.verification_uri_complete;
+    if (options?.forceNewSession) {
+      const logoutUrl = new URL(`https://${domain}/v2/logout`);
+      logoutUrl.searchParams.set("client_id", clientId);
+      logoutUrl.searchParams.set("returnTo", data.verification_uri_complete);
+      browserUrl = logoutUrl.toString();
+      logger14.info("Force new session: opening logout-redirect URL", {
+        logoutUrl: browserUrl
+      });
+    }
     const browserOpenResult = await openBrowserUrl({
-      url: data.verification_uri_complete
+      url: browserUrl
     });
     if (browserOpenResult.opened) {
       logger14.info("Browser opened for device code login");
     } else {
       logger14.warn("Failed to open browser for device code login", {
         error: browserOpenResult.error,
-        verificationUriComplete: data.verification_uri_complete
+        url: browserUrl
       });
     }
     return {
@@ -2504,7 +2567,7 @@ var getCredentialsFilePath = getApiKeyFilePath;
 // packages/mcps/src/shared/auth.ts
 var logger4 = getLogger();
-async function startDeviceCodeFlow(config) {
+async function startDeviceCodeFlow(config, options) {
   const deviceCodeUrl = `https://${config.domain}/oauth/device/code`;
   try {
     logger4.info("[Auth] Starting device code flow", {
@@ -2529,8 +2592,16 @@ async function startDeviceCodeFlow(config) {
       userCode: data.user_code,
       expiresIn: data.expires_in
     });
+    let browserUrl = data.verification_uri_complete;
+    if (options?.forceNewSession) {
+      const logoutUrl = new URL(`https://${config.domain}/v2/logout`);
+      logoutUrl.searchParams.set("client_id", config.clientId);
+      logoutUrl.searchParams.set("returnTo", data.verification_uri_complete);
+      browserUrl = logoutUrl.toString();
+      logger4.info("[Auth] Force new session: opening logout-redirect URL");
+    }
     const browserOpenResult = await openBrowserUrl({
-      url: data.verification_uri_complete
+      url: browserUrl
     });
     if (browserOpenResult.opened) {
       logger4.info("[Auth] Browser opened for device code login");
@@ -2854,8 +2925,10 @@ var LocalRunUploadInputSchema = z.object({
 // packages/mcps/src/mcp/e2e/contracts/index.ts
 var PaginationInputSchema = z.object({
-  page: z.number().int().positive().optional().describe("Page number (1-based)"),
-  pageSize: z.number().int().positive().max(100).optional().describe("Number of items per page")
+  page: z.number().int().positive().default(1).describe("Page number, 1-based. Defaults to 1 (the first page)."),
+  pageSize: z.number().int().positive().max(100).default(10).describe("Number of items per page. Defaults to 10, max 100."),
+  sortBy: z.enum(["createdAt", "updatedAt"]).default("createdAt").describe("Field to sort by. Defaults to createdAt (stable under concurrent writes)."),
+  sortOrder: z.enum(["asc", "desc"]).default("desc").describe("Sort direction. Defaults to desc (newest first).")
 });
 var IdSchema = MuggleEntityIdSchema;
 var RunBatchIdSchema = MuggleEntityIdSchema.describe("Bulk replay run batch ID (UUID)");
@@ -2961,15 +3034,67 @@ var UseCasePromptPreviewInputSchema = z.object({
 });
 var UseCaseCreateFromPromptsInputSchema = z.object({
   projectId: IdSchema.describe("Project ID (UUID) to create use cases for"),
-  prompts: z.array(z.object({
-    instruction: z.string().min(1).describe("Natural language instruction describing the use case")
-  })).min(1).describe("Array of prompts to generate use cases from")
+  instructions: z.array(z.string().min(1)).min(1).describe('Natural-language instructions \u2014 one use case is generated per string (e.g., ["As a user, I can log in"])')
 });
 var UseCaseUpdateFromPromptInputSchema = z.object({
   projectId: IdSchema.describe("Project ID (UUID)"),
   useCaseId: IdSchema.describe("Use case ID (UUID) to update"),
   instruction: z.string().min(1).describe("Natural language instruction to regenerate the use case from")
 });
+var UseCaseCreateInputSchema = z.object({
+  projectId: IdSchema.describe("Project ID (UUID) the use case belongs to"),
+  title: z.string().min(1).describe("Use case title"),
+  description: z.string().min(1).describe("Description of the use case, including actor and preconditions"),
+  userStory: z.string().min(1).describe("One-line user story from the end-user point of view"),
+  url: z.string().url().optional().describe("URL where the use case takes place (defaults to project URL)"),
+  useCaseBreakdown: z.array(z.object({
+    requirement: z.string().min(1).describe("One requirement of the use case"),
+    acceptanceCriteria: z.string().min(1).describe("Concrete, measurable acceptance criteria for the requirement")
+  })).describe("Main/alternative/error flows broken down as requirement + acceptance criteria pairs"),
+  status: z.enum(["DRAFT", "IN_REVIEW", "APPROVED", "IMPLEMENTED", "ARCHIVED"]).describe("Use case status"),
+  priority: z.enum(["LOW", "MEDIUM", "HIGH", "CRITICAL"]).describe("Use case priority"),
+  source: z.enum(["PRD_FILE", "SITEMAP", "CRAWLER", "PROMPT", "MANUAL"]).describe("How this use case was produced"),
+  category: z.string().optional().describe("Optional category")
+});
+var BulkPreviewPromptSchema = z.object({
+  clientRef: z.string().max(128).optional().describe("Optional caller-supplied reference echoed back on results"),
+  instruction: z.string().min(1).max(4e3).describe("Natural language instruction (max 4000 chars)")
+});
+var BulkPreviewSubmitUseCaseInputSchema = z.object({
+  projectId: IdSchema.describe("Project ID (UUID) the use cases belong to"),
+  prompts: z.array(BulkPreviewPromptSchema).min(1).max(100).describe("Prompts to generate use cases from (max 100 per request)")
+});
+var BulkPreviewSubmitTestCaseInputSchema = z.object({
+  projectId: IdSchema.describe("Project ID (UUID)"),
+  useCaseId: IdSchema.describe("Parent use case ID (UUID) the test cases will belong to"),
+  prompts: z.array(BulkPreviewPromptSchema).min(1).max(100).describe("Prompts to generate test cases from (max 100 per request)")
+});
+var BulkPreviewJobStatusSchema = z.enum([
+  "queued",
+  "submitted",
+  "running",
+  "succeeded",
+  "partial",
+  "failed",
+  "cancelled",
+  "expired"
+]);
+var BulkPreviewJobKindSchema = z.enum(["useCase", "testCase"]);
+var BulkPreviewJobGetInputSchema = z.object({
+  projectId: IdSchema.describe("Project ID (UUID)"),
+  jobId: IdSchema.describe("Bulk-preview job ID (UUID)")
+});
+var BulkPreviewJobCancelInputSchema = z.object({
+  projectId: IdSchema.describe("Project ID (UUID)"),
+  jobId: IdSchema.describe("Bulk-preview job ID (UUID) to cancel")
+});
+var BulkPreviewJobListInputSchema = z.object({
+  projectId: IdSchema.describe("Project ID (UUID) to list bulk-preview jobs for"),
+  status: z.array(BulkPreviewJobStatusSchema).optional().describe("Optional filter \u2014 only return jobs matching any of these statuses"),
+  kind: BulkPreviewJobKindSchema.optional().describe("Optional filter \u2014 only return jobs of this kind"),
+  limit: z.number().int().min(1).max(100).optional().describe("Max jobs to return (default 20, max 100)"),
+  cursor: z.string().optional().describe("Pagination cursor returned by a previous call")
+});
 var TestCaseListInputSchema = z.object({
   projectId: IdSchema.describe("Project ID (UUID) to list test cases for")
 }).merge(PaginationInputSchema);
@@ -3006,9 +3131,6 @@ var TestScriptListInputSchema = z.object({
 var TestScriptGetInputSchema = z.object({
   testScriptId: IdSchema.describe("Test script ID (UUID) to retrieve")
 });
-var TestScriptListPaginatedInputSchema = z.object({
-  projectId: IdSchema.describe("Project ID (UUID) to list test scripts for")
-}).merge(PaginationInputSchema);
 var ActionScriptGetInputSchema = z.object({
   actionScriptId: IdSchema.describe("Action script ID (UUID) to retrieve")
 });
@@ -3148,7 +3270,8 @@ var ApiKeyRevokeInputSchema = z.object({
 });
 var AuthLoginInputSchema = z.object({
   waitForCompletion: z.boolean().optional().describe("Whether to wait for browser login completion before returning. Default: true"),
-  timeoutMs: z.number().int().positive().min(1e3).max(9e5).optional().describe("Maximum time to wait for login completion in milliseconds. Default: 120000")
+  timeoutMs: z.number().int().positive().min(1e3).max(9e5).optional().describe("Maximum time to wait for login completion in milliseconds. Default: 120000"),
+  forceNewSession: z.boolean().optional().describe("Force a fresh login by clearing any existing Auth0 browser session before redirecting to the device activation page. Use this to switch accounts. Default: false")
 });
 var AuthPollInputSchema = z.object({
   deviceCode: z.string().optional().describe("Device code from the login response. Optional if a login was recently started.")
@@ -3180,6 +3303,61 @@ var GatewayError = class extends Error {
     this.details = params.details;
   }
 };
+// packages/mcps/src/shared/host_detection.ts
+function detectMcpHost(env = process.env) {
+  if (env.CLAUDE_CODE || env.CLAUDECODE || env.CLAUDE_CODE_SSE_PORT) {
+    return "claude-code";
+  }
+  if (env.CURSOR_TRACE_ID || env.CURSOR_MCP) {
+    return "cursor";
+  }
+  if (env.CODEX || env.OPENAI_CODEX) {
+    return "codex";
+  }
+  if (env.WINDSURF_MCP || env.WINDSURF || env.CODEIUM_API_KEY) {
+    return "windsurf";
+  }
+  return "unknown";
+}
+var INSTALL_ID_FILENAME = "install-id.json";
+var cachedInstallId;
+function installIdFilePath() {
+  return join(getDataDir(), INSTALL_ID_FILENAME);
+}
+function generateAndPersist(filePath) {
+  const installId = randomUUID();
+  const contents = { installId };
+  mkdirSync(dirname(filePath), { recursive: true });
+  writeFileSync(filePath, JSON.stringify(contents, null, 2) + "\n", "utf8");
+  return installId;
+}
+function isValid(value) {
+  return typeof value === "object" && value !== null && typeof value.installId === "string" && value.installId.length > 0;
+}
+function getInstallId() {
+  if (cachedInstallId !== void 0) return cachedInstallId;
+  const filePath = installIdFilePath();
+  if (!existsSync(filePath)) {
+    cachedInstallId = generateAndPersist(filePath);
+    return cachedInstallId;
+  }
+  try {
+    const raw = readFileSync(filePath, "utf8");
+    const parsed = JSON.parse(raw);
+    if (isValid(parsed)) {
+      cachedInstallId = parsed.installId;
+      return cachedInstallId;
+    }
+    cachedInstallId = generateAndPersist(filePath);
+    return cachedInstallId;
+  } catch {
+    cachedInstallId = generateAndPersist(filePath);
+    return cachedInstallId;
+  }
+}
+// packages/mcps/src/mcp/e2e/upstream-client.ts
 var ALLOWED_UPSTREAM_PREFIXES = [
   "/v1/protected/muggle-test/",
   "/v1/protected/wallet/",
@@ -3226,8 +3404,17 @@ var PromptServiceClient = class {
    * @returns Headers object.
    */
   buildHeaders(credentials, correlationId) {
+    const manifest = readReleaseManifest();
+    const installId = getInstallId();
+    const host = detectMcpHost();
     const headers = {
-      "X-Correlation-Id": correlationId
+      "X-Correlation-Id": correlationId,
+      "X-Client-Service-Name": manifest.serviceName,
+      "X-Client-Release": manifest.release,
+      "X-Client-Build-Id": manifest.buildId,
+      "X-Client-Commit-Sha": manifest.commitSha,
+      "X-Client-Install-Id": installId,
+      "X-Client-Host": host
     };
     if (credentials.bearerToken) {
       headers["Authorization"] = credentials.bearerToken.startsWith("Bearer ") ? credentials.bearerToken : `Bearer ${credentials.bearerToken}`;
@@ -3476,14 +3663,19 @@ var projectTools = [
   },
   {
     name: "muggle-remote-project-list",
-    description: "List all projects accessible to the authenticated user.",
+    description: "List projects accessible to the authenticated user. Returns up to 10 items per page by default (max 100). Response includes pagination metadata (totalCount, totalPages, hasMore) \u2014 check `hasMore` to decide whether to fetch additional pages.",
     inputSchema: ProjectListInputSchema,
     mapToUpstream: (input) => {
       const data = input;
       return {
         method: "GET",
         path: `${MUGGLE_TEST_PREFIX}/projects`,
-        queryParams: { page: data.page, pageSize: data.pageSize }
+        queryParams: {
+          page: data.page,
+          pageSize: data.pageSize,
+          sortBy: data.sortBy,
+          sortOrder: data.sortOrder
+        }
       };
     }
   },
@@ -3528,14 +3720,20 @@ var useCaseTools = [
   },
   {
     name: "muggle-remote-use-case-list",
-    description: "List all use cases for a project.",
+    description: "List use cases for a project. Returns up to 10 items per page by default (max 100). Response includes pagination metadata (totalCount, totalPages, hasMore) \u2014 check `hasMore` to decide whether to fetch additional pages.",
     inputSchema: UseCaseListInputSchema,
     mapToUpstream: (input) => {
       const data = input;
       return {
         method: "GET",
         path: `${MUGGLE_TEST_PREFIX}/use-cases`,
-        queryParams: { projectId: data.projectId, page: data.page, pageSize: data.pageSize }
+        queryParams: {
+          projectId: data.projectId,
+          page: data.page,
+          pageSize: data.pageSize,
+          sortBy: data.sortBy,
+          sortOrder: data.sortOrder
+        }
       };
     }
   },
@@ -3573,7 +3771,10 @@ var useCaseTools = [
       return {
         method: "POST",
         path: `${MUGGLE_TEST_PREFIX}/projects/${data.projectId}/use-cases/prompts/bulk`,
-        body: { projectId: data.projectId, prompts: data.prompts }
+        body: {
+          projectId: data.projectId,
+          prompts: data.instructions.map((instruction) => ({ instruction }))
+        }
       };
     }
   },
@@ -3589,19 +3790,62 @@ var useCaseTools = [
         body: { instruction: data.instruction }
       };
     }
+  },
+  {
+    name: "muggle-remote-use-case-create",
+    description: "Create a single use case from a fully-specified payload. Use this to persist use cases returned by muggle-remote-use-case-bulk-preview-submit \u2014 no LLM is invoked.",
+    inputSchema: UseCaseCreateInputSchema,
+    mapToUpstream: (input) => {
+      const data = input;
+      return {
+        method: "POST",
+        path: `${MUGGLE_TEST_PREFIX}/use-cases`,
+        body: {
+          projectId: data.projectId,
+          title: data.title,
+          description: data.description,
+          userStory: data.userStory,
+          url: data.url,
+          useCaseBreakdown: data.useCaseBreakdown,
+          status: data.status,
+          priority: data.priority,
+          source: data.source,
+          category: data.category
+        }
+      };
+    }
+  },
+  {
+    name: "muggle-remote-use-case-bulk-preview-submit",
+    description: "Submit an async bulk-preview job that uses the OpenAI Batch API to generate use cases from many prompts at ~50% of normal LLM cost. Returns a job ID immediately; poll with muggle-remote-bulk-preview-job-get until the job reaches a terminal status, then persist each successful result via muggle-remote-use-case-create.",
+    inputSchema: BulkPreviewSubmitUseCaseInputSchema,
+    mapToUpstream: (input) => {
+      const data = input;
+      return {
+        method: "POST",
+        path: `${MUGGLE_TEST_PREFIX}/projects/${data.projectId}/use-cases/prompts/bulk-preview`,
+        body: { prompts: data.prompts }
+      };
+    }
   }
 ];
 var testCaseTools = [
   {
     name: "muggle-remote-test-case-list",
-    description: "List test cases for a project.",
+    description: "List test cases for a project. Returns up to 10 items per page by default (max 100). Response includes pagination metadata (totalCount, totalPages, hasMore) \u2014 check `hasMore` to decide whether to fetch additional pages.",
     inputSchema: TestCaseListInputSchema,
     mapToUpstream: (input) => {
       const data = input;
       return {
         method: "GET",
         path: `${MUGGLE_TEST_PREFIX}/test-cases`,
-        queryParams: { projectId: data.projectId, page: data.page, pageSize: data.pageSize }
+        queryParams: {
+          projectId: data.projectId,
+          page: data.page,
+          pageSize: data.pageSize,
+          sortBy: data.sortBy,
+          sortOrder: data.sortOrder
+        }
       };
     }
   },
@@ -3668,44 +3912,95 @@ var testCaseTools = [
         }
       };
     }
+  },
+  {
+    name: "muggle-remote-test-case-bulk-preview-submit",
+    description: "Submit an async bulk-preview job that uses the OpenAI Batch API to generate test cases for a single use case from many prompts at ~50% of normal LLM cost. Returns a job ID immediately; poll with muggle-remote-bulk-preview-job-get until the job reaches a terminal status, then persist each successful result via muggle-remote-test-case-create. Note: one input prompt may fan out to 1\u20135 test cases.",
+    inputSchema: BulkPreviewSubmitTestCaseInputSchema,
+    mapToUpstream: (input) => {
+      const data = input;
+      return {
+        method: "POST",
+        path: `${MUGGLE_TEST_PREFIX}/projects/${data.projectId}/use-cases/${data.useCaseId}/test-cases/prompts/bulk-preview`,
+        body: { prompts: data.prompts }
+      };
+    }
   }
 ];
-var testScriptTools = [
+var bulkPreviewTools = [
   {
-    name: "muggle-remote-test-script-list",
-    description: "List test scripts for a project, optionally filtered by test case.",
-    inputSchema: TestScriptListInputSchema,
+    name: "muggle-remote-bulk-preview-job-get",
+    description: "Get the current status and (when terminal) results of a bulk-preview job. Poll this after submitting a bulk-preview job \u2014 every 10\u201315 seconds is fine. Terminal statuses: succeeded, partial, failed, cancelled, expired.",
+    inputSchema: BulkPreviewJobGetInputSchema,
     mapToUpstream: (input) => {
       const data = input;
       return {
         method: "GET",
-        path: `${MUGGLE_TEST_PREFIX}/test-scripts`,
-        queryParams: { projectId: data.projectId, testCaseId: data.testCaseId, page: data.page, pageSize: data.pageSize }
+        path: `${MUGGLE_TEST_PREFIX}/projects/${data.projectId}/bulk-preview-jobs/${data.jobId}`
       };
     }
   },
   {
-    name: "muggle-remote-test-script-get",
-    description: "Get details of a specific test script.",
-    inputSchema: TestScriptGetInputSchema,
+    name: "muggle-remote-bulk-preview-job-list",
+    description: "List bulk-preview jobs for a project, optionally filtered by status or kind.",
+    inputSchema: BulkPreviewJobListInputSchema,
     mapToUpstream: (input) => {
       const data = input;
       return {
         method: "GET",
-        path: `${MUGGLE_TEST_PREFIX}/test-scripts/${data.testScriptId}`
+        path: `${MUGGLE_TEST_PREFIX}/projects/${data.projectId}/bulk-preview-jobs`,
+        queryParams: {
+          status: data.status?.join(","),
+          kind: data.kind,
+          limit: data.limit,
+          cursor: data.cursor
+        }
+      };
+    }
+  },
+  {
+    name: "muggle-remote-bulk-preview-job-cancel",
+    description: "Request cancellation of a bulk-preview job. Cancellation is cooperative \u2014 the harvester picks it up on its next tick and moves the job to status=cancelled.",
+    inputSchema: BulkPreviewJobCancelInputSchema,
+    mapToUpstream: (input) => {
+      const data = input;
+      return {
+        method: "DELETE",
+        path: `${MUGGLE_TEST_PREFIX}/projects/${data.projectId}/bulk-preview-jobs/${data.jobId}`
+      };
+    }
+  }
+];
+var testScriptTools = [
+  {
+    name: "muggle-remote-test-script-list",
+    description: "List test scripts for a project, optionally filtered by test case. Returns up to 10 items per page by default (max 100). Response includes pagination metadata (totalCount, totalPages, hasMore) \u2014 check `hasMore` to decide whether to fetch additional pages.",
+    inputSchema: TestScriptListInputSchema,
+    mapToUpstream: (input) => {
+      const data = input;
+      return {
+        method: "GET",
+        path: `${MUGGLE_TEST_PREFIX}/test-scripts`,
+        queryParams: {
+          projectId: data.projectId,
+          testCaseId: data.testCaseId,
+          page: data.page,
+          pageSize: data.pageSize,
+          sortBy: data.sortBy,
+          sortOrder: data.sortOrder
+        }
       };
     }
   },
   {
-    name: "muggle-remote-test-script-list-paginated",
-    description: "List test scripts with full pagination support.",
-    inputSchema: TestScriptListPaginatedInputSchema,
+    name: "muggle-remote-test-script-get",
+    description: "Get details of a specific test script.",
+    inputSchema: TestScriptGetInputSchema,
     mapToUpstream: (input) => {
       const data = input;
       return {
         method: "GET",
-        path: `${MUGGLE_TEST_PREFIX}/test-scripts/paginated`,
-        queryParams: { projectId: data.projectId, page: data.page, pageSize: data.pageSize }
+        path: `${MUGGLE_TEST_PREFIX}/test-scripts/${data.testScriptId}`
       };
     }
   }
@@ -4605,7 +4900,9 @@ var authTools = [
     localHandler: async (input) => {
       const data = input;
       const authService = getAuthService();
-      const deviceCodeResponse = await authService.startDeviceCodeFlow();
+      const deviceCodeResponse = await authService.startDeviceCodeFlow({
+        forceNewSession: data.forceNewSession
+      });
       const waitForCompletion = data.waitForCompletion ?? true;
       if (!waitForCompletion) {
         return {
@@ -4691,6 +4988,7 @@ var allQaToolDefinitions = [
   ...projectTools,
   ...useCaseTools,
   ...testCaseTools,
+  ...bulkPreviewTools,
   ...testScriptTools,
   ...actionScriptTools,
   ...workflowTools,
@@ -4897,12 +5195,10 @@ var ExecuteTestGenerationInputSchema = z.object({
   testCase: TestCaseDetailsSchema.describe("Test case details obtained from muggle-remote-test-case-get"),
   /** Local URL to test against. */
   localUrl: z.string().url().describe("Local URL to test against (e.g., http://localhost:3000)"),
-  /** Explicit approval to launch electron-app. */
-  approveElectronAppLaunch: z.boolean().describe("Set to true after the user explicitly approves launching electron-app"),
   /** Optional timeout. */
   timeoutMs: z.number().int().positive().optional().describe("Timeout in milliseconds (default: 300000 = 5 min)"),
-  /** Show the electron-app UI during execution. Ask the user before approving; true = visible window, false or omit = headless. */
-  showUi: z.boolean().optional().describe("Show the electron-app UI during generation. Ask the user: true to watch the window, false or omit for headless.")
+  /** Show the electron-app UI during execution. Default: visible window. Pass false to run headless. */
+  showUi: z.boolean().optional().describe("Show the electron-app UI during generation. Defaults to visible; pass false to run headless.")
 });
 var ExecuteReplayInputSchema = z.object({
   /** Test script metadata from muggle-remote-test-script-get. */
@@ -4911,12 +5207,10 @@ var ExecuteReplayInputSchema = z.object({
   actionScript: z.array(z.unknown()).describe("Action script steps from muggle-remote-action-script-get"),
   /** Local URL to test against. */
   localUrl: z.string().url().describe("Local URL to test against (e.g., http://localhost:3000)"),
-  /** Explicit approval to launch electron-app. */
-  approveElectronAppLaunch: z.boolean().describe("Set to true after the user explicitly approves launching electron-app"),
   /** Optional timeout. */
   timeoutMs: z.number().int().positive().optional().describe("Timeout in milliseconds (default: 180000 = 3 min)"),
-  /** Show the electron-app UI during execution. Ask the user before approving; true = visible window, false or omit = headless. */
-  showUi: z.boolean().optional().describe("Show the electron-app UI during replay. Ask the user: true to watch the window, false or omit for headless.")
+  /** Show the electron-app UI during execution. Default: visible window. Pass false to run headless. */
+  showUi: z.boolean().optional().describe("Show the electron-app UI during replay. Defaults to visible; pass false to run headless.")
 });
 var CancelExecutionInputSchema = z.object({
   runId: MuggleEntityIdSchema.describe("Run ID (UUID) to cancel")
@@ -5156,38 +5450,13 @@ var testScriptGetTool = {
 };
 var executeTestGenerationTool = {
   name: "muggle-local-execute-test-generation",
-  description: "Generate an end-to-end (E2E) acceptance test script by launching a real browser against your web app. The browser navigates your app, executes the test case steps (like signing up, filling forms, clicking through flows), and produces a replayable test script with screenshots. Use this to create new browser tests for any user flow. Requires a test case (from muggle-remote-test-case-get) and a localhost URL. Launches an Electron browser \u2014 requires explicit approval via approveElectronAppLaunch. Before approving, ask the user whether they want a visible GUI; pass showUi: true to watch the window or showUi: false for headless (default when omitted).",
+  description: "Generate an end-to-end (E2E) acceptance test script by launching a real browser against your web app. The browser navigates your app, executes the test case steps (like signing up, filling forms, clicking through flows), and produces a replayable test script with screenshots. Use this to create new browser tests for any user flow. Requires a test case (from muggle-remote-test-case-get) and a localhost URL. Launches an Electron browser \u2014 defaults to a visible window; pass showUi: false to run headless.",
   inputSchema: ExecuteTestGenerationInputSchema,
   execute: async (ctx) => {
     const logger14 = createChildLogger2(ctx.correlationId);
     logger14.info("Executing muggle-local-execute-test-generation");
     const input = ExecuteTestGenerationInputSchema.parse(ctx.input);
-    if (!input.approveElectronAppLaunch) {
-      const showUiExplicit = input.showUi !== void 0;
-      const uiMode = input.showUi === true ? "visible GUI (showUi: true)" : "headless (showUi: false or omitted)";
-      return {
-        content: [
-          "## Electron App Launch Required",
-          "",
-          "This tool will launch the electron-app to generate a test script.",
-          "Please set `approveElectronAppLaunch: true` to proceed.",
-          "",
-          "**Visible GUI:** Ask the user whether they want to watch the Electron window during generation.",
-          "- If **yes** \u2192 when approving, pass `showUi: true`.",
-          "- If **no** \u2192 when approving, pass `showUi: false` (or omit `showUi`; generation runs headless).",
-          "",
-          showUiExplicit ? `**Current choice:** ${uiMode}` : "**Current choice:** not set \u2014 default on approval is headless unless you pass `showUi: true`.",
-          "",
-          `**Test Case:** ${input.testCase.title}`,
-          `**Local URL:** ${input.localUrl}`,
-          "",
-          "**Note:** The electron-app will navigate your test URL and record steps."
-        ].join("\n"),
-        isError: false,
-        data: { requiresApproval: true }
-      };
-    }
-    const showUi = input.showUi === true;
+    const showUi = input.showUi !== false;
     try {
       const result = await executeTestGeneration({
         testCase: input.testCase,
@@ -5219,39 +5488,13 @@ var executeTestGenerationTool = {
 };
 var executeReplayTool = {
   name: "muggle-local-execute-replay",
-  description: "Replay an existing E2E acceptance test script in a real browser to verify your app still works correctly \u2014 use this for regression testing after code changes. The browser executes each saved step and captures screenshots so you can see what happened. Requires: (1) test script metadata from muggle-remote-test-script-get, (2) actionScript content from muggle-remote-action-script-get using the testScript.actionScriptId, and (3) a localhost URL. Launches an Electron browser \u2014 requires explicit approval via approveElectronAppLaunch. Before approving, ask the user whether they want a visible GUI; pass showUi: true to watch the window or showUi: false for headless (default when omitted).",
+  description: "Replay an existing E2E acceptance test script in a real browser to verify your app still works correctly \u2014 use this for regression testing after code changes. The browser executes each saved step and captures screenshots so you can see what happened. Requires: (1) test script metadata from muggle-remote-test-script-get, (2) actionScript content from muggle-remote-action-script-get using the testScript.actionScriptId, and (3) a localhost URL. Launches an Electron browser \u2014 defaults to a visible window; pass showUi: false to run headless.",
   inputSchema: ExecuteReplayInputSchema,
   execute: async (ctx) => {
     const logger14 = createChildLogger2(ctx.correlationId);
     logger14.info("Executing muggle-local-execute-replay");
     const input = ExecuteReplayInputSchema.parse(ctx.input);
-    if (!input.approveElectronAppLaunch) {
-      const showUiExplicit = input.showUi !== void 0;
-      const uiMode = input.showUi === true ? "visible GUI (showUi: true)" : "headless (showUi: false or omitted)";
-      return {
-        content: [
-          "## Electron App Launch Required",
-          "",
-          "This tool will launch the electron-app to replay a test script.",
-          "Please set `approveElectronAppLaunch: true` to proceed.",
-          "",
-          "**Visible GUI:** Ask the user whether they want to watch the Electron window during replay.",
-          "- If **yes** \u2192 when approving, pass `showUi: true`.",
-          "- If **no** \u2192 when approving, pass `showUi: false` (or omit `showUi`; replay runs headless).",
-          "",
-          showUiExplicit ? `**Current choice:** ${uiMode}` : "**Current choice:** not set \u2014 default on approval is headless unless you pass `showUi: true`.",
-          "",
-          `**Test Script:** ${input.testScript.name}`,
-          `**Local URL:** ${input.localUrl}`,
-          `**Steps:** ${input.actionScript.length}`,
-          "",
-          "**Note:** The electron-app will execute the test steps against your local URL."
-        ].join("\n"),
-        isError: false,
-        data: { requiresApproval: true }
-      };
-    }
-    const showUi = input.showUi === true;
+    const showUi = input.showUi !== false;
     try {
       const result = await executeReplay({
         testScript: input.testScript,