npm - @gleanwork/mcp-server-tester - Versions diffs - 1.0.0-beta.2 → 1.0.0-beta.3 - Mend

@gleanwork/mcp-server-tester 1.0.0-beta.2 → 1.0.0-beta.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/README.md +13 -12
package/dist/cli/index.js +5 -2
package/dist/fixtures/mcp.d.ts +8 -0
package/dist/fixtures/mcp.js +5 -2
package/dist/fixtures/mcp.js.map +1 -1
package/dist/index.cjs +6 -5
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +9 -7
package/dist/index.d.ts +9 -7
package/dist/index.js +6 -5
package/dist/index.js.map +1 -1
package/dist/reporters/ui-dist/app.js +4 -4
package/package.json +3 -3
package/src/reporters/ui-dist/app.js +4 -4

package/dist/index.d.cts CHANGED Viewed

@@ -2486,6 +2486,14 @@ declare function toMatchToolPattern(this: {
 /**
  * Creates the toMatchToolSnapshot matcher function
  *
+ * @remarks
+ * **Requires Playwright test context.** This matcher calls `expect(content).toMatchSnapshot()`
+ * internally, which only works inside a Playwright test (i.e., when `testInfo` is available).
+ * Calling it outside a Playwright test will throw a cryptic context error.
+ *
+ * To test sanitizer logic without a Playwright context, use the exported `applySanitizers`
+ * function directly.
+ *
  * Note: This is an async matcher that uses Playwright's snapshot testing.
  */
 declare function toMatchToolSnapshot(this: {
@@ -2896,7 +2904,7 @@ interface EvalCase {
     metadata?: Record<string, unknown>;
     /**
      * Number of times to run this case and compute an accuracy score.
-     * When > 1, `EvalCaseResult.accuracy` is populated and `pass` is determined
+     * When > 1, `EvalCaseResult.assertionPassRate` is populated and `pass` is determined
      * by `accuracyThreshold` rather than a single run.
      * @default 1
      */
@@ -4282,12 +4290,6 @@ interface EvalCaseResult {
      * Only present when the case was run with `iterations > 1`.
      */
     infrastructureErrorRate?: number;
-    /**
-     * Accuracy score (0–1) across all iterations.
-     * Alias for `assertionPassRate`. Only present when the case was run with `iterations > 1`.
-     * @deprecated Use `assertionPassRate` for clarity; this field is kept for backward compatibility.
-     */
-    accuracy?: number;
     /**
      * Per-iteration pass/fail breakdown.
      * Only present when the case was run with `iterations > 1`.

package/dist/index.d.ts CHANGED Viewed

@@ -2486,6 +2486,14 @@ declare function toMatchToolPattern(this: {
 /**
  * Creates the toMatchToolSnapshot matcher function
  *
+ * @remarks
+ * **Requires Playwright test context.** This matcher calls `expect(content).toMatchSnapshot()`
+ * internally, which only works inside a Playwright test (i.e., when `testInfo` is available).
+ * Calling it outside a Playwright test will throw a cryptic context error.
+ *
+ * To test sanitizer logic without a Playwright context, use the exported `applySanitizers`
+ * function directly.
+ *
  * Note: This is an async matcher that uses Playwright's snapshot testing.
  */
 declare function toMatchToolSnapshot(this: {
@@ -2896,7 +2904,7 @@ interface EvalCase {
     metadata?: Record<string, unknown>;
     /**
      * Number of times to run this case and compute an accuracy score.
-     * When > 1, `EvalCaseResult.accuracy` is populated and `pass` is determined
+     * When > 1, `EvalCaseResult.assertionPassRate` is populated and `pass` is determined
      * by `accuracyThreshold` rather than a single run.
      * @default 1
      */
@@ -4282,12 +4290,6 @@ interface EvalCaseResult {
      * Only present when the case was run with `iterations > 1`.
      */
     infrastructureErrorRate?: number;
-    /**
-     * Accuracy score (0–1) across all iterations.
-     * Alias for `assertionPassRate`. Only present when the case was run with `iterations > 1`.
-     * @deprecated Use `assertionPassRate` for clarity; this field is kept for backward compatibility.
-     */
-    accuracy?: number;
     /**
      * Per-iteration pass/fail breakdown.
      * Only present when the case was run with `iterations > 1`.

package/dist/index.js CHANGED Viewed

@@ -4380,7 +4380,7 @@ function escapeHtml(text) {
 // package.json
 var package_default = {
-  version: "1.0.0-beta.2"};
+  version: "1.0.0-beta.3"};
 // src/mcp/clientFactory.ts
 function getRetryAfterDelayMs(err) {
@@ -4471,7 +4471,10 @@ async function createMCPClientForConfig(config, options) {
       validatedConfig.connectTimeoutMs !== void 0 ? { timeout: validatedConfig.connectTimeoutMs } : void 0
     );
   } else if (isHttpConfig(validatedConfig)) {
-    const headers = { ...validatedConfig.headers };
+    const headers = {
+      "User-Agent": `@gleanwork/mcp-server-tester/${package_default.version}`,
+      ...validatedConfig.headers
+    };
     if (validatedConfig.auth?.clientCredentials && !options?.authProvider) {
       const ccConfig = validatedConfig.auth.clientCredentials;
       const clientId = ccConfig.clientId ?? process.env["MCP_CLIENT_ID"];
@@ -6924,7 +6927,6 @@ async function runEvalCase(evalCase, context, options = {}) {
   const passCount = assertionResults.filter((r) => r.pass).length;
   const assertionPassRate = assertionResults.length > 0 ? passCount / assertionResults.length : 0;
   const infrastructureErrorRate = infraErrors.length / iterations;
-  const accuracy = assertionPassRate;
   const threshold = evalCase.accuracyThreshold ?? 1;
   const baseResult = lastResult ?? {
     id: evalCase.id,
@@ -6941,10 +6943,9 @@ async function runEvalCase(evalCase, context, options = {}) {
   };
   return {
     ...baseResult,
-    pass: accuracy >= threshold,
+    pass: assertionPassRate >= threshold,
     assertionPassRate,
     infrastructureErrorRate,
-    accuracy,
     iterationResults,
     infrastructureErrorCount: infraErrors.length,
     durationMs: iterationResults.reduce((sum, r) => sum + r.durationMs, 0)