@langwatch/mcp-server 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (47) hide show
  1. package/CHANGELOG.md +19 -0
  2. package/dist/archive-scenario-GAE4XVFM.js +19 -0
  3. package/dist/archive-scenario-GAE4XVFM.js.map +1 -0
  4. package/dist/{chunk-HOPTUDCZ.js → chunk-JVWDWL3J.js} +3 -2
  5. package/dist/chunk-JVWDWL3J.js.map +1 -0
  6. package/dist/chunk-K2YFPOSD.js +40 -0
  7. package/dist/chunk-K2YFPOSD.js.map +1 -0
  8. package/dist/{create-prompt-UBC537BJ.js → create-prompt-P35POKBW.js} +2 -2
  9. package/dist/create-scenario-3YRZVDYF.js +26 -0
  10. package/dist/create-scenario-3YRZVDYF.js.map +1 -0
  11. package/dist/discover-scenario-schema-MEEEVND7.js +65 -0
  12. package/dist/discover-scenario-schema-MEEEVND7.js.map +1 -0
  13. package/dist/{get-analytics-3IFTN6MY.js → get-analytics-BAVXTAPB.js} +2 -2
  14. package/dist/{get-prompt-2ZB5B3QC.js → get-prompt-LKCPT26O.js} +2 -2
  15. package/dist/get-scenario-3SCDW4Z6.js +33 -0
  16. package/dist/get-scenario-3SCDW4Z6.js.map +1 -0
  17. package/dist/{get-trace-7IXKKCJJ.js → get-trace-QFDWJ5D4.js} +2 -2
  18. package/dist/index.js +16040 -8719
  19. package/dist/index.js.map +1 -1
  20. package/dist/{list-prompts-J72LTP7Z.js → list-prompts-UQPBCUYA.js} +2 -2
  21. package/dist/list-scenarios-573YOUKC.js +40 -0
  22. package/dist/list-scenarios-573YOUKC.js.map +1 -0
  23. package/dist/{search-traces-RW2NDHN5.js → search-traces-RSMYCAN7.js} +2 -2
  24. package/dist/{update-prompt-G6HHZSUM.js → update-prompt-G2Y5EBQY.js} +2 -2
  25. package/dist/update-scenario-SSGVOBJO.js +27 -0
  26. package/dist/update-scenario-SSGVOBJO.js.map +1 -0
  27. package/package.json +3 -3
  28. package/src/__tests__/scenario-tools.integration.test.ts +286 -0
  29. package/src/__tests__/scenario-tools.unit.test.ts +185 -0
  30. package/src/index.ts +132 -3
  31. package/src/langwatch-api-scenarios.ts +67 -0
  32. package/src/langwatch-api.ts +4 -3
  33. package/src/tools/archive-scenario.ts +19 -0
  34. package/src/tools/create-scenario.ts +30 -0
  35. package/src/tools/discover-scenario-schema.ts +71 -0
  36. package/src/tools/get-scenario.ts +36 -0
  37. package/src/tools/list-scenarios.ts +47 -0
  38. package/src/tools/update-scenario.ts +32 -0
  39. package/uv.lock +1788 -1322
  40. package/dist/chunk-HOPTUDCZ.js.map +0 -1
  41. /package/dist/{create-prompt-UBC537BJ.js.map → create-prompt-P35POKBW.js.map} +0 -0
  42. /package/dist/{get-analytics-3IFTN6MY.js.map → get-analytics-BAVXTAPB.js.map} +0 -0
  43. /package/dist/{get-prompt-2ZB5B3QC.js.map → get-prompt-LKCPT26O.js.map} +0 -0
  44. /package/dist/{get-trace-7IXKKCJJ.js.map → get-trace-QFDWJ5D4.js.map} +0 -0
  45. /package/dist/{list-prompts-J72LTP7Z.js.map → list-prompts-UQPBCUYA.js.map} +0 -0
  46. /package/dist/{search-traces-RW2NDHN5.js.map → search-traces-RSMYCAN7.js.map} +0 -0
  47. /package/dist/{update-prompt-G6HHZSUM.js.map → update-prompt-G2Y5EBQY.js.map} +0 -0
package/CHANGELOG.md CHANGED
@@ -1,5 +1,24 @@
1
1
  # Changelog
2
2
 
3
+ ## [0.5.0](https://github.com/langwatch/langwatch/compare/mcp-server@v0.4.0...mcp-server@v0.5.0) (2026-02-20)
4
+
5
+
6
+ ### Features
7
+
8
+ * add scenario management tools to MCP server ([#1705](https://github.com/langwatch/langwatch/issues/1705)) ([0376fde](https://github.com/langwatch/langwatch/commit/0376fde0abff7b110b4ec5996a399c4b2ceafde0))
9
+
10
+
11
+ ### Miscellaneous
12
+
13
+ * **deps-dev:** bump @eslint/js from 9.35.0 to 9.39.2 in /mcp-server ([#1465](https://github.com/langwatch/langwatch/issues/1465)) ([fbee07d](https://github.com/langwatch/langwatch/commit/fbee07d8b964d0a059eaa32c7685c8bf667898e7))
14
+ * **deps:** bump hono ([f7e8f05](https://github.com/langwatch/langwatch/commit/f7e8f056843958cac4504ae02f37a351457f77ee))
15
+ * **deps:** bump hono from 4.11.9 to 4.12.0 in /mcp-server in the npm_and_yarn group across 1 directory ([#1736](https://github.com/langwatch/langwatch/issues/1736)) ([f7e8f05](https://github.com/langwatch/langwatch/commit/f7e8f056843958cac4504ae02f37a351457f77ee))
16
+ * **deps:** bump node-pty from 1.0.0 to 1.1.0 in /mcp-server ([#1447](https://github.com/langwatch/langwatch/issues/1447)) ([12ad02c](https://github.com/langwatch/langwatch/commit/12ad02c19dcc0ba90ad32f77659816b768188a53))
17
+ * **deps:** bump qs ([f0e9747](https://github.com/langwatch/langwatch/commit/f0e97475becd58dfa523a944fbb3fa0657dfc1dc))
18
+ * **deps:** bump qs from 6.14.1 to 6.14.2 in /mcp-server in the npm_and_yarn group across 1 directory ([#1568](https://github.com/langwatch/langwatch/issues/1568)) ([f0e9747](https://github.com/langwatch/langwatch/commit/f0e97475becd58dfa523a944fbb3fa0657dfc1dc))
19
+ * **deps:** bump the npm_and_yarn group across 1 directory with 8 updates ([#1519](https://github.com/langwatch/langwatch/issues/1519)) ([487e563](https://github.com/langwatch/langwatch/commit/487e5637a941fa9335ec8e951efdf38bb0a02a8c))
20
+ * **deps:** bump the uv group across 1 directory with 7 updates ([#1516](https://github.com/langwatch/langwatch/issues/1516)) ([7f2f178](https://github.com/langwatch/langwatch/commit/7f2f178588d89a63f3b38510844b87de7b528b3b))
21
+
3
22
  ## [0.4.0](https://github.com/langwatch/langwatch/compare/mcp-server@v0.3.3...mcp-server@v0.4.0) (2026-02-08)
4
23
 
5
24
 
@@ -0,0 +1,19 @@
1
+ import {
2
+ archiveScenario
3
+ } from "./chunk-K2YFPOSD.js";
4
+ import "./chunk-JVWDWL3J.js";
5
+ import "./chunk-AAQNA53E.js";
6
+
7
+ // src/tools/archive-scenario.ts
8
+ async function handleArchiveScenario(params) {
9
+ const result = await archiveScenario(params.scenarioId);
10
+ const lines = [];
11
+ lines.push("Scenario archived successfully!\n");
12
+ lines.push(`**ID**: ${result.id}`);
13
+ lines.push(`**Status**: ${result.archived ? "archived" : "active"}`);
14
+ return lines.join("\n");
15
+ }
16
+ export {
17
+ handleArchiveScenario
18
+ };
19
+ //# sourceMappingURL=archive-scenario-GAE4XVFM.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/tools/archive-scenario.ts"],"sourcesContent":["import { archiveScenario as apiArchiveScenario } from \"../langwatch-api-scenarios.js\";\n\n/**\n * Handles the archive_scenario MCP tool invocation.\n *\n * Archives (soft-deletes) a scenario and returns confirmation.\n */\nexport async function handleArchiveScenario(params: {\n scenarioId: string;\n}): Promise<string> {\n const result = await apiArchiveScenario(params.scenarioId);\n\n const lines: string[] = [];\n lines.push(\"Scenario archived successfully!\\n\");\n lines.push(`**ID**: ${result.id}`);\n lines.push(`**Status**: ${result.archived ? \"archived\" : \"active\"}`);\n\n return lines.join(\"\\n\");\n}\n"],"mappings":";;;;;;;AAOA,eAAsB,sBAAsB,QAExB;AAClB,QAAM,SAAS,MAAM,gBAAmB,OAAO,UAAU;AAEzD,QAAM,QAAkB,CAAC;AACzB,QAAM,KAAK,mCAAmC;AAC9C,QAAM,KAAK,WAAW,OAAO,EAAE,EAAE;AACjC,QAAM,KAAK,eAAe,OAAO,WAAW,aAAa,QAAQ,EAAE;AAEnE,SAAO,MAAM,KAAK,IAAI;AACxB;","names":[]}
@@ -9,7 +9,7 @@ async function makeRequest(method, path, body) {
9
9
  const headers = {
10
10
  "X-Auth-Token": requireApiKey()
11
11
  };
12
- if (method === "POST") {
12
+ if (body !== void 0) {
13
13
  headers["Content-Type"] = "application/json";
14
14
  }
15
15
  const response = await fetch(url, {
@@ -78,6 +78,7 @@ async function createPromptVersion(idOrHandle, data) {
78
78
  }
79
79
 
80
80
  export {
81
+ makeRequest,
81
82
  searchTraces,
82
83
  getTraceById,
83
84
  getAnalyticsTimeseries,
@@ -87,4 +88,4 @@ export {
87
88
  updatePrompt,
88
89
  createPromptVersion
89
90
  };
90
- //# sourceMappingURL=chunk-HOPTUDCZ.js.map
91
+ //# sourceMappingURL=chunk-JVWDWL3J.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/langwatch-api.ts"],"sourcesContent":["import { getConfig, requireApiKey } from \"./config.js\";\n\n// --- Response types ---\n\nexport interface TraceSearchResult {\n trace_id: string;\n formatted_trace?: string;\n input?: { value: string };\n output?: { value: string };\n timestamps?: { started_at?: string | number };\n metadata?: Record<string, unknown>;\n error?: Record<string, unknown>;\n}\n\nexport interface SearchTracesResponse {\n traces: TraceSearchResult[];\n pagination?: {\n totalHits?: number;\n scrollId?: string;\n };\n}\n\nexport interface TraceDetailResponse {\n trace_id: string;\n formatted_trace?: string;\n input?: { value: string };\n output?: { value: string };\n timestamps?: {\n started_at?: string | number;\n updated_at?: string | number;\n inserted_at?: string | number;\n };\n metadata?: {\n user_id?: string;\n thread_id?: string;\n customer_id?: string;\n labels?: string[];\n [key: string]: unknown;\n };\n error?: Record<string, unknown>;\n ascii_tree?: string;\n evaluations?: Array<{\n evaluator_id?: string;\n name?: string;\n score?: number;\n passed?: boolean;\n label?: string;\n }>;\n spans?: Array<{\n span_id: string;\n name?: string;\n type?: string;\n model?: string;\n input?: { value: string };\n output?: { value: string };\n timestamps?: { started_at?: number; finished_at?: number };\n metrics?: {\n completion_time_ms?: number;\n prompt_tokens?: number;\n completion_tokens?: number;\n tokens_estimated?: boolean;\n cost?: number;\n };\n }>;\n}\n\nexport interface AnalyticsBucket {\n date: string;\n [key: string]: unknown;\n}\n\nexport interface AnalyticsTimeseriesResponse {\n currentPeriod: AnalyticsBucket[];\n previousPeriod: AnalyticsBucket[];\n}\n\nexport interface PromptSummary {\n id?: string;\n handle?: string;\n name?: string;\n description?: string | null;\n latestVersionNumber?: number;\n version?: number;\n}\n\nexport interface PromptVersion {\n version?: number;\n commitMessage?: string;\n model?: string;\n modelProvider?: string;\n messages?: Array<{ role: string; content: string }>;\n}\n\nexport interface PromptDetailResponse extends PromptSummary {\n versions?: PromptVersion[];\n model?: string;\n modelProvider?: string;\n messages?: Array<{ role: string; content: string }>;\n prompt?: Array<{ role: string; content: string }>;\n}\n\nexport interface PromptMutationResponse {\n id?: string;\n handle?: string;\n name?: string;\n latestVersionNumber?: number;\n}\n\n// --- HTTP client ---\n\n/**\n * Sends an HTTP request to the LangWatch API.\n *\n * Builds the full URL from the configured endpoint, adds authentication,\n * and handles JSON serialization/deserialization.\n *\n * @throws Error with status code and response body when the response is not OK\n */\nexport async function makeRequest(\n method: \"GET\" | \"POST\" | \"PUT\" | \"PATCH\" | \"DELETE\",\n path: string,\n body?: unknown\n): Promise<unknown> {\n const url = getConfig().endpoint + path;\n const headers: Record<string, string> = {\n \"X-Auth-Token\": requireApiKey(),\n };\n\n if (body !== undefined) {\n headers[\"Content-Type\"] = \"application/json\";\n }\n\n const response = await fetch(url, {\n method,\n headers,\n ...(body !== undefined ? { body: JSON.stringify(body) } : {}),\n });\n\n if (!response.ok) {\n const responseBody = await response.text();\n throw new Error(\n `LangWatch API error ${response.status}: ${responseBody}`\n );\n }\n\n return response.json();\n}\n\n/** Searches traces with optional filters and pagination. */\nexport async function searchTraces(params: {\n query?: string;\n filters?: Record<string, string[]>;\n startDate: number;\n endDate: number;\n pageSize?: number;\n pageOffset?: number;\n scrollId?: string;\n format?: \"digest\" | \"json\";\n}): Promise<SearchTracesResponse> {\n const { format = \"digest\", ...rest } = params;\n return makeRequest(\"POST\", \"/api/traces/search\", {\n ...rest,\n format,\n }) as Promise<SearchTracesResponse>;\n}\n\n/** Retrieves a single trace by its ID. */\nexport async function getTraceById(\n traceId: string,\n format: \"digest\" | \"json\" = \"digest\"\n): Promise<TraceDetailResponse> {\n return makeRequest(\n \"GET\",\n `/api/traces/${encodeURIComponent(traceId)}?format=${format}`\n ) as Promise<TraceDetailResponse>;\n}\n\n/** Fetches analytics timeseries data for the given metrics and date range. */\nexport async function getAnalyticsTimeseries(params: {\n series: Array<{\n metric: string;\n aggregation: string;\n key?: string;\n subkey?: string;\n }>;\n startDate: number;\n endDate: number;\n timeZone?: string;\n groupBy?: string;\n groupByKey?: string;\n filters?: Record<string, string[]>;\n}): Promise<AnalyticsTimeseriesResponse> {\n return makeRequest(\n \"POST\",\n \"/api/analytics/timeseries\",\n params\n ) as Promise<AnalyticsTimeseriesResponse>;\n}\n\n/** Lists all prompts in the project. */\nexport async function listPrompts(): Promise<PromptSummary[]> {\n return makeRequest(\"GET\", \"/api/prompts\") as Promise<PromptSummary[]>;\n}\n\n/** Retrieves a single prompt by ID or handle. */\nexport async function getPrompt(\n idOrHandle: string,\n version?: number\n): Promise<PromptDetailResponse> {\n const query = version != null ? `?version=${version}` : \"\";\n return makeRequest(\n \"GET\",\n `/api/prompts/${encodeURIComponent(idOrHandle)}${query}`\n ) as Promise<PromptDetailResponse>;\n}\n\n/** Creates a new prompt. */\nexport async function createPrompt(data: {\n name: string;\n handle?: string;\n messages: Array<{ role: string; content: string }>;\n model: string;\n modelProvider: string;\n description?: string;\n}): Promise<PromptMutationResponse> {\n return makeRequest(\n \"POST\",\n \"/api/prompts\",\n data\n ) as Promise<PromptMutationResponse>;\n}\n\n/** Updates an existing prompt by ID or handle. */\nexport async function updatePrompt(\n idOrHandle: string,\n data: {\n messages?: Array<{ role: string; content: string }>;\n model?: string;\n modelProvider?: string;\n commitMessage?: string;\n }\n): Promise<PromptMutationResponse> {\n return makeRequest(\n \"POST\",\n `/api/prompts/${encodeURIComponent(idOrHandle)}`,\n data\n ) as Promise<PromptMutationResponse>;\n}\n\n/** Creates a new version of an existing prompt. */\nexport async function createPromptVersion(\n idOrHandle: string,\n data: {\n messages?: Array<{ role: string; content: string }>;\n model?: string;\n modelProvider?: string;\n commitMessage?: string;\n }\n): Promise<PromptMutationResponse> {\n return makeRequest(\n \"POST\",\n `/api/prompts/${encodeURIComponent(idOrHandle)}/versions`,\n data\n ) as Promise<PromptMutationResponse>;\n}\n\n"],"mappings":";;;;;;AAsHA,eAAsB,YACpB,QACA,MACA,MACkB;AAClB,QAAM,MAAM,UAAU,EAAE,WAAW;AACnC,QAAM,UAAkC;AAAA,IACtC,gBAAgB,cAAc;AAAA,EAChC;AAEA,MAAI,SAAS,QAAW;AACtB,YAAQ,cAAc,IAAI;AAAA,EAC5B;AAEA,QAAM,WAAW,MAAM,MAAM,KAAK;AAAA,IAChC;AAAA,IACA;AAAA,IACA,GAAI,SAAS,SAAY,EAAE,MAAM,KAAK,UAAU,IAAI,EAAE,IAAI,CAAC;AAAA,EAC7D,CAAC;AAED,MAAI,CAAC,SAAS,IAAI;AAChB,UAAM,eAAe,MAAM,SAAS,KAAK;AACzC,UAAM,IAAI;AAAA,MACR,uBAAuB,SAAS,MAAM,KAAK,YAAY;AAAA,IACzD;AAAA,EACF;AAEA,SAAO,SAAS,KAAK;AACvB;AAGA,eAAsB,aAAa,QASD;AAChC,QAAM,EAAE,SAAS,UAAU,GAAG,KAAK,IAAI;AACvC,SAAO,YAAY,QAAQ,sBAAsB;AAAA,IAC/C,GAAG;AAAA,IACH;AAAA,EACF,CAAC;AACH;AAGA,eAAsB,aACpB,SACA,SAA4B,UACE;AAC9B,SAAO;AAAA,IACL;AAAA,IACA,eAAe,mBAAmB,OAAO,CAAC,WAAW,MAAM;AAAA,EAC7D;AACF;AAGA,eAAsB,uBAAuB,QAaJ;AACvC,SAAO;AAAA,IACL;AAAA,IACA;AAAA,IACA;AAAA,EACF;AACF;AAGA,eAAsB,cAAwC;AAC5D,SAAO,YAAY,OAAO,cAAc;AAC1C;AAGA,eAAsB,UACpB,YACA,SAC+B;AAC/B,QAAM,QAAQ,WAAW,OAAO,YAAY,OAAO,KAAK;AACxD,SAAO;AAAA,IACL;AAAA,IACA,gBAAgB,mBAAmB,UAAU,CAAC,GAAG,KAAK;AAAA,EACxD;AACF;AAGA,eAAsB,aAAa,MAOC;AAClC,SAAO;AAAA,IACL;AAAA,IACA;AAAA,IACA;AAAA,EACF;AACF;AAGA,eAAsB,aACpB,YACA,MAMiC;AACjC,SAAO;AAAA,IACL;AAAA,IACA,gBAAgB,mBAAmB,UAAU,CAAC;AAAA,IAC9C;AAAA,EACF;AACF;AAGA,eAAsB,oBACpB,YACA,MAMiC;AACjC,SAAO;AAAA,IACL;AAAA,IACA,gBAAgB,mBAAmB,UAAU,CAAC;AAAA,IAC9C;AAAA,EACF;AACF;","names":[]}
@@ -0,0 +1,40 @@
1
+ import {
2
+ makeRequest
3
+ } from "./chunk-JVWDWL3J.js";
4
+
5
+ // src/langwatch-api-scenarios.ts
6
+ async function listScenarios() {
7
+ return makeRequest("GET", "/api/scenarios");
8
+ }
9
+ async function getScenario(id) {
10
+ return makeRequest(
11
+ "GET",
12
+ `/api/scenarios/${encodeURIComponent(id)}`
13
+ );
14
+ }
15
+ async function createScenario(data) {
16
+ return makeRequest("POST", "/api/scenarios", data);
17
+ }
18
+ async function updateScenario(params) {
19
+ const { id, ...data } = params;
20
+ return makeRequest(
21
+ "PUT",
22
+ `/api/scenarios/${encodeURIComponent(id)}`,
23
+ data
24
+ );
25
+ }
26
+ async function archiveScenario(id) {
27
+ return makeRequest(
28
+ "DELETE",
29
+ `/api/scenarios/${encodeURIComponent(id)}`
30
+ );
31
+ }
32
+
33
+ export {
34
+ listScenarios,
35
+ getScenario,
36
+ createScenario,
37
+ updateScenario,
38
+ archiveScenario
39
+ };
40
+ //# sourceMappingURL=chunk-K2YFPOSD.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/langwatch-api-scenarios.ts"],"sourcesContent":["import { makeRequest } from \"./langwatch-api.js\";\n\n// --- Scenario types ---\n\nexport interface ScenarioSummary {\n id: string;\n name: string;\n situation: string;\n criteria: string[];\n labels: string[];\n}\n\nexport interface ScenarioArchiveResponse {\n id: string;\n archived: boolean;\n}\n\n// --- Scenario API functions ---\n\n/** Lists all scenarios in the project. */\nexport async function listScenarios(): Promise<ScenarioSummary[]> {\n return makeRequest(\"GET\", \"/api/scenarios\") as Promise<ScenarioSummary[]>;\n}\n\n/** Retrieves a single scenario by ID. */\nexport async function getScenario(id: string): Promise<ScenarioSummary> {\n return makeRequest(\n \"GET\",\n `/api/scenarios/${encodeURIComponent(id)}`\n ) as Promise<ScenarioSummary>;\n}\n\n/** Creates a new scenario. */\nexport async function createScenario(data: {\n name: string;\n situation: string;\n criteria?: string[];\n labels?: string[];\n}): Promise<ScenarioSummary> {\n return makeRequest(\"POST\", \"/api/scenarios\", data) as Promise<ScenarioSummary>;\n}\n\n/** Updates an existing scenario. */\nexport async function updateScenario(params: {\n id: string;\n name?: string;\n situation?: string;\n criteria?: string[];\n labels?: string[];\n}): Promise<ScenarioSummary> {\n const { id, ...data } = params;\n return makeRequest(\n \"PUT\",\n `/api/scenarios/${encodeURIComponent(id)}`,\n data\n ) as Promise<ScenarioSummary>;\n}\n\n/** Archives (soft-deletes) a scenario. */\nexport async function archiveScenario(\n id: string\n): Promise<ScenarioArchiveResponse> {\n return makeRequest(\n \"DELETE\",\n `/api/scenarios/${encodeURIComponent(id)}`\n ) as Promise<ScenarioArchiveResponse>;\n}\n"],"mappings":";;;;;AAoBA,eAAsB,gBAA4C;AAChE,SAAO,YAAY,OAAO,gBAAgB;AAC5C;AAGA,eAAsB,YAAY,IAAsC;AACtE,SAAO;AAAA,IACL;AAAA,IACA,kBAAkB,mBAAmB,EAAE,CAAC;AAAA,EAC1C;AACF;AAGA,eAAsB,eAAe,MAKR;AAC3B,SAAO,YAAY,QAAQ,kBAAkB,IAAI;AACnD;AAGA,eAAsB,eAAe,QAMR;AAC3B,QAAM,EAAE,IAAI,GAAG,KAAK,IAAI;AACxB,SAAO;AAAA,IACL;AAAA,IACA,kBAAkB,mBAAmB,EAAE,CAAC;AAAA,IACxC;AAAA,EACF;AACF;AAGA,eAAsB,gBACpB,IACkC;AAClC,SAAO;AAAA,IACL;AAAA,IACA,kBAAkB,mBAAmB,EAAE,CAAC;AAAA,EAC1C;AACF;","names":[]}
@@ -1,6 +1,6 @@
1
1
  import {
2
2
  createPrompt
3
- } from "./chunk-HOPTUDCZ.js";
3
+ } from "./chunk-JVWDWL3J.js";
4
4
  import "./chunk-AAQNA53E.js";
5
5
 
6
6
  // src/tools/create-prompt.ts
@@ -19,4 +19,4 @@ async function handleCreatePrompt(params) {
19
19
  export {
20
20
  handleCreatePrompt
21
21
  };
22
- //# sourceMappingURL=create-prompt-UBC537BJ.js.map
22
+ //# sourceMappingURL=create-prompt-P35POKBW.js.map
@@ -0,0 +1,26 @@
1
+ import {
2
+ createScenario
3
+ } from "./chunk-K2YFPOSD.js";
4
+ import "./chunk-JVWDWL3J.js";
5
+ import "./chunk-AAQNA53E.js";
6
+
7
+ // src/tools/create-scenario.ts
8
+ async function handleCreateScenario(params) {
9
+ const result = await createScenario(params);
10
+ const lines = [];
11
+ lines.push("Scenario created successfully!\n");
12
+ lines.push(`**ID**: ${result.id}`);
13
+ lines.push(`**Name**: ${result.name}`);
14
+ lines.push(`**Situation**: ${result.situation}`);
15
+ if (Array.isArray(result.criteria) && result.criteria.length > 0) {
16
+ lines.push(`**Criteria**: ${result.criteria.length} criteria`);
17
+ }
18
+ if (Array.isArray(result.labels) && result.labels.length > 0) {
19
+ lines.push(`**Labels**: ${result.labels.join(", ")}`);
20
+ }
21
+ return lines.join("\n");
22
+ }
23
+ export {
24
+ handleCreateScenario
25
+ };
26
+ //# sourceMappingURL=create-scenario-3YRZVDYF.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/tools/create-scenario.ts"],"sourcesContent":["import { createScenario as apiCreateScenario } from \"../langwatch-api-scenarios.js\";\n\n/**\n * Handles the create_scenario MCP tool invocation.\n *\n * Creates a new scenario in the LangWatch project and returns a\n * confirmation with the created scenario's details.\n */\nexport async function handleCreateScenario(params: {\n name: string;\n situation: string;\n criteria?: string[];\n labels?: string[];\n}): Promise<string> {\n const result = await apiCreateScenario(params);\n\n const lines: string[] = [];\n lines.push(\"Scenario created successfully!\\n\");\n lines.push(`**ID**: ${result.id}`);\n lines.push(`**Name**: ${result.name}`);\n lines.push(`**Situation**: ${result.situation}`);\n if (Array.isArray(result.criteria) && result.criteria.length > 0) {\n lines.push(`**Criteria**: ${result.criteria.length} criteria`);\n }\n if (Array.isArray(result.labels) && result.labels.length > 0) {\n lines.push(`**Labels**: ${result.labels.join(\", \")}`);\n }\n\n return lines.join(\"\\n\");\n}\n"],"mappings":";;;;;;;AAQA,eAAsB,qBAAqB,QAKvB;AAClB,QAAM,SAAS,MAAM,eAAkB,MAAM;AAE7C,QAAM,QAAkB,CAAC;AACzB,QAAM,KAAK,kCAAkC;AAC7C,QAAM,KAAK,WAAW,OAAO,EAAE,EAAE;AACjC,QAAM,KAAK,aAAa,OAAO,IAAI,EAAE;AACrC,QAAM,KAAK,kBAAkB,OAAO,SAAS,EAAE;AAC/C,MAAI,MAAM,QAAQ,OAAO,QAAQ,KAAK,OAAO,SAAS,SAAS,GAAG;AAChE,UAAM,KAAK,iBAAiB,OAAO,SAAS,MAAM,WAAW;AAAA,EAC/D;AACA,MAAI,MAAM,QAAQ,OAAO,MAAM,KAAK,OAAO,OAAO,SAAS,GAAG;AAC5D,UAAM,KAAK,eAAe,OAAO,OAAO,KAAK,IAAI,CAAC,EAAE;AAAA,EACtD;AAEA,SAAO,MAAM,KAAK,IAAI;AACxB;","names":[]}
@@ -0,0 +1,65 @@
1
+ // src/tools/discover-scenario-schema.ts
2
+ function formatScenarioSchema() {
3
+ const lines = [];
4
+ lines.push("# Scenario Schema\n");
5
+ lines.push("## Fields\n");
6
+ lines.push(
7
+ '- **name** (required): A short, descriptive name (e.g., "billing dispute resolution", "password reset with 2FA unavailable")'
8
+ );
9
+ lines.push(
10
+ "- **situation** (required): The context that guides the user simulator \u2014 who the user is, what they want, and any constraints (see Writing a Good Situation below)"
11
+ );
12
+ lines.push(
13
+ "- **criteria** (array of strings): Pass/fail conditions a judge evaluates the agent against (see Writing Good Criteria below)"
14
+ );
15
+ lines.push(
16
+ '- **labels** (array of strings): Tags for organizing scenarios (e.g., "auth", "happy-path", "edge-case")'
17
+ );
18
+ lines.push("\n## Writing a Good Situation\n");
19
+ lines.push(
20
+ "The situation drives the user simulator. Include these elements:"
21
+ );
22
+ lines.push("- **Persona**: Who is the user? (e.g., a stressed small business owner, a confused teenager)");
23
+ lines.push("- **Emotional state**: How are they feeling? (e.g., frustrated, anxious, impatient)");
24
+ lines.push("- **Background/Context**: What happened before this conversation?");
25
+ lines.push("- **Intent**: What do they want to accomplish?");
26
+ lines.push("- **Constraints**: What limitations do they have? (e.g., no phone for 2FA, unfamiliar with technical terms)");
27
+ lines.push("\nExample:");
28
+ lines.push("```");
29
+ lines.push("User is a small business owner stressed about tax deadline.");
30
+ lines.push("They need help categorizing expenses but aren't familiar with");
31
+ lines.push("accounting terms. They appreciate patient explanations and examples.");
32
+ lines.push("They have a spreadsheet of transactions but aren't sure which");
33
+ lines.push("categories apply to their consulting business.");
34
+ lines.push("```");
35
+ lines.push("\n## Writing Good Criteria\n");
36
+ lines.push("Criteria are what the judge uses to pass or fail the agent. Each criterion should be:");
37
+ lines.push('- **Specific and testable** \u2014 not vague like "responds helpfully"');
38
+ lines.push("- **Behavioral** \u2014 describes what the agent should *do*, not how it works internally");
39
+ lines.push("- **Independent** \u2014 each criterion checks one thing");
40
+ lines.push("\nGood criteria patterns:");
41
+ lines.push(`- **Information gathering**: "Agent asks for the user's account number before proceeding"`);
42
+ lines.push('- **Safety/guardrails**: "Agent does not reveal internal system details or error stack traces"');
43
+ lines.push('- **Clarification**: "Agent asks clarifying questions before taking irreversible action"');
44
+ lines.push('- **Tone**: "Agent maintains a professional and empathetic tone throughout"');
45
+ lines.push('- **Completeness**: "Agent confirms the user understands the solution before ending"');
46
+ lines.push('- **Domain-specific**: "Agent recommends releasing a wild frog rather than keeping it as a pet"');
47
+ lines.push("\nAvoid vague criteria like:");
48
+ lines.push('- "Responds correctly" \u2014 correct how?');
49
+ lines.push('- "Is helpful" \u2014 helpful in what way?');
50
+ lines.push('- "Works well" \u2014 not testable');
51
+ lines.push("\n## Target Types\n");
52
+ lines.push("Scenarios can target different execution backends:");
53
+ lines.push("- **prompt**: Test a prompt template with variable substitution");
54
+ lines.push("- **http**: Test an HTTP endpoint (e.g., a deployed agent API)");
55
+ lines.push("- **code**: Test a code function directly");
56
+ lines.push("\n## Tips\n");
57
+ lines.push("- Start simple, then layer complexity (add constraints, edge cases)");
58
+ lines.push("- Test edge cases: user changes their mind, gives ambiguous input, makes mistakes");
59
+ lines.push("- Use `fetch_scenario_docs` for the full authoring guide and advanced patterns");
60
+ return lines.join("\n");
61
+ }
62
+ export {
63
+ formatScenarioSchema
64
+ };
65
+ //# sourceMappingURL=discover-scenario-schema-MEEEVND7.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/tools/discover-scenario-schema.ts"],"sourcesContent":["/**\n * Returns a human-readable description of the scenario schema,\n * including field descriptions, authoring guidance, and examples.\n */\nexport function formatScenarioSchema(): string {\n const lines: string[] = [];\n\n lines.push(\"# Scenario Schema\\n\");\n\n lines.push(\"## Fields\\n\");\n lines.push(\n '- **name** (required): A short, descriptive name (e.g., \"billing dispute resolution\", \"password reset with 2FA unavailable\")',\n );\n lines.push(\n \"- **situation** (required): The context that guides the user simulator — who the user is, what they want, and any constraints (see Writing a Good Situation below)\",\n );\n lines.push(\n \"- **criteria** (array of strings): Pass/fail conditions a judge evaluates the agent against (see Writing Good Criteria below)\",\n );\n lines.push(\n '- **labels** (array of strings): Tags for organizing scenarios (e.g., \"auth\", \"happy-path\", \"edge-case\")',\n );\n\n lines.push(\"\\n## Writing a Good Situation\\n\");\n lines.push(\n \"The situation drives the user simulator. Include these elements:\",\n );\n lines.push(\"- **Persona**: Who is the user? (e.g., a stressed small business owner, a confused teenager)\");\n lines.push(\"- **Emotional state**: How are they feeling? (e.g., frustrated, anxious, impatient)\");\n lines.push(\"- **Background/Context**: What happened before this conversation?\");\n lines.push(\"- **Intent**: What do they want to accomplish?\");\n lines.push(\"- **Constraints**: What limitations do they have? (e.g., no phone for 2FA, unfamiliar with technical terms)\");\n lines.push(\"\\nExample:\");\n lines.push(\"```\");\n lines.push(\"User is a small business owner stressed about tax deadline.\");\n lines.push(\"They need help categorizing expenses but aren't familiar with\");\n lines.push(\"accounting terms. They appreciate patient explanations and examples.\");\n lines.push(\"They have a spreadsheet of transactions but aren't sure which\");\n lines.push(\"categories apply to their consulting business.\");\n lines.push(\"```\");\n\n lines.push(\"\\n## Writing Good Criteria\\n\");\n lines.push(\"Criteria are what the judge uses to pass or fail the agent. Each criterion should be:\");\n lines.push(\"- **Specific and testable** — not vague like \\\"responds helpfully\\\"\");\n lines.push(\"- **Behavioral** — describes what the agent should *do*, not how it works internally\");\n lines.push(\"- **Independent** — each criterion checks one thing\");\n lines.push(\"\\nGood criteria patterns:\");\n lines.push(\"- **Information gathering**: \\\"Agent asks for the user's account number before proceeding\\\"\");\n lines.push(\"- **Safety/guardrails**: \\\"Agent does not reveal internal system details or error stack traces\\\"\");\n lines.push(\"- **Clarification**: \\\"Agent asks clarifying questions before taking irreversible action\\\"\");\n lines.push(\"- **Tone**: \\\"Agent maintains a professional and empathetic tone throughout\\\"\");\n lines.push(\"- **Completeness**: \\\"Agent confirms the user understands the solution before ending\\\"\");\n lines.push(\"- **Domain-specific**: \\\"Agent recommends releasing a wild frog rather than keeping it as a pet\\\"\");\n lines.push(\"\\nAvoid vague criteria like:\");\n lines.push('- \"Responds correctly\" — correct how?');\n lines.push('- \"Is helpful\" — helpful in what way?');\n lines.push('- \"Works well\" — not testable');\n\n lines.push(\"\\n## Target Types\\n\");\n lines.push(\"Scenarios can target different execution backends:\");\n lines.push(\"- **prompt**: Test a prompt template with variable substitution\");\n lines.push(\"- **http**: Test an HTTP endpoint (e.g., a deployed agent API)\");\n lines.push(\"- **code**: Test a code function directly\");\n\n lines.push(\"\\n## Tips\\n\");\n lines.push(\"- Start simple, then layer complexity (add constraints, edge cases)\");\n lines.push(\"- Test edge cases: user changes their mind, gives ambiguous input, makes mistakes\");\n lines.push(\"- Use `fetch_scenario_docs` for the full authoring guide and advanced patterns\");\n\n return lines.join(\"\\n\");\n}\n"],"mappings":";AAIO,SAAS,uBAA+B;AAC7C,QAAM,QAAkB,CAAC;AAEzB,QAAM,KAAK,qBAAqB;AAEhC,QAAM,KAAK,aAAa;AACxB,QAAM;AAAA,IACJ;AAAA,EACF;AACA,QAAM;AAAA,IACJ;AAAA,EACF;AACA,QAAM;AAAA,IACJ;AAAA,EACF;AACA,QAAM;AAAA,IACJ;AAAA,EACF;AAEA,QAAM,KAAK,iCAAiC;AAC5C,QAAM;AAAA,IACJ;AAAA,EACF;AACA,QAAM,KAAK,8FAA8F;AACzG,QAAM,KAAK,qFAAqF;AAChG,QAAM,KAAK,mEAAmE;AAC9E,QAAM,KAAK,gDAAgD;AAC3D,QAAM,KAAK,6GAA6G;AACxH,QAAM,KAAK,YAAY;AACvB,QAAM,KAAK,KAAK;AAChB,QAAM,KAAK,6DAA6D;AACxE,QAAM,KAAK,+DAA+D;AAC1E,QAAM,KAAK,sEAAsE;AACjF,QAAM,KAAK,+DAA+D;AAC1E,QAAM,KAAK,gDAAgD;AAC3D,QAAM,KAAK,KAAK;AAEhB,QAAM,KAAK,8BAA8B;AACzC,QAAM,KAAK,uFAAuF;AAClG,QAAM,KAAK,wEAAqE;AAChF,QAAM,KAAK,2FAAsF;AACjG,QAAM,KAAK,0DAAqD;AAChE,QAAM,KAAK,2BAA2B;AACtC,QAAM,KAAK,2FAA6F;AACxG,QAAM,KAAK,gGAAkG;AAC7G,QAAM,KAAK,0FAA4F;AACvG,QAAM,KAAK,6EAA+E;AAC1F,QAAM,KAAK,sFAAwF;AACnG,QAAM,KAAK,iGAAmG;AAC9G,QAAM,KAAK,8BAA8B;AACzC,QAAM,KAAK,4CAAuC;AAClD,QAAM,KAAK,4CAAuC;AAClD,QAAM,KAAK,oCAA+B;AAE1C,QAAM,KAAK,qBAAqB;AAChC,QAAM,KAAK,oDAAoD;AAC/D,QAAM,KAAK,iEAAiE;AAC5E,QAAM,KAAK,gEAAgE;AAC3E,QAAM,KAAK,2CAA2C;AAEtD,QAAM,KAAK,aAAa;AACxB,QAAM,KAAK,qEAAqE;AAChF,QAAM,KAAK,mFAAmF;AAC9F,QAAM,KAAK,gFAAgF;AAE3F,SAAO,MAAM,KAAK,IAAI;AACxB;","names":[]}
@@ -3,7 +3,7 @@ import {
3
3
  } from "./chunk-ZXKLPC2E.js";
4
4
  import {
5
5
  getAnalyticsTimeseries
6
- } from "./chunk-HOPTUDCZ.js";
6
+ } from "./chunk-JVWDWL3J.js";
7
7
  import "./chunk-AAQNA53E.js";
8
8
 
9
9
  // src/tools/get-analytics.ts
@@ -52,4 +52,4 @@ async function handleGetAnalytics(params) {
52
52
  export {
53
53
  handleGetAnalytics
54
54
  };
55
- //# sourceMappingURL=get-analytics-3IFTN6MY.js.map
55
+ //# sourceMappingURL=get-analytics-BAVXTAPB.js.map
@@ -1,6 +1,6 @@
1
1
  import {
2
2
  getPrompt
3
- } from "./chunk-HOPTUDCZ.js";
3
+ } from "./chunk-JVWDWL3J.js";
4
4
  import "./chunk-AAQNA53E.js";
5
5
 
6
6
  // src/tools/get-prompt.ts
@@ -45,4 +45,4 @@ async function handleGetPrompt(params) {
45
45
  export {
46
46
  handleGetPrompt
47
47
  };
48
- //# sourceMappingURL=get-prompt-2ZB5B3QC.js.map
48
+ //# sourceMappingURL=get-prompt-LKCPT26O.js.map
@@ -0,0 +1,33 @@
1
+ import {
2
+ getScenario
3
+ } from "./chunk-K2YFPOSD.js";
4
+ import "./chunk-JVWDWL3J.js";
5
+ import "./chunk-AAQNA53E.js";
6
+
7
+ // src/tools/get-scenario.ts
8
+ async function handleGetScenario(params) {
9
+ const scenario = await getScenario(params.scenarioId);
10
+ if (params.format === "json") {
11
+ return JSON.stringify(scenario, null, 2);
12
+ }
13
+ const lines = [];
14
+ lines.push(`# Scenario: ${scenario.name}
15
+ `);
16
+ lines.push(`**ID**: ${scenario.id}`);
17
+ lines.push(`**Situation**: ${scenario.situation}`);
18
+ if (Array.isArray(scenario.criteria) && scenario.criteria.length > 0) {
19
+ lines.push("\n## Criteria");
20
+ for (const criterion of scenario.criteria) {
21
+ lines.push(`- ${criterion}`);
22
+ }
23
+ }
24
+ if (Array.isArray(scenario.labels) && scenario.labels.length > 0) {
25
+ lines.push(`
26
+ **Labels**: ${scenario.labels.join(", ")}`);
27
+ }
28
+ return lines.join("\n");
29
+ }
30
+ export {
31
+ handleGetScenario
32
+ };
33
+ //# sourceMappingURL=get-scenario-3SCDW4Z6.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../src/tools/get-scenario.ts"],"sourcesContent":["import { getScenario as apiGetScenario } from \"../langwatch-api-scenarios.js\";\n\n/**\n * Handles the get_scenario MCP tool invocation.\n *\n * Retrieves a specific scenario by ID and formats it as\n * AI-readable markdown or raw JSON.\n */\nexport async function handleGetScenario(params: {\n scenarioId: string;\n format?: \"digest\" | \"json\";\n}): Promise<string> {\n const scenario = await apiGetScenario(params.scenarioId);\n\n if (params.format === \"json\") {\n return JSON.stringify(scenario, null, 2);\n }\n\n const lines: string[] = [];\n lines.push(`# Scenario: ${scenario.name}\\n`);\n lines.push(`**ID**: ${scenario.id}`);\n lines.push(`**Situation**: ${scenario.situation}`);\n\n if (Array.isArray(scenario.criteria) && scenario.criteria.length > 0) {\n lines.push(\"\\n## Criteria\");\n for (const criterion of scenario.criteria) {\n lines.push(`- ${criterion}`);\n }\n }\n\n if (Array.isArray(scenario.labels) && scenario.labels.length > 0) {\n lines.push(`\\n**Labels**: ${scenario.labels.join(\", \")}`);\n }\n\n return lines.join(\"\\n\");\n}\n"],"mappings":";;;;;;;AAQA,eAAsB,kBAAkB,QAGpB;AAClB,QAAM,WAAW,MAAM,YAAe,OAAO,UAAU;AAEvD,MAAI,OAAO,WAAW,QAAQ;AAC5B,WAAO,KAAK,UAAU,UAAU,MAAM,CAAC;AAAA,EACzC;AAEA,QAAM,QAAkB,CAAC;AACzB,QAAM,KAAK,eAAe,SAAS,IAAI;AAAA,CAAI;AAC3C,QAAM,KAAK,WAAW,SAAS,EAAE,EAAE;AACnC,QAAM,KAAK,kBAAkB,SAAS,SAAS,EAAE;AAEjD,MAAI,MAAM,QAAQ,SAAS,QAAQ,KAAK,SAAS,SAAS,SAAS,GAAG;AACpE,UAAM,KAAK,eAAe;AAC1B,eAAW,aAAa,SAAS,UAAU;AACzC,YAAM,KAAK,KAAK,SAAS,EAAE;AAAA,IAC7B;AAAA,EACF;AAEA,MAAI,MAAM,QAAQ,SAAS,MAAM,KAAK,SAAS,OAAO,SAAS,GAAG;AAChE,UAAM,KAAK;AAAA,cAAiB,SAAS,OAAO,KAAK,IAAI,CAAC,EAAE;AAAA,EAC1D;AAEA,SAAO,MAAM,KAAK,IAAI;AACxB;","names":[]}
@@ -1,6 +1,6 @@
1
1
  import {
2
2
  getTraceById
3
- } from "./chunk-HOPTUDCZ.js";
3
+ } from "./chunk-JVWDWL3J.js";
4
4
  import "./chunk-AAQNA53E.js";
5
5
 
6
6
  // src/tools/get-trace.ts
@@ -47,4 +47,4 @@ ${result.formatted_trace}`);
47
47
  export {
48
48
  handleGetTrace
49
49
  };
50
- //# sourceMappingURL=get-trace-7IXKKCJJ.js.map
50
+ //# sourceMappingURL=get-trace-QFDWJ5D4.js.map