@inkeep/agents-api 0.47.2 → 0.47.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. package/dist/.well-known/workflow/v1/flow.cjs +44 -44
  2. package/dist/.well-known/workflow/v1/flow.cjs.debug.json +2 -2
  3. package/dist/.well-known/workflow/v1/step.cjs +180 -134
  4. package/dist/.well-known/workflow/v1/step.cjs.debug.json +2 -2
  5. package/dist/createApp.d.ts +2 -2
  6. package/dist/createApp.js +1 -1
  7. package/dist/domains/evals/routes/evaluationTriggers.js +1 -1
  8. package/dist/domains/evals/services/conversationEvaluation.js +21 -10
  9. package/dist/domains/evals/workflow/routes.d.ts +2 -2
  10. package/dist/domains/manage/routes/availableAgents.d.ts +2 -2
  11. package/dist/domains/manage/routes/conversations.d.ts +2 -2
  12. package/dist/domains/manage/routes/index.d.ts +2 -2
  13. package/dist/domains/manage/routes/invitations.d.ts +2 -2
  14. package/dist/domains/manage/routes/mcp.d.ts +2 -2
  15. package/dist/domains/manage/routes/passwordResetLinks.d.ts +2 -2
  16. package/dist/domains/manage/routes/signoz.d.ts +2 -2
  17. package/dist/domains/manage/routes/triggers.js +110 -1
  18. package/dist/domains/manage/routes/users.d.ts +2 -2
  19. package/dist/domains/mcp/routes/mcp.d.ts +2 -2
  20. package/dist/domains/run/agents/Agent.js +19 -15
  21. package/dist/domains/run/agents/generateTaskHandler.js +1 -1
  22. package/dist/domains/run/agents/relationTools.d.ts +2 -2
  23. package/dist/domains/run/agents/relationTools.js +1 -1
  24. package/dist/domains/run/constants/execution-limits/index.js +5 -1
  25. package/dist/domains/run/handlers/executionHandler.js +6 -6
  26. package/dist/domains/run/routes/chat.js +4 -4
  27. package/dist/domains/run/routes/chatDataStream.js +4 -4
  28. package/dist/domains/run/routes/mcp.js +2 -2
  29. package/dist/domains/run/services/PendingToolApprovalManager.js +1 -1
  30. package/dist/domains/run/services/ToolApprovalUiBus.d.ts +1 -0
  31. package/dist/domains/run/services/ToolApprovalUiBus.js +2 -1
  32. package/dist/domains/run/services/TriggerService.d.ts +16 -2
  33. package/dist/domains/run/services/TriggerService.js +2 -2
  34. package/dist/domains/run/utils/model-context-utils.js +4 -2
  35. package/dist/domains/run/utils/token-estimator.d.ts +2 -2
  36. package/dist/domains/run/utils/tool-result.d.ts +11 -0
  37. package/dist/domains/run/utils/tool-result.js +15 -0
  38. package/dist/factory.d.ts +263 -263
  39. package/dist/index.d.ts +260 -260
  40. package/dist/middleware/evalsAuth.d.ts +2 -2
  41. package/dist/middleware/projectAccess.d.ts +2 -2
  42. package/dist/middleware/projectConfig.d.ts +3 -3
  43. package/dist/middleware/requirePermission.d.ts +2 -2
  44. package/dist/middleware/runAuth.d.ts +4 -4
  45. package/dist/middleware/sessionAuth.d.ts +3 -3
  46. package/dist/middleware/tenantAccess.d.ts +2 -2
  47. package/dist/middleware/tracing.d.ts +3 -3
  48. package/package.json +5 -5
@@ -45157,52 +45157,14 @@ var workflowCode = `globalThis.__private_workflows = new Map();
45157
45157
  var __defProp = Object.defineProperty;
45158
45158
  var __name = (target, value) => __defProp(target, "name", { value, configurable: true });
45159
45159
 
45160
- // src/domains/evals/workflow/functions/evaluateConversation.ts
45161
- var getConversationStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep");
45162
- var getEvaluatorsStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep");
45163
- var executeEvaluatorStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep");
45164
- var logStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep");
45165
- async function _evaluateConversationWorkflow(payload) {
45166
- const { conversationId, evaluatorIds } = payload;
45167
- await logStep("Starting conversation evaluation", payload);
45168
- const conversation = await getConversationStep(payload);
45169
- const evaluators = await getEvaluatorsStep(payload);
45170
- if (evaluators.length === 0) {
45171
- await logStep("No valid evaluators found", {
45172
- conversationId,
45173
- evaluatorIds
45174
- });
45175
- return {
45176
- success: false,
45177
- reason: "No valid evaluators"
45178
- };
45179
- }
45180
- const results = [];
45181
- for (const evaluator of evaluators) {
45182
- const result = await executeEvaluatorStep(payload, evaluator.id, conversation);
45183
- results.push(result);
45184
- }
45185
- return {
45186
- success: true,
45187
- conversationId,
45188
- resultCount: results.length
45189
- };
45190
- }
45191
- __name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
45192
- _evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
45193
- globalThis.__private_workflows.set("workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow", _evaluateConversationWorkflow);
45194
- var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
45195
- workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
45196
- });
45197
-
45198
45160
  // src/domains/evals/workflow/functions/runDatasetItem.ts
45199
45161
  var callChatApiStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep");
45200
45162
  var createRelationStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep");
45201
- var executeEvaluatorStep2 = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep");
45202
- var logStep2 = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep");
45163
+ var executeEvaluatorStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep");
45164
+ var logStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep");
45203
45165
  async function _runDatasetItemWorkflow(payload) {
45204
45166
  const { datasetItemId, datasetRunId, agentId, evaluatorIds, evaluationRunId } = payload;
45205
- await logStep2("Starting dataset item processing", {
45167
+ await logStep("Starting dataset item processing", {
45206
45168
  datasetItemId,
45207
45169
  datasetRunId,
45208
45170
  agentId,
@@ -45213,11 +45175,11 @@ async function _runDatasetItemWorkflow(payload) {
45213
45175
  await createRelationStep(payload, result.conversationId);
45214
45176
  if (evaluatorIds && evaluatorIds.length > 0 && evaluationRunId) {
45215
45177
  for (const evaluatorId of evaluatorIds) {
45216
- await executeEvaluatorStep2(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);
45178
+ await executeEvaluatorStep(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);
45217
45179
  }
45218
45180
  }
45219
45181
  } else {
45220
- await logStep2("No conversation created", {
45182
+ await logStep("No conversation created", {
45221
45183
  datasetItemId,
45222
45184
  datasetRunId,
45223
45185
  error: result.error
@@ -45237,7 +45199,45 @@ globalThis.__private_workflows.set("workflow//src/domains/evals/workflow/functio
45237
45199
  var runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {
45238
45200
  workflowId: "workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow"
45239
45201
  });
45240
- //# sourceMappingURL=data:application/json;base64,{
  "version": 3,
  "sources": ["src/domains/evals/workflow/functions/evaluateConversation.ts", "src/domains/evals/workflow/functions/runDatasetItem.ts"],
  "sourcesContent": ["/**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"_evaluateConversationWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\"},\"getConversationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\"},\"getEvaluatorsStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\"}}}}*/;\nvar getConversationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\");\nvar getEvaluatorsStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\");\nvar executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\");\n/**\n * Main workflow function - orchestrates the evaluation steps.\n *\n * IMPORTANT: This runs in a deterministic sandbox.\n * - Do NOT call Node.js APIs directly here (no DB, no fs, etc.)\n * - All side effects must happen in step functions\n */ async function _evaluateConversationWorkflow(payload) {\n    const { conversationId, evaluatorIds } = payload;\n    await logStep('Starting conversation evaluation', payload);\n    const conversation = await getConversationStep(payload);\n    const evaluators = await getEvaluatorsStep(payload);\n    if (evaluators.length === 0) {\n        await logStep('No valid evaluators found', {\n            conversationId,\n            evaluatorIds\n        });\n        return {\n            success: false,\n            reason: 'No valid evaluators'\n        };\n    }\n    const results = [];\n    for (const evaluator of evaluators){\n        const result = await executeEvaluatorStep(payload, evaluator.id, conversation);\n        results.push(result);\n    }\n    return {\n        success: true,\n        conversationId,\n        resultCount: results.length\n    };\n}\n_evaluateConversationWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\", _evaluateConversationWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow'\n});\n", "/**\n * Workflow for running dataset items through the chat API.\n *\n * This makes dataset run processing fire-and-forget - each item is queued\n * independently and processed in parallel by the workflow system.\n */ /**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"_runDatasetItemWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"callChatApiStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\"},\"createRelationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\"},\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\"}}}}*/;\n/**\n * Step: Call the chat API to process the dataset item\n */ var callChatApiStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\");\n/**\n * Step: Create conversation relation in database\n */ var createRelationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\");\n/**\n * Step: Execute a single evaluator on a conversation\n */ var executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\");\n/**\n * Main workflow function - processes a single dataset item through the chat API.\n * Optionally runs evaluators on the resulting conversation.\n */ async function _runDatasetItemWorkflow(payload) {\n    const { datasetItemId, datasetRunId, agentId, evaluatorIds, evaluationRunId } = payload;\n    await logStep('Starting dataset item processing', {\n        datasetItemId,\n        datasetRunId,\n        agentId,\n        hasEvaluators: !!(evaluatorIds && evaluatorIds.length > 0)\n    });\n    // Call chat API\n    const result = await callChatApiStep(payload);\n    // Create relation if we got a conversation\n    if (result.conversationId) {\n        await createRelationStep(payload, result.conversationId);\n        // Run evaluations if configured\n        if (evaluatorIds && evaluatorIds.length > 0 && evaluationRunId) {\n            for (const evaluatorId of evaluatorIds){\n                await executeEvaluatorStep(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);\n            }\n        }\n    } else {\n        await logStep('No conversation created', {\n            datasetItemId,\n            datasetRunId,\n            error: result.error\n        });\n    }\n    return {\n        success: !result.error,\n        datasetItemId,\n        datasetRunId,\n        conversationId: result.conversationId || null,\n        error: result.error || null\n    };\n}\n_runDatasetItemWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\", _runDatasetItemWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow'\n});\n"],
  "mappings": ";;;;;AACA,IAAI,sBAAsB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,yFAAyF;AAC/J,IAAI,oBAAoB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uFAAuF;AAC3J,IAAI,uBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,0FAA0F;AAG7J,IAAI,UAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,6EAA6E;AAOvI,eAAe,8BAA8B,SAAS;AACtD,QAAM,EAAE,gBAAgB,aAAa,IAAI;AACzC,QAAM,QAAQ,oCAAoC,OAAO;AACzD,QAAM,eAAe,MAAM,oBAAoB,OAAO;AACtD,QAAM,aAAa,MAAM,kBAAkB,OAAO;AAClD,MAAI,WAAW,WAAW,GAAG;AACzB,UAAM,QAAQ,6BAA6B;AAAA,MACvC;AAAA,MACA;AAAA,IACJ,CAAC;AACD,WAAO;AAAA,MACH,SAAS;AAAA,MACT,QAAQ;AAAA,IACZ;AAAA,EACJ;AACA,QAAM,UAAU,CAAC;AACjB,aAAW,aAAa,YAAW;AAC/B,UAAM,SAAS,MAAM,qBAAqB,SAAS,UAAU,IAAI,YAAY;AAC7E,YAAQ,KAAK,MAAM;AAAA,EACvB;AACA,SAAO;AAAA,IACH,SAAS;AAAA,IACT;AAAA,IACA,aAAa,QAAQ;AAAA,EACzB;AACJ;AAzBmB;AA0BnB,8BAA8B,aAAa;AAC3C,WAAW,oBAAoB,IAAI,yGAAyG,6BAA6B;AAElK,IAAM,+BAA+B,OAAO,OAAO,+BAA+B;AAAA,EACrF,YAAY;AAChB,CAAC;;;ACpCG,IAAI,kBAAkB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,+EAA+E;AAGjJ,IAAI,qBAAqB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,kFAAkF;AAGvJ,IAAIA,wBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,oFAAoF;AAG3J,IAAIC,WAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uEAAuE;AAIjI,eAAe,wBAAwB,SAAS;AAChD,QAAM,EAAE,eAAe,cAAc,SAAS,cAAc,gBAAgB,IAAI;AAChF,QAAMA,SAAQ,oCAAoC;AAAA,IAC9C;AAAA,IACA;AAAA,IACA;AAAA,IACA,eAAe,CAAC,EAAE,gBAAgB,aAAa,SAAS;AAAA,EAC5D,CAAC;AAED,QAAM,SAAS,MAAM,gBAAgB,OAAO;AAE5C,MAAI,OAAO,gBAAgB;AACvB,UAAM,mBAAmB,SAAS,OAAO,cAAc;AAEvD,QAAI,gBAAgB,aAAa,SAAS,KAAK,iBAAiB;AAC5D,iBAAW,eAAe,cAAa;AACnC,cAAMD,sBAAqB,QAAQ,UAAU,QAAQ,WAAW,OAAO,gBAAgB,aAAa,iBAAiB,QAAQ,yBAAyB;AAAA,MAC1J;AAAA,IACJ;AAAA,EACJ,OAAO;AACH,UAAMC,SAAQ,2BAA2B;AAAA,MACrC;AAAA,MACA;AAAA,MACA,OAAO,OAAO;AAAA,IAClB,CAAC;AAAA,EACL;AACA,SAAO;AAAA,IACH,SAAS,CAAC,OAAO;AAAA,IACjB;AAAA,IACA;AAAA,IACA,gBAAgB,OAAO,kBAAkB;AAAA,IACzC,OAAO,OAAO,SAAS;AAAA,EAC3B;AACJ;AAjCmB;AAkCnB,wBAAwB,aAAa;AACrC,WAAW,oBAAoB,IAAI,6FAA6F,uBAAuB;AAEhJ,IAAM,yBAAyB,OAAO,OAAO,yBAAyB;AAAA,EACzE,YAAY;AAChB,CAAC;",
  "names": ["executeEvaluatorStep", "logStep"]
}

45202
+
45203
+ // src/domains/evals/workflow/functions/evaluateConversation.ts
45204
+ var getConversationStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep");
45205
+ var getEvaluatorsStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep");
45206
+ var executeEvaluatorStep2 = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep");
45207
+ var logStep2 = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep");
45208
+ async function _evaluateConversationWorkflow(payload) {
45209
+ const { conversationId, evaluatorIds } = payload;
45210
+ await logStep2("Starting conversation evaluation", payload);
45211
+ const conversation = await getConversationStep(payload);
45212
+ const evaluators = await getEvaluatorsStep(payload);
45213
+ if (evaluators.length === 0) {
45214
+ await logStep2("No valid evaluators found", {
45215
+ conversationId,
45216
+ evaluatorIds
45217
+ });
45218
+ return {
45219
+ success: false,
45220
+ reason: "No valid evaluators"
45221
+ };
45222
+ }
45223
+ const results = [];
45224
+ for (const evaluator of evaluators) {
45225
+ const result = await executeEvaluatorStep2(payload, evaluator.id, conversation);
45226
+ results.push(result);
45227
+ }
45228
+ return {
45229
+ success: true,
45230
+ conversationId,
45231
+ resultCount: results.length
45232
+ };
45233
+ }
45234
+ __name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
45235
+ _evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
45236
+ globalThis.__private_workflows.set("workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow", _evaluateConversationWorkflow);
45237
+ var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
45238
+ workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
45239
+ });
45240
+ //# sourceMappingURL=data:application/json;base64,{
  "version": 3,
  "sources": ["src/domains/evals/workflow/functions/runDatasetItem.ts", "src/domains/evals/workflow/functions/evaluateConversation.ts"],
  "sourcesContent": ["/**\n * Workflow for running dataset items through the chat API.\n *\n * This makes dataset run processing fire-and-forget - each item is queued\n * independently and processed in parallel by the workflow system.\n */ /**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"_runDatasetItemWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"callChatApiStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\"},\"createRelationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\"},\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\"}}}}*/;\n/**\n * Step: Call the chat API to process the dataset item\n */ var callChatApiStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\");\n/**\n * Step: Create conversation relation in database\n */ var createRelationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\");\n/**\n * Step: Execute a single evaluator on a conversation\n */ var executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\");\n/**\n * Main workflow function - processes a single dataset item through the chat API.\n * Optionally runs evaluators on the resulting conversation.\n */ async function _runDatasetItemWorkflow(payload) {\n    const { datasetItemId, datasetRunId, agentId, evaluatorIds, evaluationRunId } = payload;\n    await logStep('Starting dataset item processing', {\n        datasetItemId,\n        datasetRunId,\n        agentId,\n        hasEvaluators: !!(evaluatorIds && evaluatorIds.length > 0)\n    });\n    // Call chat API\n    const result = await callChatApiStep(payload);\n    // Create relation if we got a conversation\n    if (result.conversationId) {\n        await createRelationStep(payload, result.conversationId);\n        // Run evaluations if configured\n        if (evaluatorIds && evaluatorIds.length > 0 && evaluationRunId) {\n            for (const evaluatorId of evaluatorIds){\n                await executeEvaluatorStep(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);\n            }\n        }\n    } else {\n        await logStep('No conversation created', {\n            datasetItemId,\n            datasetRunId,\n            error: result.error\n        });\n    }\n    return {\n        success: !result.error,\n        datasetItemId,\n        datasetRunId,\n        conversationId: result.conversationId || null,\n        error: result.error || null\n    };\n}\n_runDatasetItemWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\", _runDatasetItemWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow'\n});\n", "/**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"_evaluateConversationWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\"},\"getConversationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\"},\"getEvaluatorsStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\"}}}}*/;\nvar getConversationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\");\nvar getEvaluatorsStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\");\nvar executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\");\n/**\n * Main workflow function - orchestrates the evaluation steps.\n *\n * IMPORTANT: This runs in a deterministic sandbox.\n * - Do NOT call Node.js APIs directly here (no DB, no fs, etc.)\n * - All side effects must happen in step functions\n */ async function _evaluateConversationWorkflow(payload) {\n    const { conversationId, evaluatorIds } = payload;\n    await logStep('Starting conversation evaluation', payload);\n    const conversation = await getConversationStep(payload);\n    const evaluators = await getEvaluatorsStep(payload);\n    if (evaluators.length === 0) {\n        await logStep('No valid evaluators found', {\n            conversationId,\n            evaluatorIds\n        });\n        return {\n            success: false,\n            reason: 'No valid evaluators'\n        };\n    }\n    const results = [];\n    for (const evaluator of evaluators){\n        const result = await executeEvaluatorStep(payload, evaluator.id, conversation);\n        results.push(result);\n    }\n    return {\n        success: true,\n        conversationId,\n        resultCount: results.length\n    };\n}\n_evaluateConversationWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\", _evaluateConversationWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow'\n});\n"],
  "mappings": ";;;;;AAQI,IAAI,kBAAkB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,+EAA+E;AAGjJ,IAAI,qBAAqB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,kFAAkF;AAGvJ,IAAI,uBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,oFAAoF;AAG3J,IAAI,UAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uEAAuE;AAIjI,eAAe,wBAAwB,SAAS;AAChD,QAAM,EAAE,eAAe,cAAc,SAAS,cAAc,gBAAgB,IAAI;AAChF,QAAM,QAAQ,oCAAoC;AAAA,IAC9C;AAAA,IACA;AAAA,IACA;AAAA,IACA,eAAe,CAAC,EAAE,gBAAgB,aAAa,SAAS;AAAA,EAC5D,CAAC;AAED,QAAM,SAAS,MAAM,gBAAgB,OAAO;AAE5C,MAAI,OAAO,gBAAgB;AACvB,UAAM,mBAAmB,SAAS,OAAO,cAAc;AAEvD,QAAI,gBAAgB,aAAa,SAAS,KAAK,iBAAiB;AAC5D,iBAAW,eAAe,cAAa;AACnC,cAAM,qBAAqB,QAAQ,UAAU,QAAQ,WAAW,OAAO,gBAAgB,aAAa,iBAAiB,QAAQ,yBAAyB;AAAA,MAC1J;AAAA,IACJ;AAAA,EACJ,OAAO;AACH,UAAM,QAAQ,2BAA2B;AAAA,MACrC;AAAA,MACA;AAAA,MACA,OAAO,OAAO;AAAA,IAClB,CAAC;AAAA,EACL;AACA,SAAO;AAAA,IACH,SAAS,CAAC,OAAO;AAAA,IACjB;AAAA,IACA;AAAA,IACA,gBAAgB,OAAO,kBAAkB;AAAA,IACzC,OAAO,OAAO,SAAS;AAAA,EAC3B;AACJ;AAjCmB;AAkCnB,wBAAwB,aAAa;AACrC,WAAW,oBAAoB,IAAI,6FAA6F,uBAAuB;AAEhJ,IAAM,yBAAyB,OAAO,OAAO,yBAAyB;AAAA,EACzE,YAAY;AAChB,CAAC;;;AC3DD,IAAI,sBAAsB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,yFAAyF;AAC/J,IAAI,oBAAoB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uFAAuF;AAC3J,IAAIA,wBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,0FAA0F;AAG7J,IAAIC,WAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,6EAA6E;AAOvI,eAAe,8BAA8B,SAAS;AACtD,QAAM,EAAE,gBAAgB,aAAa,IAAI;AACzC,QAAMA,SAAQ,oCAAoC,OAAO;AACzD,QAAM,eAAe,MAAM,oBAAoB,OAAO;AACtD,QAAM,aAAa,MAAM,kBAAkB,OAAO;AAClD,MAAI,WAAW,WAAW,GAAG;AACzB,UAAMA,SAAQ,6BAA6B;AAAA,MACvC;AAAA,MACA;AAAA,IACJ,CAAC;AACD,WAAO;AAAA,MACH,SAAS;AAAA,MACT,QAAQ;AAAA,IACZ;AAAA,EACJ;AACA,QAAM,UAAU,CAAC;AACjB,aAAW,aAAa,YAAW;AAC/B,UAAM,SAAS,MAAMD,sBAAqB,SAAS,UAAU,IAAI,YAAY;AAC7E,YAAQ,KAAK,MAAM;AAAA,EACvB;AACA,SAAO;AAAA,IACH,SAAS;AAAA,IACT;AAAA,IACA,aAAa,QAAQ;AAAA,EACzB;AACJ;AAzBmB;AA0BnB,8BAA8B,aAAa;AAC3C,WAAW,oBAAoB,IAAI,yGAAyG,6BAA6B;AAElK,IAAM,+BAA+B,OAAO,OAAO,+BAA+B;AAAA,EACrF,YAAY;AAChB,CAAC;",
  "names": ["executeEvaluatorStep", "logStep"]
}

45241
45241
  `;
45242
45242
  var POST = workflowEntrypoint(workflowCode);
45243
45243
  // Annotate the CommonJS export names for ESM import in node:
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "workflowFiles": [
3
- "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/evaluateConversation.ts",
4
- "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/runDatasetItem.ts"
3
+ "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/runDatasetItem.ts",
4
+ "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/evaluateConversation.ts"
5
5
  ]
6
6
  }
@@ -143310,6 +143310,40 @@ __name(registerFieldSchemas, "registerFieldSchemas");
143310
143310
  // ../packages/agents-core/dist/validation/schemas.js
143311
143311
  var import_parser = __toESM(require_lib(), 1);
143312
143312
  var { AGENT_EXECUTION_TRANSFER_COUNT_MAX, AGENT_EXECUTION_TRANSFER_COUNT_MIN, CONTEXT_FETCHER_HTTP_TIMEOUT_MS_DEFAULT, STATUS_UPDATE_MAX_INTERVAL_SECONDS, STATUS_UPDATE_MAX_NUM_EVENTS, SUB_AGENT_TURN_GENERATION_STEPS_MAX, SUB_AGENT_TURN_GENERATION_STEPS_MIN, VALIDATION_AGENT_PROMPT_MAX_CHARS, VALIDATION_SUB_AGENT_PROMPT_MAX_CHARS } = schemaValidationDefaults;
143313
+ var PartMetadataSchema = external_exports.record(external_exports.string(), external_exports.any()).optional();
143314
+ var TextPartSchema = external_exports.object({
143315
+ kind: external_exports.literal("text"),
143316
+ text: external_exports.string(),
143317
+ metadata: PartMetadataSchema
143318
+ }).openapi("TextPart");
143319
+ var FileWithBytesSchema = external_exports.object({
143320
+ name: external_exports.string().optional(),
143321
+ mimeType: external_exports.string().optional(),
143322
+ bytes: external_exports.string()
143323
+ }).strict();
143324
+ var FileWithUriSchema = external_exports.object({
143325
+ name: external_exports.string().optional(),
143326
+ mimeType: external_exports.string().optional(),
143327
+ uri: external_exports.string()
143328
+ }).strict();
143329
+ var FilePartSchema = external_exports.object({
143330
+ kind: external_exports.literal("file"),
143331
+ file: external_exports.union([
143332
+ FileWithBytesSchema,
143333
+ FileWithUriSchema
143334
+ ]),
143335
+ metadata: PartMetadataSchema
143336
+ }).openapi("FilePart");
143337
+ var DataPartSchema = external_exports.object({
143338
+ kind: external_exports.literal("data"),
143339
+ data: external_exports.record(external_exports.string(), external_exports.any()),
143340
+ metadata: PartMetadataSchema
143341
+ }).openapi("DataPart");
143342
+ var PartSchema = external_exports.discriminatedUnion("kind", [
143343
+ TextPartSchema,
143344
+ FilePartSchema,
143345
+ DataPartSchema
143346
+ ]).openapi("Part");
143313
143347
  var StopWhenSchema = external_exports.object({
143314
143348
  transferCountIs: external_exports.number().min(AGENT_EXECUTION_TRANSFER_COUNT_MIN).max(AGENT_EXECUTION_TRANSFER_COUNT_MAX).optional().describe("The maximum number of transfers to trigger the stop condition."),
143315
143349
  stepCountIs: external_exports.number().min(SUB_AGENT_TURN_GENERATION_STEPS_MIN).max(SUB_AGENT_TURN_GENERATION_STEPS_MAX).optional().describe("The maximum number of steps to trigger the stop condition.")
@@ -143325,7 +143359,7 @@ var MAX_ID_LENGTH = 255;
143325
143359
  var URL_SAFE_ID_PATTERN = /^[a-zA-Z0-9\-_.]+$/;
143326
143360
  var ResourceIdSchema = external_exports.string().min(MIN_ID_LENGTH).max(MAX_ID_LENGTH).regex(URL_SAFE_ID_PATTERN, {
143327
143361
  message: "ID must contain only letters, numbers, hyphens, underscores, and dots"
143328
- }).refine((value) => value !== "new", 'Must not use a reserved name "new"').openapi({
143362
+ }).refine((value) => value !== "new", 'Must not use a reserved name "new"').openapi("ResourceId", {
143329
143363
  description: "Resource identifier",
143330
143364
  example: "resource_789"
143331
143365
  });
@@ -180088,7 +180122,11 @@ function createAgentsManageDatabasePool(config4) {
180088
180122
  if (!connectionString) throw new Error("INKEEP_AGENTS_MANAGE_DATABASE_URL environment variable is required. Please set it to your PostgreSQL connection string.");
180089
180123
  const pool2 = new Pool({
180090
180124
  connectionString,
180091
- max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100
180125
+ max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100,
180126
+ keepAlive: true,
180127
+ keepAliveInitialDelayMillis: 6e4,
180128
+ connectionTimeoutMillis: 1e4,
180129
+ idleTimeoutMillis: 3e4
180092
180130
  });
180093
180131
  pool2.on("error", (err2) => {
180094
180132
  console.error("Unexpected PostgreSQL pool error:", err2);
@@ -180102,7 +180140,11 @@ function createAgentsManageDatabaseClient(config4) {
180102
180140
  if (!connectionString) throw new Error("INKEEP_AGENTS_MANAGE_DATABASE_URL environment variable is required. Please set it to your PostgreSQL connection string.");
180103
180141
  const pool2 = new Pool({
180104
180142
  connectionString,
180105
- max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100
180143
+ max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100,
180144
+ keepAlive: true,
180145
+ keepAliveInitialDelayMillis: 6e4,
180146
+ connectionTimeoutMillis: 1e4,
180147
+ idleTimeoutMillis: 3e4
180106
180148
  });
180107
180149
  pool2.on("error", (err2) => {
180108
180150
  console.error("Unexpected PostgreSQL pool error:", err2);
@@ -180130,7 +180172,11 @@ function createAgentsRunDatabaseClient(config4) {
180130
180172
  if (!connectionString) throw new Error("INKEEP_AGENTS_RUN_DATABASE_URL environment variable is required. Please set it to your PostgreSQL connection string.");
180131
180173
  const pool2 = new Pool({
180132
180174
  connectionString,
180133
- max: config4?.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100
180175
+ max: config4?.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100,
180176
+ keepAlive: true,
180177
+ keepAliveInitialDelayMillis: 6e4,
180178
+ connectionTimeoutMillis: 1e4,
180179
+ idleTimeoutMillis: 3e4
180134
180180
  });
180135
180181
  pool2.on("error", (err2) => {
180136
180182
  console.error("Unexpected PostgreSQL pool error:", err2);
@@ -229788,124 +229834,8 @@ Return your evaluation as a JSON object matching the schema above.`;
229788
229834
  }
229789
229835
  };
229790
229836
 
229791
- // src/domains/evals/workflow/functions/evaluateConversation.ts
229792
- var logger22 = getLogger("workflow-evaluate-conversation");
229793
- async function getConversationStep(payload) {
229794
- const { tenantId, projectId, conversationId } = payload;
229795
- const conv = await getConversation(runDbClient_default)({
229796
- scopes: {
229797
- tenantId,
229798
- projectId
229799
- },
229800
- conversationId
229801
- });
229802
- if (!conv) {
229803
- throw new Error(`Conversation not found: ${conversationId}`);
229804
- }
229805
- return conv;
229806
- }
229807
- __name(getConversationStep, "getConversationStep");
229808
- async function getEvaluatorsStep(payload) {
229809
- const { tenantId, projectId, evaluatorIds } = payload;
229810
- const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
229811
- const evals = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorsByIds(db)({
229812
- scopes: {
229813
- tenantId,
229814
- projectId
229815
- },
229816
- evaluatorIds
229817
- }));
229818
- return evals;
229819
- }
229820
- __name(getEvaluatorsStep, "getEvaluatorsStep");
229821
- async function executeEvaluatorStep(payload, evaluatorId, conversation) {
229822
- const { tenantId, projectId, conversationId, evaluationRunId } = payload;
229823
- const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
229824
- const evaluator2 = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorById(db)({
229825
- scopes: {
229826
- tenantId,
229827
- projectId,
229828
- evaluatorId
229829
- }
229830
- }));
229831
- if (!evaluator2) {
229832
- throw new Error(`Evaluator not found: ${evaluatorId}`);
229833
- }
229834
- const evalResult = await createEvaluationResult(runDbClient_default)({
229835
- id: generateId(),
229836
- tenantId,
229837
- projectId,
229838
- conversationId,
229839
- evaluatorId: evaluator2.id,
229840
- evaluationRunId
229841
- });
229842
- try {
229843
- const evaluationService = new EvaluationService();
229844
- const output = await evaluationService.executeEvaluation({
229845
- conversation,
229846
- evaluator: evaluator2,
229847
- tenantId,
229848
- projectId
229849
- });
229850
- const updated = await updateEvaluationResult(runDbClient_default)({
229851
- scopes: {
229852
- tenantId,
229853
- projectId,
229854
- evaluationResultId: evalResult.id
229855
- },
229856
- data: {
229857
- output
229858
- }
229859
- });
229860
- logger22.info({
229861
- conversationId,
229862
- evaluatorId: evaluator2.id,
229863
- resultId: evalResult.id
229864
- }, "Evaluation completed successfully");
229865
- return updated;
229866
- } catch (error92) {
229867
- const errorMessage = error92 instanceof Error ? error92.message : "Unknown error";
229868
- logger22.error({
229869
- error: error92,
229870
- conversationId,
229871
- evaluatorId: evaluator2.id,
229872
- resultId: evalResult.id
229873
- }, "Evaluation execution failed");
229874
- const failed = await updateEvaluationResult(runDbClient_default)({
229875
- scopes: {
229876
- tenantId,
229877
- projectId,
229878
- evaluationResultId: evalResult.id
229879
- },
229880
- data: {
229881
- output: {
229882
- text: `Evaluation failed: ${errorMessage}`
229883
- }
229884
- }
229885
- });
229886
- return failed;
229887
- }
229888
- }
229889
- __name(executeEvaluatorStep, "executeEvaluatorStep");
229890
- async function logStep(message, data) {
229891
- logger22.info(data, message);
229892
- }
229893
- __name(logStep, "logStep");
229894
- async function _evaluateConversationWorkflow(payload) {
229895
- throw new Error("You attempted to execute workflow _evaluateConversationWorkflow function directly. To start a workflow, use start(_evaluateConversationWorkflow) from workflow/api");
229896
- }
229897
- __name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
229898
- _evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
229899
- var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
229900
- workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
229901
- });
229902
- registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep", getConversationStep);
229903
- registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep", getEvaluatorsStep);
229904
- registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep", executeEvaluatorStep);
229905
- registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep", logStep);
229906
-
229907
229837
  // src/domains/evals/workflow/functions/runDatasetItem.ts
229908
- var logger23 = getLogger("workflow-run-dataset-item");
229838
+ var logger22 = getLogger("workflow-run-dataset-item");
229909
229839
  async function callChatApiStep(payload) {
229910
229840
  const { tenantId, projectId, agentId, datasetItemId, datasetItemInput, datasetItemSimulationAgent, datasetRunId } = payload;
229911
229841
  const evaluationService = new EvaluationService();
@@ -229921,7 +229851,7 @@ async function callChatApiStep(payload) {
229921
229851
  datasetItem: datasetItem2,
229922
229852
  datasetRunId
229923
229853
  });
229924
- logger23.info({
229854
+ logger22.info({
229925
229855
  tenantId,
229926
229856
  projectId,
229927
229857
  datasetItemId,
@@ -229944,7 +229874,7 @@ async function createRelationStep(payload, conversationId) {
229944
229874
  conversationId,
229945
229875
  datasetItemId
229946
229876
  });
229947
- logger23.info({
229877
+ logger22.info({
229948
229878
  tenantId,
229949
229879
  projectId,
229950
229880
  datasetItemId,
@@ -229958,7 +229888,7 @@ async function createRelationStep(payload, conversationId) {
229958
229888
  };
229959
229889
  } catch (error92) {
229960
229890
  if (error92?.cause?.code === "23503" || error92?.code === "23503") {
229961
- logger23.warn({
229891
+ logger22.warn({
229962
229892
  tenantId,
229963
229893
  projectId,
229964
229894
  datasetItemId,
@@ -229975,7 +229905,7 @@ async function createRelationStep(payload, conversationId) {
229975
229905
  }
229976
229906
  }
229977
229907
  __name(createRelationStep, "createRelationStep");
229978
- async function executeEvaluatorStep2(tenantId, projectId, conversationId, evaluatorId, evaluationRunId, expectedOutput) {
229908
+ async function executeEvaluatorStep(tenantId, projectId, conversationId, evaluatorId, evaluationRunId, expectedOutput) {
229979
229909
  const ref = getProjectScopedRef(tenantId, projectId, "main");
229980
229910
  const resolvedRef = await resolveRef2(manageDbClient_default)(ref);
229981
229911
  if (!resolvedRef) {
@@ -229989,7 +229919,7 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
229989
229919
  }
229990
229920
  }));
229991
229921
  if (!evaluator2) {
229992
- logger23.warn({
229922
+ logger22.warn({
229993
229923
  evaluatorId
229994
229924
  }, "Evaluator not found");
229995
229925
  return null;
@@ -230031,7 +229961,7 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
230031
229961
  output
230032
229962
  }
230033
229963
  });
230034
- logger23.info({
229964
+ logger22.info({
230035
229965
  conversationId,
230036
229966
  evaluatorId: evaluator2.id,
230037
229967
  resultId: evalResult.id
@@ -230039,7 +229969,7 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
230039
229969
  return evalResult.id;
230040
229970
  } catch (error92) {
230041
229971
  const errorMessage = error92 instanceof Error ? error92.message : "Unknown error";
230042
- logger23.error({
229972
+ logger22.error({
230043
229973
  error: error92,
230044
229974
  conversationId,
230045
229975
  evaluatorId: evaluator2.id
@@ -230059,11 +229989,11 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
230059
229989
  return evalResult.id;
230060
229990
  }
230061
229991
  }
230062
- __name(executeEvaluatorStep2, "executeEvaluatorStep");
230063
- async function logStep2(message, data) {
230064
- logger23.info(data, message);
229992
+ __name(executeEvaluatorStep, "executeEvaluatorStep");
229993
+ async function logStep(message, data) {
229994
+ logger22.info(data, message);
230065
229995
  }
230066
- __name(logStep2, "logStep");
229996
+ __name(logStep, "logStep");
230067
229997
  async function _runDatasetItemWorkflow(payload) {
230068
229998
  throw new Error("You attempted to execute workflow _runDatasetItemWorkflow function directly. To start a workflow, use start(_runDatasetItemWorkflow) from workflow/api");
230069
229999
  }
@@ -230074,8 +230004,124 @@ var runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {
230074
230004
  });
230075
230005
  registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep", callChatApiStep);
230076
230006
  registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep", createRelationStep);
230077
- registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep", executeEvaluatorStep2);
230078
- registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep", logStep2);
230007
+ registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep", executeEvaluatorStep);
230008
+ registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep", logStep);
230009
+
230010
+ // src/domains/evals/workflow/functions/evaluateConversation.ts
230011
+ var logger23 = getLogger("workflow-evaluate-conversation");
230012
+ async function getConversationStep(payload) {
230013
+ const { tenantId, projectId, conversationId } = payload;
230014
+ const conv = await getConversation(runDbClient_default)({
230015
+ scopes: {
230016
+ tenantId,
230017
+ projectId
230018
+ },
230019
+ conversationId
230020
+ });
230021
+ if (!conv) {
230022
+ throw new Error(`Conversation not found: ${conversationId}`);
230023
+ }
230024
+ return conv;
230025
+ }
230026
+ __name(getConversationStep, "getConversationStep");
230027
+ async function getEvaluatorsStep(payload) {
230028
+ const { tenantId, projectId, evaluatorIds } = payload;
230029
+ const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
230030
+ const evals = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorsByIds(db)({
230031
+ scopes: {
230032
+ tenantId,
230033
+ projectId
230034
+ },
230035
+ evaluatorIds
230036
+ }));
230037
+ return evals;
230038
+ }
230039
+ __name(getEvaluatorsStep, "getEvaluatorsStep");
230040
+ async function executeEvaluatorStep2(payload, evaluatorId, conversation) {
230041
+ const { tenantId, projectId, conversationId, evaluationRunId } = payload;
230042
+ const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
230043
+ const evaluator2 = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorById(db)({
230044
+ scopes: {
230045
+ tenantId,
230046
+ projectId,
230047
+ evaluatorId
230048
+ }
230049
+ }));
230050
+ if (!evaluator2) {
230051
+ throw new Error(`Evaluator not found: ${evaluatorId}`);
230052
+ }
230053
+ const evalResult = await createEvaluationResult(runDbClient_default)({
230054
+ id: generateId(),
230055
+ tenantId,
230056
+ projectId,
230057
+ conversationId,
230058
+ evaluatorId: evaluator2.id,
230059
+ evaluationRunId
230060
+ });
230061
+ try {
230062
+ const evaluationService = new EvaluationService();
230063
+ const output = await evaluationService.executeEvaluation({
230064
+ conversation,
230065
+ evaluator: evaluator2,
230066
+ tenantId,
230067
+ projectId
230068
+ });
230069
+ const updated = await updateEvaluationResult(runDbClient_default)({
230070
+ scopes: {
230071
+ tenantId,
230072
+ projectId,
230073
+ evaluationResultId: evalResult.id
230074
+ },
230075
+ data: {
230076
+ output
230077
+ }
230078
+ });
230079
+ logger23.info({
230080
+ conversationId,
230081
+ evaluatorId: evaluator2.id,
230082
+ resultId: evalResult.id
230083
+ }, "Evaluation completed successfully");
230084
+ return updated;
230085
+ } catch (error92) {
230086
+ const errorMessage = error92 instanceof Error ? error92.message : "Unknown error";
230087
+ logger23.error({
230088
+ error: error92,
230089
+ conversationId,
230090
+ evaluatorId: evaluator2.id,
230091
+ resultId: evalResult.id
230092
+ }, "Evaluation execution failed");
230093
+ const failed = await updateEvaluationResult(runDbClient_default)({
230094
+ scopes: {
230095
+ tenantId,
230096
+ projectId,
230097
+ evaluationResultId: evalResult.id
230098
+ },
230099
+ data: {
230100
+ output: {
230101
+ text: `Evaluation failed: ${errorMessage}`
230102
+ }
230103
+ }
230104
+ });
230105
+ return failed;
230106
+ }
230107
+ }
230108
+ __name(executeEvaluatorStep2, "executeEvaluatorStep");
230109
+ async function logStep2(message, data) {
230110
+ logger23.info(data, message);
230111
+ }
230112
+ __name(logStep2, "logStep");
230113
+ async function _evaluateConversationWorkflow(payload) {
230114
+ throw new Error("You attempted to execute workflow _evaluateConversationWorkflow function directly. To start a workflow, use start(_evaluateConversationWorkflow) from workflow/api");
230115
+ }
230116
+ __name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
230117
+ _evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
230118
+ var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
230119
+ workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
230120
+ });
230121
+ registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep", getConversationStep);
230122
+ registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep", getEvaluatorsStep);
230123
+ registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep", executeEvaluatorStep2);
230124
+ registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep", logStep2);
230079
230125
 
230080
230126
  // ../node_modules/.pnpm/@workflow+utils@4.0.1-beta.7/node_modules/@workflow/utils/dist/index.js
230081
230127
  var import_ms2 = __toESM(require_ms(), 1);
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "stepFiles": [
3
- "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/evaluateConversation.ts",
4
- "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/runDatasetItem.ts"
3
+ "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/runDatasetItem.ts",
4
+ "/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/evaluateConversation.ts"
5
5
  ]
6
6
  }
@@ -1,10 +1,10 @@
1
1
  import { AppConfig } from "./types/app.js";
2
2
  import "./types/index.js";
3
3
  import { Hono } from "hono";
4
- import * as hono_types0 from "hono/types";
4
+ import * as hono_types3 from "hono/types";
5
5
 
6
6
  //#region src/createApp.d.ts
7
7
  declare const isWebhookRoute: (path: string) => boolean;
8
- declare function createAgentsHono(config: AppConfig): Hono<hono_types0.BlankEnv, hono_types0.BlankSchema, "/">;
8
+ declare function createAgentsHono(config: AppConfig): Hono<hono_types3.BlankEnv, hono_types3.BlankSchema, "/">;
9
9
  //#endregion
10
10
  export { createAgentsHono, isWebhookRoute };
package/dist/createApp.js CHANGED
@@ -3,9 +3,9 @@ import { env } from "./env.js";
3
3
  import { evalRoutes } from "./domains/evals/index.js";
4
4
  import { workflowRoutes } from "./domains/evals/workflow/routes.js";
5
5
  import { sessionAuth, sessionContext } from "./middleware/sessionAuth.js";
6
+ import { flushBatchProcessor } from "./instrumentation.js";
6
7
  import { manageRoutes } from "./domains/manage/index.js";
7
8
  import mcp_default from "./domains/mcp/routes/mcp.js";
8
- import { flushBatchProcessor } from "./instrumentation.js";
9
9
  import { runRoutes } from "./domains/run/index.js";
10
10
  import { authCorsConfig, defaultCorsConfig, playgroundCorsConfig, runCorsConfig, signozCorsConfig } from "./middleware/cors.js";
11
11
  import { errorHandler } from "./middleware/errorHandler.js";
@@ -43,7 +43,7 @@ app.openapi(createRoute({
43
43
  tenantId,
44
44
  projectId,
45
45
  conversationId
46
- }, "Triggering conversation evaluation (eval-api handling all logic)");
46
+ }, "Triggering conversation evaluation");
47
47
  if (!await getConversation(runDbClient_default)({
48
48
  scopes: {
49
49
  tenantId,