@inkeep/agents-api 0.0.0-dev-20260209225959 → 0.0.0-dev-20260210001219
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/.well-known/workflow/v1/flow.cjs +44 -44
- package/dist/.well-known/workflow/v1/flow.cjs.debug.json +2 -2
- package/dist/.well-known/workflow/v1/manifest.debug.json +16 -16
- package/dist/.well-known/workflow/v1/step.cjs +145 -133
- package/dist/.well-known/workflow/v1/step.cjs.debug.json +2 -2
- package/dist/data/db/manageDbClient.d.ts +2 -2
- package/dist/data/db/runDbClient.d.ts +2 -2
- package/dist/domains/evals/routes/datasetTriggers.d.ts +2 -2
- package/dist/domains/evals/routes/index.d.ts +2 -2
- package/dist/domains/manage/routes/availableAgents.d.ts +2 -2
- package/dist/domains/manage/routes/conversations.d.ts +2 -2
- package/dist/domains/manage/routes/index.d.ts +2 -2
- package/dist/domains/manage/routes/invitations.d.ts +2 -2
- package/dist/domains/manage/routes/passwordResetLinks.d.ts +2 -2
- package/dist/domains/manage/routes/signoz.d.ts +2 -2
- package/dist/domains/mcp/routes/mcp.d.ts +2 -2
- package/dist/domains/run/agents/relationTools.d.ts +2 -2
- package/dist/domains/run/constants/execution-limits/index.js +5 -1
- package/dist/domains/run/utils/model-context-utils.js +4 -2
- package/dist/domains/run/utils/token-estimator.d.ts +2 -2
- package/dist/factory.d.ts +22 -22
- package/dist/index.d.ts +22 -22
- package/dist/middleware/evalsAuth.d.ts +2 -2
- package/dist/middleware/manageAuth.d.ts +2 -2
- package/dist/middleware/projectAccess.d.ts +2 -2
- package/dist/middleware/projectConfig.d.ts +3 -3
- package/dist/middleware/requirePermission.d.ts +2 -2
- package/dist/middleware/runAuth.d.ts +4 -4
- package/dist/middleware/sessionAuth.d.ts +3 -3
- package/dist/middleware/tenantAccess.d.ts +2 -2
- package/dist/middleware/tracing.d.ts +3 -3
- package/package.json +5 -5
|
@@ -45157,52 +45157,14 @@ var workflowCode = `globalThis.__private_workflows = new Map();
|
|
|
45157
45157
|
var __defProp = Object.defineProperty;
|
|
45158
45158
|
var __name = (target, value) => __defProp(target, "name", { value, configurable: true });
|
|
45159
45159
|
|
|
45160
|
-
// src/domains/evals/workflow/functions/evaluateConversation.ts
|
|
45161
|
-
var getConversationStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep");
|
|
45162
|
-
var getEvaluatorsStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep");
|
|
45163
|
-
var executeEvaluatorStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep");
|
|
45164
|
-
var logStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep");
|
|
45165
|
-
async function _evaluateConversationWorkflow(payload) {
|
|
45166
|
-
const { conversationId, evaluatorIds } = payload;
|
|
45167
|
-
await logStep("Starting conversation evaluation", payload);
|
|
45168
|
-
const conversation = await getConversationStep(payload);
|
|
45169
|
-
const evaluators = await getEvaluatorsStep(payload);
|
|
45170
|
-
if (evaluators.length === 0) {
|
|
45171
|
-
await logStep("No valid evaluators found", {
|
|
45172
|
-
conversationId,
|
|
45173
|
-
evaluatorIds
|
|
45174
|
-
});
|
|
45175
|
-
return {
|
|
45176
|
-
success: false,
|
|
45177
|
-
reason: "No valid evaluators"
|
|
45178
|
-
};
|
|
45179
|
-
}
|
|
45180
|
-
const results = [];
|
|
45181
|
-
for (const evaluator of evaluators) {
|
|
45182
|
-
const result = await executeEvaluatorStep(payload, evaluator.id, conversation);
|
|
45183
|
-
results.push(result);
|
|
45184
|
-
}
|
|
45185
|
-
return {
|
|
45186
|
-
success: true,
|
|
45187
|
-
conversationId,
|
|
45188
|
-
resultCount: results.length
|
|
45189
|
-
};
|
|
45190
|
-
}
|
|
45191
|
-
__name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
|
|
45192
|
-
_evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
|
|
45193
|
-
globalThis.__private_workflows.set("workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow", _evaluateConversationWorkflow);
|
|
45194
|
-
var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
|
|
45195
|
-
workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
|
|
45196
|
-
});
|
|
45197
|
-
|
|
45198
45160
|
// src/domains/evals/workflow/functions/runDatasetItem.ts
|
|
45199
45161
|
var callChatApiStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep");
|
|
45200
45162
|
var createRelationStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep");
|
|
45201
|
-
var
|
|
45202
|
-
var
|
|
45163
|
+
var executeEvaluatorStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep");
|
|
45164
|
+
var logStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep");
|
|
45203
45165
|
async function _runDatasetItemWorkflow(payload) {
|
|
45204
45166
|
const { datasetItemId, datasetRunId, agentId, evaluatorIds, evaluationRunId } = payload;
|
|
45205
|
-
await
|
|
45167
|
+
await logStep("Starting dataset item processing", {
|
|
45206
45168
|
datasetItemId,
|
|
45207
45169
|
datasetRunId,
|
|
45208
45170
|
agentId,
|
|
@@ -45213,11 +45175,11 @@ async function _runDatasetItemWorkflow(payload) {
|
|
|
45213
45175
|
await createRelationStep(payload, result.conversationId);
|
|
45214
45176
|
if (evaluatorIds && evaluatorIds.length > 0 && evaluationRunId) {
|
|
45215
45177
|
for (const evaluatorId of evaluatorIds) {
|
|
45216
|
-
await
|
|
45178
|
+
await executeEvaluatorStep(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);
|
|
45217
45179
|
}
|
|
45218
45180
|
}
|
|
45219
45181
|
} else {
|
|
45220
|
-
await
|
|
45182
|
+
await logStep("No conversation created", {
|
|
45221
45183
|
datasetItemId,
|
|
45222
45184
|
datasetRunId,
|
|
45223
45185
|
error: result.error
|
|
@@ -45237,7 +45199,45 @@ globalThis.__private_workflows.set("workflow//src/domains/evals/workflow/functio
|
|
|
45237
45199
|
var runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {
|
|
45238
45200
|
workflowId: "workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow"
|
|
45239
45201
|
});
|
|
45240
|
-
//# sourceMappingURL=data:application/json;base64,{
  "version": 3,
  "sources": ["src/domains/evals/workflow/functions/evaluateConversation.ts", "src/domains/evals/workflow/functions/runDatasetItem.ts"],
  "sourcesContent": ["/**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"_evaluateConversationWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\"},\"getConversationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\"},\"getEvaluatorsStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\"}}}}*/;\nvar getConversationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\");\nvar getEvaluatorsStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\");\nvar executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\");\n/**\n * Main workflow function - orchestrates the evaluation steps.\n *\n * IMPORTANT: This runs in a deterministic sandbox.\n * - Do NOT call Node.js APIs directly here (no DB, no fs, etc.)\n * - All side effects must happen in step functions\n */ async function _evaluateConversationWorkflow(payload) {\n    const { conversationId, evaluatorIds } = payload;\n    await logStep('Starting conversation evaluation', payload);\n    const conversation = await getConversationStep(payload);\n    const evaluators = await getEvaluatorsStep(payload);\n    if (evaluators.length === 0) {\n        await logStep('No valid evaluators found', {\n            conversationId,\n            evaluatorIds\n        });\n        return {\n            success: false,\n            reason: 'No valid evaluators'\n        };\n    }\n    const results = [];\n    for (const evaluator of evaluators){\n        const result = await executeEvaluatorStep(payload, evaluator.id, conversation);\n        results.push(result);\n    }\n    return {\n        success: true,\n        conversationId,\n        resultCount: results.length\n    };\n}\n_evaluateConversationWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\", _evaluateConversationWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow'\n});\n", "/**\n * Workflow for running dataset items through the chat API.\n *\n * This makes dataset run processing fire-and-forget - each item is queued\n * independently and processed in parallel by the workflow system.\n */ /**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"_runDatasetItemWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"callChatApiStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\"},\"createRelationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\"},\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\"}}}}*/;\n/**\n * Step: Call the chat API to process the dataset item\n */ var callChatApiStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\");\n/**\n * Step: Create conversation relation in database\n */ var createRelationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\");\n/**\n * Step: Execute a single evaluator on a conversation\n */ var executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\");\n/**\n * Main workflow function - processes a single dataset item through the chat API.\n * Optionally runs evaluators on the resulting conversation.\n */ async function _runDatasetItemWorkflow(payload) {\n    const { datasetItemId, datasetRunId, agentId, evaluatorIds, evaluationRunId } = payload;\n    await logStep('Starting dataset item processing', {\n        datasetItemId,\n        datasetRunId,\n        agentId,\n        hasEvaluators: !!(evaluatorIds && evaluatorIds.length > 0)\n    });\n    // Call chat API\n    const result = await callChatApiStep(payload);\n    // Create relation if we got a conversation\n    if (result.conversationId) {\n        await createRelationStep(payload, result.conversationId);\n        // Run evaluations if configured\n        if (evaluatorIds && evaluatorIds.length > 0 && evaluationRunId) {\n            for (const evaluatorId of evaluatorIds){\n                await executeEvaluatorStep(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);\n            }\n        }\n    } else {\n        await logStep('No conversation created', {\n            datasetItemId,\n            datasetRunId,\n            error: result.error\n        });\n    }\n    return {\n        success: !result.error,\n        datasetItemId,\n        datasetRunId,\n        conversationId: result.conversationId || null,\n        error: result.error || null\n    };\n}\n_runDatasetItemWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\", _runDatasetItemWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow'\n});\n"],
  "mappings": ";;;;;AACA,IAAI,sBAAsB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,yFAAyF;AAC/J,IAAI,oBAAoB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uFAAuF;AAC3J,IAAI,uBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,0FAA0F;AAG7J,IAAI,UAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,6EAA6E;AAOvI,eAAe,8BAA8B,SAAS;AACtD,QAAM,EAAE,gBAAgB,aAAa,IAAI;AACzC,QAAM,QAAQ,oCAAoC,OAAO;AACzD,QAAM,eAAe,MAAM,oBAAoB,OAAO;AACtD,QAAM,aAAa,MAAM,kBAAkB,OAAO;AAClD,MAAI,WAAW,WAAW,GAAG;AACzB,UAAM,QAAQ,6BAA6B;AAAA,MACvC;AAAA,MACA;AAAA,IACJ,CAAC;AACD,WAAO;AAAA,MACH,SAAS;AAAA,MACT,QAAQ;AAAA,IACZ;AAAA,EACJ;AACA,QAAM,UAAU,CAAC;AACjB,aAAW,aAAa,YAAW;AAC/B,UAAM,SAAS,MAAM,qBAAqB,SAAS,UAAU,IAAI,YAAY;AAC7E,YAAQ,KAAK,MAAM;AAAA,EACvB;AACA,SAAO;AAAA,IACH,SAAS;AAAA,IACT;AAAA,IACA,aAAa,QAAQ;AAAA,EACzB;AACJ;AAzBmB;AA0BnB,8BAA8B,aAAa;AAC3C,WAAW,oBAAoB,IAAI,yGAAyG,6BAA6B;AAElK,IAAM,+BAA+B,OAAO,OAAO,+BAA+B;AAAA,EACrF,YAAY;AAChB,CAAC;;;ACpCG,IAAI,kBAAkB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,+EAA+E;AAGjJ,IAAI,qBAAqB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,kFAAkF;AAGvJ,IAAIA,wBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,oFAAoF;AAG3J,IAAIC,WAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uEAAuE;AAIjI,eAAe,wBAAwB,SAAS;AAChD,QAAM,EAAE,eAAe,cAAc,SAAS,cAAc,gBAAgB,IAAI;AAChF,QAAMA,SAAQ,oCAAoC;AAAA,IAC9C;AAAA,IACA;AAAA,IACA;AAAA,IACA,eAAe,CAAC,EAAE,gBAAgB,aAAa,SAAS;AAAA,EAC5D,CAAC;AAED,QAAM,SAAS,MAAM,gBAAgB,OAAO;AAE5C,MAAI,OAAO,gBAAgB;AACvB,UAAM,mBAAmB,SAAS,OAAO,cAAc;AAEvD,QAAI,gBAAgB,aAAa,SAAS,KAAK,iBAAiB;AAC5D,iBAAW,eAAe,cAAa;AACnC,cAAMD,sBAAqB,QAAQ,UAAU,QAAQ,WAAW,OAAO,gBAAgB,aAAa,iBAAiB,QAAQ,yBAAyB;AAAA,MAC1J;AAAA,IACJ;AAAA,EACJ,OAAO;AACH,UAAMC,SAAQ,2BAA2B;AAAA,MACrC;AAAA,MACA;AAAA,MACA,OAAO,OAAO;AAAA,IAClB,CAAC;AAAA,EACL;AACA,SAAO;AAAA,IACH,SAAS,CAAC,OAAO;AAAA,IACjB;AAAA,IACA;AAAA,IACA,gBAAgB,OAAO,kBAAkB;AAAA,IACzC,OAAO,OAAO,SAAS;AAAA,EAC3B;AACJ;AAjCmB;AAkCnB,wBAAwB,aAAa;AACrC,WAAW,oBAAoB,IAAI,6FAA6F,uBAAuB;AAEhJ,IAAM,yBAAyB,OAAO,OAAO,yBAAyB;AAAA,EACzE,YAAY;AAChB,CAAC;",
  "names": ["executeEvaluatorStep", "logStep"]
}

|
|
45202
|
+
|
|
45203
|
+
// src/domains/evals/workflow/functions/evaluateConversation.ts
|
|
45204
|
+
var getConversationStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep");
|
|
45205
|
+
var getEvaluatorsStep = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep");
|
|
45206
|
+
var executeEvaluatorStep2 = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep");
|
|
45207
|
+
var logStep2 = globalThis[Symbol.for("WORKFLOW_USE_STEP")]("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep");
|
|
45208
|
+
async function _evaluateConversationWorkflow(payload) {
|
|
45209
|
+
const { conversationId, evaluatorIds } = payload;
|
|
45210
|
+
await logStep2("Starting conversation evaluation", payload);
|
|
45211
|
+
const conversation = await getConversationStep(payload);
|
|
45212
|
+
const evaluators = await getEvaluatorsStep(payload);
|
|
45213
|
+
if (evaluators.length === 0) {
|
|
45214
|
+
await logStep2("No valid evaluators found", {
|
|
45215
|
+
conversationId,
|
|
45216
|
+
evaluatorIds
|
|
45217
|
+
});
|
|
45218
|
+
return {
|
|
45219
|
+
success: false,
|
|
45220
|
+
reason: "No valid evaluators"
|
|
45221
|
+
};
|
|
45222
|
+
}
|
|
45223
|
+
const results = [];
|
|
45224
|
+
for (const evaluator of evaluators) {
|
|
45225
|
+
const result = await executeEvaluatorStep2(payload, evaluator.id, conversation);
|
|
45226
|
+
results.push(result);
|
|
45227
|
+
}
|
|
45228
|
+
return {
|
|
45229
|
+
success: true,
|
|
45230
|
+
conversationId,
|
|
45231
|
+
resultCount: results.length
|
|
45232
|
+
};
|
|
45233
|
+
}
|
|
45234
|
+
__name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
|
|
45235
|
+
_evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
|
|
45236
|
+
globalThis.__private_workflows.set("workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow", _evaluateConversationWorkflow);
|
|
45237
|
+
var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
|
|
45238
|
+
workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
|
|
45239
|
+
});
|
|
45240
|
+
//# sourceMappingURL=data:application/json;base64,{
  "version": 3,
  "sources": ["src/domains/evals/workflow/functions/runDatasetItem.ts", "src/domains/evals/workflow/functions/evaluateConversation.ts"],
  "sourcesContent": ["/**\n * Workflow for running dataset items through the chat API.\n *\n * This makes dataset run processing fire-and-forget - each item is queued\n * independently and processed in parallel by the workflow system.\n */ /**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"_runDatasetItemWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/runDatasetItem.ts\":{\"callChatApiStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\"},\"createRelationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\"},\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\"}}}}*/;\n/**\n * Step: Call the chat API to process the dataset item\n */ var callChatApiStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep\");\n/**\n * Step: Create conversation relation in database\n */ var createRelationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep\");\n/**\n * Step: Execute a single evaluator on a conversation\n */ var executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep\");\n/**\n * Main workflow function - processes a single dataset item through the chat API.\n * Optionally runs evaluators on the resulting conversation.\n */ async function _runDatasetItemWorkflow(payload) {\n    const { datasetItemId, datasetRunId, agentId, evaluatorIds, evaluationRunId } = payload;\n    await logStep('Starting dataset item processing', {\n        datasetItemId,\n        datasetRunId,\n        agentId,\n        hasEvaluators: !!(evaluatorIds && evaluatorIds.length > 0)\n    });\n    // Call chat API\n    const result = await callChatApiStep(payload);\n    // Create relation if we got a conversation\n    if (result.conversationId) {\n        await createRelationStep(payload, result.conversationId);\n        // Run evaluations if configured\n        if (evaluatorIds && evaluatorIds.length > 0 && evaluationRunId) {\n            for (const evaluatorId of evaluatorIds){\n                await executeEvaluatorStep(payload.tenantId, payload.projectId, result.conversationId, evaluatorId, evaluationRunId, payload.datasetItemExpectedOutput);\n            }\n        }\n    } else {\n        await logStep('No conversation created', {\n            datasetItemId,\n            datasetRunId,\n            error: result.error\n        });\n    }\n    return {\n        success: !result.error,\n        datasetItemId,\n        datasetRunId,\n        conversationId: result.conversationId || null,\n        error: result.error || null\n    };\n}\n_runDatasetItemWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow\", _runDatasetItemWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow'\n});\n", "/**__internal_workflows{\"workflows\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"_evaluateConversationWorkflow\":{\"workflowId\":\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\"}}},\"steps\":{\"src/domains/evals/workflow/functions/evaluateConversation.ts\":{\"executeEvaluatorStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\"},\"getConversationStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\"},\"getEvaluatorsStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\"},\"logStep\":{\"stepId\":\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\"}}}}*/;\nvar getConversationStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep\");\nvar getEvaluatorsStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep\");\nvar executeEvaluatorStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep\");\n/**\n * Step: Log workflow progress\n */ var logStep = globalThis[Symbol.for(\"WORKFLOW_USE_STEP\")](\"step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep\");\n/**\n * Main workflow function - orchestrates the evaluation steps.\n *\n * IMPORTANT: This runs in a deterministic sandbox.\n * - Do NOT call Node.js APIs directly here (no DB, no fs, etc.)\n * - All side effects must happen in step functions\n */ async function _evaluateConversationWorkflow(payload) {\n    const { conversationId, evaluatorIds } = payload;\n    await logStep('Starting conversation evaluation', payload);\n    const conversation = await getConversationStep(payload);\n    const evaluators = await getEvaluatorsStep(payload);\n    if (evaluators.length === 0) {\n        await logStep('No valid evaluators found', {\n            conversationId,\n            evaluatorIds\n        });\n        return {\n            success: false,\n            reason: 'No valid evaluators'\n        };\n    }\n    const results = [];\n    for (const evaluator of evaluators){\n        const result = await executeEvaluatorStep(payload, evaluator.id, conversation);\n        results.push(result);\n    }\n    return {\n        success: true,\n        conversationId,\n        resultCount: results.length\n    };\n}\n_evaluateConversationWorkflow.workflowId = \"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\";\nglobalThis.__private_workflows.set(\"workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow\", _evaluateConversationWorkflow);\n// This ID must match what workflow:build generates in .well-known/workflow/v1/flow.cjs\nexport const evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {\n    workflowId: 'workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow'\n});\n"],
  "mappings": ";;;;;AAQI,IAAI,kBAAkB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,+EAA+E;AAGjJ,IAAI,qBAAqB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,kFAAkF;AAGvJ,IAAI,uBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,oFAAoF;AAG3J,IAAI,UAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uEAAuE;AAIjI,eAAe,wBAAwB,SAAS;AAChD,QAAM,EAAE,eAAe,cAAc,SAAS,cAAc,gBAAgB,IAAI;AAChF,QAAM,QAAQ,oCAAoC;AAAA,IAC9C;AAAA,IACA;AAAA,IACA;AAAA,IACA,eAAe,CAAC,EAAE,gBAAgB,aAAa,SAAS;AAAA,EAC5D,CAAC;AAED,QAAM,SAAS,MAAM,gBAAgB,OAAO;AAE5C,MAAI,OAAO,gBAAgB;AACvB,UAAM,mBAAmB,SAAS,OAAO,cAAc;AAEvD,QAAI,gBAAgB,aAAa,SAAS,KAAK,iBAAiB;AAC5D,iBAAW,eAAe,cAAa;AACnC,cAAM,qBAAqB,QAAQ,UAAU,QAAQ,WAAW,OAAO,gBAAgB,aAAa,iBAAiB,QAAQ,yBAAyB;AAAA,MAC1J;AAAA,IACJ;AAAA,EACJ,OAAO;AACH,UAAM,QAAQ,2BAA2B;AAAA,MACrC;AAAA,MACA;AAAA,MACA,OAAO,OAAO;AAAA,IAClB,CAAC;AAAA,EACL;AACA,SAAO;AAAA,IACH,SAAS,CAAC,OAAO;AAAA,IACjB;AAAA,IACA;AAAA,IACA,gBAAgB,OAAO,kBAAkB;AAAA,IACzC,OAAO,OAAO,SAAS;AAAA,EAC3B;AACJ;AAjCmB;AAkCnB,wBAAwB,aAAa;AACrC,WAAW,oBAAoB,IAAI,6FAA6F,uBAAuB;AAEhJ,IAAM,yBAAyB,OAAO,OAAO,yBAAyB;AAAA,EACzE,YAAY;AAChB,CAAC;;;AC3DD,IAAI,sBAAsB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,yFAAyF;AAC/J,IAAI,oBAAoB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,uFAAuF;AAC3J,IAAIA,wBAAuB,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,0FAA0F;AAG7J,IAAIC,WAAU,WAAW,OAAO,IAAI,mBAAmB,CAAC,EAAE,6EAA6E;AAOvI,eAAe,8BAA8B,SAAS;AACtD,QAAM,EAAE,gBAAgB,aAAa,IAAI;AACzC,QAAMA,SAAQ,oCAAoC,OAAO;AACzD,QAAM,eAAe,MAAM,oBAAoB,OAAO;AACtD,QAAM,aAAa,MAAM,kBAAkB,OAAO;AAClD,MAAI,WAAW,WAAW,GAAG;AACzB,UAAMA,SAAQ,6BAA6B;AAAA,MACvC;AAAA,MACA;AAAA,IACJ,CAAC;AACD,WAAO;AAAA,MACH,SAAS;AAAA,MACT,QAAQ;AAAA,IACZ;AAAA,EACJ;AACA,QAAM,UAAU,CAAC;AACjB,aAAW,aAAa,YAAW;AAC/B,UAAM,SAAS,MAAMD,sBAAqB,SAAS,UAAU,IAAI,YAAY;AAC7E,YAAQ,KAAK,MAAM;AAAA,EACvB;AACA,SAAO;AAAA,IACH,SAAS;AAAA,IACT;AAAA,IACA,aAAa,QAAQ;AAAA,EACzB;AACJ;AAzBmB;AA0BnB,8BAA8B,aAAa;AAC3C,WAAW,oBAAoB,IAAI,yGAAyG,6BAA6B;AAElK,IAAM,+BAA+B,OAAO,OAAO,+BAA+B;AAAA,EACrF,YAAY;AAChB,CAAC;",
  "names": ["executeEvaluatorStep", "logStep"]
}

|
|
45241
45241
|
`;
|
|
45242
45242
|
var POST = workflowEntrypoint(workflowCode);
|
|
45243
45243
|
// Annotate the CommonJS export names for ESM import in node:
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"workflowFiles": [
|
|
3
|
-
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/
|
|
4
|
-
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/
|
|
3
|
+
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/runDatasetItem.ts",
|
|
4
|
+
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/evaluateConversation.ts"
|
|
5
5
|
]
|
|
6
6
|
}
|
|
@@ -1,5 +1,16 @@
|
|
|
1
1
|
{
|
|
2
2
|
"steps": {
|
|
3
|
+
"node_modules/.pnpm/workflow@4.0.1-beta.33_@aws-sdk+client-sts@3.970.0_@opentelemetry+api@1.9.0_@types+reac_162752afbc89dc886082698201e5b45d/node_modules/workflow/dist/internal/builtins.js": {
|
|
4
|
+
"__builtin_response_array_buffer": {
|
|
5
|
+
"stepId": "__builtin_response_array_buffer"
|
|
6
|
+
},
|
|
7
|
+
"__builtin_response_json": {
|
|
8
|
+
"stepId": "__builtin_response_json"
|
|
9
|
+
},
|
|
10
|
+
"__builtin_response_text": {
|
|
11
|
+
"stepId": "__builtin_response_text"
|
|
12
|
+
}
|
|
13
|
+
},
|
|
3
14
|
"src/domains/evals/workflow/functions/evaluateConversation.ts": {
|
|
4
15
|
"executeEvaluatorStep": {
|
|
5
16
|
"stepId": "step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep"
|
|
@@ -14,17 +25,6 @@
|
|
|
14
25
|
"stepId": "step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep"
|
|
15
26
|
}
|
|
16
27
|
},
|
|
17
|
-
"node_modules/.pnpm/workflow@4.0.1-beta.33_@aws-sdk+client-sts@3.970.0_@opentelemetry+api@1.9.0_@types+reac_162752afbc89dc886082698201e5b45d/node_modules/workflow/dist/internal/builtins.js": {
|
|
18
|
-
"__builtin_response_array_buffer": {
|
|
19
|
-
"stepId": "__builtin_response_array_buffer"
|
|
20
|
-
},
|
|
21
|
-
"__builtin_response_json": {
|
|
22
|
-
"stepId": "__builtin_response_json"
|
|
23
|
-
},
|
|
24
|
-
"__builtin_response_text": {
|
|
25
|
-
"stepId": "__builtin_response_text"
|
|
26
|
-
}
|
|
27
|
-
},
|
|
28
28
|
"src/domains/evals/workflow/functions/runDatasetItem.ts": {
|
|
29
29
|
"callChatApiStep": {
|
|
30
30
|
"stepId": "step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep"
|
|
@@ -41,15 +41,15 @@
|
|
|
41
41
|
}
|
|
42
42
|
},
|
|
43
43
|
"workflows": {
|
|
44
|
-
"src/domains/evals/workflow/functions/runDatasetItem.ts": {
|
|
45
|
-
"_runDatasetItemWorkflow": {
|
|
46
|
-
"workflowId": "workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow"
|
|
47
|
-
}
|
|
48
|
-
},
|
|
49
44
|
"src/domains/evals/workflow/functions/evaluateConversation.ts": {
|
|
50
45
|
"_evaluateConversationWorkflow": {
|
|
51
46
|
"workflowId": "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
|
|
52
47
|
}
|
|
48
|
+
},
|
|
49
|
+
"src/domains/evals/workflow/functions/runDatasetItem.ts": {
|
|
50
|
+
"_runDatasetItemWorkflow": {
|
|
51
|
+
"workflowId": "workflow//src/domains/evals/workflow/functions/runDatasetItem.ts//_runDatasetItemWorkflow"
|
|
52
|
+
}
|
|
53
53
|
}
|
|
54
54
|
}
|
|
55
55
|
}
|
|
@@ -180088,7 +180088,11 @@ function createAgentsManageDatabasePool(config4) {
|
|
|
180088
180088
|
if (!connectionString) throw new Error("INKEEP_AGENTS_MANAGE_DATABASE_URL environment variable is required. Please set it to your PostgreSQL connection string.");
|
|
180089
180089
|
const pool2 = new Pool({
|
|
180090
180090
|
connectionString,
|
|
180091
|
-
max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100
|
|
180091
|
+
max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100,
|
|
180092
|
+
keepAlive: true,
|
|
180093
|
+
keepAliveInitialDelayMillis: 6e4,
|
|
180094
|
+
connectionTimeoutMillis: 1e4,
|
|
180095
|
+
idleTimeoutMillis: 3e4
|
|
180092
180096
|
});
|
|
180093
180097
|
pool2.on("error", (err2) => {
|
|
180094
180098
|
console.error("Unexpected PostgreSQL pool error:", err2);
|
|
@@ -180102,7 +180106,11 @@ function createAgentsManageDatabaseClient(config4) {
|
|
|
180102
180106
|
if (!connectionString) throw new Error("INKEEP_AGENTS_MANAGE_DATABASE_URL environment variable is required. Please set it to your PostgreSQL connection string.");
|
|
180103
180107
|
const pool2 = new Pool({
|
|
180104
180108
|
connectionString,
|
|
180105
|
-
max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100
|
|
180109
|
+
max: config4.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100,
|
|
180110
|
+
keepAlive: true,
|
|
180111
|
+
keepAliveInitialDelayMillis: 6e4,
|
|
180112
|
+
connectionTimeoutMillis: 1e4,
|
|
180113
|
+
idleTimeoutMillis: 3e4
|
|
180106
180114
|
});
|
|
180107
180115
|
pool2.on("error", (err2) => {
|
|
180108
180116
|
console.error("Unexpected PostgreSQL pool error:", err2);
|
|
@@ -180130,7 +180138,11 @@ function createAgentsRunDatabaseClient(config4) {
|
|
|
180130
180138
|
if (!connectionString) throw new Error("INKEEP_AGENTS_RUN_DATABASE_URL environment variable is required. Please set it to your PostgreSQL connection string.");
|
|
180131
180139
|
const pool2 = new Pool({
|
|
180132
180140
|
connectionString,
|
|
180133
|
-
max: config4?.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100
|
|
180141
|
+
max: config4?.poolSize || Number(env.POSTGRES_POOL_SIZE) || 100,
|
|
180142
|
+
keepAlive: true,
|
|
180143
|
+
keepAliveInitialDelayMillis: 6e4,
|
|
180144
|
+
connectionTimeoutMillis: 1e4,
|
|
180145
|
+
idleTimeoutMillis: 3e4
|
|
180134
180146
|
});
|
|
180135
180147
|
pool2.on("error", (err2) => {
|
|
180136
180148
|
console.error("Unexpected PostgreSQL pool error:", err2);
|
|
@@ -229788,124 +229800,8 @@ Return your evaluation as a JSON object matching the schema above.`;
|
|
|
229788
229800
|
}
|
|
229789
229801
|
};
|
|
229790
229802
|
|
|
229791
|
-
// src/domains/evals/workflow/functions/evaluateConversation.ts
|
|
229792
|
-
var logger22 = getLogger("workflow-evaluate-conversation");
|
|
229793
|
-
async function getConversationStep(payload) {
|
|
229794
|
-
const { tenantId, projectId, conversationId } = payload;
|
|
229795
|
-
const conv = await getConversation(runDbClient_default)({
|
|
229796
|
-
scopes: {
|
|
229797
|
-
tenantId,
|
|
229798
|
-
projectId
|
|
229799
|
-
},
|
|
229800
|
-
conversationId
|
|
229801
|
-
});
|
|
229802
|
-
if (!conv) {
|
|
229803
|
-
throw new Error(`Conversation not found: ${conversationId}`);
|
|
229804
|
-
}
|
|
229805
|
-
return conv;
|
|
229806
|
-
}
|
|
229807
|
-
__name(getConversationStep, "getConversationStep");
|
|
229808
|
-
async function getEvaluatorsStep(payload) {
|
|
229809
|
-
const { tenantId, projectId, evaluatorIds } = payload;
|
|
229810
|
-
const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
|
|
229811
|
-
const evals = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorsByIds(db)({
|
|
229812
|
-
scopes: {
|
|
229813
|
-
tenantId,
|
|
229814
|
-
projectId
|
|
229815
|
-
},
|
|
229816
|
-
evaluatorIds
|
|
229817
|
-
}));
|
|
229818
|
-
return evals;
|
|
229819
|
-
}
|
|
229820
|
-
__name(getEvaluatorsStep, "getEvaluatorsStep");
|
|
229821
|
-
async function executeEvaluatorStep(payload, evaluatorId, conversation) {
|
|
229822
|
-
const { tenantId, projectId, conversationId, evaluationRunId } = payload;
|
|
229823
|
-
const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
|
|
229824
|
-
const evaluator2 = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorById(db)({
|
|
229825
|
-
scopes: {
|
|
229826
|
-
tenantId,
|
|
229827
|
-
projectId,
|
|
229828
|
-
evaluatorId
|
|
229829
|
-
}
|
|
229830
|
-
}));
|
|
229831
|
-
if (!evaluator2) {
|
|
229832
|
-
throw new Error(`Evaluator not found: ${evaluatorId}`);
|
|
229833
|
-
}
|
|
229834
|
-
const evalResult = await createEvaluationResult(runDbClient_default)({
|
|
229835
|
-
id: generateId(),
|
|
229836
|
-
tenantId,
|
|
229837
|
-
projectId,
|
|
229838
|
-
conversationId,
|
|
229839
|
-
evaluatorId: evaluator2.id,
|
|
229840
|
-
evaluationRunId
|
|
229841
|
-
});
|
|
229842
|
-
try {
|
|
229843
|
-
const evaluationService = new EvaluationService();
|
|
229844
|
-
const output = await evaluationService.executeEvaluation({
|
|
229845
|
-
conversation,
|
|
229846
|
-
evaluator: evaluator2,
|
|
229847
|
-
tenantId,
|
|
229848
|
-
projectId
|
|
229849
|
-
});
|
|
229850
|
-
const updated = await updateEvaluationResult(runDbClient_default)({
|
|
229851
|
-
scopes: {
|
|
229852
|
-
tenantId,
|
|
229853
|
-
projectId,
|
|
229854
|
-
evaluationResultId: evalResult.id
|
|
229855
|
-
},
|
|
229856
|
-
data: {
|
|
229857
|
-
output
|
|
229858
|
-
}
|
|
229859
|
-
});
|
|
229860
|
-
logger22.info({
|
|
229861
|
-
conversationId,
|
|
229862
|
-
evaluatorId: evaluator2.id,
|
|
229863
|
-
resultId: evalResult.id
|
|
229864
|
-
}, "Evaluation completed successfully");
|
|
229865
|
-
return updated;
|
|
229866
|
-
} catch (error92) {
|
|
229867
|
-
const errorMessage = error92 instanceof Error ? error92.message : "Unknown error";
|
|
229868
|
-
logger22.error({
|
|
229869
|
-
error: error92,
|
|
229870
|
-
conversationId,
|
|
229871
|
-
evaluatorId: evaluator2.id,
|
|
229872
|
-
resultId: evalResult.id
|
|
229873
|
-
}, "Evaluation execution failed");
|
|
229874
|
-
const failed = await updateEvaluationResult(runDbClient_default)({
|
|
229875
|
-
scopes: {
|
|
229876
|
-
tenantId,
|
|
229877
|
-
projectId,
|
|
229878
|
-
evaluationResultId: evalResult.id
|
|
229879
|
-
},
|
|
229880
|
-
data: {
|
|
229881
|
-
output: {
|
|
229882
|
-
text: `Evaluation failed: ${errorMessage}`
|
|
229883
|
-
}
|
|
229884
|
-
}
|
|
229885
|
-
});
|
|
229886
|
-
return failed;
|
|
229887
|
-
}
|
|
229888
|
-
}
|
|
229889
|
-
__name(executeEvaluatorStep, "executeEvaluatorStep");
|
|
229890
|
-
async function logStep(message, data) {
|
|
229891
|
-
logger22.info(data, message);
|
|
229892
|
-
}
|
|
229893
|
-
__name(logStep, "logStep");
|
|
229894
|
-
async function _evaluateConversationWorkflow(payload) {
|
|
229895
|
-
throw new Error("You attempted to execute workflow _evaluateConversationWorkflow function directly. To start a workflow, use start(_evaluateConversationWorkflow) from workflow/api");
|
|
229896
|
-
}
|
|
229897
|
-
__name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
|
|
229898
|
-
_evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
|
|
229899
|
-
var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
|
|
229900
|
-
workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
|
|
229901
|
-
});
|
|
229902
|
-
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep", getConversationStep);
|
|
229903
|
-
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep", getEvaluatorsStep);
|
|
229904
|
-
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep", executeEvaluatorStep);
|
|
229905
|
-
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep", logStep);
|
|
229906
|
-
|
|
229907
229803
|
// src/domains/evals/workflow/functions/runDatasetItem.ts
|
|
229908
|
-
var
|
|
229804
|
+
var logger22 = getLogger("workflow-run-dataset-item");
|
|
229909
229805
|
async function callChatApiStep(payload) {
|
|
229910
229806
|
const { tenantId, projectId, agentId, datasetItemId, datasetItemInput, datasetItemSimulationAgent, datasetRunId } = payload;
|
|
229911
229807
|
const evaluationService = new EvaluationService();
|
|
@@ -229921,7 +229817,7 @@ async function callChatApiStep(payload) {
|
|
|
229921
229817
|
datasetItem: datasetItem2,
|
|
229922
229818
|
datasetRunId
|
|
229923
229819
|
});
|
|
229924
|
-
|
|
229820
|
+
logger22.info({
|
|
229925
229821
|
tenantId,
|
|
229926
229822
|
projectId,
|
|
229927
229823
|
datasetItemId,
|
|
@@ -229944,7 +229840,7 @@ async function createRelationStep(payload, conversationId) {
|
|
|
229944
229840
|
conversationId,
|
|
229945
229841
|
datasetItemId
|
|
229946
229842
|
});
|
|
229947
|
-
|
|
229843
|
+
logger22.info({
|
|
229948
229844
|
tenantId,
|
|
229949
229845
|
projectId,
|
|
229950
229846
|
datasetItemId,
|
|
@@ -229958,7 +229854,7 @@ async function createRelationStep(payload, conversationId) {
|
|
|
229958
229854
|
};
|
|
229959
229855
|
} catch (error92) {
|
|
229960
229856
|
if (error92?.cause?.code === "23503" || error92?.code === "23503") {
|
|
229961
|
-
|
|
229857
|
+
logger22.warn({
|
|
229962
229858
|
tenantId,
|
|
229963
229859
|
projectId,
|
|
229964
229860
|
datasetItemId,
|
|
@@ -229975,7 +229871,7 @@ async function createRelationStep(payload, conversationId) {
|
|
|
229975
229871
|
}
|
|
229976
229872
|
}
|
|
229977
229873
|
__name(createRelationStep, "createRelationStep");
|
|
229978
|
-
async function
|
|
229874
|
+
async function executeEvaluatorStep(tenantId, projectId, conversationId, evaluatorId, evaluationRunId, expectedOutput) {
|
|
229979
229875
|
const ref = getProjectScopedRef(tenantId, projectId, "main");
|
|
229980
229876
|
const resolvedRef = await resolveRef2(manageDbClient_default)(ref);
|
|
229981
229877
|
if (!resolvedRef) {
|
|
@@ -229989,7 +229885,7 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
|
|
|
229989
229885
|
}
|
|
229990
229886
|
}));
|
|
229991
229887
|
if (!evaluator2) {
|
|
229992
|
-
|
|
229888
|
+
logger22.warn({
|
|
229993
229889
|
evaluatorId
|
|
229994
229890
|
}, "Evaluator not found");
|
|
229995
229891
|
return null;
|
|
@@ -230031,7 +229927,7 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
|
|
|
230031
229927
|
output
|
|
230032
229928
|
}
|
|
230033
229929
|
});
|
|
230034
|
-
|
|
229930
|
+
logger22.info({
|
|
230035
229931
|
conversationId,
|
|
230036
229932
|
evaluatorId: evaluator2.id,
|
|
230037
229933
|
resultId: evalResult.id
|
|
@@ -230039,7 +229935,7 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
|
|
|
230039
229935
|
return evalResult.id;
|
|
230040
229936
|
} catch (error92) {
|
|
230041
229937
|
const errorMessage = error92 instanceof Error ? error92.message : "Unknown error";
|
|
230042
|
-
|
|
229938
|
+
logger22.error({
|
|
230043
229939
|
error: error92,
|
|
230044
229940
|
conversationId,
|
|
230045
229941
|
evaluatorId: evaluator2.id
|
|
@@ -230059,11 +229955,11 @@ async function executeEvaluatorStep2(tenantId, projectId, conversationId, evalua
|
|
|
230059
229955
|
return evalResult.id;
|
|
230060
229956
|
}
|
|
230061
229957
|
}
|
|
230062
|
-
__name(
|
|
230063
|
-
async function
|
|
230064
|
-
|
|
229958
|
+
__name(executeEvaluatorStep, "executeEvaluatorStep");
|
|
229959
|
+
async function logStep(message, data) {
|
|
229960
|
+
logger22.info(data, message);
|
|
230065
229961
|
}
|
|
230066
|
-
__name(
|
|
229962
|
+
__name(logStep, "logStep");
|
|
230067
229963
|
async function _runDatasetItemWorkflow(payload) {
|
|
230068
229964
|
throw new Error("You attempted to execute workflow _runDatasetItemWorkflow function directly. To start a workflow, use start(_runDatasetItemWorkflow) from workflow/api");
|
|
230069
229965
|
}
|
|
@@ -230074,8 +229970,124 @@ var runDatasetItemWorkflow = Object.assign(_runDatasetItemWorkflow, {
|
|
|
230074
229970
|
});
|
|
230075
229971
|
registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//callChatApiStep", callChatApiStep);
|
|
230076
229972
|
registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//createRelationStep", createRelationStep);
|
|
230077
|
-
registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep",
|
|
230078
|
-
registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep",
|
|
229973
|
+
registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//executeEvaluatorStep", executeEvaluatorStep);
|
|
229974
|
+
registerStepFunction("step//src/domains/evals/workflow/functions/runDatasetItem.ts//logStep", logStep);
|
|
229975
|
+
|
|
229976
|
+
// src/domains/evals/workflow/functions/evaluateConversation.ts
|
|
229977
|
+
var logger23 = getLogger("workflow-evaluate-conversation");
|
|
229978
|
+
async function getConversationStep(payload) {
|
|
229979
|
+
const { tenantId, projectId, conversationId } = payload;
|
|
229980
|
+
const conv = await getConversation(runDbClient_default)({
|
|
229981
|
+
scopes: {
|
|
229982
|
+
tenantId,
|
|
229983
|
+
projectId
|
|
229984
|
+
},
|
|
229985
|
+
conversationId
|
|
229986
|
+
});
|
|
229987
|
+
if (!conv) {
|
|
229988
|
+
throw new Error(`Conversation not found: ${conversationId}`);
|
|
229989
|
+
}
|
|
229990
|
+
return conv;
|
|
229991
|
+
}
|
|
229992
|
+
__name(getConversationStep, "getConversationStep");
|
|
229993
|
+
async function getEvaluatorsStep(payload) {
|
|
229994
|
+
const { tenantId, projectId, evaluatorIds } = payload;
|
|
229995
|
+
const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
|
|
229996
|
+
const evals = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorsByIds(db)({
|
|
229997
|
+
scopes: {
|
|
229998
|
+
tenantId,
|
|
229999
|
+
projectId
|
|
230000
|
+
},
|
|
230001
|
+
evaluatorIds
|
|
230002
|
+
}));
|
|
230003
|
+
return evals;
|
|
230004
|
+
}
|
|
230005
|
+
__name(getEvaluatorsStep, "getEvaluatorsStep");
|
|
230006
|
+
async function executeEvaluatorStep2(payload, evaluatorId, conversation) {
|
|
230007
|
+
const { tenantId, projectId, conversationId, evaluationRunId } = payload;
|
|
230008
|
+
const projectMain = await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId);
|
|
230009
|
+
const evaluator2 = await withRef(manageDbPool_default, projectMain, (db) => getEvaluatorById(db)({
|
|
230010
|
+
scopes: {
|
|
230011
|
+
tenantId,
|
|
230012
|
+
projectId,
|
|
230013
|
+
evaluatorId
|
|
230014
|
+
}
|
|
230015
|
+
}));
|
|
230016
|
+
if (!evaluator2) {
|
|
230017
|
+
throw new Error(`Evaluator not found: ${evaluatorId}`);
|
|
230018
|
+
}
|
|
230019
|
+
const evalResult = await createEvaluationResult(runDbClient_default)({
|
|
230020
|
+
id: generateId(),
|
|
230021
|
+
tenantId,
|
|
230022
|
+
projectId,
|
|
230023
|
+
conversationId,
|
|
230024
|
+
evaluatorId: evaluator2.id,
|
|
230025
|
+
evaluationRunId
|
|
230026
|
+
});
|
|
230027
|
+
try {
|
|
230028
|
+
const evaluationService = new EvaluationService();
|
|
230029
|
+
const output = await evaluationService.executeEvaluation({
|
|
230030
|
+
conversation,
|
|
230031
|
+
evaluator: evaluator2,
|
|
230032
|
+
tenantId,
|
|
230033
|
+
projectId
|
|
230034
|
+
});
|
|
230035
|
+
const updated = await updateEvaluationResult(runDbClient_default)({
|
|
230036
|
+
scopes: {
|
|
230037
|
+
tenantId,
|
|
230038
|
+
projectId,
|
|
230039
|
+
evaluationResultId: evalResult.id
|
|
230040
|
+
},
|
|
230041
|
+
data: {
|
|
230042
|
+
output
|
|
230043
|
+
}
|
|
230044
|
+
});
|
|
230045
|
+
logger23.info({
|
|
230046
|
+
conversationId,
|
|
230047
|
+
evaluatorId: evaluator2.id,
|
|
230048
|
+
resultId: evalResult.id
|
|
230049
|
+
}, "Evaluation completed successfully");
|
|
230050
|
+
return updated;
|
|
230051
|
+
} catch (error92) {
|
|
230052
|
+
const errorMessage = error92 instanceof Error ? error92.message : "Unknown error";
|
|
230053
|
+
logger23.error({
|
|
230054
|
+
error: error92,
|
|
230055
|
+
conversationId,
|
|
230056
|
+
evaluatorId: evaluator2.id,
|
|
230057
|
+
resultId: evalResult.id
|
|
230058
|
+
}, "Evaluation execution failed");
|
|
230059
|
+
const failed = await updateEvaluationResult(runDbClient_default)({
|
|
230060
|
+
scopes: {
|
|
230061
|
+
tenantId,
|
|
230062
|
+
projectId,
|
|
230063
|
+
evaluationResultId: evalResult.id
|
|
230064
|
+
},
|
|
230065
|
+
data: {
|
|
230066
|
+
output: {
|
|
230067
|
+
text: `Evaluation failed: ${errorMessage}`
|
|
230068
|
+
}
|
|
230069
|
+
}
|
|
230070
|
+
});
|
|
230071
|
+
return failed;
|
|
230072
|
+
}
|
|
230073
|
+
}
|
|
230074
|
+
__name(executeEvaluatorStep2, "executeEvaluatorStep");
|
|
230075
|
+
async function logStep2(message, data) {
|
|
230076
|
+
logger23.info(data, message);
|
|
230077
|
+
}
|
|
230078
|
+
__name(logStep2, "logStep");
|
|
230079
|
+
async function _evaluateConversationWorkflow(payload) {
|
|
230080
|
+
throw new Error("You attempted to execute workflow _evaluateConversationWorkflow function directly. To start a workflow, use start(_evaluateConversationWorkflow) from workflow/api");
|
|
230081
|
+
}
|
|
230082
|
+
__name(_evaluateConversationWorkflow, "_evaluateConversationWorkflow");
|
|
230083
|
+
_evaluateConversationWorkflow.workflowId = "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow";
|
|
230084
|
+
var evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, {
|
|
230085
|
+
workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow"
|
|
230086
|
+
});
|
|
230087
|
+
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getConversationStep", getConversationStep);
|
|
230088
|
+
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//getEvaluatorsStep", getEvaluatorsStep);
|
|
230089
|
+
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//executeEvaluatorStep", executeEvaluatorStep2);
|
|
230090
|
+
registerStepFunction("step//src/domains/evals/workflow/functions/evaluateConversation.ts//logStep", logStep2);
|
|
230079
230091
|
|
|
230080
230092
|
// ../node_modules/.pnpm/@workflow+utils@4.0.1-beta.7/node_modules/@workflow/utils/dist/index.js
|
|
230081
230093
|
var import_ms2 = __toESM(require_ms(), 1);
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"stepFiles": [
|
|
3
|
-
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/
|
|
4
|
-
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/
|
|
3
|
+
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/runDatasetItem.ts",
|
|
4
|
+
"/home/runner/work/agents/agents/agents-api/src/domains/evals/workflow/functions/evaluateConversation.ts"
|
|
5
5
|
]
|
|
6
6
|
}
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
import * as
|
|
1
|
+
import * as _inkeep_agents_core0 from "@inkeep/agents-core";
|
|
2
2
|
|
|
3
3
|
//#region src/data/db/manageDbClient.d.ts
|
|
4
|
-
declare const manageDbClient:
|
|
4
|
+
declare const manageDbClient: _inkeep_agents_core0.AgentsManageDatabaseClient;
|
|
5
5
|
//#endregion
|
|
6
6
|
export { manageDbClient as default };
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
import * as
|
|
1
|
+
import * as _inkeep_agents_core0 from "@inkeep/agents-core";
|
|
2
2
|
|
|
3
3
|
//#region src/data/db/runDbClient.d.ts
|
|
4
|
-
declare const runDbClient:
|
|
4
|
+
declare const runDbClient: _inkeep_agents_core0.AgentsRunDatabaseClient;
|
|
5
5
|
//#endregion
|
|
6
6
|
export { runDbClient as default };
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import { OpenAPIHono } from "@hono/zod-openapi";
|
|
2
|
-
import * as
|
|
2
|
+
import * as hono16 from "hono";
|
|
3
3
|
|
|
4
4
|
//#region src/domains/evals/routes/datasetTriggers.d.ts
|
|
5
|
-
declare const app: OpenAPIHono<
|
|
5
|
+
declare const app: OpenAPIHono<hono16.Env, {}, "/">;
|
|
6
6
|
//#endregion
|
|
7
7
|
export { app as default };
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import { OpenAPIHono } from "@hono/zod-openapi";
|
|
2
|
-
import * as
|
|
2
|
+
import * as hono14 from "hono";
|
|
3
3
|
|
|
4
4
|
//#region src/domains/evals/routes/index.d.ts
|
|
5
|
-
declare const app: OpenAPIHono<
|
|
5
|
+
declare const app: OpenAPIHono<hono14.Env, {}, "/">;
|
|
6
6
|
//#endregion
|
|
7
7
|
export { app as default };
|