@inkeep/agents-api 0.0.0-dev-20260121145510
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE.md +56 -0
- package/SUPPLEMENTAL_TERMS.md +40 -0
- package/dist/.well-known/workflow/v1/flow.cjs +46383 -0
- package/dist/.well-known/workflow/v1/flow.cjs.debug.json +6 -0
- package/dist/.well-known/workflow/v1/manifest.debug.json +55 -0
- package/dist/.well-known/workflow/v1/step.cjs +218683 -0
- package/dist/.well-known/workflow/v1/step.cjs.debug.json +6 -0
- package/dist/.well-known/workflow/v1/webhook.mjs +29 -0
- package/dist/createApp.d.ts +10 -0
- package/dist/createApp.js +170 -0
- package/dist/data/db/index.d.ts +4 -0
- package/dist/data/db/index.js +5 -0
- package/dist/data/db/manageDbClient.d.ts +6 -0
- package/dist/data/db/manageDbClient.js +9 -0
- package/dist/data/db/manageDbPool.d.ts +6 -0
- package/dist/data/db/manageDbPool.js +9 -0
- package/dist/data/db/runDbClient.d.ts +6 -0
- package/dist/data/db/runDbClient.js +9 -0
- package/dist/domains/evals/index.d.ts +13 -0
- package/dist/domains/evals/index.js +13 -0
- package/dist/domains/evals/routes/datasetTriggers.d.ts +7 -0
- package/dist/domains/evals/routes/datasetTriggers.js +65 -0
- package/dist/domains/evals/routes/evaluationTriggers.d.ts +11 -0
- package/dist/domains/evals/routes/evaluationTriggers.js +311 -0
- package/dist/domains/evals/routes/index.d.ts +7 -0
- package/dist/domains/evals/routes/index.js +12 -0
- package/dist/domains/evals/scripts/build-workflow.d.ts +1 -0
- package/dist/domains/evals/scripts/build-workflow.js +31 -0
- package/dist/domains/evals/services/EvaluationService.d.ts +96 -0
- package/dist/domains/evals/services/EvaluationService.js +863 -0
- package/dist/domains/evals/services/conversationEvaluation.d.ts +15 -0
- package/dist/domains/evals/services/conversationEvaluation.js +102 -0
- package/dist/domains/evals/services/datasetRun.d.ts +16 -0
- package/dist/domains/evals/services/datasetRun.js +43 -0
- package/dist/domains/evals/services/evaluationJob.d.ts +17 -0
- package/dist/domains/evals/services/evaluationJob.js +65 -0
- package/dist/domains/evals/services/startEvaluation.d.ts +19 -0
- package/dist/domains/evals/services/startEvaluation.js +18 -0
- package/dist/domains/evals/workflow/functions/evaluateConversation.d.ts +31 -0
- package/dist/domains/evals/workflow/functions/evaluateConversation.js +135 -0
- package/dist/domains/evals/workflow/functions/runDatasetItem.d.ts +39 -0
- package/dist/domains/evals/workflow/functions/runDatasetItem.js +205 -0
- package/dist/domains/evals/workflow/index.d.ts +4 -0
- package/dist/domains/evals/workflow/index.js +5 -0
- package/dist/domains/evals/workflow/routes.d.ts +7 -0
- package/dist/domains/evals/workflow/routes.js +106 -0
- package/dist/domains/evals/workflow/world.d.ts +4 -0
- package/dist/domains/evals/workflow/world.js +36 -0
- package/dist/domains/index.d.ts +4 -0
- package/dist/domains/index.js +5 -0
- package/dist/domains/manage/index.d.ts +12 -0
- package/dist/domains/manage/index.js +31 -0
- package/dist/domains/manage/routes/agent.d.ts +9 -0
- package/dist/domains/manage/routes/agent.js +266 -0
- package/dist/domains/manage/routes/agentFull.d.ts +9 -0
- package/dist/domains/manage/routes/agentFull.js +207 -0
- package/dist/domains/manage/routes/agentToolRelations.d.ts +9 -0
- package/dist/domains/manage/routes/agentToolRelations.js +289 -0
- package/dist/domains/manage/routes/apiKeys.d.ts +9 -0
- package/dist/domains/manage/routes/apiKeys.js +217 -0
- package/dist/domains/manage/routes/artifactComponents.d.ts +9 -0
- package/dist/domains/manage/routes/artifactComponents.js +210 -0
- package/dist/domains/manage/routes/branches.d.ts +9 -0
- package/dist/domains/manage/routes/branches.js +182 -0
- package/dist/domains/manage/routes/cliAuth.d.ts +9 -0
- package/dist/domains/manage/routes/cliAuth.js +60 -0
- package/dist/domains/manage/routes/contextConfigs.d.ts +9 -0
- package/dist/domains/manage/routes/contextConfigs.js +189 -0
- package/dist/domains/manage/routes/conversations.d.ts +7 -0
- package/dist/domains/manage/routes/conversations.js +59 -0
- package/dist/domains/manage/routes/credentialStores.d.ts +9 -0
- package/dist/domains/manage/routes/credentialStores.js +86 -0
- package/dist/domains/manage/routes/credentials.d.ts +9 -0
- package/dist/domains/manage/routes/credentials.js +207 -0
- package/dist/domains/manage/routes/dataComponents.d.ts +9 -0
- package/dist/domains/manage/routes/dataComponents.js +192 -0
- package/dist/domains/manage/routes/evals/datasetItems.d.ts +9 -0
- package/dist/domains/manage/routes/evals/datasetItems.js +310 -0
- package/dist/domains/manage/routes/evals/datasetRunConfigs.d.ts +9 -0
- package/dist/domains/manage/routes/evals/datasetRunConfigs.js +402 -0
- package/dist/domains/manage/routes/evals/datasetRuns.d.ts +9 -0
- package/dist/domains/manage/routes/evals/datasetRuns.js +256 -0
- package/dist/domains/manage/routes/evals/datasets.d.ts +9 -0
- package/dist/domains/manage/routes/evals/datasets.js +238 -0
- package/dist/domains/manage/routes/evals/evaluationJobConfigEvaluatorRelations.d.ts +9 -0
- package/dist/domains/manage/routes/evals/evaluationJobConfigEvaluatorRelations.js +146 -0
- package/dist/domains/manage/routes/evals/evaluationJobConfigs.d.ts +9 -0
- package/dist/domains/manage/routes/evals/evaluationJobConfigs.js +364 -0
- package/dist/domains/manage/routes/evals/evaluationResults.d.ts +7 -0
- package/dist/domains/manage/routes/evals/evaluationResults.js +192 -0
- package/dist/domains/manage/routes/evals/evaluationRunConfigs.d.ts +9 -0
- package/dist/domains/manage/routes/evals/evaluationRunConfigs.js +403 -0
- package/dist/domains/manage/routes/evals/evaluationSuiteConfigEvaluatorRelations.d.ts +9 -0
- package/dist/domains/manage/routes/evals/evaluationSuiteConfigEvaluatorRelations.js +146 -0
- package/dist/domains/manage/routes/evals/evaluationSuiteConfigs.d.ts +9 -0
- package/dist/domains/manage/routes/evals/evaluationSuiteConfigs.js +246 -0
- package/dist/domains/manage/routes/evals/evaluators.d.ts +9 -0
- package/dist/domains/manage/routes/evals/evaluators.js +281 -0
- package/dist/domains/manage/routes/evals/index.d.ts +9 -0
- package/dist/domains/manage/routes/evals/index.js +26 -0
- package/dist/domains/manage/routes/externalAgents.d.ts +9 -0
- package/dist/domains/manage/routes/externalAgents.js +199 -0
- package/dist/domains/manage/routes/functionTools.d.ts +9 -0
- package/dist/domains/manage/routes/functionTools.js +256 -0
- package/dist/domains/manage/routes/functions.d.ts +9 -0
- package/dist/domains/manage/routes/functions.js +285 -0
- package/dist/domains/manage/routes/index.d.ts +7 -0
- package/dist/domains/manage/routes/index.js +68 -0
- package/dist/domains/manage/routes/invitations.d.ts +9 -0
- package/dist/domains/manage/routes/invitations.js +41 -0
- package/dist/domains/manage/routes/mcp.d.ts +7 -0
- package/dist/domains/manage/routes/mcp.js +45 -0
- package/dist/domains/manage/routes/mcpCatalog.d.ts +9 -0
- package/dist/domains/manage/routes/mcpCatalog.js +454 -0
- package/dist/domains/manage/routes/oauth.d.ts +10 -0
- package/dist/domains/manage/routes/oauth.js +327 -0
- package/dist/domains/manage/routes/playgroundToken.d.ts +9 -0
- package/dist/domains/manage/routes/playgroundToken.js +127 -0
- package/dist/domains/manage/routes/projectFull.d.ts +9 -0
- package/dist/domains/manage/routes/projectFull.js +304 -0
- package/dist/domains/manage/routes/projectMembers.d.ts +9 -0
- package/dist/domains/manage/routes/projectMembers.js +201 -0
- package/dist/domains/manage/routes/projectPermissions.d.ts +9 -0
- package/dist/domains/manage/routes/projectPermissions.js +68 -0
- package/dist/domains/manage/routes/projects.d.ts +9 -0
- package/dist/domains/manage/routes/projects.js +279 -0
- package/dist/domains/manage/routes/ref.d.ts +9 -0
- package/dist/domains/manage/routes/ref.js +33 -0
- package/dist/domains/manage/routes/signoz.d.ts +10 -0
- package/dist/domains/manage/routes/signoz.js +159 -0
- package/dist/domains/manage/routes/subAgentArtifactComponents.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentArtifactComponents.js +202 -0
- package/dist/domains/manage/routes/subAgentDataComponents.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentDataComponents.js +201 -0
- package/dist/domains/manage/routes/subAgentExternalAgentRelations.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentExternalAgentRelations.js +216 -0
- package/dist/domains/manage/routes/subAgentFunctionTools.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentFunctionTools.js +205 -0
- package/dist/domains/manage/routes/subAgentRelations.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentRelations.js +263 -0
- package/dist/domains/manage/routes/subAgentTeamAgentRelations.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentTeamAgentRelations.js +216 -0
- package/dist/domains/manage/routes/subAgentToolRelations.d.ts +9 -0
- package/dist/domains/manage/routes/subAgentToolRelations.js +289 -0
- package/dist/domains/manage/routes/subAgents.d.ts +9 -0
- package/dist/domains/manage/routes/subAgents.js +220 -0
- package/dist/domains/manage/routes/thirdPartyMCPServers.d.ts +9 -0
- package/dist/domains/manage/routes/thirdPartyMCPServers.js +72 -0
- package/dist/domains/manage/routes/tools.d.ts +9 -0
- package/dist/domains/manage/routes/tools.js +261 -0
- package/dist/domains/manage/routes/triggers.d.ts +9 -0
- package/dist/domains/manage/routes/triggers.js +455 -0
- package/dist/domains/manage/routes/userOrganizations.d.ts +9 -0
- package/dist/domains/manage/routes/userOrganizations.js +58 -0
- package/dist/domains/run/a2a/client.d.ts +186 -0
- package/dist/domains/run/a2a/client.js +524 -0
- package/dist/domains/run/a2a/handlers.d.ts +7 -0
- package/dist/domains/run/a2a/handlers.js +574 -0
- package/dist/domains/run/a2a/transfer.d.ts +27 -0
- package/dist/domains/run/a2a/transfer.js +50 -0
- package/dist/domains/run/a2a/types.d.ts +75 -0
- package/dist/domains/run/a2a/types.js +22 -0
- package/dist/domains/run/agents/Agent.d.ts +273 -0
- package/dist/domains/run/agents/Agent.js +2104 -0
- package/dist/domains/run/agents/ModelFactory.d.ts +63 -0
- package/dist/domains/run/agents/ModelFactory.js +194 -0
- package/dist/domains/run/agents/SystemPromptBuilder.d.ts +21 -0
- package/dist/domains/run/agents/SystemPromptBuilder.js +48 -0
- package/dist/domains/run/agents/ToolSessionManager.d.ts +63 -0
- package/dist/domains/run/agents/ToolSessionManager.js +146 -0
- package/dist/domains/run/agents/generateTaskHandler.d.ts +44 -0
- package/dist/domains/run/agents/generateTaskHandler.js +396 -0
- package/dist/domains/run/agents/relationTools.d.ts +64 -0
- package/dist/domains/run/agents/relationTools.js +365 -0
- package/dist/domains/run/agents/types.d.ts +31 -0
- package/dist/domains/run/agents/types.js +1 -0
- package/dist/domains/run/agents/versions/v1/Phase1Config.d.ts +29 -0
- package/dist/domains/run/agents/versions/v1/Phase1Config.js +458 -0
- package/dist/domains/run/agents/versions/v1/Phase2Config.d.ts +33 -0
- package/dist/domains/run/agents/versions/v1/Phase2Config.js +341 -0
- package/dist/domains/run/constants/execution-limits/defaults.d.ts +51 -0
- package/dist/domains/run/constants/execution-limits/defaults.js +52 -0
- package/dist/domains/run/constants/execution-limits/index.d.ts +6 -0
- package/dist/domains/run/constants/execution-limits/index.js +21 -0
- package/dist/domains/run/context/ContextFetcher.d.ts +68 -0
- package/dist/domains/run/context/ContextFetcher.js +276 -0
- package/dist/domains/run/context/ContextResolver.d.ts +56 -0
- package/dist/domains/run/context/ContextResolver.js +273 -0
- package/dist/domains/run/context/context.d.ts +19 -0
- package/dist/domains/run/context/context.js +108 -0
- package/dist/domains/run/context/contextCache.d.ts +56 -0
- package/dist/domains/run/context/contextCache.js +174 -0
- package/dist/domains/run/context/index.d.ts +6 -0
- package/dist/domains/run/context/index.js +7 -0
- package/dist/domains/run/context/validation.d.ts +39 -0
- package/dist/domains/run/context/validation.js +255 -0
- package/dist/domains/run/data/agent.d.ts +7 -0
- package/dist/domains/run/data/agent.js +67 -0
- package/dist/domains/run/data/agents.d.ts +34 -0
- package/dist/domains/run/data/agents.js +131 -0
- package/dist/domains/run/data/conversations.d.ts +129 -0
- package/dist/domains/run/data/conversations.js +517 -0
- package/dist/domains/run/handlers/executionHandler.d.ts +44 -0
- package/dist/domains/run/handlers/executionHandler.js +485 -0
- package/dist/domains/run/index.d.ts +13 -0
- package/dist/domains/run/index.js +21 -0
- package/dist/domains/run/routes/agents.d.ts +13 -0
- package/dist/domains/run/routes/agents.js +141 -0
- package/dist/domains/run/routes/chat.d.ts +14 -0
- package/dist/domains/run/routes/chat.js +300 -0
- package/dist/domains/run/routes/chatDataStream.d.ts +14 -0
- package/dist/domains/run/routes/chatDataStream.js +381 -0
- package/dist/domains/run/routes/mcp.d.ts +14 -0
- package/dist/domains/run/routes/mcp.js +483 -0
- package/dist/domains/run/routes/webhooks.d.ts +15 -0
- package/dist/domains/run/routes/webhooks.js +416 -0
- package/dist/domains/run/services/AgentSession.d.ts +354 -0
- package/dist/domains/run/services/AgentSession.js +1203 -0
- package/dist/domains/run/services/ArtifactParser.d.ts +105 -0
- package/dist/domains/run/services/ArtifactParser.js +338 -0
- package/dist/domains/run/services/ArtifactService.d.ts +122 -0
- package/dist/domains/run/services/ArtifactService.js +629 -0
- package/dist/domains/run/services/BaseCompressor.d.ts +183 -0
- package/dist/domains/run/services/BaseCompressor.js +500 -0
- package/dist/domains/run/services/ConversationCompressor.d.ts +32 -0
- package/dist/domains/run/services/ConversationCompressor.js +91 -0
- package/dist/domains/run/services/IncrementalStreamParser.d.ts +98 -0
- package/dist/domains/run/services/IncrementalStreamParser.js +327 -0
- package/dist/domains/run/services/MidGenerationCompressor.d.ts +63 -0
- package/dist/domains/run/services/MidGenerationCompressor.js +104 -0
- package/dist/domains/run/services/PendingToolApprovalManager.d.ts +62 -0
- package/dist/domains/run/services/PendingToolApprovalManager.js +133 -0
- package/dist/domains/run/services/ResponseFormatter.d.ts +39 -0
- package/dist/domains/run/services/ResponseFormatter.js +152 -0
- package/dist/domains/run/services/evaluationRunConfigMatcher.d.ts +4 -0
- package/dist/domains/run/services/evaluationRunConfigMatcher.js +7 -0
- package/dist/domains/run/tools/NativeSandboxExecutor.d.ts +38 -0
- package/dist/domains/run/tools/NativeSandboxExecutor.js +432 -0
- package/dist/domains/run/tools/SandboxExecutorFactory.d.ts +36 -0
- package/dist/domains/run/tools/SandboxExecutorFactory.js +80 -0
- package/dist/domains/run/tools/VercelSandboxExecutor.d.ts +71 -0
- package/dist/domains/run/tools/VercelSandboxExecutor.js +340 -0
- package/dist/domains/run/tools/distill-conversation-history-tool.d.ts +62 -0
- package/dist/domains/run/tools/distill-conversation-history-tool.js +206 -0
- package/dist/domains/run/tools/distill-conversation-tool.d.ts +41 -0
- package/dist/domains/run/tools/distill-conversation-tool.js +141 -0
- package/dist/domains/run/tools/sandbox-utils.d.ts +18 -0
- package/dist/domains/run/tools/sandbox-utils.js +53 -0
- package/dist/domains/run/types/chat.d.ts +27 -0
- package/dist/domains/run/types/chat.js +1 -0
- package/dist/domains/run/types/executionContext.d.ts +40 -0
- package/dist/domains/run/types/executionContext.js +28 -0
- package/dist/domains/run/types/xml.d.ts +5 -0
- package/dist/domains/run/utils/SchemaProcessor.d.ts +52 -0
- package/dist/domains/run/utils/SchemaProcessor.js +182 -0
- package/dist/domains/run/utils/agent-operations.d.ts +62 -0
- package/dist/domains/run/utils/agent-operations.js +53 -0
- package/dist/domains/run/utils/artifact-component-schema.d.ts +42 -0
- package/dist/domains/run/utils/artifact-component-schema.js +186 -0
- package/dist/domains/run/utils/cleanup.d.ts +21 -0
- package/dist/domains/run/utils/cleanup.js +59 -0
- package/dist/domains/run/utils/data-component-schema.d.ts +2 -0
- package/dist/domains/run/utils/data-component-schema.js +3 -0
- package/dist/domains/run/utils/default-status-schemas.d.ts +20 -0
- package/dist/domains/run/utils/default-status-schemas.js +24 -0
- package/dist/domains/run/utils/json-postprocessor.d.ts +13 -0
- package/dist/domains/run/utils/json-postprocessor.js +19 -0
- package/dist/domains/run/utils/model-context-utils.d.ts +39 -0
- package/dist/domains/run/utils/model-context-utils.js +181 -0
- package/dist/domains/run/utils/model-resolver.d.ts +6 -0
- package/dist/domains/run/utils/model-resolver.js +24 -0
- package/dist/domains/run/utils/project.d.ts +207 -0
- package/dist/domains/run/utils/project.js +315 -0
- package/dist/domains/run/utils/schema-validation.d.ts +44 -0
- package/dist/domains/run/utils/schema-validation.js +97 -0
- package/dist/domains/run/utils/stream-helpers.d.ts +193 -0
- package/dist/domains/run/utils/stream-helpers.js +510 -0
- package/dist/domains/run/utils/stream-registry.d.ts +22 -0
- package/dist/domains/run/utils/stream-registry.js +33 -0
- package/dist/domains/run/utils/token-estimator.d.ts +23 -0
- package/dist/domains/run/utils/token-estimator.js +17 -0
- package/dist/domains/run/utils/tracer.d.ts +7 -0
- package/dist/domains/run/utils/tracer.js +7 -0
- package/dist/env.d.ts +89 -0
- package/dist/env.js +69 -0
- package/dist/factory.d.ts +1535 -0
- package/dist/factory.js +42 -0
- package/dist/index.d.ts +1530 -0
- package/dist/index.js +59 -0
- package/dist/initialization.d.ts +6 -0
- package/dist/initialization.js +65 -0
- package/dist/instrumentation.d.ts +17 -0
- package/dist/instrumentation.js +68 -0
- package/dist/logger.d.ts +2 -0
- package/dist/logger.js +3 -0
- package/dist/middleware/branchScopedDb.d.ts +31 -0
- package/dist/middleware/branchScopedDb.js +137 -0
- package/dist/middleware/cors.d.ts +36 -0
- package/dist/middleware/cors.js +131 -0
- package/dist/middleware/errorHandler.d.ts +12 -0
- package/dist/middleware/errorHandler.js +88 -0
- package/dist/middleware/evalsAuth.d.ts +16 -0
- package/dist/middleware/evalsAuth.js +52 -0
- package/dist/middleware/index.d.ts +8 -0
- package/dist/middleware/index.js +9 -0
- package/dist/middleware/manageAuth.d.ts +25 -0
- package/dist/middleware/manageAuth.js +80 -0
- package/dist/middleware/projectAccess.d.ts +31 -0
- package/dist/middleware/projectAccess.js +118 -0
- package/dist/middleware/projectConfig.d.ts +25 -0
- package/dist/middleware/projectConfig.js +89 -0
- package/dist/middleware/ref.d.ts +61 -0
- package/dist/middleware/ref.js +239 -0
- package/dist/middleware/requirePermission.d.ts +14 -0
- package/dist/middleware/requirePermission.js +80 -0
- package/dist/middleware/runAuth.d.ts +29 -0
- package/dist/middleware/runAuth.js +253 -0
- package/dist/middleware/sessionAuth.d.ts +17 -0
- package/dist/middleware/sessionAuth.js +58 -0
- package/dist/middleware/tenantAccess.d.ts +22 -0
- package/dist/middleware/tenantAccess.js +63 -0
- package/dist/middleware/tracing.d.ts +7 -0
- package/dist/middleware/tracing.js +50 -0
- package/dist/openapi.d.ts +7 -0
- package/dist/openapi.js +156 -0
- package/dist/ssoHelpers.d.ts +20 -0
- package/dist/ssoHelpers.js +51 -0
- package/dist/templates/v1/phase1/system-prompt.js +5 -0
- package/dist/templates/v1/phase1/thinking-preparation.js +5 -0
- package/dist/templates/v1/phase1/tool.js +5 -0
- package/dist/templates/v1/phase2/data-component.js +5 -0
- package/dist/templates/v1/phase2/data-components.js +5 -0
- package/dist/templates/v1/phase2/system-prompt.js +5 -0
- package/dist/templates/v1/shared/artifact-retrieval-guidance.js +5 -0
- package/dist/templates/v1/shared/artifact.js +5 -0
- package/dist/types/app.d.ts +64 -0
- package/dist/types/app.js +1 -0
- package/dist/types/index.d.ts +2 -0
- package/dist/types/index.js +1 -0
- package/dist/types/runExecutionContext.d.ts +25 -0
- package/dist/types/runExecutionContext.js +28 -0
- package/dist/utils/oauthService.d.ts +71 -0
- package/dist/utils/oauthService.js +106 -0
- package/dist/utils/signozHelpers.d.ts +9 -0
- package/dist/utils/signozHelpers.js +33 -0
- package/dist/utils/speakeasy.d.ts +93 -0
- package/dist/utils/speakeasy.js +44 -0
- package/dist/utils/tempApiKeys.d.ts +17 -0
- package/dist/utils/tempApiKeys.js +26 -0
- package/dist/utils/workflowApiHelpers.d.ts +1 -0
- package/dist/utils/workflowApiHelpers.js +1 -0
- package/package.json +125 -0
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
import { ResolvedRef } from "@inkeep/agents-core";
|
|
2
|
+
|
|
3
|
+
//#region src/domains/evals/services/conversationEvaluation.d.ts
|
|
4
|
+
declare const triggerConversationEvaluation: (params: {
|
|
5
|
+
tenantId: string;
|
|
6
|
+
projectId: string;
|
|
7
|
+
conversationId: string;
|
|
8
|
+
resolvedRef: ResolvedRef;
|
|
9
|
+
}) => Promise<{
|
|
10
|
+
success: boolean;
|
|
11
|
+
message: string;
|
|
12
|
+
evaluationsTriggered: number;
|
|
13
|
+
}>;
|
|
14
|
+
//#endregion
|
|
15
|
+
export { triggerConversationEvaluation };
|
|
@@ -0,0 +1,102 @@
|
|
|
1
|
+
import { getLogger as getLogger$1 } from "../../../logger.js";
|
|
2
|
+
import manageDbPool_default from "../../../data/db/manageDbPool.js";
|
|
3
|
+
import runDbClient_default from "../../../data/db/runDbClient.js";
|
|
4
|
+
import { evaluateConversationWorkflow } from "../workflow/functions/evaluateConversation.js";
|
|
5
|
+
import "../workflow/index.js";
|
|
6
|
+
import { createEvaluationRun, generateId, getConversation, getEvaluationSuiteConfigById, getEvaluationSuiteConfigEvaluatorRelations, listEvaluationRunConfigsWithSuiteConfigs, withRef } from "@inkeep/agents-core";
|
|
7
|
+
import { start } from "workflow/api";
|
|
8
|
+
|
|
9
|
+
//#region src/domains/evals/services/conversationEvaluation.ts
|
|
10
|
+
const logger = getLogger$1("ConversationEvaluation");
|
|
11
|
+
const triggerConversationEvaluation = async (params) => {
|
|
12
|
+
const { tenantId, projectId, conversationId, resolvedRef } = params;
|
|
13
|
+
try {
|
|
14
|
+
logger.info({
|
|
15
|
+
tenantId,
|
|
16
|
+
projectId,
|
|
17
|
+
conversationId
|
|
18
|
+
}, "Triggering conversation evaluation (eval-api handling all logic)");
|
|
19
|
+
if (!await getConversation(runDbClient_default)({
|
|
20
|
+
scopes: {
|
|
21
|
+
tenantId,
|
|
22
|
+
projectId
|
|
23
|
+
},
|
|
24
|
+
conversationId
|
|
25
|
+
})) throw new Error(`Conversation not found: ${conversationId}`);
|
|
26
|
+
const runConfigs = (await withRef(manageDbPool_default, resolvedRef, (db) => listEvaluationRunConfigsWithSuiteConfigs(db)({ scopes: {
|
|
27
|
+
tenantId,
|
|
28
|
+
projectId
|
|
29
|
+
} }))).filter((config) => config.isActive);
|
|
30
|
+
if (runConfigs.length === 0) throw new Error("No active evaluation run configs found");
|
|
31
|
+
let evaluationsTriggered = 0;
|
|
32
|
+
for (const runConfig of runConfigs) for (const suiteConfigId of runConfig.suiteConfigIds) {
|
|
33
|
+
const suiteConfig = await withRef(manageDbPool_default, resolvedRef, (db) => getEvaluationSuiteConfigById(db)({ scopes: {
|
|
34
|
+
tenantId,
|
|
35
|
+
projectId,
|
|
36
|
+
evaluationSuiteConfigId: suiteConfigId
|
|
37
|
+
} }));
|
|
38
|
+
if (!suiteConfig) {
|
|
39
|
+
logger.warn({ suiteConfigId }, "Suite config not found, skipping");
|
|
40
|
+
continue;
|
|
41
|
+
}
|
|
42
|
+
if (suiteConfig.sampleRate !== null && suiteConfig.sampleRate !== void 0) {
|
|
43
|
+
const random = Math.random();
|
|
44
|
+
if (random > suiteConfig.sampleRate) {
|
|
45
|
+
logger.info({
|
|
46
|
+
suiteConfigId: suiteConfig.id,
|
|
47
|
+
sampleRate: suiteConfig.sampleRate,
|
|
48
|
+
random,
|
|
49
|
+
conversationId
|
|
50
|
+
}, "Conversation filtered out by sample rate");
|
|
51
|
+
continue;
|
|
52
|
+
}
|
|
53
|
+
}
|
|
54
|
+
const evaluatorIds = (await withRef(manageDbPool_default, resolvedRef, (db) => getEvaluationSuiteConfigEvaluatorRelations(db)({ scopes: {
|
|
55
|
+
tenantId,
|
|
56
|
+
projectId,
|
|
57
|
+
evaluationSuiteConfigId: suiteConfigId
|
|
58
|
+
} }))).map((r) => r.evaluatorId);
|
|
59
|
+
if (evaluatorIds.length === 0) continue;
|
|
60
|
+
const evaluationRunId = generateId();
|
|
61
|
+
await createEvaluationRun(runDbClient_default)({
|
|
62
|
+
id: evaluationRunId,
|
|
63
|
+
tenantId,
|
|
64
|
+
projectId,
|
|
65
|
+
evaluationRunConfigId: runConfig.id
|
|
66
|
+
});
|
|
67
|
+
logger.info({
|
|
68
|
+
conversationId,
|
|
69
|
+
runConfigId: runConfig.id,
|
|
70
|
+
evaluationRunId,
|
|
71
|
+
evaluatorCount: evaluatorIds.length,
|
|
72
|
+
sampleRate: suiteConfig.sampleRate
|
|
73
|
+
}, "Created evaluation run, starting workflow");
|
|
74
|
+
await start(evaluateConversationWorkflow, [{
|
|
75
|
+
tenantId,
|
|
76
|
+
projectId,
|
|
77
|
+
conversationId,
|
|
78
|
+
evaluatorIds,
|
|
79
|
+
evaluationRunId
|
|
80
|
+
}]);
|
|
81
|
+
evaluationsTriggered++;
|
|
82
|
+
}
|
|
83
|
+
return {
|
|
84
|
+
success: true,
|
|
85
|
+
message: evaluationsTriggered > 0 ? `Triggered ${evaluationsTriggered} evaluation(s)` : "No evaluations matched (filtered by sample rate or no evaluators)",
|
|
86
|
+
evaluationsTriggered
|
|
87
|
+
};
|
|
88
|
+
} catch (error) {
|
|
89
|
+
logger.error({
|
|
90
|
+
error,
|
|
91
|
+
tenantId,
|
|
92
|
+
projectId,
|
|
93
|
+
conversationId
|
|
94
|
+
}, "Failed to trigger conversation evaluation");
|
|
95
|
+
logger.error({ error: error?.stack }, "Failed to trigger conversation evaluation");
|
|
96
|
+
logger.error({ error: error?.message }, "Failed to trigger conversation evaluation");
|
|
97
|
+
throw error;
|
|
98
|
+
}
|
|
99
|
+
};
|
|
100
|
+
|
|
101
|
+
//#endregion
|
|
102
|
+
export { triggerConversationEvaluation };
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
import { DatasetRunItem } from "@inkeep/agents-core";
|
|
2
|
+
|
|
3
|
+
//#region src/domains/evals/services/datasetRun.d.ts
|
|
4
|
+
declare function queueDatasetRunItems(params: {
|
|
5
|
+
tenantId: string;
|
|
6
|
+
projectId: string;
|
|
7
|
+
datasetRunId: string;
|
|
8
|
+
items: DatasetRunItem[];
|
|
9
|
+
evaluatorIds?: string[];
|
|
10
|
+
evaluationRunId?: string;
|
|
11
|
+
}): Promise<{
|
|
12
|
+
queued: number;
|
|
13
|
+
failed: number;
|
|
14
|
+
}>;
|
|
15
|
+
//#endregion
|
|
16
|
+
export { queueDatasetRunItems };
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
import { getLogger } from "../../../logger.js";
|
|
2
|
+
import { runDatasetItemWorkflow } from "../workflow/functions/runDatasetItem.js";
|
|
3
|
+
import { start } from "workflow/api";
|
|
4
|
+
|
|
5
|
+
//#region src/domains/evals/services/datasetRun.ts
|
|
6
|
+
async function queueDatasetRunItems(params) {
|
|
7
|
+
const { tenantId, projectId, datasetRunId, items, evaluatorIds, evaluationRunId } = params;
|
|
8
|
+
const logger = getLogger("workflow-triggers");
|
|
9
|
+
let queued = 0;
|
|
10
|
+
let failed = 0;
|
|
11
|
+
for (const item of items) {
|
|
12
|
+
const payload = {
|
|
13
|
+
tenantId,
|
|
14
|
+
projectId,
|
|
15
|
+
agentId: item.agentId,
|
|
16
|
+
datasetItemId: item.id ?? "",
|
|
17
|
+
datasetItemInput: item.input,
|
|
18
|
+
datasetItemExpectedOutput: item.expectedOutput,
|
|
19
|
+
datasetItemSimulationAgent: item.simulationAgent,
|
|
20
|
+
datasetRunId,
|
|
21
|
+
evaluatorIds,
|
|
22
|
+
evaluationRunId
|
|
23
|
+
};
|
|
24
|
+
try {
|
|
25
|
+
await start(runDatasetItemWorkflow, [payload]);
|
|
26
|
+
queued++;
|
|
27
|
+
} catch (err) {
|
|
28
|
+
logger.error({
|
|
29
|
+
err,
|
|
30
|
+
datasetItemId: item.id,
|
|
31
|
+
agentId: item.agentId
|
|
32
|
+
}, "Failed to queue dataset item workflow");
|
|
33
|
+
failed++;
|
|
34
|
+
}
|
|
35
|
+
}
|
|
36
|
+
return {
|
|
37
|
+
queued,
|
|
38
|
+
failed
|
|
39
|
+
};
|
|
40
|
+
}
|
|
41
|
+
|
|
42
|
+
//#endregion
|
|
43
|
+
export { queueDatasetRunItems };
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import { EvaluationJobFilterCriteria } from "@inkeep/agents-core";
|
|
2
|
+
|
|
3
|
+
//#region src/domains/evals/services/evaluationJob.d.ts
|
|
4
|
+
declare function queueEvaluationJobConversations(params: {
|
|
5
|
+
tenantId: string;
|
|
6
|
+
projectId: string;
|
|
7
|
+
evaluationJobConfigId: string;
|
|
8
|
+
evaluatorIds: string[];
|
|
9
|
+
jobFilters: EvaluationJobFilterCriteria | null | undefined;
|
|
10
|
+
}): Promise<{
|
|
11
|
+
conversationCount: number;
|
|
12
|
+
queued: number;
|
|
13
|
+
failed: number;
|
|
14
|
+
evaluationRunId: string;
|
|
15
|
+
}>;
|
|
16
|
+
//#endregion
|
|
17
|
+
export { queueEvaluationJobConversations };
|
|
@@ -0,0 +1,65 @@
|
|
|
1
|
+
import { getLogger as getLogger$1 } from "../../../logger.js";
|
|
2
|
+
import runDbClient_default from "../../../data/db/runDbClient.js";
|
|
3
|
+
import { evaluateConversationWorkflow } from "../workflow/functions/evaluateConversation.js";
|
|
4
|
+
import "../workflow/index.js";
|
|
5
|
+
import { createEvaluationRun, filterConversationsForJob, generateId } from "@inkeep/agents-core";
|
|
6
|
+
import { start } from "workflow/api";
|
|
7
|
+
|
|
8
|
+
//#region src/domains/evals/services/evaluationJob.ts
|
|
9
|
+
const logger = getLogger$1("evaluation-job");
|
|
10
|
+
async function queueEvaluationJobConversations(params) {
|
|
11
|
+
const { tenantId, projectId, evaluationJobConfigId, evaluatorIds, jobFilters } = params;
|
|
12
|
+
const conversations = await filterConversationsForJob(runDbClient_default)({
|
|
13
|
+
scopes: {
|
|
14
|
+
tenantId,
|
|
15
|
+
projectId
|
|
16
|
+
},
|
|
17
|
+
jobFilters
|
|
18
|
+
});
|
|
19
|
+
if (conversations.length === 0) {
|
|
20
|
+
logger.warn({
|
|
21
|
+
tenantId,
|
|
22
|
+
projectId,
|
|
23
|
+
evaluationJobConfigId
|
|
24
|
+
}, "No conversations found for job");
|
|
25
|
+
return {
|
|
26
|
+
conversationCount: 0,
|
|
27
|
+
queued: 0,
|
|
28
|
+
failed: 0,
|
|
29
|
+
evaluationRunId: ""
|
|
30
|
+
};
|
|
31
|
+
}
|
|
32
|
+
const evaluationRun = await createEvaluationRun(runDbClient_default)({
|
|
33
|
+
id: generateId(),
|
|
34
|
+
tenantId,
|
|
35
|
+
projectId,
|
|
36
|
+
evaluationJobConfigId
|
|
37
|
+
});
|
|
38
|
+
let queued = 0;
|
|
39
|
+
let failed = 0;
|
|
40
|
+
for (const conv of conversations) try {
|
|
41
|
+
await start(evaluateConversationWorkflow, [{
|
|
42
|
+
tenantId,
|
|
43
|
+
projectId,
|
|
44
|
+
conversationId: conv.id,
|
|
45
|
+
evaluatorIds,
|
|
46
|
+
evaluationRunId: evaluationRun.id
|
|
47
|
+
}]);
|
|
48
|
+
queued++;
|
|
49
|
+
} catch (err) {
|
|
50
|
+
logger.error({
|
|
51
|
+
err,
|
|
52
|
+
conversationId: conv.id
|
|
53
|
+
}, "Failed to queue conversation evaluation");
|
|
54
|
+
failed++;
|
|
55
|
+
}
|
|
56
|
+
return {
|
|
57
|
+
conversationCount: conversations.length,
|
|
58
|
+
queued,
|
|
59
|
+
failed,
|
|
60
|
+
evaluationRunId: evaluationRun.id
|
|
61
|
+
};
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
//#endregion
|
|
65
|
+
export { queueEvaluationJobConversations };
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
//#region src/domains/evals/services/startEvaluation.d.ts
|
|
2
|
+
/**
|
|
3
|
+
* Service to start evaluation workflows.
|
|
4
|
+
* This encapsulates the workflow logic so consumers don't need to import workflow packages.
|
|
5
|
+
*/
|
|
6
|
+
interface StartEvaluationParams {
|
|
7
|
+
tenantId: string;
|
|
8
|
+
projectId: string;
|
|
9
|
+
conversationId: string;
|
|
10
|
+
evaluatorIds: string[];
|
|
11
|
+
evaluationRunId: string;
|
|
12
|
+
}
|
|
13
|
+
/**
|
|
14
|
+
* Start an evaluation workflow for a conversation.
|
|
15
|
+
* This is a convenience wrapper that handles workflow initialization internally.
|
|
16
|
+
*/
|
|
17
|
+
declare function startConversationEvaluation(params: StartEvaluationParams): Promise<void>;
|
|
18
|
+
//#endregion
|
|
19
|
+
export { StartEvaluationParams, startConversationEvaluation };
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
import { evaluateConversationWorkflow } from "../workflow/functions/evaluateConversation.js";
|
|
2
|
+
import { start } from "workflow/api";
|
|
3
|
+
|
|
4
|
+
//#region src/domains/evals/services/startEvaluation.ts
|
|
5
|
+
/**
|
|
6
|
+
* Service to start evaluation workflows.
|
|
7
|
+
* This encapsulates the workflow logic so consumers don't need to import workflow packages.
|
|
8
|
+
*/
|
|
9
|
+
/**
|
|
10
|
+
* Start an evaluation workflow for a conversation.
|
|
11
|
+
* This is a convenience wrapper that handles workflow initialization internally.
|
|
12
|
+
*/
|
|
13
|
+
async function startConversationEvaluation(params) {
|
|
14
|
+
await start(evaluateConversationWorkflow, [params]);
|
|
15
|
+
}
|
|
16
|
+
|
|
17
|
+
//#endregion
|
|
18
|
+
export { startConversationEvaluation };
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
//#region src/domains/evals/workflow/functions/evaluateConversation.d.ts
|
|
2
|
+
type EvaluationPayload = {
|
|
3
|
+
tenantId: string;
|
|
4
|
+
projectId: string;
|
|
5
|
+
conversationId: string;
|
|
6
|
+
evaluatorIds: string[];
|
|
7
|
+
evaluationRunId: string;
|
|
8
|
+
};
|
|
9
|
+
/**
|
|
10
|
+
* Main workflow function - orchestrates the evaluation steps.
|
|
11
|
+
*
|
|
12
|
+
* IMPORTANT: This runs in a deterministic sandbox.
|
|
13
|
+
* - Do NOT call Node.js APIs directly here (no DB, no fs, etc.)
|
|
14
|
+
* - All side effects must happen in step functions
|
|
15
|
+
*/
|
|
16
|
+
declare function _evaluateConversationWorkflow(payload: EvaluationPayload): Promise<{
|
|
17
|
+
success: boolean;
|
|
18
|
+
reason: string;
|
|
19
|
+
conversationId?: undefined;
|
|
20
|
+
resultCount?: undefined;
|
|
21
|
+
} | {
|
|
22
|
+
success: boolean;
|
|
23
|
+
conversationId: string;
|
|
24
|
+
resultCount: number;
|
|
25
|
+
reason?: undefined;
|
|
26
|
+
}>;
|
|
27
|
+
declare const evaluateConversationWorkflow: typeof _evaluateConversationWorkflow & {
|
|
28
|
+
workflowId: string;
|
|
29
|
+
};
|
|
30
|
+
//#endregion
|
|
31
|
+
export { evaluateConversationWorkflow };
|
|
@@ -0,0 +1,135 @@
|
|
|
1
|
+
import { getLogger as getLogger$1 } from "../../../../logger.js";
|
|
2
|
+
import manageDbClient_default from "../../../../data/db/manageDbClient.js";
|
|
3
|
+
import manageDbPool_default from "../../../../data/db/manageDbPool.js";
|
|
4
|
+
import runDbClient_default from "../../../../data/db/runDbClient.js";
|
|
5
|
+
import "../../../../data/db/index.js";
|
|
6
|
+
import { EvaluationService } from "../../services/EvaluationService.js";
|
|
7
|
+
import { createEvaluationResult, generateId, getConversation, getEvaluatorById, getEvaluatorsByIds, getProjectMainResolvedRef, updateEvaluationResult, withRef } from "@inkeep/agents-core";
|
|
8
|
+
|
|
9
|
+
//#region src/domains/evals/workflow/functions/evaluateConversation.ts
|
|
10
|
+
const logger = getLogger$1("workflow-evaluate-conversation");
|
|
11
|
+
async function getConversationStep(payload) {
|
|
12
|
+
"use step";
|
|
13
|
+
const { tenantId, projectId, conversationId } = payload;
|
|
14
|
+
const conv = await getConversation(runDbClient_default)({
|
|
15
|
+
scopes: {
|
|
16
|
+
tenantId,
|
|
17
|
+
projectId
|
|
18
|
+
},
|
|
19
|
+
conversationId
|
|
20
|
+
});
|
|
21
|
+
if (!conv) throw new Error(`Conversation not found: ${conversationId}`);
|
|
22
|
+
return conv;
|
|
23
|
+
}
|
|
24
|
+
async function getEvaluatorsStep(payload) {
|
|
25
|
+
"use step";
|
|
26
|
+
const { tenantId, projectId, evaluatorIds } = payload;
|
|
27
|
+
return await withRef(manageDbPool_default, await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId), (db) => getEvaluatorsByIds(db)({
|
|
28
|
+
scopes: {
|
|
29
|
+
tenantId,
|
|
30
|
+
projectId
|
|
31
|
+
},
|
|
32
|
+
evaluatorIds
|
|
33
|
+
}));
|
|
34
|
+
}
|
|
35
|
+
async function executeEvaluatorStep(payload, evaluatorId, conversation) {
|
|
36
|
+
"use step";
|
|
37
|
+
const { tenantId, projectId, conversationId, evaluationRunId } = payload;
|
|
38
|
+
const evaluator = await withRef(manageDbPool_default, await getProjectMainResolvedRef(manageDbClient_default)(tenantId, projectId), (db) => getEvaluatorById(db)({ scopes: {
|
|
39
|
+
tenantId,
|
|
40
|
+
projectId,
|
|
41
|
+
evaluatorId
|
|
42
|
+
} }));
|
|
43
|
+
if (!evaluator) throw new Error(`Evaluator not found: ${evaluatorId}`);
|
|
44
|
+
const evalResult = await createEvaluationResult(runDbClient_default)({
|
|
45
|
+
id: generateId(),
|
|
46
|
+
tenantId,
|
|
47
|
+
projectId,
|
|
48
|
+
conversationId,
|
|
49
|
+
evaluatorId: evaluator.id,
|
|
50
|
+
evaluationRunId
|
|
51
|
+
});
|
|
52
|
+
try {
|
|
53
|
+
const output = await new EvaluationService().executeEvaluation({
|
|
54
|
+
conversation,
|
|
55
|
+
evaluator,
|
|
56
|
+
tenantId,
|
|
57
|
+
projectId
|
|
58
|
+
});
|
|
59
|
+
const updated = await updateEvaluationResult(runDbClient_default)({
|
|
60
|
+
scopes: {
|
|
61
|
+
tenantId,
|
|
62
|
+
projectId,
|
|
63
|
+
evaluationResultId: evalResult.id
|
|
64
|
+
},
|
|
65
|
+
data: { output }
|
|
66
|
+
});
|
|
67
|
+
logger.info({
|
|
68
|
+
conversationId,
|
|
69
|
+
evaluatorId: evaluator.id,
|
|
70
|
+
resultId: evalResult.id
|
|
71
|
+
}, "Evaluation completed successfully");
|
|
72
|
+
return updated;
|
|
73
|
+
} catch (error) {
|
|
74
|
+
const errorMessage = error instanceof Error ? error.message : "Unknown error";
|
|
75
|
+
logger.error({
|
|
76
|
+
error,
|
|
77
|
+
conversationId,
|
|
78
|
+
evaluatorId: evaluator.id,
|
|
79
|
+
resultId: evalResult.id
|
|
80
|
+
}, "Evaluation execution failed");
|
|
81
|
+
return await updateEvaluationResult(runDbClient_default)({
|
|
82
|
+
scopes: {
|
|
83
|
+
tenantId,
|
|
84
|
+
projectId,
|
|
85
|
+
evaluationResultId: evalResult.id
|
|
86
|
+
},
|
|
87
|
+
data: { output: { text: `Evaluation failed: ${errorMessage}` } }
|
|
88
|
+
});
|
|
89
|
+
}
|
|
90
|
+
}
|
|
91
|
+
/**
|
|
92
|
+
* Step: Log workflow progress
|
|
93
|
+
*/
|
|
94
|
+
async function logStep(message, data) {
|
|
95
|
+
"use step";
|
|
96
|
+
logger.info(data, message);
|
|
97
|
+
}
|
|
98
|
+
/**
|
|
99
|
+
* Main workflow function - orchestrates the evaluation steps.
|
|
100
|
+
*
|
|
101
|
+
* IMPORTANT: This runs in a deterministic sandbox.
|
|
102
|
+
* - Do NOT call Node.js APIs directly here (no DB, no fs, etc.)
|
|
103
|
+
* - All side effects must happen in step functions
|
|
104
|
+
*/
|
|
105
|
+
async function _evaluateConversationWorkflow(payload) {
|
|
106
|
+
"use workflow";
|
|
107
|
+
const { conversationId, evaluatorIds } = payload;
|
|
108
|
+
await logStep("Starting conversation evaluation", payload);
|
|
109
|
+
const conversation = await getConversationStep(payload);
|
|
110
|
+
const evaluators = await getEvaluatorsStep(payload);
|
|
111
|
+
if (evaluators.length === 0) {
|
|
112
|
+
await logStep("No valid evaluators found", {
|
|
113
|
+
conversationId,
|
|
114
|
+
evaluatorIds
|
|
115
|
+
});
|
|
116
|
+
return {
|
|
117
|
+
success: false,
|
|
118
|
+
reason: "No valid evaluators"
|
|
119
|
+
};
|
|
120
|
+
}
|
|
121
|
+
const results = [];
|
|
122
|
+
for (const evaluator of evaluators) {
|
|
123
|
+
const result = await executeEvaluatorStep(payload, evaluator.id, conversation);
|
|
124
|
+
results.push(result);
|
|
125
|
+
}
|
|
126
|
+
return {
|
|
127
|
+
success: true,
|
|
128
|
+
conversationId,
|
|
129
|
+
resultCount: results.length
|
|
130
|
+
};
|
|
131
|
+
}
|
|
132
|
+
const evaluateConversationWorkflow = Object.assign(_evaluateConversationWorkflow, { workflowId: "workflow//src/domains/evals/workflow/functions/evaluateConversation.ts//_evaluateConversationWorkflow" });
|
|
133
|
+
|
|
134
|
+
//#endregion
|
|
135
|
+
export { evaluateConversationWorkflow };
|
|
@@ -0,0 +1,39 @@
|
|
|
1
|
+
//#region src/domains/evals/workflow/functions/runDatasetItem.d.ts
|
|
2
|
+
type RunDatasetItemPayload = {
|
|
3
|
+
tenantId: string;
|
|
4
|
+
projectId: string;
|
|
5
|
+
agentId: string;
|
|
6
|
+
datasetItemId: string;
|
|
7
|
+
datasetItemInput: unknown;
|
|
8
|
+
datasetItemExpectedOutput?: unknown;
|
|
9
|
+
datasetItemSimulationAgent?: {
|
|
10
|
+
prompt: string;
|
|
11
|
+
model: {
|
|
12
|
+
model: string;
|
|
13
|
+
providerOptions?: Record<string, unknown>;
|
|
14
|
+
};
|
|
15
|
+
stopWhen?: {
|
|
16
|
+
transferCountIs?: number;
|
|
17
|
+
stepCountIs?: number;
|
|
18
|
+
};
|
|
19
|
+
};
|
|
20
|
+
datasetRunId: string;
|
|
21
|
+
evaluatorIds?: string[];
|
|
22
|
+
evaluationRunId?: string;
|
|
23
|
+
};
|
|
24
|
+
/**
|
|
25
|
+
* Main workflow function - processes a single dataset item through the chat API.
|
|
26
|
+
* Optionally runs evaluators on the resulting conversation.
|
|
27
|
+
*/
|
|
28
|
+
declare function _runDatasetItemWorkflow(payload: RunDatasetItemPayload): Promise<{
|
|
29
|
+
success: boolean;
|
|
30
|
+
datasetItemId: string;
|
|
31
|
+
datasetRunId: string;
|
|
32
|
+
conversationId: string | null;
|
|
33
|
+
error: string | null;
|
|
34
|
+
}>;
|
|
35
|
+
declare const runDatasetItemWorkflow: typeof _runDatasetItemWorkflow & {
|
|
36
|
+
workflowId: string;
|
|
37
|
+
};
|
|
38
|
+
//#endregion
|
|
39
|
+
export { runDatasetItemWorkflow };
|