@nexus-cortex/core 4.26.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +202 -0
- package/NOTICE +2 -0
- package/README.md +13 -0
- package/dist/adapters/AdapterRegistry.d.ts +118 -0
- package/dist/adapters/AdapterRegistry.d.ts.map +1 -0
- package/dist/adapters/AdapterRegistry.js +195 -0
- package/dist/adapters/AdapterRegistry.js.map +1 -0
- package/dist/adapters/ChatCompletionsAPIAdapter.d.ts +254 -0
- package/dist/adapters/ChatCompletionsAPIAdapter.d.ts.map +1 -0
- package/dist/adapters/ChatCompletionsAPIAdapter.js +531 -0
- package/dist/adapters/ChatCompletionsAPIAdapter.js.map +1 -0
- package/dist/adapters/FormatAdapter.interface.d.ts +66 -0
- package/dist/adapters/FormatAdapter.interface.d.ts.map +1 -0
- package/dist/adapters/FormatAdapter.interface.js +89 -0
- package/dist/adapters/FormatAdapter.interface.js.map +1 -0
- package/dist/adapters/GatewayTranslationLayer.d.ts +222 -0
- package/dist/adapters/GatewayTranslationLayer.d.ts.map +1 -0
- package/dist/adapters/GatewayTranslationLayer.js +679 -0
- package/dist/adapters/GatewayTranslationLayer.js.map +1 -0
- package/dist/adapters/GenerateContentAPIAdapter.d.ts +240 -0
- package/dist/adapters/GenerateContentAPIAdapter.d.ts.map +1 -0
- package/dist/adapters/GenerateContentAPIAdapter.js +489 -0
- package/dist/adapters/GenerateContentAPIAdapter.js.map +1 -0
- package/dist/adapters/GoogleGenAPIAdapter.d.ts +217 -0
- package/dist/adapters/GoogleGenAPIAdapter.d.ts.map +1 -0
- package/dist/adapters/GoogleGenAPIAdapter.js +310 -0
- package/dist/adapters/GoogleGenAPIAdapter.js.map +1 -0
- package/dist/adapters/MessagesAPIAdapter.d.ts +280 -0
- package/dist/adapters/MessagesAPIAdapter.d.ts.map +1 -0
- package/dist/adapters/MessagesAPIAdapter.js +586 -0
- package/dist/adapters/MessagesAPIAdapter.js.map +1 -0
- package/dist/adapters/ResponsesAPIAdapter.d.ts +323 -0
- package/dist/adapters/ResponsesAPIAdapter.d.ts.map +1 -0
- package/dist/adapters/ResponsesAPIAdapter.js +584 -0
- package/dist/adapters/ResponsesAPIAdapter.js.map +1 -0
- package/dist/adapters/ServerSideToolDetection.d.ts +105 -0
- package/dist/adapters/ServerSideToolDetection.d.ts.map +1 -0
- package/dist/adapters/ServerSideToolDetection.js +249 -0
- package/dist/adapters/ServerSideToolDetection.js.map +1 -0
- package/dist/adapters/ToolNamingHandler.d.ts +129 -0
- package/dist/adapters/ToolNamingHandler.d.ts.map +1 -0
- package/dist/adapters/ToolNamingHandler.js +227 -0
- package/dist/adapters/ToolNamingHandler.js.map +1 -0
- package/dist/adapters/index.d.ts +19 -0
- package/dist/adapters/index.d.ts.map +1 -0
- package/dist/adapters/index.js +23 -0
- package/dist/adapters/index.js.map +1 -0
- package/dist/adapters/node/NodeConfigProvider.d.ts +19 -0
- package/dist/adapters/node/NodeConfigProvider.d.ts.map +1 -0
- package/dist/adapters/node/NodeConfigProvider.js +37 -0
- package/dist/adapters/node/NodeConfigProvider.js.map +1 -0
- package/dist/adapters/node/NodeHistoryStoreAdapter.d.ts +26 -0
- package/dist/adapters/node/NodeHistoryStoreAdapter.d.ts.map +1 -0
- package/dist/adapters/node/NodeHistoryStoreAdapter.js +61 -0
- package/dist/adapters/node/NodeHistoryStoreAdapter.js.map +1 -0
- package/dist/adapters/node/NodePermissionAdapter.d.ts +21 -0
- package/dist/adapters/node/NodePermissionAdapter.d.ts.map +1 -0
- package/dist/adapters/node/NodePermissionAdapter.js +39 -0
- package/dist/adapters/node/NodePermissionAdapter.js.map +1 -0
- package/dist/adapters/node/NodeToolExecutorAdapter.d.ts +22 -0
- package/dist/adapters/node/NodeToolExecutorAdapter.d.ts.map +1 -0
- package/dist/adapters/node/NodeToolExecutorAdapter.js +33 -0
- package/dist/adapters/node/NodeToolExecutorAdapter.js.map +1 -0
- package/dist/adapters/node/index.d.ts +18 -0
- package/dist/adapters/node/index.d.ts.map +1 -0
- package/dist/adapters/node/index.js +18 -0
- package/dist/adapters/node/index.js.map +1 -0
- package/dist/agents/AgentStore.d.ts +172 -0
- package/dist/agents/AgentStore.d.ts.map +1 -0
- package/dist/agents/AgentStore.js +649 -0
- package/dist/agents/AgentStore.js.map +1 -0
- package/dist/agents/index.d.ts +9 -0
- package/dist/agents/index.d.ts.map +1 -0
- package/dist/agents/index.js +8 -0
- package/dist/agents/index.js.map +1 -0
- package/dist/agents/projectRoot.d.ts +2 -0
- package/dist/agents/projectRoot.d.ts.map +1 -0
- package/dist/agents/projectRoot.js +37 -0
- package/dist/agents/projectRoot.js.map +1 -0
- package/dist/commands/SlashCommandCompleter.d.ts +116 -0
- package/dist/commands/SlashCommandCompleter.d.ts.map +1 -0
- package/dist/commands/SlashCommandCompleter.js +321 -0
- package/dist/commands/SlashCommandCompleter.js.map +1 -0
- package/dist/commands/SlashCommandParser.d.ts +139 -0
- package/dist/commands/SlashCommandParser.d.ts.map +1 -0
- package/dist/commands/SlashCommandParser.js +338 -0
- package/dist/commands/SlashCommandParser.js.map +1 -0
- package/dist/commands/SlashCommandRegistry.d.ts +92 -0
- package/dist/commands/SlashCommandRegistry.d.ts.map +1 -0
- package/dist/commands/SlashCommandRegistry.js +983 -0
- package/dist/commands/SlashCommandRegistry.js.map +1 -0
- package/dist/commands/index.d.ts +13 -0
- package/dist/commands/index.d.ts.map +1 -0
- package/dist/commands/index.js +15 -0
- package/dist/commands/index.js.map +1 -0
- package/dist/commands/types.d.ts +154 -0
- package/dist/commands/types.d.ts.map +1 -0
- package/dist/commands/types.js +10 -0
- package/dist/commands/types.js.map +1 -0
- package/dist/config/AnthropicCredentialService.d.ts +107 -0
- package/dist/config/AnthropicCredentialService.d.ts.map +1 -0
- package/dist/config/AnthropicCredentialService.js +209 -0
- package/dist/config/AnthropicCredentialService.js.map +1 -0
- package/dist/config/InteractiveConfigurator.d.ts +26 -0
- package/dist/config/InteractiveConfigurator.d.ts.map +1 -0
- package/dist/config/InteractiveConfigurator.js +330 -0
- package/dist/config/InteractiveConfigurator.js.map +1 -0
- package/dist/config/MentorshipConfigService.d.ts +90 -0
- package/dist/config/MentorshipConfigService.d.ts.map +1 -0
- package/dist/config/MentorshipConfigService.js +318 -0
- package/dist/config/MentorshipConfigService.js.map +1 -0
- package/dist/config/RuntimeConfigRegistry.d.ts +20 -0
- package/dist/config/RuntimeConfigRegistry.d.ts.map +1 -0
- package/dist/config/RuntimeConfigRegistry.js +57 -0
- package/dist/config/RuntimeConfigRegistry.js.map +1 -0
- package/dist/config/SettingsLoader.d.ts +128 -0
- package/dist/config/SettingsLoader.d.ts.map +1 -0
- package/dist/config/SettingsLoader.js +487 -0
- package/dist/config/SettingsLoader.js.map +1 -0
- package/dist/config/SettingsSchema.d.ts +219 -0
- package/dist/config/SettingsSchema.d.ts.map +1 -0
- package/dist/config/SettingsSchema.js +855 -0
- package/dist/config/SettingsSchema.js.map +1 -0
- package/dist/config/SettingsWriter.d.ts +83 -0
- package/dist/config/SettingsWriter.d.ts.map +1 -0
- package/dist/config/SettingsWriter.js +256 -0
- package/dist/config/SettingsWriter.js.map +1 -0
- package/dist/config/index.d.ts +13 -0
- package/dist/config/index.d.ts.map +1 -0
- package/dist/config/index.js +13 -0
- package/dist/config/index.js.map +1 -0
- package/dist/conversation/ContextBudgetManager.d.ts +172 -0
- package/dist/conversation/ContextBudgetManager.d.ts.map +1 -0
- package/dist/conversation/ContextBudgetManager.js +445 -0
- package/dist/conversation/ContextBudgetManager.js.map +1 -0
- package/dist/conversation/StoredCompactionManager.d.ts +208 -0
- package/dist/conversation/StoredCompactionManager.d.ts.map +1 -0
- package/dist/conversation/StoredCompactionManager.js +314 -0
- package/dist/conversation/StoredCompactionManager.js.map +1 -0
- package/dist/conversation/SummaryTemplates.d.ts +35 -0
- package/dist/conversation/SummaryTemplates.d.ts.map +1 -0
- package/dist/conversation/SummaryTemplates.js +174 -0
- package/dist/conversation/SummaryTemplates.js.map +1 -0
- package/dist/conversation/index.d.ts +8 -0
- package/dist/conversation/index.d.ts.map +1 -0
- package/dist/conversation/index.js +8 -0
- package/dist/conversation/index.js.map +1 -0
- package/dist/file-tracking/ContentAddressableStore.d.ts +86 -0
- package/dist/file-tracking/ContentAddressableStore.d.ts.map +1 -0
- package/dist/file-tracking/ContentAddressableStore.js +187 -0
- package/dist/file-tracking/ContentAddressableStore.js.map +1 -0
- package/dist/file-tracking/FileCheckpointManager.d.ts +103 -0
- package/dist/file-tracking/FileCheckpointManager.d.ts.map +1 -0
- package/dist/file-tracking/FileCheckpointManager.js +269 -0
- package/dist/file-tracking/FileCheckpointManager.js.map +1 -0
- package/dist/file-tracking/index.d.ts +7 -0
- package/dist/file-tracking/index.d.ts.map +1 -0
- package/dist/file-tracking/index.js +7 -0
- package/dist/file-tracking/index.js.map +1 -0
- package/dist/index.d.ts +54 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +73 -0
- package/dist/index.js.map +1 -0
- package/dist/interfaces/APITransport.d.ts +120 -0
- package/dist/interfaces/APITransport.d.ts.map +1 -0
- package/dist/interfaces/APITransport.js +14 -0
- package/dist/interfaces/APITransport.js.map +1 -0
- package/dist/interfaces/ConfigProvider.d.ts +52 -0
- package/dist/interfaces/ConfigProvider.d.ts.map +1 -0
- package/dist/interfaces/ConfigProvider.js +14 -0
- package/dist/interfaces/ConfigProvider.js.map +1 -0
- package/dist/interfaces/CredentialResolver.d.ts +57 -0
- package/dist/interfaces/CredentialResolver.d.ts.map +1 -0
- package/dist/interfaces/CredentialResolver.js +13 -0
- package/dist/interfaces/CredentialResolver.js.map +1 -0
- package/dist/interfaces/HistoryStore.d.ts +108 -0
- package/dist/interfaces/HistoryStore.d.ts.map +1 -0
- package/dist/interfaces/HistoryStore.js +14 -0
- package/dist/interfaces/HistoryStore.js.map +1 -0
- package/dist/interfaces/PermissionHandler.d.ts +74 -0
- package/dist/interfaces/PermissionHandler.d.ts.map +1 -0
- package/dist/interfaces/PermissionHandler.js +13 -0
- package/dist/interfaces/PermissionHandler.js.map +1 -0
- package/dist/interfaces/ToolExecutorRegistry.d.ts +126 -0
- package/dist/interfaces/ToolExecutorRegistry.d.ts.map +1 -0
- package/dist/interfaces/ToolExecutorRegistry.js +14 -0
- package/dist/interfaces/ToolExecutorRegistry.js.map +1 -0
- package/dist/interfaces/index.d.ts +19 -0
- package/dist/interfaces/index.d.ts.map +1 -0
- package/dist/interfaces/index.js +14 -0
- package/dist/interfaces/index.js.map +1 -0
- package/dist/mcp/McpClient.d.ts +142 -0
- package/dist/mcp/McpClient.d.ts.map +1 -0
- package/dist/mcp/McpClient.js +349 -0
- package/dist/mcp/McpClient.js.map +1 -0
- package/dist/mcp/McpClientManager.d.ts +148 -0
- package/dist/mcp/McpClientManager.d.ts.map +1 -0
- package/dist/mcp/McpClientManager.js +366 -0
- package/dist/mcp/McpClientManager.js.map +1 -0
- package/dist/mcp/McpConfigManager.d.ts +125 -0
- package/dist/mcp/McpConfigManager.d.ts.map +1 -0
- package/dist/mcp/McpConfigManager.js +448 -0
- package/dist/mcp/McpConfigManager.js.map +1 -0
- package/dist/mcp/McpServerRegistry.d.ts +102 -0
- package/dist/mcp/McpServerRegistry.d.ts.map +1 -0
- package/dist/mcp/McpServerRegistry.js +281 -0
- package/dist/mcp/McpServerRegistry.js.map +1 -0
- package/dist/mcp/index.d.ts +11 -0
- package/dist/mcp/index.d.ts.map +1 -0
- package/dist/mcp/index.js +9 -0
- package/dist/mcp/index.js.map +1 -0
- package/dist/mcp/mcpToolNamespacing.d.ts +26 -0
- package/dist/mcp/mcpToolNamespacing.d.ts.map +1 -0
- package/dist/mcp/mcpToolNamespacing.js +36 -0
- package/dist/mcp/mcpToolNamespacing.js.map +1 -0
- package/dist/mcp/test-mcp-integration.d.ts +8 -0
- package/dist/mcp/test-mcp-integration.d.ts.map +1 -0
- package/dist/mcp/test-mcp-integration.js +115 -0
- package/dist/mcp/test-mcp-integration.js.map +1 -0
- package/dist/middleware/ErrorClassificationMiddleware.d.ts +116 -0
- package/dist/middleware/ErrorClassificationMiddleware.d.ts.map +1 -0
- package/dist/middleware/ErrorClassificationMiddleware.js +225 -0
- package/dist/middleware/ErrorClassificationMiddleware.js.map +1 -0
- package/dist/middleware/HelperModelMiddleware.d.ts +337 -0
- package/dist/middleware/HelperModelMiddleware.d.ts.map +1 -0
- package/dist/middleware/HelperModelMiddleware.js +1376 -0
- package/dist/middleware/HelperModelMiddleware.js.map +1 -0
- package/dist/middleware/MentorshipMiddleware.d.ts +210 -0
- package/dist/middleware/MentorshipMiddleware.d.ts.map +1 -0
- package/dist/middleware/MentorshipMiddleware.js +427 -0
- package/dist/middleware/MentorshipMiddleware.js.map +1 -0
- package/dist/middleware/PermissionsMiddleware.d.ts +193 -0
- package/dist/middleware/PermissionsMiddleware.d.ts.map +1 -0
- package/dist/middleware/PermissionsMiddleware.js +344 -0
- package/dist/middleware/PermissionsMiddleware.js.map +1 -0
- package/dist/middleware/RetryMiddleware.d.ts +159 -0
- package/dist/middleware/RetryMiddleware.d.ts.map +1 -0
- package/dist/middleware/RetryMiddleware.js +268 -0
- package/dist/middleware/RetryMiddleware.js.map +1 -0
- package/dist/middleware/SystemMessageMiddleware.d.ts +165 -0
- package/dist/middleware/SystemMessageMiddleware.d.ts.map +1 -0
- package/dist/middleware/SystemMessageMiddleware.js +354 -0
- package/dist/middleware/SystemMessageMiddleware.js.map +1 -0
- package/dist/middleware/contracts/MiddlewareContracts.d.ts +294 -0
- package/dist/middleware/contracts/MiddlewareContracts.d.ts.map +1 -0
- package/dist/middleware/contracts/MiddlewareContracts.js +12 -0
- package/dist/middleware/contracts/MiddlewareContracts.js.map +1 -0
- package/dist/middleware/helpers/HelperMiddlewareAdapter.interface.d.ts +211 -0
- package/dist/middleware/helpers/HelperMiddlewareAdapter.interface.d.ts.map +1 -0
- package/dist/middleware/helpers/HelperMiddlewareAdapter.interface.js +211 -0
- package/dist/middleware/helpers/HelperMiddlewareAdapter.interface.js.map +1 -0
- package/dist/middleware/helpers/HelperModelMiddlewareRegistry.d.ts +106 -0
- package/dist/middleware/helpers/HelperModelMiddlewareRegistry.d.ts.map +1 -0
- package/dist/middleware/helpers/HelperModelMiddlewareRegistry.js +148 -0
- package/dist/middleware/helpers/HelperModelMiddlewareRegistry.js.map +1 -0
- package/dist/middleware/helpers/adapters/ChatCompletionsAPIHelperAdapter.d.ts +76 -0
- package/dist/middleware/helpers/adapters/ChatCompletionsAPIHelperAdapter.d.ts.map +1 -0
- package/dist/middleware/helpers/adapters/ChatCompletionsAPIHelperAdapter.js +277 -0
- package/dist/middleware/helpers/adapters/ChatCompletionsAPIHelperAdapter.js.map +1 -0
- package/dist/middleware/helpers/adapters/GenerateContentAPIHelperAdapter.d.ts +57 -0
- package/dist/middleware/helpers/adapters/GenerateContentAPIHelperAdapter.d.ts.map +1 -0
- package/dist/middleware/helpers/adapters/GenerateContentAPIHelperAdapter.js +155 -0
- package/dist/middleware/helpers/adapters/GenerateContentAPIHelperAdapter.js.map +1 -0
- package/dist/middleware/helpers/adapters/GoogleGenAPIHelperAdapter.d.ts +124 -0
- package/dist/middleware/helpers/adapters/GoogleGenAPIHelperAdapter.d.ts.map +1 -0
- package/dist/middleware/helpers/adapters/GoogleGenAPIHelperAdapter.js +276 -0
- package/dist/middleware/helpers/adapters/GoogleGenAPIHelperAdapter.js.map +1 -0
- package/dist/middleware/helpers/adapters/MessagesAPIHelperAdapter.d.ts +71 -0
- package/dist/middleware/helpers/adapters/MessagesAPIHelperAdapter.d.ts.map +1 -0
- package/dist/middleware/helpers/adapters/MessagesAPIHelperAdapter.js +264 -0
- package/dist/middleware/helpers/adapters/MessagesAPIHelperAdapter.js.map +1 -0
- package/dist/middleware/helpers/adapters/ResponsesAPIHelperAdapter.d.ts +64 -0
- package/dist/middleware/helpers/adapters/ResponsesAPIHelperAdapter.d.ts.map +1 -0
- package/dist/middleware/helpers/adapters/ResponsesAPIHelperAdapter.js +189 -0
- package/dist/middleware/helpers/adapters/ResponsesAPIHelperAdapter.js.map +1 -0
- package/dist/middleware/helpers/adapters/index.d.ts +31 -0
- package/dist/middleware/helpers/adapters/index.d.ts.map +1 -0
- package/dist/middleware/helpers/adapters/index.js +40 -0
- package/dist/middleware/helpers/adapters/index.js.map +1 -0
- package/dist/middleware/helpers/index.d.ts +10 -0
- package/dist/middleware/helpers/index.d.ts.map +1 -0
- package/dist/middleware/helpers/index.js +13 -0
- package/dist/middleware/helpers/index.js.map +1 -0
- package/dist/middleware/index.d.ts +12 -0
- package/dist/middleware/index.d.ts.map +1 -0
- package/dist/middleware/index.js +13 -0
- package/dist/middleware/index.js.map +1 -0
- package/dist/middleware/permissions/ApprovalHandler.d.ts +22 -0
- package/dist/middleware/permissions/ApprovalHandler.d.ts.map +1 -0
- package/dist/middleware/permissions/ApprovalHandler.js +27 -0
- package/dist/middleware/permissions/ApprovalHandler.js.map +1 -0
- package/dist/middleware/permissions/AutoApproveHandler.d.ts +62 -0
- package/dist/middleware/permissions/AutoApproveHandler.d.ts.map +1 -0
- package/dist/middleware/permissions/AutoApproveHandler.js +68 -0
- package/dist/middleware/permissions/AutoApproveHandler.js.map +1 -0
- package/dist/middleware/permissions/BashCommandPolicy.d.ts +134 -0
- package/dist/middleware/permissions/BashCommandPolicy.d.ts.map +1 -0
- package/dist/middleware/permissions/BashCommandPolicy.js +239 -0
- package/dist/middleware/permissions/BashCommandPolicy.js.map +1 -0
- package/dist/middleware/permissions/BlacklistPolicy.d.ts +66 -0
- package/dist/middleware/permissions/BlacklistPolicy.d.ts.map +1 -0
- package/dist/middleware/permissions/BlacklistPolicy.js +82 -0
- package/dist/middleware/permissions/BlacklistPolicy.js.map +1 -0
- package/dist/middleware/permissions/CLIApprovalHandler.d.ts +124 -0
- package/dist/middleware/permissions/CLIApprovalHandler.d.ts.map +1 -0
- package/dist/middleware/permissions/CLIApprovalHandler.js +366 -0
- package/dist/middleware/permissions/CLIApprovalHandler.js.map +1 -0
- package/dist/middleware/permissions/DefaultPolicies.d.ts +53 -0
- package/dist/middleware/permissions/DefaultPolicies.d.ts.map +1 -0
- package/dist/middleware/permissions/DefaultPolicies.js +307 -0
- package/dist/middleware/permissions/DefaultPolicies.js.map +1 -0
- package/dist/middleware/permissions/DenyAllHandler.d.ts +58 -0
- package/dist/middleware/permissions/DenyAllHandler.d.ts.map +1 -0
- package/dist/middleware/permissions/DenyAllHandler.js +59 -0
- package/dist/middleware/permissions/DenyAllHandler.js.map +1 -0
- package/dist/middleware/permissions/FileOperationPolicy.d.ts +117 -0
- package/dist/middleware/permissions/FileOperationPolicy.d.ts.map +1 -0
- package/dist/middleware/permissions/FileOperationPolicy.js +222 -0
- package/dist/middleware/permissions/FileOperationPolicy.js.map +1 -0
- package/dist/middleware/permissions/IPCApprovalHandler.d.ts +94 -0
- package/dist/middleware/permissions/IPCApprovalHandler.d.ts.map +1 -0
- package/dist/middleware/permissions/IPCApprovalHandler.js +178 -0
- package/dist/middleware/permissions/IPCApprovalHandler.js.map +1 -0
- package/dist/middleware/permissions/PermissionAuditLogger.d.ts +169 -0
- package/dist/middleware/permissions/PermissionAuditLogger.d.ts.map +1 -0
- package/dist/middleware/permissions/PermissionAuditLogger.js +267 -0
- package/dist/middleware/permissions/PermissionAuditLogger.js.map +1 -0
- package/dist/middleware/permissions/PermissionConfig.d.ts +181 -0
- package/dist/middleware/permissions/PermissionConfig.d.ts.map +1 -0
- package/dist/middleware/permissions/PermissionConfig.js +110 -0
- package/dist/middleware/permissions/PermissionConfig.js.map +1 -0
- package/dist/middleware/permissions/PermissionConfigLoader.d.ts +89 -0
- package/dist/middleware/permissions/PermissionConfigLoader.d.ts.map +1 -0
- package/dist/middleware/permissions/PermissionConfigLoader.js +296 -0
- package/dist/middleware/permissions/PermissionConfigLoader.js.map +1 -0
- package/dist/middleware/permissions/PermissionEvaluator.d.ts +111 -0
- package/dist/middleware/permissions/PermissionEvaluator.d.ts.map +1 -0
- package/dist/middleware/permissions/PermissionEvaluator.js +196 -0
- package/dist/middleware/permissions/PermissionEvaluator.js.map +1 -0
- package/dist/middleware/permissions/PermissionPolicy.d.ts +59 -0
- package/dist/middleware/permissions/PermissionPolicy.d.ts.map +1 -0
- package/dist/middleware/permissions/PermissionPolicy.js +67 -0
- package/dist/middleware/permissions/PermissionPolicy.js.map +1 -0
- package/dist/middleware/permissions/PermissionProfileStore.d.ts +77 -0
- package/dist/middleware/permissions/PermissionProfileStore.d.ts.map +1 -0
- package/dist/middleware/permissions/PermissionProfileStore.js +167 -0
- package/dist/middleware/permissions/PermissionProfileStore.js.map +1 -0
- package/dist/middleware/permissions/WhitelistPolicy.d.ts +66 -0
- package/dist/middleware/permissions/WhitelistPolicy.d.ts.map +1 -0
- package/dist/middleware/permissions/WhitelistPolicy.js +82 -0
- package/dist/middleware/permissions/WhitelistPolicy.js.map +1 -0
- package/dist/middleware/permissions/index.d.ts +40 -0
- package/dist/middleware/permissions/index.d.ts.map +1 -0
- package/dist/middleware/permissions/index.js +30 -0
- package/dist/middleware/permissions/index.js.map +1 -0
- package/dist/middleware/permissions/profilePath.d.ts +15 -0
- package/dist/middleware/permissions/profilePath.d.ts.map +1 -0
- package/dist/middleware/permissions/profilePath.js +35 -0
- package/dist/middleware/permissions/profilePath.js.map +1 -0
- package/dist/models/ModelConfig.interface.d.ts +18 -0
- package/dist/models/ModelConfig.interface.d.ts.map +1 -0
- package/dist/models/ModelConfig.interface.js +157 -0
- package/dist/models/ModelConfig.interface.js.map +1 -0
- package/dist/models/cards/anthropic/claude-3-5-haiku.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-3-5-haiku.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-3-5-haiku.js +19 -0
- package/dist/models/cards/anthropic/claude-3-5-haiku.js.map +1 -0
- package/dist/models/cards/anthropic/claude-3-5-sonnet.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-3-5-sonnet.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-3-5-sonnet.js +19 -0
- package/dist/models/cards/anthropic/claude-3-5-sonnet.js.map +1 -0
- package/dist/models/cards/anthropic/claude-3-haiku.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-3-haiku.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-3-haiku.js +19 -0
- package/dist/models/cards/anthropic/claude-3-haiku.js.map +1 -0
- package/dist/models/cards/anthropic/claude-4-5-haiku.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-4-5-haiku.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-4-5-haiku.js +26 -0
- package/dist/models/cards/anthropic/claude-4-5-haiku.js.map +1 -0
- package/dist/models/cards/anthropic/claude-fable-5.d.ts +14 -0
- package/dist/models/cards/anthropic/claude-fable-5.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-fable-5.js +30 -0
- package/dist/models/cards/anthropic/claude-fable-5.js.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-1.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-opus-4-1.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-1.js +19 -0
- package/dist/models/cards/anthropic/claude-opus-4-1.js.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-5.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-opus-4-5.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-5.js +27 -0
- package/dist/models/cards/anthropic/claude-opus-4-5.js.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-6.d.ts +10 -0
- package/dist/models/cards/anthropic/claude-opus-4-6.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-6.js +26 -0
- package/dist/models/cards/anthropic/claude-opus-4-6.js.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-7.d.ts +10 -0
- package/dist/models/cards/anthropic/claude-opus-4-7.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-7.js +26 -0
- package/dist/models/cards/anthropic/claude-opus-4-7.js.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-8.d.ts +12 -0
- package/dist/models/cards/anthropic/claude-opus-4-8.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-opus-4-8.js +28 -0
- package/dist/models/cards/anthropic/claude-opus-4-8.js.map +1 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-5.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-5.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-5.js +27 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-5.js.map +1 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-6.d.ts +10 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-6.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-6.js +26 -0
- package/dist/models/cards/anthropic/claude-sonnet-4-6.js.map +1 -0
- package/dist/models/cards/anthropic/claude-sonnet-4.d.ts +11 -0
- package/dist/models/cards/anthropic/claude-sonnet-4.d.ts.map +1 -0
- package/dist/models/cards/anthropic/claude-sonnet-4.js +19 -0
- package/dist/models/cards/anthropic/claude-sonnet-4.js.map +1 -0
- package/dist/models/cards/anthropic/index.d.ts +15 -0
- package/dist/models/cards/anthropic/index.d.ts.map +1 -0
- package/dist/models/cards/anthropic/index.js +15 -0
- package/dist/models/cards/anthropic/index.js.map +1 -0
- package/dist/models/cards/cloudflare/gemma-4-26b.d.ts +3 -0
- package/dist/models/cards/cloudflare/gemma-4-26b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/gemma-4-26b.js +17 -0
- package/dist/models/cards/cloudflare/gemma-4-26b.js.map +1 -0
- package/dist/models/cards/cloudflare/glm-4-7-flash.d.ts +3 -0
- package/dist/models/cards/cloudflare/glm-4-7-flash.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/glm-4-7-flash.js +18 -0
- package/dist/models/cards/cloudflare/glm-4-7-flash.js.map +1 -0
- package/dist/models/cards/cloudflare/gpt-oss-120b.d.ts +3 -0
- package/dist/models/cards/cloudflare/gpt-oss-120b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/gpt-oss-120b.js +18 -0
- package/dist/models/cards/cloudflare/gpt-oss-120b.js.map +1 -0
- package/dist/models/cards/cloudflare/gpt-oss-20b.d.ts +3 -0
- package/dist/models/cards/cloudflare/gpt-oss-20b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/gpt-oss-20b.js +18 -0
- package/dist/models/cards/cloudflare/gpt-oss-20b.js.map +1 -0
- package/dist/models/cards/cloudflare/granite-4.d.ts +3 -0
- package/dist/models/cards/cloudflare/granite-4.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/granite-4.js +17 -0
- package/dist/models/cards/cloudflare/granite-4.js.map +1 -0
- package/dist/models/cards/cloudflare/index.d.ts +24 -0
- package/dist/models/cards/cloudflare/index.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/index.js +24 -0
- package/dist/models/cards/cloudflare/index.js.map +1 -0
- package/dist/models/cards/cloudflare/kimi-k2-5.d.ts +3 -0
- package/dist/models/cards/cloudflare/kimi-k2-5.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/kimi-k2-5.js +17 -0
- package/dist/models/cards/cloudflare/kimi-k2-5.js.map +1 -0
- package/dist/models/cards/cloudflare/kimi-k2-6.d.ts +3 -0
- package/dist/models/cards/cloudflare/kimi-k2-6.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/kimi-k2-6.js +20 -0
- package/dist/models/cards/cloudflare/kimi-k2-6.js.map +1 -0
- package/dist/models/cards/cloudflare/llama-3-3-70b.d.ts +3 -0
- package/dist/models/cards/cloudflare/llama-3-3-70b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/llama-3-3-70b.js +17 -0
- package/dist/models/cards/cloudflare/llama-3-3-70b.js.map +1 -0
- package/dist/models/cards/cloudflare/llama-4-scout.d.ts +3 -0
- package/dist/models/cards/cloudflare/llama-4-scout.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/llama-4-scout.js +18 -0
- package/dist/models/cards/cloudflare/llama-4-scout.js.map +1 -0
- package/dist/models/cards/cloudflare/mistral-small-3-1.d.ts +3 -0
- package/dist/models/cards/cloudflare/mistral-small-3-1.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/mistral-small-3-1.js +18 -0
- package/dist/models/cards/cloudflare/mistral-small-3-1.js.map +1 -0
- package/dist/models/cards/cloudflare/nemotron-3-120b.d.ts +3 -0
- package/dist/models/cards/cloudflare/nemotron-3-120b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/nemotron-3-120b.js +16 -0
- package/dist/models/cards/cloudflare/nemotron-3-120b.js.map +1 -0
- package/dist/models/cards/cloudflare/qwen3-30b.d.ts +3 -0
- package/dist/models/cards/cloudflare/qwen3-30b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/qwen3-30b.js +17 -0
- package/dist/models/cards/cloudflare/qwen3-30b.js.map +1 -0
- package/dist/models/cards/cloudflare/qwq-32b.d.ts +3 -0
- package/dist/models/cards/cloudflare/qwq-32b.d.ts.map +1 -0
- package/dist/models/cards/cloudflare/qwq-32b.js +18 -0
- package/dist/models/cards/cloudflare/qwq-32b.js.map +1 -0
- package/dist/models/cards/deepseek/deepseek-v4-flash.d.ts +11 -0
- package/dist/models/cards/deepseek/deepseek-v4-flash.d.ts.map +1 -0
- package/dist/models/cards/deepseek/deepseek-v4-flash.js +25 -0
- package/dist/models/cards/deepseek/deepseek-v4-flash.js.map +1 -0
- package/dist/models/cards/deepseek/deepseek-v4-pro.d.ts +11 -0
- package/dist/models/cards/deepseek/deepseek-v4-pro.d.ts.map +1 -0
- package/dist/models/cards/deepseek/deepseek-v4-pro.js +25 -0
- package/dist/models/cards/deepseek/deepseek-v4-pro.js.map +1 -0
- package/dist/models/cards/deepseek/index.d.ts +22 -0
- package/dist/models/cards/deepseek/index.d.ts.map +1 -0
- package/dist/models/cards/deepseek/index.js +22 -0
- package/dist/models/cards/deepseek/index.js.map +1 -0
- package/dist/models/cards/gemma/gemma-3-12b-it.d.ts +10 -0
- package/dist/models/cards/gemma/gemma-3-12b-it.d.ts.map +1 -0
- package/dist/models/cards/gemma/gemma-3-12b-it.js +16 -0
- package/dist/models/cards/gemma/gemma-3-12b-it.js.map +1 -0
- package/dist/models/cards/gemma/gemma-3-1b-it.d.ts +10 -0
- package/dist/models/cards/gemma/gemma-3-1b-it.d.ts.map +1 -0
- package/dist/models/cards/gemma/gemma-3-1b-it.js +16 -0
- package/dist/models/cards/gemma/gemma-3-1b-it.js.map +1 -0
- package/dist/models/cards/gemma/gemma-3-27b-it.d.ts +10 -0
- package/dist/models/cards/gemma/gemma-3-27b-it.d.ts.map +1 -0
- package/dist/models/cards/gemma/gemma-3-27b-it.js +16 -0
- package/dist/models/cards/gemma/gemma-3-27b-it.js.map +1 -0
- package/dist/models/cards/gemma/gemma-3-4b-it.d.ts +10 -0
- package/dist/models/cards/gemma/gemma-3-4b-it.d.ts.map +1 -0
- package/dist/models/cards/gemma/gemma-3-4b-it.js +16 -0
- package/dist/models/cards/gemma/gemma-3-4b-it.js.map +1 -0
- package/dist/models/cards/gemma/index.d.ts +9 -0
- package/dist/models/cards/gemma/index.d.ts.map +1 -0
- package/dist/models/cards/gemma/index.js +9 -0
- package/dist/models/cards/gemma/index.js.map +1 -0
- package/dist/models/cards/glm/glm-4-5-air.d.ts +17 -0
- package/dist/models/cards/glm/glm-4-5-air.d.ts.map +1 -0
- package/dist/models/cards/glm/glm-4-5-air.js +27 -0
- package/dist/models/cards/glm/glm-4-5-air.js.map +1 -0
- package/dist/models/cards/glm/glm-4-5.d.ts +16 -0
- package/dist/models/cards/glm/glm-4-5.d.ts.map +1 -0
- package/dist/models/cards/glm/glm-4-5.js +26 -0
- package/dist/models/cards/glm/glm-4-5.js.map +1 -0
- package/dist/models/cards/glm/glm-4-6.d.ts +17 -0
- package/dist/models/cards/glm/glm-4-6.d.ts.map +1 -0
- package/dist/models/cards/glm/glm-4-6.js +27 -0
- package/dist/models/cards/glm/glm-4-6.js.map +1 -0
- package/dist/models/cards/glm/glm-4-flash.d.ts +12 -0
- package/dist/models/cards/glm/glm-4-flash.d.ts.map +1 -0
- package/dist/models/cards/glm/glm-4-flash.js +20 -0
- package/dist/models/cards/glm/glm-4-flash.js.map +1 -0
- package/dist/models/cards/glm/glm-4.d.ts +12 -0
- package/dist/models/cards/glm/glm-4.d.ts.map +1 -0
- package/dist/models/cards/glm/glm-4.js +21 -0
- package/dist/models/cards/glm/glm-4.js.map +1 -0
- package/dist/models/cards/glm/index.d.ts +13 -0
- package/dist/models/cards/glm/index.d.ts.map +1 -0
- package/dist/models/cards/glm/index.js +13 -0
- package/dist/models/cards/glm/index.js.map +1 -0
- package/dist/models/cards/google/gemini-1-5-flash.d.ts +10 -0
- package/dist/models/cards/google/gemini-1-5-flash.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-1-5-flash.js +18 -0
- package/dist/models/cards/google/gemini-1-5-flash.js.map +1 -0
- package/dist/models/cards/google/gemini-1-5-pro.d.ts +10 -0
- package/dist/models/cards/google/gemini-1-5-pro.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-1-5-pro.js +18 -0
- package/dist/models/cards/google/gemini-1-5-pro.js.map +1 -0
- package/dist/models/cards/google/gemini-2-0-flash-lite.d.ts +10 -0
- package/dist/models/cards/google/gemini-2-0-flash-lite.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-0-flash-lite.js +18 -0
- package/dist/models/cards/google/gemini-2-0-flash-lite.js.map +1 -0
- package/dist/models/cards/google/gemini-2-0-flash.d.ts +10 -0
- package/dist/models/cards/google/gemini-2-0-flash.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-0-flash.js +24 -0
- package/dist/models/cards/google/gemini-2-0-flash.js.map +1 -0
- package/dist/models/cards/google/gemini-2-5-computer-use-preview.d.ts +18 -0
- package/dist/models/cards/google/gemini-2-5-computer-use-preview.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-5-computer-use-preview.js +26 -0
- package/dist/models/cards/google/gemini-2-5-computer-use-preview.js.map +1 -0
- package/dist/models/cards/google/gemini-2-5-flash-lite.d.ts +10 -0
- package/dist/models/cards/google/gemini-2-5-flash-lite.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-5-flash-lite.js +18 -0
- package/dist/models/cards/google/gemini-2-5-flash-lite.js.map +1 -0
- package/dist/models/cards/google/gemini-2-5-flash-sdk.d.ts +11 -0
- package/dist/models/cards/google/gemini-2-5-flash-sdk.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-5-flash-sdk.js +25 -0
- package/dist/models/cards/google/gemini-2-5-flash-sdk.js.map +1 -0
- package/dist/models/cards/google/gemini-2-5-flash.d.ts +10 -0
- package/dist/models/cards/google/gemini-2-5-flash.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-5-flash.js +24 -0
- package/dist/models/cards/google/gemini-2-5-flash.js.map +1 -0
- package/dist/models/cards/google/gemini-2-5-pro.d.ts +10 -0
- package/dist/models/cards/google/gemini-2-5-pro.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-2-5-pro.js +24 -0
- package/dist/models/cards/google/gemini-2-5-pro.js.map +1 -0
- package/dist/models/cards/google/gemini-3-1-flash-lite-preview.d.ts +11 -0
- package/dist/models/cards/google/gemini-3-1-flash-lite-preview.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-3-1-flash-lite-preview.js +20 -0
- package/dist/models/cards/google/gemini-3-1-flash-lite-preview.js.map +1 -0
- package/dist/models/cards/google/gemini-3-1-pro-preview.d.ts +10 -0
- package/dist/models/cards/google/gemini-3-1-pro-preview.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-3-1-pro-preview.js +19 -0
- package/dist/models/cards/google/gemini-3-1-pro-preview.js.map +1 -0
- package/dist/models/cards/google/gemini-3-5-flash.d.ts +10 -0
- package/dist/models/cards/google/gemini-3-5-flash.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-3-5-flash.js +19 -0
- package/dist/models/cards/google/gemini-3-5-flash.js.map +1 -0
- package/dist/models/cards/google/gemini-3-flash-preview.d.ts +11 -0
- package/dist/models/cards/google/gemini-3-flash-preview.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-3-flash-preview.js +20 -0
- package/dist/models/cards/google/gemini-3-flash-preview.js.map +1 -0
- package/dist/models/cards/google/gemini-3.d.ts +11 -0
- package/dist/models/cards/google/gemini-3.d.ts.map +1 -0
- package/dist/models/cards/google/gemini-3.js +20 -0
- package/dist/models/cards/google/gemini-3.js.map +1 -0
- package/dist/models/cards/google/index.d.ts +17 -0
- package/dist/models/cards/google/index.d.ts.map +1 -0
- package/dist/models/cards/google/index.js +17 -0
- package/dist/models/cards/google/index.js.map +1 -0
- package/dist/models/cards/huggingface/index.d.ts +10 -0
- package/dist/models/cards/huggingface/index.d.ts.map +1 -0
- package/dist/models/cards/huggingface/index.js +10 -0
- package/dist/models/cards/huggingface/index.js.map +1 -0
- package/dist/models/cards/huggingface/llama-3-8b-instruct.d.ts +17 -0
- package/dist/models/cards/huggingface/llama-3-8b-instruct.d.ts.map +1 -0
- package/dist/models/cards/huggingface/llama-3-8b-instruct.js +25 -0
- package/dist/models/cards/huggingface/llama-3-8b-instruct.js.map +1 -0
- package/dist/models/cards/huggingface/mistral-7b-instruct.d.ts +10 -0
- package/dist/models/cards/huggingface/mistral-7b-instruct.d.ts.map +1 -0
- package/dist/models/cards/huggingface/mistral-7b-instruct.js +18 -0
- package/dist/models/cards/huggingface/mistral-7b-instruct.js.map +1 -0
- package/dist/models/cards/local/codellama-13b-local.d.ts +19 -0
- package/dist/models/cards/local/codellama-13b-local.d.ts.map +1 -0
- package/dist/models/cards/local/codellama-13b-local.js +28 -0
- package/dist/models/cards/local/codellama-13b-local.js.map +1 -0
- package/dist/models/cards/local/index.d.ts +17 -0
- package/dist/models/cards/local/index.d.ts.map +1 -0
- package/dist/models/cards/local/index.js +17 -0
- package/dist/models/cards/local/index.js.map +1 -0
- package/dist/models/cards/local/llama-3-8b-local.d.ts +25 -0
- package/dist/models/cards/local/llama-3-8b-local.d.ts.map +1 -0
- package/dist/models/cards/local/llama-3-8b-local.js +34 -0
- package/dist/models/cards/local/llama-3-8b-local.js.map +1 -0
- package/dist/models/cards/local/mistral-7b-ollama.d.ts +18 -0
- package/dist/models/cards/local/mistral-7b-ollama.d.ts.map +1 -0
- package/dist/models/cards/local/mistral-7b-ollama.js +27 -0
- package/dist/models/cards/local/mistral-7b-ollama.js.map +1 -0
- package/dist/models/cards/mercury/index.d.ts +10 -0
- package/dist/models/cards/mercury/index.d.ts.map +1 -0
- package/dist/models/cards/mercury/index.js +10 -0
- package/dist/models/cards/mercury/index.js.map +1 -0
- package/dist/models/cards/mercury/mercury-2.d.ts +24 -0
- package/dist/models/cards/mercury/mercury-2.d.ts.map +1 -0
- package/dist/models/cards/mercury/mercury-2.js +33 -0
- package/dist/models/cards/mercury/mercury-2.js.map +1 -0
- package/dist/models/cards/minimax/index.d.ts +10 -0
- package/dist/models/cards/minimax/index.d.ts.map +1 -0
- package/dist/models/cards/minimax/index.js +10 -0
- package/dist/models/cards/minimax/index.js.map +1 -0
- package/dist/models/cards/minimax/minimax-m2-stable.d.ts +21 -0
- package/dist/models/cards/minimax/minimax-m2-stable.d.ts.map +1 -0
- package/dist/models/cards/minimax/minimax-m2-stable.js +31 -0
- package/dist/models/cards/minimax/minimax-m2-stable.js.map +1 -0
- package/dist/models/cards/minimax/minimax-m2.d.ts +20 -0
- package/dist/models/cards/minimax/minimax-m2.d.ts.map +1 -0
- package/dist/models/cards/minimax/minimax-m2.js +30 -0
- package/dist/models/cards/minimax/minimax-m2.js.map +1 -0
- package/dist/models/cards/moonshot/index.d.ts +9 -0
- package/dist/models/cards/moonshot/index.d.ts.map +1 -0
- package/dist/models/cards/moonshot/index.js +9 -0
- package/dist/models/cards/moonshot/index.js.map +1 -0
- package/dist/models/cards/moonshot/kimi-chat-128k.d.ts +10 -0
- package/dist/models/cards/moonshot/kimi-chat-128k.d.ts.map +1 -0
- package/dist/models/cards/moonshot/kimi-chat-128k.js +18 -0
- package/dist/models/cards/moonshot/kimi-chat-128k.js.map +1 -0
- package/dist/models/cards/moonshot/kimi-chat-32k.d.ts +10 -0
- package/dist/models/cards/moonshot/kimi-chat-32k.d.ts.map +1 -0
- package/dist/models/cards/moonshot/kimi-chat-32k.js +18 -0
- package/dist/models/cards/moonshot/kimi-chat-32k.js.map +1 -0
- package/dist/models/cards/moonshot/kimi-chat.d.ts +12 -0
- package/dist/models/cards/moonshot/kimi-chat.d.ts.map +1 -0
- package/dist/models/cards/moonshot/kimi-chat.js +20 -0
- package/dist/models/cards/moonshot/kimi-chat.js.map +1 -0
- package/dist/models/cards/moonshot/kimi-k2-instruct.d.ts +17 -0
- package/dist/models/cards/moonshot/kimi-k2-instruct.d.ts.map +1 -0
- package/dist/models/cards/moonshot/kimi-k2-instruct.js +26 -0
- package/dist/models/cards/moonshot/kimi-k2-instruct.js.map +1 -0
- package/dist/models/cards/moonshot/kimi-k2-thinking.d.ts +18 -0
- package/dist/models/cards/moonshot/kimi-k2-thinking.d.ts.map +1 -0
- package/dist/models/cards/moonshot/kimi-k2-thinking.js +27 -0
- package/dist/models/cards/moonshot/kimi-k2-thinking.js.map +1 -0
- package/dist/models/cards/openai/gpt-4-1-mini.d.ts +10 -0
- package/dist/models/cards/openai/gpt-4-1-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-4-1-mini.js +18 -0
- package/dist/models/cards/openai/gpt-4-1-mini.js.map +1 -0
- package/dist/models/cards/openai/gpt-4-1-nano.d.ts +10 -0
- package/dist/models/cards/openai/gpt-4-1-nano.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-4-1-nano.js +18 -0
- package/dist/models/cards/openai/gpt-4-1-nano.js.map +1 -0
- package/dist/models/cards/openai/gpt-4-1.d.ts +10 -0
- package/dist/models/cards/openai/gpt-4-1.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-4-1.js +18 -0
- package/dist/models/cards/openai/gpt-4-1.js.map +1 -0
- package/dist/models/cards/openai/gpt-4o-mini.d.ts +10 -0
- package/dist/models/cards/openai/gpt-4o-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-4o-mini.js +19 -0
- package/dist/models/cards/openai/gpt-4o-mini.js.map +1 -0
- package/dist/models/cards/openai/gpt-4o.d.ts +10 -0
- package/dist/models/cards/openai/gpt-4o.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-4o.js +19 -0
- package/dist/models/cards/openai/gpt-4o.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-1-reasoning.d.ts +14 -0
- package/dist/models/cards/openai/gpt-5-1-reasoning.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-1-reasoning.js +29 -0
- package/dist/models/cards/openai/gpt-5-1-reasoning.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-1.d.ts +11 -0
- package/dist/models/cards/openai/gpt-5-1.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-1.js +27 -0
- package/dist/models/cards/openai/gpt-5-1.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-2.d.ts +21 -0
- package/dist/models/cards/openai/gpt-5-2.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-2.js +37 -0
- package/dist/models/cards/openai/gpt-5-2.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-4-mini.d.ts +11 -0
- package/dist/models/cards/openai/gpt-5-4-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-4-mini.js +27 -0
- package/dist/models/cards/openai/gpt-5-4-mini.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-4.d.ts +11 -0
- package/dist/models/cards/openai/gpt-5-4.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-4.js +27 -0
- package/dist/models/cards/openai/gpt-5-4.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-5.d.ts +11 -0
- package/dist/models/cards/openai/gpt-5-5.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-5.js +27 -0
- package/dist/models/cards/openai/gpt-5-5.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-chat-latest.d.ts +10 -0
- package/dist/models/cards/openai/gpt-5-chat-latest.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-chat-latest.js +26 -0
- package/dist/models/cards/openai/gpt-5-chat-latest.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-codex.d.ts +11 -0
- package/dist/models/cards/openai/gpt-5-codex.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-codex.js +19 -0
- package/dist/models/cards/openai/gpt-5-codex.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-mini.d.ts +10 -0
- package/dist/models/cards/openai/gpt-5-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-mini.js +26 -0
- package/dist/models/cards/openai/gpt-5-mini.js.map +1 -0
- package/dist/models/cards/openai/gpt-5-nano.d.ts +10 -0
- package/dist/models/cards/openai/gpt-5-nano.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5-nano.js +26 -0
- package/dist/models/cards/openai/gpt-5-nano.js.map +1 -0
- package/dist/models/cards/openai/gpt-5.d.ts +10 -0
- package/dist/models/cards/openai/gpt-5.d.ts.map +1 -0
- package/dist/models/cards/openai/gpt-5.js +26 -0
- package/dist/models/cards/openai/gpt-5.js.map +1 -0
- package/dist/models/cards/openai/index.d.ts +32 -0
- package/dist/models/cards/openai/index.d.ts.map +1 -0
- package/dist/models/cards/openai/index.js +38 -0
- package/dist/models/cards/openai/index.js.map +1 -0
- package/dist/models/cards/openai/o1-mini.d.ts +11 -0
- package/dist/models/cards/openai/o1-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/o1-mini.js +28 -0
- package/dist/models/cards/openai/o1-mini.js.map +1 -0
- package/dist/models/cards/openai/o1-pro.d.ts +11 -0
- package/dist/models/cards/openai/o1-pro.d.ts.map +1 -0
- package/dist/models/cards/openai/o1-pro.js +28 -0
- package/dist/models/cards/openai/o1-pro.js.map +1 -0
- package/dist/models/cards/openai/o1.d.ts +11 -0
- package/dist/models/cards/openai/o1.d.ts.map +1 -0
- package/dist/models/cards/openai/o1.js +28 -0
- package/dist/models/cards/openai/o1.js.map +1 -0
- package/dist/models/cards/openai/o3-mini.d.ts +11 -0
- package/dist/models/cards/openai/o3-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/o3-mini.js +30 -0
- package/dist/models/cards/openai/o3-mini.js.map +1 -0
- package/dist/models/cards/openai/o3-pro.d.ts +11 -0
- package/dist/models/cards/openai/o3-pro.d.ts.map +1 -0
- package/dist/models/cards/openai/o3-pro.js +28 -0
- package/dist/models/cards/openai/o3-pro.js.map +1 -0
- package/dist/models/cards/openai/o3.d.ts +11 -0
- package/dist/models/cards/openai/o3.d.ts.map +1 -0
- package/dist/models/cards/openai/o3.js +28 -0
- package/dist/models/cards/openai/o3.js.map +1 -0
- package/dist/models/cards/openai/o4-mini.d.ts +11 -0
- package/dist/models/cards/openai/o4-mini.d.ts.map +1 -0
- package/dist/models/cards/openai/o4-mini.js +27 -0
- package/dist/models/cards/openai/o4-mini.js.map +1 -0
- package/dist/models/cards/qwen/index.d.ts +13 -0
- package/dist/models/cards/qwen/index.d.ts.map +1 -0
- package/dist/models/cards/qwen/index.js +13 -0
- package/dist/models/cards/qwen/index.js.map +1 -0
- package/dist/models/cards/qwen/qwen-3-coder.d.ts +17 -0
- package/dist/models/cards/qwen/qwen-3-coder.d.ts.map +1 -0
- package/dist/models/cards/qwen/qwen-3-coder.js +27 -0
- package/dist/models/cards/qwen/qwen-3-coder.js.map +1 -0
- package/dist/models/cards/qwen/qwen-3-max-preview.d.ts +17 -0
- package/dist/models/cards/qwen/qwen-3-max-preview.d.ts.map +1 -0
- package/dist/models/cards/qwen/qwen-3-max-preview.js +27 -0
- package/dist/models/cards/qwen/qwen-3-max-preview.js.map +1 -0
- package/dist/models/cards/qwen/qwen-max.d.ts +10 -0
- package/dist/models/cards/qwen/qwen-max.d.ts.map +1 -0
- package/dist/models/cards/qwen/qwen-max.js +18 -0
- package/dist/models/cards/qwen/qwen-max.js.map +1 -0
- package/dist/models/cards/qwen/qwen-plus.d.ts +10 -0
- package/dist/models/cards/qwen/qwen-plus.d.ts.map +1 -0
- package/dist/models/cards/qwen/qwen-plus.js +18 -0
- package/dist/models/cards/qwen/qwen-plus.js.map +1 -0
- package/dist/models/cards/qwen/qwen-turbo.d.ts +10 -0
- package/dist/models/cards/qwen/qwen-turbo.d.ts.map +1 -0
- package/dist/models/cards/qwen/qwen-turbo.js +18 -0
- package/dist/models/cards/qwen/qwen-turbo.js.map +1 -0
- package/dist/models/cards/xai/grok-4-1-fast-non-reasoning.d.ts +15 -0
- package/dist/models/cards/xai/grok-4-1-fast-non-reasoning.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-1-fast-non-reasoning.js +24 -0
- package/dist/models/cards/xai/grok-4-1-fast-non-reasoning.js.map +1 -0
- package/dist/models/cards/xai/grok-4-1.d.ts +14 -0
- package/dist/models/cards/xai/grok-4-1.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-1.js +24 -0
- package/dist/models/cards/xai/grok-4-1.js.map +1 -0
- package/dist/models/cards/xai/grok-4-20-multi-agent.d.ts +13 -0
- package/dist/models/cards/xai/grok-4-20-multi-agent.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-20-multi-agent.js +23 -0
- package/dist/models/cards/xai/grok-4-20-multi-agent.js.map +1 -0
- package/dist/models/cards/xai/grok-4-20-non-reasoning.d.ts +10 -0
- package/dist/models/cards/xai/grok-4-20-non-reasoning.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-20-non-reasoning.js +19 -0
- package/dist/models/cards/xai/grok-4-20-non-reasoning.js.map +1 -0
- package/dist/models/cards/xai/grok-4-20-reasoning.d.ts +10 -0
- package/dist/models/cards/xai/grok-4-20-reasoning.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-20-reasoning.js +20 -0
- package/dist/models/cards/xai/grok-4-20-reasoning.js.map +1 -0
- package/dist/models/cards/xai/grok-4-3.d.ts +11 -0
- package/dist/models/cards/xai/grok-4-3.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-3.js +22 -0
- package/dist/models/cards/xai/grok-4-3.js.map +1 -0
- package/dist/models/cards/xai/grok-4-fast-non-reasoning.d.ts +13 -0
- package/dist/models/cards/xai/grok-4-fast-non-reasoning.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-fast-non-reasoning.js +22 -0
- package/dist/models/cards/xai/grok-4-fast-non-reasoning.js.map +1 -0
- package/dist/models/cards/xai/grok-4-fast.d.ts +12 -0
- package/dist/models/cards/xai/grok-4-fast.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-4-fast.js +21 -0
- package/dist/models/cards/xai/grok-4-fast.js.map +1 -0
- package/dist/models/cards/xai/grok-build-0-1-responses.d.ts +22 -0
- package/dist/models/cards/xai/grok-build-0-1-responses.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-build-0-1-responses.js +39 -0
- package/dist/models/cards/xai/grok-build-0-1-responses.js.map +1 -0
- package/dist/models/cards/xai/grok-build-0-1.d.ts +17 -0
- package/dist/models/cards/xai/grok-build-0-1.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-build-0-1.js +31 -0
- package/dist/models/cards/xai/grok-build-0-1.js.map +1 -0
- package/dist/models/cards/xai/grok-code-fast-1.d.ts +10 -0
- package/dist/models/cards/xai/grok-code-fast-1.d.ts.map +1 -0
- package/dist/models/cards/xai/grok-code-fast-1.js +22 -0
- package/dist/models/cards/xai/grok-code-fast-1.js.map +1 -0
- package/dist/models/cards/xai/index.d.ts +17 -0
- package/dist/models/cards/xai/index.d.ts.map +1 -0
- package/dist/models/cards/xai/index.js +18 -0
- package/dist/models/cards/xai/index.js.map +1 -0
- package/dist/models/configurators/AnthropicConfigurator.d.ts +57 -0
- package/dist/models/configurators/AnthropicConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/AnthropicConfigurator.js +108 -0
- package/dist/models/configurators/AnthropicConfigurator.js.map +1 -0
- package/dist/models/configurators/CloudflareConfigurator.d.ts +46 -0
- package/dist/models/configurators/CloudflareConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/CloudflareConfigurator.js +112 -0
- package/dist/models/configurators/CloudflareConfigurator.js.map +1 -0
- package/dist/models/configurators/DeepSeekConfigurator.d.ts +26 -0
- package/dist/models/configurators/DeepSeekConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/DeepSeekConfigurator.js +81 -0
- package/dist/models/configurators/DeepSeekConfigurator.js.map +1 -0
- package/dist/models/configurators/GLMConfigurator.d.ts +22 -0
- package/dist/models/configurators/GLMConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/GLMConfigurator.js +82 -0
- package/dist/models/configurators/GLMConfigurator.js.map +1 -0
- package/dist/models/configurators/GemmaConfigurator.d.ts +18 -0
- package/dist/models/configurators/GemmaConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/GemmaConfigurator.js +89 -0
- package/dist/models/configurators/GemmaConfigurator.js.map +1 -0
- package/dist/models/configurators/GoogleConfigurator.d.ts +26 -0
- package/dist/models/configurators/GoogleConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/GoogleConfigurator.js +91 -0
- package/dist/models/configurators/GoogleConfigurator.js.map +1 -0
- package/dist/models/configurators/GoogleSDKConfigurator.d.ts +29 -0
- package/dist/models/configurators/GoogleSDKConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/GoogleSDKConfigurator.js +95 -0
- package/dist/models/configurators/GoogleSDKConfigurator.js.map +1 -0
- package/dist/models/configurators/HuggingFaceConfigurator.d.ts +31 -0
- package/dist/models/configurators/HuggingFaceConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/HuggingFaceConfigurator.js +85 -0
- package/dist/models/configurators/HuggingFaceConfigurator.js.map +1 -0
- package/dist/models/configurators/LocalModelConfigurator.d.ts +30 -0
- package/dist/models/configurators/LocalModelConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/LocalModelConfigurator.js +88 -0
- package/dist/models/configurators/LocalModelConfigurator.js.map +1 -0
- package/dist/models/configurators/MercuryConfigurator.d.ts +27 -0
- package/dist/models/configurators/MercuryConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/MercuryConfigurator.js +91 -0
- package/dist/models/configurators/MercuryConfigurator.js.map +1 -0
- package/dist/models/configurators/MiniMaxConfigurator.d.ts +47 -0
- package/dist/models/configurators/MiniMaxConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/MiniMaxConfigurator.js +103 -0
- package/dist/models/configurators/MiniMaxConfigurator.js.map +1 -0
- package/dist/models/configurators/MoonshotConfigurator.d.ts +21 -0
- package/dist/models/configurators/MoonshotConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/MoonshotConfigurator.js +81 -0
- package/dist/models/configurators/MoonshotConfigurator.js.map +1 -0
- package/dist/models/configurators/OpenAIConfigurator.d.ts +52 -0
- package/dist/models/configurators/OpenAIConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/OpenAIConfigurator.js +128 -0
- package/dist/models/configurators/OpenAIConfigurator.js.map +1 -0
- package/dist/models/configurators/OpenAIResponsesConfigurator.d.ts +23 -0
- package/dist/models/configurators/OpenAIResponsesConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/OpenAIResponsesConfigurator.js +113 -0
- package/dist/models/configurators/OpenAIResponsesConfigurator.js.map +1 -0
- package/dist/models/configurators/QwenConfigurator.d.ts +26 -0
- package/dist/models/configurators/QwenConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/QwenConfigurator.js +87 -0
- package/dist/models/configurators/QwenConfigurator.js.map +1 -0
- package/dist/models/configurators/XAIConfigurator.d.ts +52 -0
- package/dist/models/configurators/XAIConfigurator.d.ts.map +1 -0
- package/dist/models/configurators/XAIConfigurator.js +130 -0
- package/dist/models/configurators/XAIConfigurator.js.map +1 -0
- package/dist/models/configurators/index.d.ts +19 -0
- package/dist/models/configurators/index.d.ts.map +1 -0
- package/dist/models/configurators/index.js +19 -0
- package/dist/models/configurators/index.js.map +1 -0
- package/dist/models/index.d.ts +7 -0
- package/dist/models/index.d.ts.map +1 -0
- package/dist/models/index.js +7 -0
- package/dist/models/index.js.map +1 -0
- package/dist/models/registry/ModelAliasResolver.d.ts +109 -0
- package/dist/models/registry/ModelAliasResolver.d.ts.map +1 -0
- package/dist/models/registry/ModelAliasResolver.js +255 -0
- package/dist/models/registry/ModelAliasResolver.js.map +1 -0
- package/dist/models/registry/ModelCardLoader.d.ts +44 -0
- package/dist/models/registry/ModelCardLoader.d.ts.map +1 -0
- package/dist/models/registry/ModelCardLoader.js +124 -0
- package/dist/models/registry/ModelCardLoader.js.map +1 -0
- package/dist/models/registry/ModularModelRegistry.d.ts +86 -0
- package/dist/models/registry/ModularModelRegistry.d.ts.map +1 -0
- package/dist/models/registry/ModularModelRegistry.js +311 -0
- package/dist/models/registry/ModularModelRegistry.js.map +1 -0
- package/dist/models/registry/index.d.ts +8 -0
- package/dist/models/registry/index.d.ts.map +1 -0
- package/dist/models/registry/index.js +9 -0
- package/dist/models/registry/index.js.map +1 -0
- package/dist/orchestrator/APIClient.d.ts +274 -0
- package/dist/orchestrator/APIClient.d.ts.map +1 -0
- package/dist/orchestrator/APIClient.js +2770 -0
- package/dist/orchestrator/APIClient.js.map +1 -0
- package/dist/orchestrator/CortexOrchestrator.d.ts +986 -0
- package/dist/orchestrator/CortexOrchestrator.d.ts.map +1 -0
- package/dist/orchestrator/CortexOrchestrator.js +6374 -0
- package/dist/orchestrator/CortexOrchestrator.js.map +1 -0
- package/dist/orchestrator/OrchestratorFactory.d.ts +81 -0
- package/dist/orchestrator/OrchestratorFactory.d.ts.map +1 -0
- package/dist/orchestrator/OrchestratorFactory.js +433 -0
- package/dist/orchestrator/OrchestratorFactory.js.map +1 -0
- package/dist/orchestrator/PauseController.d.ts +126 -0
- package/dist/orchestrator/PauseController.d.ts.map +1 -0
- package/dist/orchestrator/PauseController.js +248 -0
- package/dist/orchestrator/PauseController.js.map +1 -0
- package/dist/orchestrator/SubAgentEventEmitter.d.ts +152 -0
- package/dist/orchestrator/SubAgentEventEmitter.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentEventEmitter.js +372 -0
- package/dist/orchestrator/SubAgentEventEmitter.js.map +1 -0
- package/dist/orchestrator/SubAgentIPC.d.ts +242 -0
- package/dist/orchestrator/SubAgentIPC.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentIPC.js +85 -0
- package/dist/orchestrator/SubAgentIPC.js.map +1 -0
- package/dist/orchestrator/SubAgentManager.d.ts +215 -0
- package/dist/orchestrator/SubAgentManager.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentManager.js +477 -0
- package/dist/orchestrator/SubAgentManager.js.map +1 -0
- package/dist/orchestrator/SubAgentOrchestrator.d.ts +125 -0
- package/dist/orchestrator/SubAgentOrchestrator.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentOrchestrator.js +395 -0
- package/dist/orchestrator/SubAgentOrchestrator.js.map +1 -0
- package/dist/orchestrator/SubAgentPermissionChecker.d.ts +132 -0
- package/dist/orchestrator/SubAgentPermissionChecker.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentPermissionChecker.js +239 -0
- package/dist/orchestrator/SubAgentPermissionChecker.js.map +1 -0
- package/dist/orchestrator/SubAgentProcessManager.d.ts +228 -0
- package/dist/orchestrator/SubAgentProcessManager.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentProcessManager.js +679 -0
- package/dist/orchestrator/SubAgentProcessManager.js.map +1 -0
- package/dist/orchestrator/SubAgentTypes.d.ts +428 -0
- package/dist/orchestrator/SubAgentTypes.d.ts.map +1 -0
- package/dist/orchestrator/SubAgentTypes.js +12 -0
- package/dist/orchestrator/SubAgentTypes.js.map +1 -0
- package/dist/orchestrator/apiErrorClassifier.d.ts +17 -0
- package/dist/orchestrator/apiErrorClassifier.d.ts.map +1 -0
- package/dist/orchestrator/apiErrorClassifier.js +38 -0
- package/dist/orchestrator/apiErrorClassifier.js.map +1 -0
- package/dist/orchestrator/assistantTextPresence.d.ts +32 -0
- package/dist/orchestrator/assistantTextPresence.d.ts.map +1 -0
- package/dist/orchestrator/assistantTextPresence.js +47 -0
- package/dist/orchestrator/assistantTextPresence.js.map +1 -0
- package/dist/orchestrator/citationVerification.d.ts +32 -0
- package/dist/orchestrator/citationVerification.d.ts.map +1 -0
- package/dist/orchestrator/citationVerification.js +47 -0
- package/dist/orchestrator/citationVerification.js.map +1 -0
- package/dist/orchestrator/coordinateVerification.d.ts +50 -0
- package/dist/orchestrator/coordinateVerification.d.ts.map +1 -0
- package/dist/orchestrator/coordinateVerification.js +114 -0
- package/dist/orchestrator/coordinateVerification.js.map +1 -0
- package/dist/orchestrator/cortexTrainingRecord.d.ts +88 -0
- package/dist/orchestrator/cortexTrainingRecord.d.ts.map +1 -0
- package/dist/orchestrator/cortexTrainingRecord.js +102 -0
- package/dist/orchestrator/cortexTrainingRecord.js.map +1 -0
- package/dist/orchestrator/index.d.ts +20 -0
- package/dist/orchestrator/index.d.ts.map +1 -0
- package/dist/orchestrator/index.js +18 -0
- package/dist/orchestrator/index.js.map +1 -0
- package/dist/orchestrator/mcpAutoInjectPolicy.d.ts +18 -0
- package/dist/orchestrator/mcpAutoInjectPolicy.d.ts.map +1 -0
- package/dist/orchestrator/mcpAutoInjectPolicy.js +24 -0
- package/dist/orchestrator/mcpAutoInjectPolicy.js.map +1 -0
- package/dist/orchestrator/staticSystemPromptPin.d.ts +20 -0
- package/dist/orchestrator/staticSystemPromptPin.d.ts.map +1 -0
- package/dist/orchestrator/staticSystemPromptPin.js +33 -0
- package/dist/orchestrator/staticSystemPromptPin.js.map +1 -0
- package/dist/orchestrator/toolBudgetSignal.d.ts +41 -0
- package/dist/orchestrator/toolBudgetSignal.d.ts.map +1 -0
- package/dist/orchestrator/toolBudgetSignal.js +77 -0
- package/dist/orchestrator/toolBudgetSignal.js.map +1 -0
- package/dist/orchestrator/toolNameMatcher.d.ts +21 -0
- package/dist/orchestrator/toolNameMatcher.d.ts.map +1 -0
- package/dist/orchestrator/toolNameMatcher.js +69 -0
- package/dist/orchestrator/toolNameMatcher.js.map +1 -0
- package/dist/session/CacheMetricsAccumulator.d.ts +72 -0
- package/dist/session/CacheMetricsAccumulator.d.ts.map +1 -0
- package/dist/session/CacheMetricsAccumulator.js +144 -0
- package/dist/session/CacheMetricsAccumulator.js.map +1 -0
- package/dist/session/CheckpointManager.d.ts +106 -0
- package/dist/session/CheckpointManager.d.ts.map +1 -0
- package/dist/session/CheckpointManager.js +223 -0
- package/dist/session/CheckpointManager.js.map +1 -0
- package/dist/session/JSONLHistoryStore.d.ts +154 -0
- package/dist/session/JSONLHistoryStore.d.ts.map +1 -0
- package/dist/session/JSONLHistoryStore.js +393 -0
- package/dist/session/JSONLHistoryStore.js.map +1 -0
- package/dist/session/MessageTypes.d.ts +269 -0
- package/dist/session/MessageTypes.d.ts.map +1 -0
- package/dist/session/MessageTypes.js +38 -0
- package/dist/session/MessageTypes.js.map +1 -0
- package/dist/session/SessionTimeline.d.ts +304 -0
- package/dist/session/SessionTimeline.d.ts.map +1 -0
- package/dist/session/SessionTimeline.js +396 -0
- package/dist/session/SessionTimeline.js.map +1 -0
- package/dist/session/index.d.ts +10 -0
- package/dist/session/index.d.ts.map +1 -0
- package/dist/session/index.js +10 -0
- package/dist/session/index.js.map +1 -0
- package/dist/system-messages/MessageValidator.d.ts +71 -0
- package/dist/system-messages/MessageValidator.d.ts.map +1 -0
- package/dist/system-messages/MessageValidator.js +305 -0
- package/dist/system-messages/MessageValidator.js.map +1 -0
- package/dist/system-messages/SystemMessageLoader.d.ts +154 -0
- package/dist/system-messages/SystemMessageLoader.d.ts.map +1 -0
- package/dist/system-messages/SystemMessageLoader.js +695 -0
- package/dist/system-messages/SystemMessageLoader.js.map +1 -0
- package/dist/system-messages/SystemMessageRegistry.d.ts +67 -0
- package/dist/system-messages/SystemMessageRegistry.d.ts.map +1 -0
- package/dist/system-messages/SystemMessageRegistry.interface.d.ts +166 -0
- package/dist/system-messages/SystemMessageRegistry.interface.d.ts.map +1 -0
- package/dist/system-messages/SystemMessageRegistry.interface.js +6 -0
- package/dist/system-messages/SystemMessageRegistry.interface.js.map +1 -0
- package/dist/system-messages/SystemMessageRegistry.js +164 -0
- package/dist/system-messages/SystemMessageRegistry.js.map +1 -0
- package/dist/system-messages/SystemMessageStore.d.ts +207 -0
- package/dist/system-messages/SystemMessageStore.d.ts.map +1 -0
- package/dist/system-messages/SystemMessageStore.js +748 -0
- package/dist/system-messages/SystemMessageStore.js.map +1 -0
- package/dist/system-messages/SystemReminderInjector.d.ts +148 -0
- package/dist/system-messages/SystemReminderInjector.d.ts.map +1 -0
- package/dist/system-messages/SystemReminderInjector.js +331 -0
- package/dist/system-messages/SystemReminderInjector.js.map +1 -0
- package/dist/system-messages/docTruncation.d.ts +31 -0
- package/dist/system-messages/docTruncation.d.ts.map +1 -0
- package/dist/system-messages/docTruncation.js +26 -0
- package/dist/system-messages/docTruncation.js.map +1 -0
- package/dist/system-messages/index.d.ts +12 -0
- package/dist/system-messages/index.d.ts.map +1 -0
- package/dist/system-messages/index.js +15 -0
- package/dist/system-messages/index.js.map +1 -0
- package/dist/system-messages/messages/ACTIVE_DISCOVERY.md +26 -0
- package/dist/system-messages/messages/EXAMPLES.md +73 -0
- package/dist/system-messages/messages/PERIODIC_REMINDER.md +6 -0
- package/dist/system-messages/messages/REASONING_GUIDE.md +12 -0
- package/dist/system-messages/messages/SYSTEM_PROMPT.md +47 -0
- package/dist/system-messages/messages/TASK_AGENT_GUIDE.md +5 -0
- package/dist/system-messages/messages/TOOL_USAGE_GUIDE.md +131 -0
- package/dist/system-messages/system-message-registry.json +233 -0
- package/dist/system-messages/turnVaryingClassifier.d.ts +20 -0
- package/dist/system-messages/turnVaryingClassifier.d.ts.map +1 -0
- package/dist/system-messages/turnVaryingClassifier.js +27 -0
- package/dist/system-messages/turnVaryingClassifier.js.map +1 -0
- package/dist/system-messages/types.d.ts +184 -0
- package/dist/system-messages/types.d.ts.map +1 -0
- package/dist/system-messages/types.js +7 -0
- package/dist/system-messages/types.js.map +1 -0
- package/dist/tools/ClientSideToolFilter.d.ts +35 -0
- package/dist/tools/ClientSideToolFilter.d.ts.map +1 -0
- package/dist/tools/ClientSideToolFilter.js +74 -0
- package/dist/tools/ClientSideToolFilter.js.map +1 -0
- package/dist/tools/ServerSideTools.d.ts +181 -0
- package/dist/tools/ServerSideTools.d.ts.map +1 -0
- package/dist/tools/ServerSideTools.js +309 -0
- package/dist/tools/ServerSideTools.js.map +1 -0
- package/dist/tools/ToolFactory.d.ts +88 -0
- package/dist/tools/ToolFactory.d.ts.map +1 -0
- package/dist/tools/ToolFactory.js +153 -0
- package/dist/tools/ToolFactory.js.map +1 -0
- package/dist/tools/context-management/InitCortexContext.d.ts +184 -0
- package/dist/tools/context-management/InitCortexContext.d.ts.map +1 -0
- package/dist/tools/context-management/InitCortexContext.js +1063 -0
- package/dist/tools/context-management/InitCortexContext.js.map +1 -0
- package/dist/tools/context-management/index.d.ts +8 -0
- package/dist/tools/context-management/index.d.ts.map +1 -0
- package/dist/tools/context-management/index.js +7 -0
- package/dist/tools/context-management/index.js.map +1 -0
- package/dist/tools/historical/GetConversationSegment.d.ts +131 -0
- package/dist/tools/historical/GetConversationSegment.d.ts.map +1 -0
- package/dist/tools/historical/GetConversationSegment.js +306 -0
- package/dist/tools/historical/GetConversationSegment.js.map +1 -0
- package/dist/tools/historical/HistoricalContextService.d.ts +229 -0
- package/dist/tools/historical/HistoricalContextService.d.ts.map +1 -0
- package/dist/tools/historical/HistoricalContextService.js +206 -0
- package/dist/tools/historical/HistoricalContextService.js.map +1 -0
- package/dist/tools/historical/ListCompactionBoundaries.d.ts +107 -0
- package/dist/tools/historical/ListCompactionBoundaries.d.ts.map +1 -0
- package/dist/tools/historical/ListCompactionBoundaries.js +175 -0
- package/dist/tools/historical/ListCompactionBoundaries.js.map +1 -0
- package/dist/tools/historical/ListSessions.d.ts +50 -0
- package/dist/tools/historical/ListSessions.d.ts.map +1 -0
- package/dist/tools/historical/ListSessions.js +93 -0
- package/dist/tools/historical/ListSessions.js.map +1 -0
- package/dist/tools/historical/LoadSession.d.ts +51 -0
- package/dist/tools/historical/LoadSession.d.ts.map +1 -0
- package/dist/tools/historical/LoadSession.js +89 -0
- package/dist/tools/historical/LoadSession.js.map +1 -0
- package/dist/tools/historical/RequestHistoricalContext.d.ts +122 -0
- package/dist/tools/historical/RequestHistoricalContext.d.ts.map +1 -0
- package/dist/tools/historical/RequestHistoricalContext.js +250 -0
- package/dist/tools/historical/RequestHistoricalContext.js.map +1 -0
- package/dist/tools/historical/SearchConversationHistory.d.ts +117 -0
- package/dist/tools/historical/SearchConversationHistory.d.ts.map +1 -0
- package/dist/tools/historical/SearchConversationHistory.js +239 -0
- package/dist/tools/historical/SearchConversationHistory.js.map +1 -0
- package/dist/tools/historical/index.d.ts +14 -0
- package/dist/tools/historical/index.d.ts.map +1 -0
- package/dist/tools/historical/index.js +14 -0
- package/dist/tools/historical/index.js.map +1 -0
- package/dist/tools/index.d.ts +15 -0
- package/dist/tools/index.d.ts.map +1 -0
- package/dist/tools/index.js +21 -0
- package/dist/tools/index.js.map +1 -0
- package/dist/tools/mcp-management/ConfigureMcpServer.d.ts +41 -0
- package/dist/tools/mcp-management/ConfigureMcpServer.d.ts.map +1 -0
- package/dist/tools/mcp-management/ConfigureMcpServer.js +147 -0
- package/dist/tools/mcp-management/ConfigureMcpServer.js.map +1 -0
- package/dist/tools/mcp-management/DisableMcpServer.d.ts +39 -0
- package/dist/tools/mcp-management/DisableMcpServer.d.ts.map +1 -0
- package/dist/tools/mcp-management/DisableMcpServer.js +108 -0
- package/dist/tools/mcp-management/DisableMcpServer.js.map +1 -0
- package/dist/tools/mcp-management/EnableMcpServer.d.ts +49 -0
- package/dist/tools/mcp-management/EnableMcpServer.d.ts.map +1 -0
- package/dist/tools/mcp-management/EnableMcpServer.js +134 -0
- package/dist/tools/mcp-management/EnableMcpServer.js.map +1 -0
- package/dist/tools/mcp-management/GetMcpConfig.d.ts +52 -0
- package/dist/tools/mcp-management/GetMcpConfig.d.ts.map +1 -0
- package/dist/tools/mcp-management/GetMcpConfig.js +95 -0
- package/dist/tools/mcp-management/GetMcpConfig.js.map +1 -0
- package/dist/tools/mcp-management/InitMcpConfig.d.ts +113 -0
- package/dist/tools/mcp-management/InitMcpConfig.d.ts.map +1 -0
- package/dist/tools/mcp-management/InitMcpConfig.js +421 -0
- package/dist/tools/mcp-management/InitMcpConfig.js.map +1 -0
- package/dist/tools/mcp-management/ListAvailableMcpServers.d.ts +50 -0
- package/dist/tools/mcp-management/ListAvailableMcpServers.d.ts.map +1 -0
- package/dist/tools/mcp-management/ListAvailableMcpServers.js +92 -0
- package/dist/tools/mcp-management/ListAvailableMcpServers.js.map +1 -0
- package/dist/tools/mcp-management/SearchMcpServers.d.ts +44 -0
- package/dist/tools/mcp-management/SearchMcpServers.d.ts.map +1 -0
- package/dist/tools/mcp-management/SearchMcpServers.js +96 -0
- package/dist/tools/mcp-management/SearchMcpServers.js.map +1 -0
- package/dist/tools/mcp-management/index.d.ts +23 -0
- package/dist/tools/mcp-management/index.d.ts.map +1 -0
- package/dist/tools/mcp-management/index.js +16 -0
- package/dist/tools/mcp-management/index.js.map +1 -0
- package/dist/tools/registries/AddonToolRegistry.d.ts +70 -0
- package/dist/tools/registries/AddonToolRegistry.d.ts.map +1 -0
- package/dist/tools/registries/AddonToolRegistry.js +138 -0
- package/dist/tools/registries/AddonToolRegistry.js.map +1 -0
- package/dist/tools/registries/BaseToolRegistry.d.ts +38 -0
- package/dist/tools/registries/BaseToolRegistry.d.ts.map +1 -0
- package/dist/tools/registries/BaseToolRegistry.js +2058 -0
- package/dist/tools/registries/BaseToolRegistry.js.map +1 -0
- package/dist/tools/registries/index.d.ts +8 -0
- package/dist/tools/registries/index.d.ts.map +1 -0
- package/dist/tools/registries/index.js +8 -0
- package/dist/tools/registries/index.js.map +1 -0
- package/dist/tools/types/CanonicalTool.d.ts +130 -0
- package/dist/tools/types/CanonicalTool.d.ts.map +1 -0
- package/dist/tools/types/CanonicalTool.js +10 -0
- package/dist/tools/types/CanonicalTool.js.map +1 -0
- package/dist/tools/types/index.d.ts +7 -0
- package/dist/tools/types/index.d.ts.map +1 -0
- package/dist/tools/types/index.js +7 -0
- package/dist/tools/types/index.js.map +1 -0
- package/dist/training/AutoResearchGate.d.ts +64 -0
- package/dist/training/AutoResearchGate.d.ts.map +1 -0
- package/dist/training/AutoResearchGate.js +94 -0
- package/dist/training/AutoResearchGate.js.map +1 -0
- package/dist/training/AutoResearchStats.d.ts +128 -0
- package/dist/training/AutoResearchStats.d.ts.map +1 -0
- package/dist/training/AutoResearchStats.js +210 -0
- package/dist/training/AutoResearchStats.js.map +1 -0
- package/dist/training/BenchRunner.d.ts +177 -0
- package/dist/training/BenchRunner.d.ts.map +1 -0
- package/dist/training/BenchRunner.js +211 -0
- package/dist/training/BenchRunner.js.map +1 -0
- package/dist/training/DecisionPriorInjector.d.ts +18 -0
- package/dist/training/DecisionPriorInjector.d.ts.map +1 -0
- package/dist/training/DecisionPriorInjector.js +34 -0
- package/dist/training/DecisionPriorInjector.js.map +1 -0
- package/dist/training/DecisionStore.d.ts +78 -0
- package/dist/training/DecisionStore.d.ts.map +1 -0
- package/dist/training/DecisionStore.js +171 -0
- package/dist/training/DecisionStore.js.map +1 -0
- package/dist/training/ExperimentLedger.d.ts +138 -0
- package/dist/training/ExperimentLedger.d.ts.map +1 -0
- package/dist/training/ExperimentLedger.js +160 -0
- package/dist/training/ExperimentLedger.js.map +1 -0
- package/dist/training/ExperimentRunner.d.ts +88 -0
- package/dist/training/ExperimentRunner.d.ts.map +1 -0
- package/dist/training/ExperimentRunner.js +97 -0
- package/dist/training/ExperimentRunner.js.map +1 -0
- package/dist/training/ModelRouterMatrix.d.ts +197 -0
- package/dist/training/ModelRouterMatrix.d.ts.map +1 -0
- package/dist/training/ModelRouterMatrix.js +0 -0
- package/dist/training/ModelRouterMatrix.js.map +1 -0
- package/dist/training/ResearchBacklog.d.ts +102 -0
- package/dist/training/ResearchBacklog.d.ts.map +1 -0
- package/dist/training/ResearchBacklog.js +149 -0
- package/dist/training/ResearchBacklog.js.map +1 -0
- package/dist/training/TaskClassifier.d.ts +16 -0
- package/dist/training/TaskClassifier.d.ts.map +1 -0
- package/dist/training/TaskClassifier.js +70 -0
- package/dist/training/TaskClassifier.js.map +1 -0
- package/dist/training/ThompsonRouter.d.ts +53 -0
- package/dist/training/ThompsonRouter.d.ts.map +1 -0
- package/dist/training/ThompsonRouter.js +73 -0
- package/dist/training/ThompsonRouter.js.map +1 -0
- package/dist/training/VersionComparison.d.ts +90 -0
- package/dist/training/VersionComparison.d.ts.map +1 -0
- package/dist/training/VersionComparison.js +117 -0
- package/dist/training/VersionComparison.js.map +1 -0
- package/dist/ui/index.d.ts +13 -0
- package/dist/ui/index.d.ts.map +1 -0
- package/dist/ui/index.js +15 -0
- package/dist/ui/index.js.map +1 -0
- package/dist/ui/menu-types.d.ts +314 -0
- package/dist/ui/menu-types.d.ts.map +1 -0
- package/dist/ui/menu-types.js +138 -0
- package/dist/ui/menu-types.js.map +1 -0
- package/dist/ui/types.d.ts +86 -0
- package/dist/ui/types.d.ts.map +1 -0
- package/dist/ui/types.js +12 -0
- package/dist/ui/types.js.map +1 -0
- package/dist/utils/ContextResolver.d.ts +132 -0
- package/dist/utils/ContextResolver.d.ts.map +1 -0
- package/dist/utils/ContextResolver.js +269 -0
- package/dist/utils/ContextResolver.js.map +1 -0
- package/dist/utils/DiffParser.d.ts +101 -0
- package/dist/utils/DiffParser.d.ts.map +1 -0
- package/dist/utils/DiffParser.js +193 -0
- package/dist/utils/DiffParser.js.map +1 -0
- package/dist/utils/ErrorDetector.d.ts +99 -0
- package/dist/utils/ErrorDetector.d.ts.map +1 -0
- package/dist/utils/ErrorDetector.js +258 -0
- package/dist/utils/ErrorDetector.js.map +1 -0
- package/dist/utils/TokenCounter.d.ts +97 -0
- package/dist/utils/TokenCounter.d.ts.map +1 -0
- package/dist/utils/TokenCounter.js +193 -0
- package/dist/utils/TokenCounter.js.map +1 -0
- package/dist/utils/agentDiscovery.d.ts +12 -0
- package/dist/utils/agentDiscovery.d.ts.map +1 -0
- package/dist/utils/agentDiscovery.js +72 -0
- package/dist/utils/agentDiscovery.js.map +1 -0
- package/dist/utils/ids.d.ts +5 -0
- package/dist/utils/ids.d.ts.map +1 -0
- package/dist/utils/ids.js +14 -0
- package/dist/utils/ids.js.map +1 -0
- package/dist/utils/index.d.ts +14 -0
- package/dist/utils/index.d.ts.map +1 -0
- package/dist/utils/index.js +14 -0
- package/dist/utils/index.js.map +1 -0
- package/dist/utils/logger.d.ts +22 -0
- package/dist/utils/logger.d.ts.map +1 -0
- package/dist/utils/logger.js +44 -0
- package/dist/utils/logger.js.map +1 -0
- package/package.json +87 -0
|
@@ -0,0 +1,210 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* AutoResearchStats — the Monte-Carlo keep/discard gate.
|
|
3
|
+
*
|
|
4
|
+
* This is the statistical immune system of the recursive auto-research loop. A
|
|
5
|
+
* raw `delta > 0` WILL fool a self-improvement loop: with enough parallel
|
|
6
|
+
* experiments, some "win" on noise alone, the loop merges the noise, and it
|
|
7
|
+
* compounds. This module replaces raw deltas with three rigorous tests:
|
|
8
|
+
*
|
|
9
|
+
* 1. BOOTSTRAP CI on the aggregate score delta — keep only if the CI excludes 0.
|
|
10
|
+
* 2. PERMUTATION TEST — a one-sided p-value for "candidate is better", computed
|
|
11
|
+
* under the exchangeability null (base/candidate labels are swappable).
|
|
12
|
+
* 3. N-AWARE FWER — when N experiments run in parallel (a swarm), the keep bar
|
|
13
|
+
* tightens to control the family-wise error rate. Without this a swarm
|
|
14
|
+
* confidently merges noise (multiple-comparisons trap).
|
|
15
|
+
*
|
|
16
|
+
* REPRODUCIBILITY: every test is driven by a SEEDED PRNG (mulberry32). Same data
|
|
17
|
+
* + same seed → same p-value and CI. This is deliberate: the auto-research record
|
|
18
|
+
* is meant to be public + verifiable (Layer 3), so a decision must be
|
|
19
|
+
* reproducible by anyone re-running the gate on the same records.
|
|
20
|
+
*
|
|
21
|
+
* STRUCTURE: resampling is done at the RUN level WITHIN each task, then averaged
|
|
22
|
+
* across tasks. This respects the per-task structure (a task with more runs
|
|
23
|
+
* doesn't dominate; within-task noise is captured) — the correct unit for "did
|
|
24
|
+
* the harness version improve the eval".
|
|
25
|
+
*
|
|
26
|
+
* Pure functions, no I/O. The caller (VersionComparison → ExperimentLedger)
|
|
27
|
+
* feeds per-task score arrays and writes the returned verdict via
|
|
28
|
+
* `ExperimentLedger.decide()`.
|
|
29
|
+
*/
|
|
30
|
+
/** mulberry32 — tiny, fast, well-distributed seeded PRNG. Deterministic. */
|
|
31
|
+
export function mulberry32(seed) {
|
|
32
|
+
let a = seed >>> 0;
|
|
33
|
+
return function () {
|
|
34
|
+
a |= 0;
|
|
35
|
+
a = (a + 0x6d2b79f5) | 0;
|
|
36
|
+
let t = Math.imul(a ^ (a >>> 15), 1 | a);
|
|
37
|
+
t = (t + Math.imul(t ^ (t >>> 7), 61 | t)) ^ t;
|
|
38
|
+
return ((t ^ (t >>> 14)) >>> 0) / 4294967296;
|
|
39
|
+
};
|
|
40
|
+
}
|
|
41
|
+
const DEFAULT_SEED = 0x9e3779b9;
|
|
42
|
+
function mean(xs) {
|
|
43
|
+
if (xs.length === 0)
|
|
44
|
+
return 0;
|
|
45
|
+
return xs.reduce((s, x) => s + x, 0) / xs.length;
|
|
46
|
+
}
|
|
47
|
+
function round4(n) { return Math.round(n * 10000) / 10000; }
|
|
48
|
+
/** Resample an array with replacement (bootstrap). */
|
|
49
|
+
function resample(xs, rng) {
|
|
50
|
+
const n = xs.length;
|
|
51
|
+
const out = new Array(n);
|
|
52
|
+
for (let i = 0; i < n; i++)
|
|
53
|
+
out[i] = xs[(rng() * n) | 0];
|
|
54
|
+
return out;
|
|
55
|
+
}
|
|
56
|
+
/** Fisher-Yates shuffle (in place) using the seeded RNG. */
|
|
57
|
+
function shuffle(xs, rng) {
|
|
58
|
+
for (let i = xs.length - 1; i > 0; i--) {
|
|
59
|
+
const j = (rng() * (i + 1)) | 0;
|
|
60
|
+
const tmp = xs[i];
|
|
61
|
+
xs[i] = xs[j];
|
|
62
|
+
xs[j] = tmp;
|
|
63
|
+
}
|
|
64
|
+
}
|
|
65
|
+
function percentile(sorted, q) {
|
|
66
|
+
if (sorted.length === 0)
|
|
67
|
+
return 0;
|
|
68
|
+
const idx = Math.min(sorted.length - 1, Math.max(0, Math.round(q * (sorted.length - 1))));
|
|
69
|
+
return sorted[idx];
|
|
70
|
+
}
|
|
71
|
+
/** Observed aggregate effect: mean across tasks of (candMean - baseMean). */
|
|
72
|
+
export function aggregateEffect(tasks) {
|
|
73
|
+
if (tasks.length === 0)
|
|
74
|
+
return 0;
|
|
75
|
+
return mean(tasks.map(t => mean(t.candScores) - mean(t.baseScores)));
|
|
76
|
+
}
|
|
77
|
+
/**
|
|
78
|
+
* Bootstrap percentile CI on the aggregate effect. Resamples runs within each
|
|
79
|
+
* arm of each task, recomputes the aggregate, repeats. Keep requires ciLow > 0.
|
|
80
|
+
*/
|
|
81
|
+
export function bootstrapCI(tasks, opts) {
|
|
82
|
+
const iterations = opts.iterations ?? 2000;
|
|
83
|
+
const ci = opts.ci ?? 0.95;
|
|
84
|
+
const stats = [];
|
|
85
|
+
for (let b = 0; b < iterations; b++) {
|
|
86
|
+
const taskDeltas = tasks.map(t => mean(resample(t.candScores, opts.rng)) - mean(resample(t.baseScores, opts.rng)));
|
|
87
|
+
stats.push(mean(taskDeltas));
|
|
88
|
+
}
|
|
89
|
+
stats.sort((x, y) => x - y);
|
|
90
|
+
const lowQ = (1 - ci) / 2;
|
|
91
|
+
return {
|
|
92
|
+
ciLow: round4(percentile(stats, lowQ)),
|
|
93
|
+
ciHigh: round4(percentile(stats, 1 - lowQ)),
|
|
94
|
+
effect: round4(aggregateEffect(tasks)),
|
|
95
|
+
};
|
|
96
|
+
}
|
|
97
|
+
/**
|
|
98
|
+
* One-sided permutation p-value for "candidate > base". Within each task, pools
|
|
99
|
+
* the two arms and relabels at random into the original arm sizes (the
|
|
100
|
+
* exchangeability null), recomputes the aggregate effect, and measures how often
|
|
101
|
+
* the permuted effect meets or beats the observed one. Add-one estimator
|
|
102
|
+
* (never returns exactly 0 — a permutation p-value can't certify impossibility).
|
|
103
|
+
*/
|
|
104
|
+
export function permutationPValue(tasks, opts) {
|
|
105
|
+
const iterations = opts.iterations ?? 2000;
|
|
106
|
+
const observed = aggregateEffect(tasks);
|
|
107
|
+
let atLeastAsExtreme = 0;
|
|
108
|
+
for (let p = 0; p < iterations; p++) {
|
|
109
|
+
const permDeltas = tasks.map(t => {
|
|
110
|
+
const pooled = [...t.baseScores, ...t.candScores];
|
|
111
|
+
shuffle(pooled, opts.rng);
|
|
112
|
+
const nb = t.baseScores.length;
|
|
113
|
+
const permBase = pooled.slice(0, nb);
|
|
114
|
+
const permCand = pooled.slice(nb);
|
|
115
|
+
return mean(permCand) - mean(permBase);
|
|
116
|
+
});
|
|
117
|
+
if (mean(permDeltas) >= observed)
|
|
118
|
+
atLeastAsExtreme++;
|
|
119
|
+
}
|
|
120
|
+
return round4((atLeastAsExtreme + 1) / (iterations + 1));
|
|
121
|
+
}
|
|
122
|
+
/**
|
|
123
|
+
* Šidák family-wise threshold: the per-experiment alpha that holds the
|
|
124
|
+
* family-wise error at `alpha` across N independent experiments.
|
|
125
|
+
* `1 - (1 - alpha)^(1/N)`. Tighter than alpha, slightly looser than Bonferroni.
|
|
126
|
+
*/
|
|
127
|
+
export function sidakThreshold(alpha, nExperiments) {
|
|
128
|
+
const n = Math.max(1, nExperiments);
|
|
129
|
+
return round4(1 - Math.pow(1 - alpha, 1 / n));
|
|
130
|
+
}
|
|
131
|
+
/**
|
|
132
|
+
* Monte-Carlo FWER threshold. Simulates the joint null of N experiments and
|
|
133
|
+
* returns the per-experiment p-value cutoff that controls the family-wise error
|
|
134
|
+
* at `alpha` (the alpha-quantile of the family minimum p-value). With independent
|
|
135
|
+
* experiments this reproduces Šidák — and that's the point: it VALIDATES the
|
|
136
|
+
* analytic bar and is the extension point for correlated experiments (shared
|
|
137
|
+
* tasks), where the true threshold is less conservative than Bonferroni/Šidák.
|
|
138
|
+
* A `correlation` hook can later inject a copula; for now experiments are modeled
|
|
139
|
+
* independent (conservative, correct).
|
|
140
|
+
*/
|
|
141
|
+
export function mcFwerThreshold(alpha, nExperiments, opts) {
|
|
142
|
+
const n = Math.max(1, nExperiments);
|
|
143
|
+
if (n === 1)
|
|
144
|
+
return round4(alpha);
|
|
145
|
+
const iterations = opts.iterations ?? 5000;
|
|
146
|
+
const minPs = [];
|
|
147
|
+
for (let i = 0; i < iterations; i++) {
|
|
148
|
+
let minP = 1;
|
|
149
|
+
for (let j = 0; j < n; j++) {
|
|
150
|
+
const u = opts.rng(); // null p-value ~ Uniform(0,1)
|
|
151
|
+
if (u < minP)
|
|
152
|
+
minP = u;
|
|
153
|
+
}
|
|
154
|
+
minPs.push(minP);
|
|
155
|
+
}
|
|
156
|
+
minPs.sort((a, b) => a - b);
|
|
157
|
+
// cutoff = alpha-quantile of the family-minimum-p distribution
|
|
158
|
+
return round4(percentile(minPs, alpha));
|
|
159
|
+
}
|
|
160
|
+
/**
|
|
161
|
+
* The full gate. Produces the keep/discard/pending verdict for one experiment,
|
|
162
|
+
* tested against the FWER-adjusted threshold for a family of
|
|
163
|
+
* `nFamilyExperiments`. Decision rule:
|
|
164
|
+
* - PENDING if no task has >= minRunsPerArm in both arms (not enough data).
|
|
165
|
+
* - KEEP if ciLow > 0 AND pValue <= alphaAdjusted (real, significant gain).
|
|
166
|
+
* - DISCARD otherwise.
|
|
167
|
+
*
|
|
168
|
+
* The returned object maps directly onto ExperimentLedger.decide()'s
|
|
169
|
+
* DecisionUpdate (decision/pValue/ciLow/ciHigh/fwerAdjusted/nRuns/reason).
|
|
170
|
+
*/
|
|
171
|
+
export function decideExperiment(tasks, opts = {}) {
|
|
172
|
+
const alpha = opts.alpha ?? 0.05;
|
|
173
|
+
const nFamily = opts.nFamilyExperiments ?? 1;
|
|
174
|
+
const minRuns = opts.minRunsPerArm ?? 2;
|
|
175
|
+
const rng = opts.rng ?? mulberry32(opts.seed ?? DEFAULT_SEED);
|
|
176
|
+
const usable = tasks.filter(t => t.baseScores.length >= minRuns && t.candScores.length >= minRuns);
|
|
177
|
+
const nRuns = tasks.reduce((s, t) => s + t.baseScores.length + t.candScores.length, 0);
|
|
178
|
+
if (usable.length === 0) {
|
|
179
|
+
return {
|
|
180
|
+
decision: 'pending',
|
|
181
|
+
effect: round4(aggregateEffect(tasks)),
|
|
182
|
+
fwerAdjusted: false,
|
|
183
|
+
nRuns,
|
|
184
|
+
nTasks: tasks.length,
|
|
185
|
+
reason: `insufficient data: no task has >= ${minRuns} runs in both arms`,
|
|
186
|
+
};
|
|
187
|
+
}
|
|
188
|
+
const { ciLow, ciHigh, effect } = bootstrapCI(usable, { iterations: opts.bootstrapIterations, ci: opts.ci, rng });
|
|
189
|
+
const pValue = permutationPValue(usable, { iterations: opts.permutationIterations, rng });
|
|
190
|
+
const alphaAdjusted = mcFwerThreshold(alpha, nFamily, { rng });
|
|
191
|
+
const ciExcludesZero = ciLow > 0;
|
|
192
|
+
const significant = pValue <= alphaAdjusted;
|
|
193
|
+
const keep = ciExcludesZero && significant;
|
|
194
|
+
const reason = keep
|
|
195
|
+
? `keep: effect +${effect} (95% CI [${ciLow}, ${ciHigh}] excludes 0), p=${pValue} <= alpha_adj=${alphaAdjusted} (N=${nFamily})`
|
|
196
|
+
: `discard: ${!ciExcludesZero ? `CI [${ciLow}, ${ciHigh}] includes 0` : `p=${pValue} > alpha_adj=${alphaAdjusted} (N=${nFamily})`}`;
|
|
197
|
+
return {
|
|
198
|
+
decision: keep ? 'keep' : 'discard',
|
|
199
|
+
effect,
|
|
200
|
+
pValue,
|
|
201
|
+
ciLow,
|
|
202
|
+
ciHigh,
|
|
203
|
+
fwerAdjusted: true,
|
|
204
|
+
alphaAdjusted,
|
|
205
|
+
nRuns,
|
|
206
|
+
nTasks: usable.length,
|
|
207
|
+
reason,
|
|
208
|
+
};
|
|
209
|
+
}
|
|
210
|
+
//# sourceMappingURL=AutoResearchStats.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"AutoResearchStats.js","sourceRoot":"","sources":["../../src/training/AutoResearchStats.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA4BG;AAKH,4EAA4E;AAC5E,MAAM,UAAU,UAAU,CAAC,IAAY;IACrC,IAAI,CAAC,GAAG,IAAI,KAAK,CAAC,CAAC;IACnB,OAAO;QACL,CAAC,IAAI,CAAC,CAAC;QAAC,CAAC,GAAG,CAAC,CAAC,GAAG,UAAU,CAAC,GAAG,CAAC,CAAC;QACjC,IAAI,CAAC,GAAG,IAAI,CAAC,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,EAAE,CAAC,GAAG,CAAC,CAAC,CAAC;QACzC,CAAC,GAAG,CAAC,CAAC,GAAG,IAAI,CAAC,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;QAC/C,OAAO,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,CAAC,KAAK,CAAC,CAAC,GAAG,UAAU,CAAC;IAC/C,CAAC,CAAC;AACJ,CAAC;AAyCD,MAAM,YAAY,GAAG,UAAU,CAAC;AAEhC,SAAS,IAAI,CAAC,EAAY;IACxB,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IAC9B,OAAO,EAAE,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC,GAAG,EAAE,CAAC,MAAM,CAAC;AACnD,CAAC;AAED,SAAS,MAAM,CAAC,CAAS,IAAY,OAAO,IAAI,CAAC,KAAK,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,KAAK,CAAC,CAAC,CAAC;AAE5E,sDAAsD;AACtD,SAAS,QAAQ,CAAC,EAAY,EAAE,GAAQ;IACtC,MAAM,CAAC,GAAG,EAAE,CAAC,MAAM,CAAC;IACpB,MAAM,GAAG,GAAG,IAAI,KAAK,CAAS,CAAC,CAAC,CAAC;IACjC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,EAAE;QAAE,GAAG,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,GAAG,EAAE,GAAG,CAAC,CAAC,GAAG,CAAC,CAAE,CAAC;IAC1D,OAAO,GAAG,CAAC;AACb,CAAC;AAED,4DAA4D;AAC5D,SAAS,OAAO,CAAI,EAAO,EAAE,GAAQ;IACnC,KAAK,IAAI,CAAC,GAAG,EAAE,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;QACvC,MAAM,CAAC,GAAG,CAAC,GAAG,EAAE,GAAG,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;QAChC,MAAM,GAAG,GAAG,EAAE,CAAC,CAAC,CAAE,CAAC;QAAC,EAAE,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,CAAE,CAAC;QAAC,EAAE,CAAC,CAAC,CAAC,GAAG,GAAG,CAAC;IAClD,CAAC;AACH,CAAC;AAED,SAAS,UAAU,CAAC,MAAgB,EAAE,CAAS;IAC7C,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IAClC,MAAM,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;IAC1F,OAAO,MAAM,CAAC,GAAG,CAAE,CAAC;AACtB,CAAC;AAED,6EAA6E;AAC7E,MAAM,UAAU,eAAe,CAAC,KAAiB;IAC/C,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IACjC,OAAO,IAAI,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC,CAAC,UAAU,CAAC,GAAG,IAAI,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;AACvE,CAAC;AAED;;;GAGG;AACH,MAAM,UAAU,WAAW,CACzB,KAAiB,EACjB,IAAoD;IAEpD,MAAM,UAAU,GAAG,IAAI,CAAC,UAAU,IAAI,IAAI,CAAC;IAC3C,MAAM,EAAE,GAAG,IAAI,CAAC,EAAE,IAAI,IAAI,CAAC;IAC3B,MAAM,KAAK,GAAa,EAAE,CAAC;IAC3B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,UAAU,EAAE,CAAC,EAAE,EAAE,CAAC;QACpC,MAAM,UAAU,GAAG,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC,UAAU,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,GAAG,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC,UAAU,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QACnH,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC,CAAC;IAC/B,CAAC;IACD,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;IAC5B,MAAM,IAAI,GAAG,CAAC,CAAC,GAAG,EAAE,CAAC,GAAG,CAAC,CAAC;IAC1B,OAAO;QACL,KAAK,EAAE,MAAM,CAAC,UAAU,CAAC,KAAK,EAAE,IAAI,CAAC,CAAC;QACtC,MAAM,EAAE,MAAM,CAAC,UAAU,CAAC,KAAK,EAAE,CAAC,GAAG,IAAI,CAAC,CAAC;QAC3C,MAAM,EAAE,MAAM,CAAC,eAAe,CAAC,KAAK,CAAC,CAAC;KACvC,CAAC;AACJ,CAAC;AAED;;;;;;GAMG;AACH,MAAM,UAAU,iBAAiB,CAC/B,KAAiB,EACjB,IAAuC;IAEvC,MAAM,UAAU,GAAG,IAAI,CAAC,UAAU,IAAI,IAAI,CAAC;IAC3C,MAAM,QAAQ,GAAG,eAAe,CAAC,KAAK,CAAC,CAAC;IACxC,IAAI,gBAAgB,GAAG,CAAC,CAAC;IACzB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,UAAU,EAAE,CAAC,EAAE,EAAE,CAAC;QACpC,MAAM,UAAU,GAAG,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE;YAC/B,MAAM,MAAM,GAAG,CAAC,GAAG,CAAC,CAAC,UAAU,EAAE,GAAG,CAAC,CAAC,UAAU,CAAC,CAAC;YAClD,OAAO,CAAC,MAAM,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC;YAC1B,MAAM,EAAE,GAAG,CAAC,CAAC,UAAU,CAAC,MAAM,CAAC;YAC/B,MAAM,QAAQ,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;YACrC,MAAM,QAAQ,GAAG,MAAM,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC;YAClC,OAAO,IAAI,CAAC,QAAQ,CAAC,GAAG,IAAI,CAAC,QAAQ,CAAC,CAAC;QACzC,CAAC,CAAC,CAAC;QACH,IAAI,IAAI,CAAC,UAAU,CAAC,IAAI,QAAQ;YAAE,gBAAgB,EAAE,CAAC;IACvD,CAAC;IACD,OAAO,MAAM,CAAC,CAAC,gBAAgB,GAAG,CAAC,CAAC,GAAG,CAAC,UAAU,GAAG,CAAC,CAAC,CAAC,CAAC;AAC3D,CAAC;AAED;;;;GAIG;AACH,MAAM,UAAU,cAAc,CAAC,KAAa,EAAE,YAAoB;IAChE,MAAM,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,YAAY,CAAC,CAAC;IACpC,OAAO,MAAM,CAAC,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,GAAG,KAAK,EAAE,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;AAChD,CAAC;AAED;;;;;;;;;GASG;AACH,MAAM,UAAU,eAAe,CAC7B,KAAa,EACb,YAAoB,EACpB,IAAuC;IAEvC,MAAM,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,YAAY,CAAC,CAAC;IACpC,IAAI,CAAC,KAAK,CAAC;QAAE,OAAO,MAAM,CAAC,KAAK,CAAC,CAAC;IAClC,MAAM,UAAU,GAAG,IAAI,CAAC,UAAU,IAAI,IAAI,CAAC;IAC3C,MAAM,KAAK,GAAa,EAAE,CAAC;IAC3B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,UAAU,EAAE,CAAC,EAAE,EAAE,CAAC;QACpC,IAAI,IAAI,GAAG,CAAC,CAAC;QACb,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;YAC3B,MAAM,CAAC,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC,CAAC,8BAA8B;YACpD,IAAI,CAAC,GAAG,IAAI;gBAAE,IAAI,GAAG,CAAC,CAAC;QACzB,CAAC;QACD,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IACnB,CAAC;IACD,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;IAC5B,+DAA+D;IAC/D,OAAO,MAAM,CAAC,UAAU,CAAC,KAAK,EAAE,KAAK,CAAC,CAAC,CAAC;AAC1C,CAAC;AAED;;;;;;;;;;GAUG;AACH,MAAM,UAAU,gBAAgB,CAAC,KAAiB,EAAE,OAAoB,EAAE;IACxE,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,IAAI,IAAI,CAAC;IACjC,MAAM,OAAO,GAAG,IAAI,CAAC,kBAAkB,IAAI,CAAC,CAAC;IAC7C,MAAM,OAAO,GAAG,IAAI,CAAC,aAAa,IAAI,CAAC,CAAC;IACxC,MAAM,GAAG,GAAG,IAAI,CAAC,GAAG,IAAI,UAAU,CAAC,IAAI,CAAC,IAAI,IAAI,YAAY,CAAC,CAAC;IAE9D,MAAM,MAAM,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,UAAU,CAAC,MAAM,IAAI,OAAO,IAAI,CAAC,CAAC,UAAU,CAAC,MAAM,IAAI,OAAO,CAAC,CAAC;IACnG,MAAM,KAAK,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,UAAU,CAAC,MAAM,GAAG,CAAC,CAAC,UAAU,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;IAEvF,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QACxB,OAAO;YACL,QAAQ,EAAE,SAAS;YACnB,MAAM,EAAE,MAAM,CAAC,eAAe,CAAC,KAAK,CAAC,CAAC;YACtC,YAAY,EAAE,KAAK;YACnB,KAAK;YACL,MAAM,EAAE,KAAK,CAAC,MAAM;YACpB,MAAM,EAAE,qCAAqC,OAAO,oBAAoB;SACzE,CAAC;IACJ,CAAC;IAED,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,MAAM,EAAE,GAAG,WAAW,CAAC,MAAM,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,mBAAmB,EAAE,EAAE,EAAE,IAAI,CAAC,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;IAClH,MAAM,MAAM,GAAG,iBAAiB,CAAC,MAAM,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,qBAAqB,EAAE,GAAG,EAAE,CAAC,CAAC;IAC1F,MAAM,aAAa,GAAG,eAAe,CAAC,KAAK,EAAE,OAAO,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;IAE/D,MAAM,cAAc,GAAG,KAAK,GAAG,CAAC,CAAC;IACjC,MAAM,WAAW,GAAG,MAAM,IAAI,aAAa,CAAC;IAC5C,MAAM,IAAI,GAAG,cAAc,IAAI,WAAW,CAAC;IAE3C,MAAM,MAAM,GAAG,IAAI;QACjB,CAAC,CAAC,iBAAiB,MAAM,aAAa,KAAK,KAAK,MAAM,oBAAoB,MAAM,iBAAiB,aAAa,OAAO,OAAO,GAAG;QAC/H,CAAC,CAAC,YAAY,CAAC,cAAc,CAAC,CAAC,CAAC,OAAO,KAAK,KAAK,MAAM,cAAc,CAAC,CAAC,CAAC,KAAK,MAAM,gBAAgB,aAAa,OAAO,OAAO,GAAG,EAAE,CAAC;IAEtI,OAAO;QACL,QAAQ,EAAE,IAAI,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,SAAS;QACnC,MAAM;QACN,MAAM;QACN,KAAK;QACL,MAAM;QACN,YAAY,EAAE,IAAI;QAClB,aAAa;QACb,KAAK;QACL,MAAM,EAAE,MAAM,CAAC,MAAM;QACrB,MAAM;KACP,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1,177 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* BenchRunner — the missing GRADER that produces REAL scored matrix records.
|
|
3
|
+
*
|
|
4
|
+
* The orchestrator's auto-record (MODEL_ROUTER_RECORD) writes a liveness STUB
|
|
5
|
+
* (`qualitativeScore = hasText ? 75 : 0`) — fine for "is the model alive", useless
|
|
6
|
+
* for "did the candidate harness get better". The auto-research decision layer
|
|
7
|
+
* consumes `qualitativeScore` as the per-run signal, so without a real grader
|
|
8
|
+
* every base/candidate comparison is a flat tie → the gate always says discard.
|
|
9
|
+
*
|
|
10
|
+
* This module runs a TASK SET through the harness and grades each run with a
|
|
11
|
+
* deterministic (or LLM-judge) verifier, writing the REAL pass/qualitativeScore
|
|
12
|
+
* to `router-matrix.jsonl` under a given experimentTag/split. The CLI
|
|
13
|
+
* (`cortex autoresearch bench`) wires a concrete HarnessRunner; here everything
|
|
14
|
+
* is pure + injectable so it unit-tests with no network.
|
|
15
|
+
*
|
|
16
|
+
* FLOW: orchestrator (nexus side) runs this in the base worktree (→ records under
|
|
17
|
+
* harnessRef=base) and the candidate worktree (→ harnessRef=candidate), then calls
|
|
18
|
+
* `cortex autoresearch evaluate --base … --candidate …` which compares them.
|
|
19
|
+
* One bench run = one harness build; the base/candidate axis is the git ref the
|
|
20
|
+
* record is auto-stamped with (override via opts.harnessRef for single-box tests).
|
|
21
|
+
*/
|
|
22
|
+
import { ModelRouterMatrix } from './ModelRouterMatrix.js';
|
|
23
|
+
import type { NewDeficiency } from './ResearchBacklog.js';
|
|
24
|
+
export type Verifier =
|
|
25
|
+
/** output, normalized, must equal `expected` exactly. */
|
|
26
|
+
{
|
|
27
|
+
type: 'exact';
|
|
28
|
+
expected: string;
|
|
29
|
+
normalize?: boolean;
|
|
30
|
+
}
|
|
31
|
+
/** `pattern` (RegExp) must match somewhere in the output. */
|
|
32
|
+
| {
|
|
33
|
+
type: 'regex';
|
|
34
|
+
pattern: string;
|
|
35
|
+
flags?: string;
|
|
36
|
+
}
|
|
37
|
+
/** every string in `all` must appear — PARTIAL CREDIT: score = found/total×100.
|
|
38
|
+
* This is the workhorse: graded continuous scores (not just pass/fail) give the
|
|
39
|
+
* bootstrap/permutation gate real signal to separate base from candidate. */
|
|
40
|
+
| {
|
|
41
|
+
type: 'contains';
|
|
42
|
+
all: string[];
|
|
43
|
+
caseInsensitive?: boolean;
|
|
44
|
+
}
|
|
45
|
+
/** delegated to an injected judge fn (e.g. the deepseek helper). */
|
|
46
|
+
| {
|
|
47
|
+
type: 'llm-judge';
|
|
48
|
+
rubric: string;
|
|
49
|
+
}
|
|
50
|
+
/** Extract a NUMBER from the output and score it — the continuous-metric path for
|
|
51
|
+
* non-cortex targets (ROI, latency, accuracy, tour length, …). `extract` is a regex
|
|
52
|
+
* whose capture group 1 (or whole match) is the number; default = the LAST number in
|
|
53
|
+
* the output (evals usually print the metric last). `direction` orients "better".
|
|
54
|
+
* `best`/`worst` linearly map value→0-100 (omit → the raw oriented value is the score;
|
|
55
|
+
* the gate is relative either way). `target` sets the pass threshold (>= for maximize,
|
|
56
|
+
* <= for minimize); omit → any extracted number passes, so a crashed/non-numeric run
|
|
57
|
+
* fails (score 0) and seeds the backlog. */
|
|
58
|
+
| {
|
|
59
|
+
type: 'numeric';
|
|
60
|
+
direction: 'maximize' | 'minimize';
|
|
61
|
+
extract?: string;
|
|
62
|
+
best?: number;
|
|
63
|
+
worst?: number;
|
|
64
|
+
target?: number;
|
|
65
|
+
};
|
|
66
|
+
export interface TaskSpec {
|
|
67
|
+
id: string;
|
|
68
|
+
prompt: string;
|
|
69
|
+
verifier: Verifier;
|
|
70
|
+
/** T1–T5; if omitted, classifyTask(prompt) decides. */
|
|
71
|
+
taskType?: string;
|
|
72
|
+
}
|
|
73
|
+
/** Optional LLM judge — injected so core stays network-free. */
|
|
74
|
+
export type JudgeFn = (output: string, rubric: string) => Promise<{
|
|
75
|
+
pass: boolean;
|
|
76
|
+
qualitativeScore: number;
|
|
77
|
+
}>;
|
|
78
|
+
export interface GradeResult {
|
|
79
|
+
pass: boolean;
|
|
80
|
+
/** 0–100. Continuous where possible (partial credit) so the gate can separate arms. */
|
|
81
|
+
qualitativeScore: number;
|
|
82
|
+
detail?: string;
|
|
83
|
+
}
|
|
84
|
+
/**
|
|
85
|
+
* Grade one model output against a verifier. Pure for the deterministic types;
|
|
86
|
+
* `contains` gives partial credit. `llm-judge` requires an injected judge.
|
|
87
|
+
*/
|
|
88
|
+
export declare function gradeRun(output: string, verifier: Verifier, judge?: JudgeFn): Promise<GradeResult>;
|
|
89
|
+
export interface HarnessRunResult {
|
|
90
|
+
text: string;
|
|
91
|
+
modelId?: string;
|
|
92
|
+
inputTokens: number;
|
|
93
|
+
outputTokens: number;
|
|
94
|
+
toolCallCount: number;
|
|
95
|
+
latencyMs: number;
|
|
96
|
+
}
|
|
97
|
+
export interface HarnessRunner {
|
|
98
|
+
run(prompt: string, opts?: {
|
|
99
|
+
model?: string;
|
|
100
|
+
}): Promise<HarnessRunResult>;
|
|
101
|
+
}
|
|
102
|
+
/**
|
|
103
|
+
* Deterministic backlog seeding sink. `ResearchBacklog` satisfies this directly
|
|
104
|
+
* (its `add(d: NewDeficiency)`); injected (not imported) so `runBench` stays pure
|
|
105
|
+
* and fs/network-free for unit tests.
|
|
106
|
+
*/
|
|
107
|
+
export interface DeficiencySink {
|
|
108
|
+
add(d: NewDeficiency): unknown;
|
|
109
|
+
}
|
|
110
|
+
export interface RunBenchOptions {
|
|
111
|
+
experimentTag: string;
|
|
112
|
+
runs?: number;
|
|
113
|
+
split?: 'train' | 'holdout';
|
|
114
|
+
modelId?: string;
|
|
115
|
+
benchmarkSource?: string;
|
|
116
|
+
/** override the auto-stamped git SHA (single-box base/candidate simulation). */
|
|
117
|
+
harnessRef?: string;
|
|
118
|
+
judge?: JudgeFn;
|
|
119
|
+
/** progress callback (one per graded run). */
|
|
120
|
+
onRun?: (info: {
|
|
121
|
+
taskId: string;
|
|
122
|
+
run: number;
|
|
123
|
+
pass: boolean;
|
|
124
|
+
qualitativeScore: number;
|
|
125
|
+
}) => void;
|
|
126
|
+
/**
|
|
127
|
+
* Deterministic backlog seeding. When provided, any task whose pass-rate < 1 across
|
|
128
|
+
* its runs idempotently seeds a deficiency here — so a failing verifier records a
|
|
129
|
+
* harness weakness even if the model never calls the ResearchBacklog tool. Confidence
|
|
130
|
+
* scales with failure consistency × run count, so a flaky one-off lands low-priority
|
|
131
|
+
* (and triage's confidence weighting sinks it) rather than as a false positive. Omit
|
|
132
|
+
* the sink ⇒ no seeding (unchanged behavior). Only the `train` split seeds — a holdout
|
|
133
|
+
* failure is verification signal for a specific fix, not a newly-discovered deficiency.
|
|
134
|
+
*/
|
|
135
|
+
backlog?: DeficiencySink;
|
|
136
|
+
/** Provenance stamped onto seeded deficiencies (e.g. the bench round / harness SHA). */
|
|
137
|
+
discoveredRound?: string;
|
|
138
|
+
discoveredRef?: string;
|
|
139
|
+
/** Harness area for seeded deficiencies (ResearchBacklog `bugClass`; default 'Other'). */
|
|
140
|
+
deficiencyBugClass?: string;
|
|
141
|
+
/**
|
|
142
|
+
* Effectiveness-layer arm identity. When the auto-research PM dispatches a varied
|
|
143
|
+
* arm (a distinct persona/strategy at a chosen temperature), pass them here so each
|
|
144
|
+
* scored record carries the arm — getStrategyScores/recommendStrategy then rank the
|
|
145
|
+
* (model × temperature × strategy) combinations, not just models. Both optional and
|
|
146
|
+
* back-compatible; omit them and records score exactly as before.
|
|
147
|
+
*/
|
|
148
|
+
temperature?: number;
|
|
149
|
+
strategy?: string;
|
|
150
|
+
}
|
|
151
|
+
export interface BenchTaskSummary {
|
|
152
|
+
taskId: string;
|
|
153
|
+
taskFingerprint: string;
|
|
154
|
+
taskType: string;
|
|
155
|
+
runs: number;
|
|
156
|
+
passRate: number;
|
|
157
|
+
meanScore: number;
|
|
158
|
+
}
|
|
159
|
+
export interface BenchSummary {
|
|
160
|
+
experimentTag: string;
|
|
161
|
+
split: 'train' | 'holdout';
|
|
162
|
+
harnessRef?: string;
|
|
163
|
+
totalRuns: number;
|
|
164
|
+
tasks: BenchTaskSummary[];
|
|
165
|
+
/** Number of deficiencies seeded into `opts.backlog` this run (0 when no sink). */
|
|
166
|
+
seededDeficiencies: number;
|
|
167
|
+
}
|
|
168
|
+
/**
|
|
169
|
+
* Run each task `runs` times through `runner`, grade each output, and write a
|
|
170
|
+
* REAL scored BenchmarkRecord to the matrix (harnessRef auto-stamped unless
|
|
171
|
+
* overridden; taskFingerprint = hash of prompt+verifier so it's the stable
|
|
172
|
+
* comparability key the gate joins on).
|
|
173
|
+
*/
|
|
174
|
+
export declare function runBench(tasks: TaskSpec[], runner: HarnessRunner, matrix: ModelRouterMatrix, opts: RunBenchOptions): Promise<BenchSummary>;
|
|
175
|
+
/** Validate a parsed task-set JSON value, throwing on malformed entries. */
|
|
176
|
+
export declare function parseTaskSet(raw: unknown, source?: string): TaskSpec[];
|
|
177
|
+
//# sourceMappingURL=BenchRunner.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"BenchRunner.d.ts","sourceRoot":"","sources":["../../src/training/BenchRunner.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;GAoBG;AAEH,OAAO,EAAE,iBAAiB,EAAE,MAAM,wBAAwB,CAAC;AAE3D,OAAO,KAAK,EAAE,aAAa,EAAY,MAAM,sBAAsB,CAAC;AAMpE,MAAM,MAAM,QAAQ;AAClB,yDAAyD;AACvD;IAAE,IAAI,EAAE,OAAO,CAAC;IAAC,QAAQ,EAAE,MAAM,CAAC;IAAC,SAAS,CAAC,EAAE,OAAO,CAAA;CAAE;AAC1D,6DAA6D;GAC3D;IAAE,IAAI,EAAE,OAAO,CAAC;IAAC,OAAO,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAE;AACpD;;8EAE8E;GAC5E;IAAE,IAAI,EAAE,UAAU,CAAC;IAAC,GAAG,EAAE,MAAM,EAAE,CAAC;IAAC,eAAe,CAAC,EAAE,OAAO,CAAA;CAAE;AAChE,oEAAoE;GAClE;IAAE,IAAI,EAAE,WAAW,CAAC;IAAC,MAAM,EAAE,MAAM,CAAA;CAAE;AACvC;;;;;;;6CAO6C;GAC3C;IAAE,IAAI,EAAE,SAAS,CAAC;IAAC,SAAS,EAAE,UAAU,GAAG,UAAU,CAAC;IAAC,OAAO,CAAC,EAAE,MAAM,CAAC;IAAC,IAAI,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAC;IAAC,MAAM,CAAC,EAAE,MAAM,CAAA;CAAE,CAAC;AAE9H,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,MAAM,CAAC;IACf,QAAQ,EAAE,QAAQ,CAAC;IACnB,uDAAuD;IACvD,QAAQ,CAAC,EAAE,MAAM,CAAC;CACnB;AAED,gEAAgE;AAChE,MAAM,MAAM,OAAO,GAAG,CAAC,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,KAAK,OAAO,CAAC;IAAE,IAAI,EAAE,OAAO,CAAC;IAAC,gBAAgB,EAAE,MAAM,CAAA;CAAE,CAAC,CAAC;AAE/G,MAAM,WAAW,WAAW;IAC1B,IAAI,EAAE,OAAO,CAAC;IACd,uFAAuF;IACvF,gBAAgB,EAAE,MAAM,CAAC;IACzB,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAMD;;;GAGG;AACH,wBAAsB,QAAQ,CAAC,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,KAAK,CAAC,EAAE,OAAO,GAAG,OAAO,CAAC,WAAW,CAAC,CA2DxG;AAMD,MAAM,WAAW,gBAAgB;IAC/B,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,WAAW,EAAE,MAAM,CAAC;IACpB,YAAY,EAAE,MAAM,CAAC;IACrB,aAAa,EAAE,MAAM,CAAC;IACtB,SAAS,EAAE,MAAM,CAAC;CACnB;AAED,MAAM,WAAW,aAAa;IAC5B,GAAG,CAAC,MAAM,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE;QAAE,KAAK,CAAC,EAAE,MAAM,CAAA;KAAE,GAAG,OAAO,CAAC,gBAAgB,CAAC,CAAC;CAC3E;AAED;;;;GAIG;AACH,MAAM,WAAW,cAAc;IAC7B,GAAG,CAAC,CAAC,EAAE,aAAa,GAAG,OAAO,CAAC;CAChC;AAMD,MAAM,WAAW,eAAe;IAC9B,aAAa,EAAE,MAAM,CAAC;IACtB,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,KAAK,CAAC,EAAE,OAAO,GAAG,SAAS,CAAC;IAC5B,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,gFAAgF;IAChF,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,KAAK,CAAC,EAAE,OAAO,CAAC;IAChB,8CAA8C;IAC9C,KAAK,CAAC,EAAE,CAAC,IAAI,EAAE;QAAE,MAAM,EAAE,MAAM,CAAC;QAAC,GAAG,EAAE,MAAM,CAAC;QAAC,IAAI,EAAE,OAAO,CAAC;QAAC,gBAAgB,EAAE,MAAM,CAAA;KAAE,KAAK,IAAI,CAAC;IACjG;;;;;;;;OAQG;IACH,OAAO,CAAC,EAAE,cAAc,CAAC;IACzB,wFAAwF;IACxF,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,0FAA0F;IAC1F,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAC5B;;;;;;OAMG;IACH,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,QAAQ,CAAC,EAAE,MAAM,CAAC;CACnB;AAED,MAAM,WAAW,gBAAgB;IAC/B,MAAM,EAAE,MAAM,CAAC;IACf,eAAe,EAAE,MAAM,CAAC;IACxB,QAAQ,EAAE,MAAM,CAAC;IACjB,IAAI,EAAE,MAAM,CAAC;IACb,QAAQ,EAAE,MAAM,CAAC;IACjB,SAAS,EAAE,MAAM,CAAC;CACnB;AAED,MAAM,WAAW,YAAY;IAC3B,aAAa,EAAE,MAAM,CAAC;IACtB,KAAK,EAAE,OAAO,GAAG,SAAS,CAAC;IAC3B,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,SAAS,EAAE,MAAM,CAAC;IAClB,KAAK,EAAE,gBAAgB,EAAE,CAAC;IAC1B,mFAAmF;IACnF,kBAAkB,EAAE,MAAM,CAAC;CAC5B;AAED;;;;;GAKG;AACH,wBAAsB,QAAQ,CAC5B,KAAK,EAAE,QAAQ,EAAE,EACjB,MAAM,EAAE,aAAa,EACrB,MAAM,EAAE,iBAAiB,EACzB,IAAI,EAAE,eAAe,GACpB,OAAO,CAAC,YAAY,CAAC,CA8FvB;AAED,4EAA4E;AAC5E,wBAAgB,YAAY,CAAC,GAAG,EAAE,OAAO,EAAE,MAAM,SAAe,GAAG,QAAQ,EAAE,CAe5E"}
|
|
@@ -0,0 +1,211 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* BenchRunner — the missing GRADER that produces REAL scored matrix records.
|
|
3
|
+
*
|
|
4
|
+
* The orchestrator's auto-record (MODEL_ROUTER_RECORD) writes a liveness STUB
|
|
5
|
+
* (`qualitativeScore = hasText ? 75 : 0`) — fine for "is the model alive", useless
|
|
6
|
+
* for "did the candidate harness get better". The auto-research decision layer
|
|
7
|
+
* consumes `qualitativeScore` as the per-run signal, so without a real grader
|
|
8
|
+
* every base/candidate comparison is a flat tie → the gate always says discard.
|
|
9
|
+
*
|
|
10
|
+
* This module runs a TASK SET through the harness and grades each run with a
|
|
11
|
+
* deterministic (or LLM-judge) verifier, writing the REAL pass/qualitativeScore
|
|
12
|
+
* to `router-matrix.jsonl` under a given experimentTag/split. The CLI
|
|
13
|
+
* (`cortex autoresearch bench`) wires a concrete HarnessRunner; here everything
|
|
14
|
+
* is pure + injectable so it unit-tests with no network.
|
|
15
|
+
*
|
|
16
|
+
* FLOW: orchestrator (nexus side) runs this in the base worktree (→ records under
|
|
17
|
+
* harnessRef=base) and the candidate worktree (→ harnessRef=candidate), then calls
|
|
18
|
+
* `cortex autoresearch evaluate --base … --candidate …` which compares them.
|
|
19
|
+
* One bench run = one harness build; the base/candidate axis is the git ref the
|
|
20
|
+
* record is auto-stamped with (override via opts.harnessRef for single-box tests).
|
|
21
|
+
*/
|
|
22
|
+
import { ModelRouterMatrix } from './ModelRouterMatrix.js';
|
|
23
|
+
import { classifyTask } from './TaskClassifier.js';
|
|
24
|
+
function normalizeWs(s) {
|
|
25
|
+
return s.replace(/\s+/g, ' ').trim().toLowerCase();
|
|
26
|
+
}
|
|
27
|
+
/**
|
|
28
|
+
* Grade one model output against a verifier. Pure for the deterministic types;
|
|
29
|
+
* `contains` gives partial credit. `llm-judge` requires an injected judge.
|
|
30
|
+
*/
|
|
31
|
+
export async function gradeRun(output, verifier, judge) {
|
|
32
|
+
switch (verifier.type) {
|
|
33
|
+
case 'exact': {
|
|
34
|
+
const a = verifier.normalize ? normalizeWs(output) : output.trim();
|
|
35
|
+
const b = verifier.normalize ? normalizeWs(verifier.expected) : verifier.expected.trim();
|
|
36
|
+
const pass = a === b;
|
|
37
|
+
return { pass, qualitativeScore: pass ? 100 : 0 };
|
|
38
|
+
}
|
|
39
|
+
case 'regex': {
|
|
40
|
+
const re = new RegExp(verifier.pattern, verifier.flags);
|
|
41
|
+
const pass = re.test(output);
|
|
42
|
+
return { pass, qualitativeScore: pass ? 100 : 0 };
|
|
43
|
+
}
|
|
44
|
+
case 'contains': {
|
|
45
|
+
const hay = verifier.caseInsensitive ? output.toLowerCase() : output;
|
|
46
|
+
const needles = verifier.all.map(n => (verifier.caseInsensitive ? n.toLowerCase() : n));
|
|
47
|
+
const found = needles.filter(n => hay.includes(n)).length;
|
|
48
|
+
const total = needles.length || 1;
|
|
49
|
+
const qualitativeScore = Math.round((found / total) * 100);
|
|
50
|
+
return { pass: found === needles.length, qualitativeScore, detail: `${found}/${needles.length} matched` };
|
|
51
|
+
}
|
|
52
|
+
case 'llm-judge': {
|
|
53
|
+
if (!judge)
|
|
54
|
+
throw new Error("gradeRun: verifier type 'llm-judge' requires an injected JudgeFn");
|
|
55
|
+
return judge(output, verifier.rubric);
|
|
56
|
+
}
|
|
57
|
+
case 'numeric': {
|
|
58
|
+
let value = NaN;
|
|
59
|
+
if (verifier.extract) {
|
|
60
|
+
const m = output.match(new RegExp(verifier.extract));
|
|
61
|
+
if (m)
|
|
62
|
+
value = parseFloat(m[1] ?? m[0]);
|
|
63
|
+
}
|
|
64
|
+
else {
|
|
65
|
+
const all = output.match(/-?\d+(?:\.\d+)?(?:[eE][-+]?\d+)?/g);
|
|
66
|
+
if (all && all.length)
|
|
67
|
+
value = parseFloat(all[all.length - 1]);
|
|
68
|
+
}
|
|
69
|
+
if (!Number.isFinite(value)) {
|
|
70
|
+
return { pass: false, qualitativeScore: 0, detail: 'numeric: no number extracted' };
|
|
71
|
+
}
|
|
72
|
+
// Orient so higher = better, then optionally linear-map [worst,best] → [0,100].
|
|
73
|
+
const oriented = verifier.direction === 'minimize' ? -value : value;
|
|
74
|
+
let score;
|
|
75
|
+
if (verifier.best != null && verifier.worst != null) {
|
|
76
|
+
const bestO = verifier.direction === 'minimize' ? -verifier.best : verifier.best;
|
|
77
|
+
const worstO = verifier.direction === 'minimize' ? -verifier.worst : verifier.worst;
|
|
78
|
+
score = bestO === worstO
|
|
79
|
+
? (oriented >= bestO ? 100 : 0)
|
|
80
|
+
: Math.max(0, Math.min(100, ((oriented - worstO) / (bestO - worstO)) * 100));
|
|
81
|
+
}
|
|
82
|
+
else {
|
|
83
|
+
score = oriented; // raw oriented value; the gate compares base vs candidate relatively
|
|
84
|
+
}
|
|
85
|
+
const pass = verifier.target == null
|
|
86
|
+
? true
|
|
87
|
+
: (verifier.direction === 'minimize' ? value <= verifier.target : value >= verifier.target);
|
|
88
|
+
return { pass, qualitativeScore: Math.round(score * 100) / 100, detail: `value=${value}` };
|
|
89
|
+
}
|
|
90
|
+
default: {
|
|
91
|
+
const _exhaustive = verifier;
|
|
92
|
+
throw new Error(`gradeRun: unknown verifier ${JSON.stringify(_exhaustive)}`);
|
|
93
|
+
}
|
|
94
|
+
}
|
|
95
|
+
}
|
|
96
|
+
/**
|
|
97
|
+
* Run each task `runs` times through `runner`, grade each output, and write a
|
|
98
|
+
* REAL scored BenchmarkRecord to the matrix (harnessRef auto-stamped unless
|
|
99
|
+
* overridden; taskFingerprint = hash of prompt+verifier so it's the stable
|
|
100
|
+
* comparability key the gate joins on).
|
|
101
|
+
*/
|
|
102
|
+
export async function runBench(tasks, runner, matrix, opts) {
|
|
103
|
+
const runs = opts.runs ?? 2;
|
|
104
|
+
const split = opts.split ?? 'train';
|
|
105
|
+
const taskSummaries = [];
|
|
106
|
+
let totalRuns = 0;
|
|
107
|
+
let seededDeficiencies = 0;
|
|
108
|
+
for (const task of tasks) {
|
|
109
|
+
const taskType = task.taskType ?? classifyTask(task.prompt).taskType;
|
|
110
|
+
const taskFingerprint = ModelRouterMatrix.fingerprintTask(task.prompt, JSON.stringify(task.verifier));
|
|
111
|
+
let passes = 0;
|
|
112
|
+
let scoreSum = 0;
|
|
113
|
+
let sampleFailure;
|
|
114
|
+
let observedModelId = opts.modelId;
|
|
115
|
+
for (let i = 0; i < runs; i++) {
|
|
116
|
+
const res = await runner.run(task.prompt, { model: opts.modelId });
|
|
117
|
+
const grade = await gradeRun(res.text, task.verifier, opts.judge);
|
|
118
|
+
if (!grade.pass && sampleFailure === undefined)
|
|
119
|
+
sampleFailure = res.text;
|
|
120
|
+
observedModelId = res.modelId ?? observedModelId;
|
|
121
|
+
passes += grade.pass ? 1 : 0;
|
|
122
|
+
scoreSum += grade.qualitativeScore;
|
|
123
|
+
totalRuns++;
|
|
124
|
+
matrix.record({
|
|
125
|
+
modelId: res.modelId ?? opts.modelId ?? 'unknown',
|
|
126
|
+
taskType,
|
|
127
|
+
toolCallCount: res.toolCallCount,
|
|
128
|
+
inputTokens: res.inputTokens,
|
|
129
|
+
outputTokens: res.outputTokens,
|
|
130
|
+
latencyMs: res.latencyMs,
|
|
131
|
+
pass: grade.pass,
|
|
132
|
+
qualitativeScore: grade.qualitativeScore,
|
|
133
|
+
taskFingerprint,
|
|
134
|
+
experimentTag: opts.experimentTag,
|
|
135
|
+
split,
|
|
136
|
+
benchmarkSource: opts.benchmarkSource,
|
|
137
|
+
...(opts.harnessRef ? { harnessRef: opts.harnessRef } : {}),
|
|
138
|
+
...(opts.temperature !== undefined ? { temperature: opts.temperature } : {}),
|
|
139
|
+
...(opts.strategy ? { strategy: opts.strategy } : {}),
|
|
140
|
+
});
|
|
141
|
+
opts.onRun?.({ taskId: task.id, run: i + 1, pass: grade.pass, qualitativeScore: grade.qualitativeScore });
|
|
142
|
+
}
|
|
143
|
+
const passRate = Math.round((passes / runs) * 1000) / 1000;
|
|
144
|
+
const meanScore = Math.round((scoreSum / runs) * 100) / 100;
|
|
145
|
+
// Deterministic backlog seeding: a sub-100% pass-rate is direct evidence of a
|
|
146
|
+
// harness weakness, so seed it here rather than relying on the model to call the
|
|
147
|
+
// ResearchBacklog tool. Idempotent by title (`Bench failure: <taskId>`), so a
|
|
148
|
+
// re-run updates the same record. Confidence = how consistently it failed × how
|
|
149
|
+
// many runs back it, so a flaky one-off (or a possibly-too-strict verifier on a
|
|
150
|
+
// near-miss) sinks in triage instead of registering as a confident false positive.
|
|
151
|
+
if (opts.backlog && split !== 'holdout' && passRate < 1) {
|
|
152
|
+
const failRate = 1 - passRate;
|
|
153
|
+
const sampleWeight = Math.min(1, runs / 3); // 1 run = weak evidence; ~3+ = solid
|
|
154
|
+
const confidence = Math.round(Math.min(0.9, Math.max(0.25, 0.3 + 0.6 * failRate * sampleWeight)) * 100) / 100;
|
|
155
|
+
const severity = meanScore <= 10 ? 'high' : meanScore < 60 ? 'medium' : 'low';
|
|
156
|
+
const clip = (s, n) => (s.length > n ? s.slice(0, n) + '…' : s);
|
|
157
|
+
try {
|
|
158
|
+
opts.backlog.add({
|
|
159
|
+
title: `Bench failure: ${task.id}`,
|
|
160
|
+
description: `Harness failed benchmark task "${task.id}" (${task.verifier.type} verifier). ` +
|
|
161
|
+
`passRate=${passes}/${runs}, meanScore=${meanScore}. Prompt: ${clip(task.prompt, 200)}`,
|
|
162
|
+
bugClass: opts.deficiencyBugClass ?? 'Other',
|
|
163
|
+
severity,
|
|
164
|
+
impact: 3,
|
|
165
|
+
effort: 3,
|
|
166
|
+
confidence,
|
|
167
|
+
discoveredRound: opts.discoveredRound,
|
|
168
|
+
discoveredRef: opts.discoveredRef,
|
|
169
|
+
affectedModels: observedModelId ? [observedModelId] : undefined,
|
|
170
|
+
affectedTaskFingerprints: [taskFingerprint],
|
|
171
|
+
notes: `taskType=${taskType}; split=${split}; sample output: ${clip(sampleFailure ?? '(empty output)', 300)}`,
|
|
172
|
+
});
|
|
173
|
+
seededDeficiencies++;
|
|
174
|
+
}
|
|
175
|
+
catch {
|
|
176
|
+
// A backlog write error must never fail the benchmark itself.
|
|
177
|
+
}
|
|
178
|
+
}
|
|
179
|
+
taskSummaries.push({ taskId: task.id, taskFingerprint, taskType, runs, passRate, meanScore });
|
|
180
|
+
}
|
|
181
|
+
return {
|
|
182
|
+
experimentTag: opts.experimentTag,
|
|
183
|
+
split,
|
|
184
|
+
harnessRef: opts.harnessRef,
|
|
185
|
+
totalRuns,
|
|
186
|
+
tasks: taskSummaries,
|
|
187
|
+
seededDeficiencies,
|
|
188
|
+
};
|
|
189
|
+
}
|
|
190
|
+
/** Validate a parsed task-set JSON value, throwing on malformed entries. */
|
|
191
|
+
export function parseTaskSet(raw, source = '<task-set>') {
|
|
192
|
+
const arr = Array.isArray(raw) ? raw : [raw];
|
|
193
|
+
return arr.map((t, i) => {
|
|
194
|
+
if (!t || typeof t !== 'object')
|
|
195
|
+
throw new Error(`${source}[${i}]: not an object`);
|
|
196
|
+
const o = t;
|
|
197
|
+
if (typeof o.id !== 'string' || !o.id)
|
|
198
|
+
throw new Error(`${source}[${i}]: missing 'id'`);
|
|
199
|
+
if (typeof o.prompt !== 'string' || !o.prompt)
|
|
200
|
+
throw new Error(`${source}[${i}] (${o.id}): missing 'prompt'`);
|
|
201
|
+
if (!o.verifier || typeof o.verifier !== 'object')
|
|
202
|
+
throw new Error(`${source}[${i}] (${o.id}): missing 'verifier'`);
|
|
203
|
+
const v = o.verifier;
|
|
204
|
+
const validTypes = ['exact', 'regex', 'contains', 'llm-judge', 'numeric'];
|
|
205
|
+
if (typeof v.type !== 'string' || !validTypes.includes(v.type)) {
|
|
206
|
+
throw new Error(`${source}[${i}] (${o.id}): verifier.type must be one of ${validTypes.join('|')}`);
|
|
207
|
+
}
|
|
208
|
+
return { id: o.id, prompt: o.prompt, verifier: o.verifier, taskType: o.taskType };
|
|
209
|
+
});
|
|
210
|
+
}
|
|
211
|
+
//# sourceMappingURL=BenchRunner.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"BenchRunner.js","sourceRoot":"","sources":["../../src/training/BenchRunner.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;GAoBG;AAEH,OAAO,EAAE,iBAAiB,EAAE,MAAM,wBAAwB,CAAC;AAC3D,OAAO,EAAE,YAAY,EAAE,MAAM,qBAAqB,CAAC;AA8CnD,SAAS,WAAW,CAAC,CAAS;IAC5B,OAAO,CAAC,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;AACrD,CAAC;AAED;;;GAGG;AACH,MAAM,CAAC,KAAK,UAAU,QAAQ,CAAC,MAAc,EAAE,QAAkB,EAAE,KAAe;IAChF,QAAQ,QAAQ,CAAC,IAAI,EAAE,CAAC;QACtB,KAAK,OAAO,CAAC,CAAC,CAAC;YACb,MAAM,CAAC,GAAG,QAAQ,CAAC,SAAS,CAAC,CAAC,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,IAAI,EAAE,CAAC;YACnE,MAAM,CAAC,GAAG,QAAQ,CAAC,SAAS,CAAC,CAAC,CAAC,WAAW,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;YACzF,MAAM,IAAI,GAAG,CAAC,KAAK,CAAC,CAAC;YACrB,OAAO,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;QACpD,CAAC;QACD,KAAK,OAAO,CAAC,CAAC,CAAC;YACb,MAAM,EAAE,GAAG,IAAI,MAAM,CAAC,QAAQ,CAAC,OAAO,EAAE,QAAQ,CAAC,KAAK,CAAC,CAAC;YACxD,MAAM,IAAI,GAAG,EAAE,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;YAC7B,OAAO,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;QACpD,CAAC;QACD,KAAK,UAAU,CAAC,CAAC,CAAC;YAChB,MAAM,GAAG,GAAG,QAAQ,CAAC,eAAe,CAAC,CAAC,CAAC,MAAM,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,MAAM,CAAC;YACrE,MAAM,OAAO,GAAG,QAAQ,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,QAAQ,CAAC,eAAe,CAAC,CAAC,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YACxF,MAAM,KAAK,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC;YAC1D,MAAM,KAAK,GAAG,OAAO,CAAC,MAAM,IAAI,CAAC,CAAC;YAClC,MAAM,gBAAgB,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,KAAK,GAAG,KAAK,CAAC,GAAG,GAAG,CAAC,CAAC;YAC3D,OAAO,EAAE,IAAI,EAAE,KAAK,KAAK,OAAO,CAAC,MAAM,EAAE,gBAAgB,EAAE,MAAM,EAAE,GAAG,KAAK,IAAI,OAAO,CAAC,MAAM,UAAU,EAAE,CAAC;QAC5G,CAAC;QACD,KAAK,WAAW,CAAC,CAAC,CAAC;YACjB,IAAI,CAAC,KAAK;gBAAE,MAAM,IAAI,KAAK,CAAC,kEAAkE,CAAC,CAAC;YAChG,OAAO,KAAK,CAAC,MAAM,EAAE,QAAQ,CAAC,MAAM,CAAC,CAAC;QACxC,CAAC;QACD,KAAK,SAAS,CAAC,CAAC,CAAC;YACf,IAAI,KAAK,GAAG,GAAG,CAAC;YAChB,IAAI,QAAQ,CAAC,OAAO,EAAE,CAAC;gBACrB,MAAM,CAAC,GAAG,MAAM,CAAC,KAAK,CAAC,IAAI,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;gBACrD,IAAI,CAAC;oBAAE,KAAK,GAAG,UAAU,CAAC,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAC1C,CAAC;iBAAM,CAAC;gBACN,MAAM,GAAG,GAAG,MAAM,CAAC,KAAK,CAAC,mCAAmC,CAAC,CAAC;gBAC9D,IAAI,GAAG,IAAI,GAAG,CAAC,MAAM;oBAAE,KAAK,GAAG,UAAU,CAAC,GAAG,CAAC,GAAG,CAAC,MAAM,GAAG,CAAC,CAAE,CAAC,CAAC;YAClE,CAAC;YACD,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;gBAC5B,OAAO,EAAE,IAAI,EAAE,KAAK,EAAE,gBAAgB,EAAE,CAAC,EAAE,MAAM,EAAE,8BAA8B,EAAE,CAAC;YACtF,CAAC;YACD,gFAAgF;YAChF,MAAM,QAAQ,GAAG,QAAQ,CAAC,SAAS,KAAK,UAAU,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC;YACpE,IAAI,KAAa,CAAC;YAClB,IAAI,QAAQ,CAAC,IAAI,IAAI,IAAI,IAAI,QAAQ,CAAC,KAAK,IAAI,IAAI,EAAE,CAAC;gBACpD,MAAM,KAAK,GAAG,QAAQ,CAAC,SAAS,KAAK,UAAU,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC;gBACjF,MAAM,MAAM,GAAG,QAAQ,CAAC,SAAS,KAAK,UAAU,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,CAAC,QAAQ,CAAC,KAAK,CAAC;gBACpF,KAAK,GAAG,KAAK,KAAK,MAAM;oBACtB,CAAC,CAAC,CAAC,QAAQ,IAAI,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;oBAC/B,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,GAAG,EAAE,CAAC,CAAC,QAAQ,GAAG,MAAM,CAAC,GAAG,CAAC,KAAK,GAAG,MAAM,CAAC,CAAC,GAAG,GAAG,CAAC,CAAC,CAAC;YACjF,CAAC;iBAAM,CAAC;gBACN,KAAK,GAAG,QAAQ,CAAC,CAAC,qEAAqE;YACzF,CAAC;YACD,MAAM,IAAI,GAAG,QAAQ,CAAC,MAAM,IAAI,IAAI;gBAClC,CAAC,CAAC,IAAI;gBACN,CAAC,CAAC,CAAC,QAAQ,CAAC,SAAS,KAAK,UAAU,CAAC,CAAC,CAAC,KAAK,IAAI,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,KAAK,IAAI,QAAQ,CAAC,MAAM,CAAC,CAAC;YAC9F,OAAO,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,KAAK,CAAC,KAAK,GAAG,GAAG,CAAC,GAAG,GAAG,EAAE,MAAM,EAAE,SAAS,KAAK,EAAE,EAAE,CAAC;QAC7F,CAAC;QACD,OAAO,CAAC,CAAC,CAAC;YACR,MAAM,WAAW,GAAU,QAAQ,CAAC;YACpC,MAAM,IAAI,KAAK,CAAC,8BAA8B,IAAI,CAAC,SAAS,CAAC,WAAW,CAAC,EAAE,CAAC,CAAC;QAC/E,CAAC;IACH,CAAC;AACH,CAAC;AAwFD;;;;;GAKG;AACH,MAAM,CAAC,KAAK,UAAU,QAAQ,CAC5B,KAAiB,EACjB,MAAqB,EACrB,MAAyB,EACzB,IAAqB;IAErB,MAAM,IAAI,GAAG,IAAI,CAAC,IAAI,IAAI,CAAC,CAAC;IAC5B,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,IAAI,OAAO,CAAC;IACpC,MAAM,aAAa,GAAuB,EAAE,CAAC;IAC7C,IAAI,SAAS,GAAG,CAAC,CAAC;IAClB,IAAI,kBAAkB,GAAG,CAAC,CAAC;IAE3B,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,MAAM,QAAQ,GAAG,IAAI,CAAC,QAAQ,IAAI,YAAY,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,QAAQ,CAAC;QACrE,MAAM,eAAe,GAAG,iBAAiB,CAAC,eAAe,CAAC,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC;QACtG,IAAI,MAAM,GAAG,CAAC,CAAC;QACf,IAAI,QAAQ,GAAG,CAAC,CAAC;QACjB,IAAI,aAAiC,CAAC;QACtC,IAAI,eAAe,GAAuB,IAAI,CAAC,OAAO,CAAC;QAEvD,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,IAAI,EAAE,CAAC,EAAE,EAAE,CAAC;YAC9B,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,GAAG,CAAC,IAAI,CAAC,MAAM,EAAE,EAAE,KAAK,EAAE,IAAI,CAAC,OAAO,EAAE,CAAC,CAAC;YACnE,MAAM,KAAK,GAAG,MAAM,QAAQ,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,QAAQ,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC;YAClE,IAAI,CAAC,KAAK,CAAC,IAAI,IAAI,aAAa,KAAK,SAAS;gBAAE,aAAa,GAAG,GAAG,CAAC,IAAI,CAAC;YACzE,eAAe,GAAG,GAAG,CAAC,OAAO,IAAI,eAAe,CAAC;YACjD,MAAM,IAAI,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAC7B,QAAQ,IAAI,KAAK,CAAC,gBAAgB,CAAC;YACnC,SAAS,EAAE,CAAC;YAEZ,MAAM,CAAC,MAAM,CAAC;gBACZ,OAAO,EAAE,GAAG,CAAC,OAAO,IAAI,IAAI,CAAC,OAAO,IAAI,SAAS;gBACjD,QAAQ;gBACR,aAAa,EAAE,GAAG,CAAC,aAAa;gBAChC,WAAW,EAAE,GAAG,CAAC,WAAW;gBAC5B,YAAY,EAAE,GAAG,CAAC,YAAY;gBAC9B,SAAS,EAAE,GAAG,CAAC,SAAS;gBACxB,IAAI,EAAE,KAAK,CAAC,IAAI;gBAChB,gBAAgB,EAAE,KAAK,CAAC,gBAAgB;gBACxC,eAAe;gBACf,aAAa,EAAE,IAAI,CAAC,aAAa;gBACjC,KAAK;gBACL,eAAe,EAAE,IAAI,CAAC,eAAe;gBACrC,GAAG,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC,CAAC,EAAE,UAAU,EAAE,IAAI,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBAC3D,GAAG,CAAC,IAAI,CAAC,WAAW,KAAK,SAAS,CAAC,CAAC,CAAC,EAAE,WAAW,EAAE,IAAI,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBAC5E,GAAG,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC,EAAE,QAAQ,EAAE,IAAI,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;aACtD,CAAC,CAAC;YAEH,IAAI,CAAC,KAAK,EAAE,CAAC,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,EAAE,GAAG,EAAE,CAAC,GAAG,CAAC,EAAE,IAAI,EAAE,KAAK,CAAC,IAAI,EAAE,gBAAgB,EAAE,KAAK,CAAC,gBAAgB,EAAE,CAAC,CAAC;QAC5G,CAAC;QAED,MAAM,QAAQ,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,MAAM,GAAG,IAAI,CAAC,GAAG,IAAI,CAAC,GAAG,IAAI,CAAC;QAC3D,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,QAAQ,GAAG,IAAI,CAAC,GAAG,GAAG,CAAC,GAAG,GAAG,CAAC;QAE5D,8EAA8E;QAC9E,iFAAiF;QACjF,8EAA8E;QAC9E,gFAAgF;QAChF,gFAAgF;QAChF,mFAAmF;QACnF,IAAI,IAAI,CAAC,OAAO,IAAI,KAAK,KAAK,SAAS,IAAI,QAAQ,GAAG,CAAC,EAAE,CAAC;YACxD,MAAM,QAAQ,GAAG,CAAC,GAAG,QAAQ,CAAC;YAC9B,MAAM,YAAY,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC,qCAAqC;YACjF,MAAM,UAAU,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,GAAG,EAAE,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,GAAG,GAAG,GAAG,GAAG,QAAQ,GAAG,YAAY,CAAC,CAAC,GAAG,GAAG,CAAC,GAAG,GAAG,CAAC;YAC9G,MAAM,QAAQ,GAAa,SAAS,IAAI,EAAE,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,SAAS,GAAG,EAAE,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC;YACxF,MAAM,IAAI,GAAG,CAAC,CAAS,EAAE,CAAS,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAChF,IAAI,CAAC;gBACH,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC;oBACf,KAAK,EAAE,kBAAkB,IAAI,CAAC,EAAE,EAAE;oBAClC,WAAW,EACT,kCAAkC,IAAI,CAAC,EAAE,MAAM,IAAI,CAAC,QAAQ,CAAC,IAAI,cAAc;wBAC/E,YAAY,MAAM,IAAI,IAAI,eAAe,SAAS,aAAa,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE;oBACzF,QAAQ,EAAE,IAAI,CAAC,kBAAkB,IAAI,OAAO;oBAC5C,QAAQ;oBACR,MAAM,EAAE,CAAC;oBACT,MAAM,EAAE,CAAC;oBACT,UAAU;oBACV,eAAe,EAAE,IAAI,CAAC,eAAe;oBACrC,aAAa,EAAE,IAAI,CAAC,aAAa;oBACjC,cAAc,EAAE,eAAe,CAAC,CAAC,CAAC,CAAC,eAAe,CAAC,CAAC,CAAC,CAAC,SAAS;oBAC/D,wBAAwB,EAAE,CAAC,eAAe,CAAC;oBAC3C,KAAK,EAAE,YAAY,QAAQ,WAAW,KAAK,oBAAoB,IAAI,CAAC,aAAa,IAAI,gBAAgB,EAAE,GAAG,CAAC,EAAE;iBAC9G,CAAC,CAAC;gBACH,kBAAkB,EAAE,CAAC;YACvB,CAAC;YAAC,MAAM,CAAC;gBACP,8DAA8D;YAChE,CAAC;QACH,CAAC;QAED,aAAa,CAAC,IAAI,CAAC,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,EAAE,eAAe,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,EAAE,SAAS,EAAE,CAAC,CAAC;IAChG,CAAC;IAED,OAAO;QACL,aAAa,EAAE,IAAI,CAAC,aAAa;QACjC,KAAK;QACL,UAAU,EAAE,IAAI,CAAC,UAAU;QAC3B,SAAS;QACT,KAAK,EAAE,aAAa;QACpB,kBAAkB;KACnB,CAAC;AACJ,CAAC;AAED,4EAA4E;AAC5E,MAAM,UAAU,YAAY,CAAC,GAAY,EAAE,MAAM,GAAG,YAAY;IAC9D,MAAM,GAAG,GAAG,KAAK,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAC7C,OAAO,GAAG,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE;QACtB,IAAI,CAAC,CAAC,IAAI,OAAO,CAAC,KAAK,QAAQ;YAAE,MAAM,IAAI,KAAK,CAAC,GAAG,MAAM,IAAI,CAAC,kBAAkB,CAAC,CAAC;QACnF,MAAM,CAAC,GAAG,CAA4B,CAAC;QACvC,IAAI,OAAO,CAAC,CAAC,EAAE,KAAK,QAAQ,IAAI,CAAC,CAAC,CAAC,EAAE;YAAE,MAAM,IAAI,KAAK,CAAC,GAAG,MAAM,IAAI,CAAC,iBAAiB,CAAC,CAAC;QACxF,IAAI,OAAO,CAAC,CAAC,MAAM,KAAK,QAAQ,IAAI,CAAC,CAAC,CAAC,MAAM;YAAE,MAAM,IAAI,KAAK,CAAC,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,CAAC,EAAE,qBAAqB,CAAC,CAAC;QAC9G,IAAI,CAAC,CAAC,CAAC,QAAQ,IAAI,OAAO,CAAC,CAAC,QAAQ,KAAK,QAAQ;YAAE,MAAM,IAAI,KAAK,CAAC,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,CAAC,EAAE,uBAAuB,CAAC,CAAC;QACpH,MAAM,CAAC,GAAG,CAAC,CAAC,QAAmC,CAAC;QAChD,MAAM,UAAU,GAAG,CAAC,OAAO,EAAE,OAAO,EAAE,UAAU,EAAE,WAAW,EAAE,SAAS,CAAC,CAAC;QAC1E,IAAI,OAAO,CAAC,CAAC,IAAI,KAAK,QAAQ,IAAI,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC,CAAC,IAAI,CAAC,EAAE,CAAC;YAC/D,MAAM,IAAI,KAAK,CAAC,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,CAAC,EAAE,mCAAmC,UAAU,CAAC,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACrG,CAAC;QACD,OAAO,EAAE,EAAE,EAAE,CAAC,CAAC,EAAE,EAAE,MAAM,EAAE,CAAC,CAAC,MAAM,EAAE,QAAQ,EAAE,CAAC,CAAC,QAAoB,EAAE,QAAQ,EAAE,CAAC,CAAC,QAA8B,EAAE,CAAC;IACtH,CAAC,CAAC,CAAC;AACL,CAAC"}
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* DecisionPriorInjector — formats a <system-reminder> block from past
|
|
3
|
+
* decision stats so the orchestrator can prepend it to the next tool
|
|
4
|
+
* result, giving the model evidence-based priors about how a given
|
|
5
|
+
* (toolName, input) pattern has fared in past sessions.
|
|
6
|
+
*
|
|
7
|
+
* Only emits a reminder when at least one prior FAILED — pure-success
|
|
8
|
+
* histories produce no output (no actionable signal, just noise).
|
|
9
|
+
*
|
|
10
|
+
* When `recent` is supplied, the reminder body includes up to 3 specific
|
|
11
|
+
* recent outcomes (newest first) — matching the
|
|
12
|
+
* "up to 3 prior outcomes" pattern. Specific
|
|
13
|
+
* recent entries give the model far more actionable signal than the
|
|
14
|
+
* aggregate count alone (e.g. "the last 2 attempts both timed out").
|
|
15
|
+
*/
|
|
16
|
+
import type { Decision, DecisionStats } from './DecisionStore.js';
|
|
17
|
+
export declare function formatPriorReminder(toolName: string, stats: DecisionStats, recent?: Decision[]): string | null;
|
|
18
|
+
//# sourceMappingURL=DecisionPriorInjector.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"DecisionPriorInjector.d.ts","sourceRoot":"","sources":["../../src/training/DecisionPriorInjector.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;GAcG;AAEH,OAAO,KAAK,EAAE,QAAQ,EAAE,aAAa,EAAE,MAAM,oBAAoB,CAAC;AAIlE,wBAAgB,mBAAmB,CACjC,QAAQ,EAAE,MAAM,EAChB,KAAK,EAAE,aAAa,EACpB,MAAM,CAAC,EAAE,QAAQ,EAAE,GAClB,MAAM,GAAG,IAAI,CAoBf"}
|