npm - vieval - Versions diffs - 0.0.7 → 0.0.9 - Mend

vieval 0.0.7 → 0.0.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/README.md +24 -2
package/dist/bin/vieval.mjs +1 -1
package/dist/cli/index.mjs +1 -1
package/dist/{cli-ImxGpoYQ.mjs → cli-Dao25VxV.mjs} +2 -2
package/dist/cli-Dao25VxV.mjs.map +1 -0
package/dist/config.d.mts +1 -1
package/dist/config.mjs +1 -1
package/dist/core/assertions/index.d.mts +1 -1
package/dist/core/inference-executors/index.d.mts +1 -1
package/dist/core/inference-executors/index.mjs +10 -4
package/dist/core/inference-executors/index.mjs.map +1 -1
package/dist/core/processors/results/index.d.mts +1 -1
package/dist/core/runner/index.d.mts +2 -2
package/dist/core/runner/index.mjs +6 -40
package/dist/core/runner/index.mjs.map +1 -1
package/dist/{env-BeHv_5mo.d.mts → env-DfWZy_n4.d.mts} +14 -9
package/dist/env-nV5rVErX.mjs +35 -0
package/dist/env-nV5rVErX.mjs.map +1 -0
package/dist/{index-5R1_k2nv.d.mts → index-BkjyCInx.d.mts} +12 -37
package/dist/index.d.mts +5 -5
package/dist/index.mjs +1 -1
package/dist/{models-DIGdOUpJ.mjs → models-pBSRUZhY.mjs} +1 -1
package/dist/{models-DIGdOUpJ.mjs.map → models-pBSRUZhY.mjs.map} +1 -1
package/dist/plugins/chat-models/index.d.mts +63 -6
package/dist/plugins/chat-models/index.mjs +74 -18
package/dist/plugins/chat-models/index.mjs.map +1 -1
package/dist/registry-BHGMxjpA.mjs.map +1 -1
package/package.json +1 -1
package/dist/cli-ImxGpoYQ.mjs.map +0 -1
package/dist/env--94B0UtW.mjs +0 -41
package/dist/env--94B0UtW.mjs.map +0 -1

package/dist/{index-5R1_k2nv.d.mts → index-BkjyCInx.d.mts} RENAMED Viewed

@@ -495,15 +495,6 @@ interface ModelDefinition {
 declare function resolveModelByName(models: readonly ModelDefinition[], name: string): ModelDefinition | undefined;
 //#endregion
 //#region src/core/runner/task-context.d.ts
-/**
- * Options for selecting a model from the execution context.
- */
-interface TaskModelSelectionOptions {
-  /**
-   * Model id or alias name.
-   */
-  name: string;
-}
 /**
  * Task-scoped execution context exposed to runner executors.
  */
@@ -513,13 +504,9 @@ interface TaskExecutionContext {
    */
   cache: TaskCacheRuntime;
   /**
-   * Resolves model configuration for the current task.
-   *
-   * Use when:
-   * - no arguments are provided to use the model selected by run matrix/inferenceExecutor
-   * - `name` is provided to resolve a specific model id or alias
+   * Configured model registrations available to model plugins.
    */
-  model: (selection?: string | TaskModelSelectionOptions) => ModelDefinition;
+  models: readonly ModelDefinition[];
 }
 /**
  * Inputs used to build task execution context.
@@ -530,14 +517,13 @@ interface CreateTaskExecutionContextOptions {
   task: ScheduledTask;
 }
 /**
- * Creates task-scoped model resolver context for runner execution.
+ * Creates task-scoped context data for runner execution.
  *
  * Call stack:
  *
  * {@link runScheduledTasks}
  *   -> {@link createTaskExecutionContext}
- *     -> {@link resolveModelByName}
- *       -> `task.model()` / `task.model({ name })`
+ *     -> `TaskExecutionContext`
  */
 declare function createTaskExecutionContext(options: CreateTaskExecutionContextOptions): TaskExecutionContext;
 //#endregion
@@ -581,7 +567,7 @@ interface RunScheduledTasksOptions {
    * Creates per-task execution context.
    *
    * Use when:
-   * - executor code needs per-task model resolution or other task-scoped data
+   * - executor code needs per-task models, cache, or other task-scoped data
    */
   createExecutionContext?: (task: ScheduledTask) => TaskExecutionContext;
   /**
@@ -1035,24 +1021,13 @@ interface TaskRunContext {
    */
   task: ScheduledTask;
   /**
-   * Matrix-scoped model resolver.
-   *
-   * Runtime impact:
-   * - `context.model()` uses `context.task.matrix.run.model` first when present
-   * - then falls back to inferenceExecutor-id match
-   * - then falls back to first configured model
+   * Configured model registrations available to model plugins.
    *
-   * @example
-   * ```ts
-   * // matrix.run.model = 'gpt-4.1-mini'
-   * const defaultModel = context.model()
-   * // resolves the configured model whose id/model/alias matches 'gpt-4.1-mini'
-   *
-   * const judgeModel = context.model({ name: 'judge-large' })
-   * // explicit lookup bypasses matrix default
-   * ```
+   * Use when:
+   * - a plugin owns model selection semantics and needs access to registered models
+   * - eval code resolves matrix-selected model axes through plugin helpers
    */
-  model: TaskExecutionContext['model'];
+  models: TaskExecutionContext['models'];
   /**
    * Optional reporter lifecycle hooks for task-local case events.
    *
@@ -1378,5 +1353,5 @@ interface ConfigHookPlugin<TConfig> {
   configVievalResolved?: (config: TConfig) => void | Promise<void>;
 }
 //#endregion
-export { CreateRunnerScheduleOptions as $, RunScheduledTasksOptions as A, resolveModelByName as B, TaskDefinition as C, TaskRunContext as D, TaskReporterHooks as E, CreateTaskExecutionContextOptions as F, createRunnerRuntimeContext as G, collectEvalEntries as H, TaskExecutionContext as I, AggregatedRunSummary as J, AggregatedProviderSummary as K, TaskModelSelectionOptions as L, RunnerTaskState as M, ScheduledTaskExecutor as N, TaskRunOutput as O, runScheduledTasks as P, aggregateRunResults as Q, createTaskExecutionContext as R, TaskConcurrencyConfig as S, TaskReporterEventPayload as T, CreateVievalRunnerRuntimeContextOptions as U, asProjectRelativePath as V, RunnerRuntimeContext as W, RunScore as X, RunResult as Y, RunScoreKind as Z, ScopedMatrices as _, CliOpenTelemetryReportingConfig as a, ScheduledTaskMatrix as at, TaskCaseReporterPayload as b, EvalDefinition as c, CreateFilesystemTaskCacheRuntimeOptions as ct, MatrixAxisValues as d, CacheFileHandle as dt, InferenceExecutor as et, MatrixDefinition as f, CacheFileOptions as ft, MatrixValue as g, MatrixRow as h, Awaitable as i, ScheduledTask as it, RunnerExecutionError as j, TelemetryAttributeValue as k, EvalModule as l, createFilesystemTaskCacheRuntime as lt, MatrixPrimitive as m, TaskCacheRuntime as mt, defineEval as n, RunnerMatrixInput as nt, CliReportingConfig as o, ScheduledTaskMatrixMeta as ot, MatrixLayer as p, CacheNamespace as pt, AggregatedRunResults as q, defineTask as r, RunnerMatrixSelection as rt, CollectedEvalEntry as s, createRunnerSchedule as st, ConfigHookPlugin as t, RunnerMatrixDefinition as tt, EvalModuleMap as u, normalizeCacheFilePathSegments as ut, TaskAutoRetryDelay as v, TaskExecutionPolicy as w, TaskCaseState as x, TaskCaseReporterEndPayload as y, ModelDefinition as z };
-//# sourceMappingURL=index-5R1_k2nv.d.mts.map
+export { InferenceExecutor as $, RunScheduledTasksOptions as A, asProjectRelativePath as B, TaskDefinition as C, TaskRunContext as D, TaskReporterHooks as E, CreateTaskExecutionContextOptions as F, AggregatedProviderSummary as G, CreateVievalRunnerRuntimeContextOptions as H, TaskExecutionContext as I, RunResult as J, AggregatedRunResults as K, createTaskExecutionContext as L, RunnerTaskState as M, ScheduledTaskExecutor as N, TaskRunOutput as O, runScheduledTasks as P, CreateRunnerScheduleOptions as Q, ModelDefinition as R, TaskConcurrencyConfig as S, TaskReporterEventPayload as T, RunnerRuntimeContext as U, collectEvalEntries as V, createRunnerRuntimeContext as W, RunScoreKind as X, RunScore as Y, aggregateRunResults as Z, ScopedMatrices as _, CliOpenTelemetryReportingConfig as a, ScheduledTaskMatrixMeta as at, TaskCaseReporterPayload as b, EvalDefinition as c, createFilesystemTaskCacheRuntime as ct, MatrixAxisValues as d, CacheFileOptions as dt, RunnerMatrixDefinition as et, MatrixDefinition as f, CacheNamespace as ft, MatrixValue as g, MatrixRow as h, Awaitable as i, ScheduledTaskMatrix as it, RunnerExecutionError as j, TelemetryAttributeValue as k, EvalModule as l, normalizeCacheFilePathSegments as lt, MatrixPrimitive as m, defineEval as n, RunnerMatrixSelection as nt, CliReportingConfig as o, createRunnerSchedule as ot, MatrixLayer as p, TaskCacheRuntime as pt, AggregatedRunSummary as q, defineTask as r, ScheduledTask as rt, CollectedEvalEntry as s, CreateFilesystemTaskCacheRuntimeOptions as st, ConfigHookPlugin as t, RunnerMatrixInput as tt, EvalModuleMap as u, CacheFileHandle as ut, TaskAutoRetryDelay as v, TaskExecutionPolicy as w, TaskCaseState as x, TaskCaseReporterEndPayload as y, resolveModelByName as z };
+//# sourceMappingURL=index-BkjyCInx.d.mts.map

package/dist/index.d.mts CHANGED Viewed

@@ -1,5 +1,5 @@
-import { D as TaskRunContext, I as TaskExecutionContext, O as TaskRunOutput, S as TaskConcurrencyConfig, Y as RunResult, Z as RunScoreKind, et as InferenceExecutor, f as MatrixDefinition, it as ScheduledTask, k as TelemetryAttributeValue, o as CliReportingConfig, p as MatrixLayer, t as ConfigHookPlugin, w as TaskExecutionPolicy, z as ModelDefinition } from "./index-5R1_k2nv.mjs";
-import { a as requiredEnvFrom } from "./env-BeHv_5mo.mjs";
+import { $ as InferenceExecutor, D as TaskRunContext, I as TaskExecutionContext, J as RunResult, O as TaskRunOutput, R as ModelDefinition, S as TaskConcurrencyConfig, X as RunScoreKind, f as MatrixDefinition, k as TelemetryAttributeValue, o as CliReportingConfig, p as MatrixLayer, rt as ScheduledTask, t as ConfigHookPlugin, w as TaskExecutionPolicy } from "./index-BkjyCInx.mjs";
+import { a as requiredEnvFrom } from "./env-DfWZy_n4.mjs";
 import { expect } from "./expect.mjs";
 import * as _$c12 from "c12";
@@ -137,7 +137,7 @@ interface CliProjectConfig {
    * Model definitions available to project runtime execution.
    *
    * Inference executors control schedule fan-out, while models provide
-   * runtime lookup metadata for `context.model(...)` during task execution.
+   * runtime lookup metadata for model plugin helpers during task execution.
    *
    * @default inherited from top-level config models
    */
@@ -253,11 +253,11 @@ interface CliComparisonConfig {
  * Execution context exposed to project-level `executor` implementations.
  *
  * Use when:
- * - a project executor needs the task-scoped model resolver plus case reporter hooks
+ * - a project executor needs task-scoped models plus case reporter hooks
  * - custom scheduling logic wants the same hook shape as `TaskRunContext`
  *
  * Expects:
- * - `model` resolves configured models for the current task
+ * - `models` exposes configured model registrations for plugin helpers
  * - `reporterHooks` follows `TaskRunContext['reporterHooks']`
  * - `telemetry` follows `TaskRunContext['telemetry']`
  * - `runtimeConcurrency` follows `TaskRunContext['runtimeConcurrency']`

package/dist/index.mjs CHANGED Viewed

@@ -1,6 +1,6 @@
 import { i as registerEvalDefinition, l as loadEnv, o as createNoopTelemetryRuntime, s as defineConfig } from "./registry-BHGMxjpA.mjs";
 import { t as createSchedulerQueue } from "./queue-DsZQkZO_.mjs";
-import { n as requiredEnvFrom } from "./env--94B0UtW.mjs";
+import { n as requiredEnvFrom } from "./env-nV5rVErX.mjs";
 import { defineEval, defineTask } from "./config.mjs";
 import { expect } from "./expect.mjs";
 import { errorMessageFrom, sleep } from "@moeru/std";

package/dist/{models-DIGdOUpJ.mjs → models-pBSRUZhY.mjs} RENAMED Viewed

@@ -11,4 +11,4 @@ function resolveModelByName(models, name) {
 //#endregion
 export { resolveModelByName as t };
-//# sourceMappingURL=models-DIGdOUpJ.mjs.map
+//# sourceMappingURL=models-pBSRUZhY.mjs.map

package/dist/{models-DIGdOUpJ.mjs.map → models-pBSRUZhY.mjs.map} RENAMED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"models-~~DIGdOUpJ~~.mjs","names":[],"sources":["../src/config/models.ts"],"sourcesContent":["import type { TaskExecutionPolicy } from './types'\n\n/*\n Canonical model definition consumed by vieval runtime and config.\n \n Use when:\n * - declaring models in `vieval.config.`\n - resolving task runtime models by id, alias, or concrete model name\n \n Expects:\n * - `id` to be stable and unique within one config\n * - `inferenceExecutorId` to match scheduler/executor identifiers\n \n Returns:\n * - one normalized model registration record\n /\nexport interface ModelDefinition {\n /\n Stable model id.\n /\n id: string\n /\n Inference-executor id used for matching and reporting.\n /\n inferenceExecutorId: string\n /\n Executor reference passed through config.\n \n `vieval` core treats this as opaque runtime metadata. Builder plugins can\n * narrow this field with plugin-specific executor input types.\n /\n inferenceExecutor: unknown\n /\n Concrete model name passed to the inference executor.\n /\n model: string\n /\n Alias names that can resolve this model.\n /\n aliases: string[]\n /\n Optional execution policy hints attached to this model.\n /\n executionPolicy?: TaskExecutionPolicy\n /\n Optional model-level call parameters.\n /\n parameters?: Record<string, unknown>\n}\n\n/\n Resolves one model by id, model name, or alias in registration order.\n \n Returns:\n * - the first matching model, or `undefined` when no match exists\n */\nexport function resolveModelByName(\n models: readonly ModelDefinition[],\n name: string,\n): ModelDefinition \| undefined {\n return models.find(model => model.id === name \|\| model.model === name \|\| model.aliases.includes(name))\n}\n"],"mappings":";;;;;;;AAwDA,SAAgB,mBACd,QACA,MAC6B;AAC7B,QAAO,OAAO,MAAK,UAAS,MAAM,OAAO,QAAQ,MAAM,UAAU,QAAQ,MAAM,QAAQ,SAAS,KAAK,CAAC"}
1	+ {"version":3,"file":"models-pBSRUZhY.mjs","names":[],"sources":["../src/config/models.ts"],"sourcesContent":["import type { TaskExecutionPolicy } from './types'\n\n/*\n Canonical model definition consumed by vieval runtime and config.\n \n Use when:\n * - declaring models in `vieval.config.`\n - resolving task runtime models by id, alias, or concrete model name\n \n Expects:\n * - `id` to be stable and unique within one config\n * - `inferenceExecutorId` to match scheduler/executor identifiers\n \n Returns:\n * - one normalized model registration record\n /\nexport interface ModelDefinition {\n /\n Stable model id.\n /\n id: string\n /\n Inference-executor id used for matching and reporting.\n /\n inferenceExecutorId: string\n /\n Executor reference passed through config.\n \n `vieval` core treats this as opaque runtime metadata. Builder plugins can\n * narrow this field with plugin-specific executor input types.\n /\n inferenceExecutor: unknown\n /\n Concrete model name passed to the inference executor.\n /\n model: string\n /\n Alias names that can resolve this model.\n /\n aliases: string[]\n /\n Optional execution policy hints attached to this model.\n /\n executionPolicy?: TaskExecutionPolicy\n /\n Optional model-level call parameters.\n /\n parameters?: Record<string, unknown>\n}\n\n/\n Resolves one model by id, model name, or alias in registration order.\n \n Returns:\n * - the first matching model, or `undefined` when no match exists\n */\nexport function resolveModelByName(\n models: readonly ModelDefinition[],\n name: string,\n): ModelDefinition \| undefined {\n return models.find(model => model.id === name \|\| model.model === name \|\| model.aliases.includes(name))\n}\n"],"mappings":";;;;;;;AAwDA,SAAgB,mBACd,QACA,MAC6B;AAC7B,QAAO,OAAO,MAAK,UAAS,MAAM,OAAO,QAAQ,MAAM,UAAU,QAAQ,MAAM,QAAQ,SAAS,KAAK,CAAC"}

package/dist/plugins/chat-models/index.d.mts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { D as TaskRunContext, f as MatrixDefinition, t as ConfigHookPlugin, w as TaskExecutionPolicy, z as ModelDefinition } from "../../index-5R1_k2nv.mjs";
+import { D as TaskRunContext, R as ModelDefinition, f as MatrixDefinition, t as ConfigHookPlugin, w as TaskExecutionPolicy } from "../../index-BkjyCInx.mjs";
 //#region src/plugins/chat-models/runtime-config.d.ts
 /**
@@ -80,7 +80,7 @@ type ChatModelRuntimeConfig = OpenAIChatModelRuntimeConfig | OllamaChatModelRunt
  * Normalizes one configured chat model into runtime executor config.
  *
  * Use when:
- * - eval code needs typed provider constructor options from `context.model()`
+ * - eval code needs typed provider constructor options from a resolved model
  * - model parameters should be validated once with clear error messages
  *
  * Expects:
@@ -95,7 +95,7 @@ declare function toChatModelRuntimeConfig(model: ModelDefinition): ChatModelRunt
  * Resolves OpenAI runtime config from one resolved run-context model.
  *
  * Use when:
- * - task execution already has `context.model()` output
+ * - task execution already has a model resolved through chat-model helpers
  * - eval code wants typed OpenAI provider options with a concise helper name
  *
  * Expects:
@@ -109,7 +109,7 @@ declare function openaiFromRunContext(model: ModelDefinition): OpenAIChatModelRu
  * Resolves Ollama runtime config from one resolved run-context model.
  *
  * Use when:
- * - task execution already has `context.model()` output
+ * - task execution already has a model resolved through chat-model helpers
  * - eval code wants typed Ollama provider options with a concise helper name
  *
  * Expects:
@@ -123,7 +123,7 @@ declare function ollamaFromRunContext(model: ModelDefinition): OllamaChatModelRu
  * Resolves OpenRouter runtime config from one resolved run-context model.
  *
  * Use when:
- * - task execution already has `context.model()` output
+ * - task execution already has a model resolved through chat-model helpers
  * - eval code wants typed OpenRouter provider options with a concise helper name
  *
  * Expects:
@@ -540,6 +540,63 @@ interface ChatModelsPluginOptions {
    */
   models: readonly ChatModelDefinition[];
 }
+/**
+ * Matrix scope that can carry a chat model selector.
+ */
+type MatrixModelScope = 'eval' | 'run';
+/**
+ * Options for resolving a chat model from a matrix axis.
+ */
+interface ModelFromMatrixOptions {
+  /**
+   * Matrix axis whose selected value is a model id, model name, or alias.
+   */
+  axis: string;
+}
+type MatrixModelContext = Pick<TaskRunContext, 'models' | 'task'>;
+/**
+ * Resolves a configured chat model from one scoped matrix axis.
+ *
+ * Use when:
+ * - a matrix axis selects the agent, judge, or another chat model role
+ * - eval code should keep model lookup semantics inside the chat-models plugin
+ *
+ * Expects:
+ * - `scope` to identify `context.task.matrix.run` or `context.task.matrix.eval`
+ * - `options.axis` to exist and contain a model id, model name, or alias
+ *
+ * Returns:
+ * - the configured model matching the selected matrix value
+ */
+declare function modelFromMatrix(context: MatrixModelContext, scope: MatrixModelScope, options: ModelFromMatrixOptions): ModelDefinition;
+/**
+ * Resolves a configured chat model from one run-matrix axis.
+ *
+ * Use when:
+ * - run matrix selects the model used by the system under evaluation
+ * - callers want the scoped helper instead of passing `scope: 'run'`
+ *
+ * Expects:
+ * - `options.axis` to exist in `context.task.matrix.run`
+ *
+ * Returns:
+ * - the configured model matching the selected run-matrix value
+ */
+declare function modelFromRun(context: MatrixModelContext, options: ModelFromMatrixOptions): ModelDefinition;
+/**
+ * Resolves a configured chat model from one eval-matrix axis.
+ *
+ * Use when:
+ * - eval matrix selects a judge, rubric, or evaluator model
+ * - callers want the scoped helper instead of passing `scope: 'eval'`
+ *
+ * Expects:
+ * - `options.axis` to exist in `context.task.matrix.eval`
+ *
+ * Returns:
+ * - the configured model matching the selected eval-matrix value
+ */
+declare function modelFromEval(context: MatrixModelContext, options: ModelFromMatrixOptions): ModelDefinition;
 /**
  * Creates a run-matrix `model` axis from configured chat model names.
  *
@@ -571,5 +628,5 @@ declare function ChatProviders(options: ChatProvidersPluginOptions): Plugin;
  */
 declare function ChatModels(options: ChatModelsPluginOptions): Plugin;
 //#endregion
-export { ChatModelDefinition, ChatModelExecutorInput, ChatModelExecutorLike, ChatModelFromBaseOptions, ChatModelFromOptions, ChatModelHeaders, ChatModelInferenceExecutor, ChatModelResolverContext, ChatModelResolverValue, ChatModelRuntimeConfig, ChatModelTelemetryProvider, ChatModelToolCall, ChatModels, ChatModelsPluginOptions, ChatProviderDefinition, ChatProviderFromOptions, ChatProviders, ChatProvidersPluginOptions, EmitChatModelErrorTelemetryOptions, EmitChatModelRequestTelemetryOptions, EmitChatModelResponseTelemetryOptions, GenericChatModelInferenceExecutor, OllamaChatModelInferenceExecutor, OllamaChatModelRuntimeConfig, OpenAIChatModelInferenceExecutor, OpenAIChatModelRuntimeConfig, OpenRouterChatModelInferenceExecutor, OpenRouterChatModelRuntimeConfig, OptionalProviderEnvMap, Plugin, PluginConfig, RequiredProviderEnvMap, chatModelFrom, chatModelMatrix, chatProviderFrom, emitChatModelErrorTelemetry, emitChatModelRequestTelemetry, emitChatModelResponseTelemetry, extractChatModelToolCalls, extractMeteringDimensions, ollamaFromRunContext, openaiFromRunContext, openrouterFromRunContext, toChatModelRuntimeConfig };
+export { ChatModelDefinition, ChatModelExecutorInput, ChatModelExecutorLike, ChatModelFromBaseOptions, ChatModelFromOptions, ChatModelHeaders, ChatModelInferenceExecutor, ChatModelResolverContext, ChatModelResolverValue, ChatModelRuntimeConfig, ChatModelTelemetryProvider, ChatModelToolCall, ChatModels, ChatModelsPluginOptions, ChatProviderDefinition, ChatProviderFromOptions, ChatProviders, ChatProvidersPluginOptions, EmitChatModelErrorTelemetryOptions, EmitChatModelRequestTelemetryOptions, EmitChatModelResponseTelemetryOptions, GenericChatModelInferenceExecutor, MatrixModelScope, ModelFromMatrixOptions, OllamaChatModelInferenceExecutor, OllamaChatModelRuntimeConfig, OpenAIChatModelInferenceExecutor, OpenAIChatModelRuntimeConfig, OpenRouterChatModelInferenceExecutor, OpenRouterChatModelRuntimeConfig, OptionalProviderEnvMap, Plugin, PluginConfig, RequiredProviderEnvMap, chatModelFrom, chatModelMatrix, chatProviderFrom, emitChatModelErrorTelemetry, emitChatModelRequestTelemetry, emitChatModelResponseTelemetry, extractChatModelToolCalls, extractMeteringDimensions, modelFromEval, modelFromMatrix, modelFromRun, ollamaFromRunContext, openaiFromRunContext, openrouterFromRunContext, toChatModelRuntimeConfig };
 //# sourceMappingURL=index.d.mts.map

package/dist/plugins/chat-models/index.mjs CHANGED Viewed

@@ -1,4 +1,5 @@
-import { n as requiredEnvFrom, t as envFrom } from "../../env--94B0UtW.mjs";
+import { n as requiredEnvFrom, t as envFrom } from "../../env-nV5rVErX.mjs";
+import { t as resolveModelByName } from "../../models-pBSRUZhY.mjs";
 import process from "node:process";
 import { errorMessageFrom } from "@moeru/std";
 //#region src/plugins/chat-models/runtime-config.ts
@@ -7,15 +8,19 @@ function getParameters(model) {
 }
 function parseOptionalStringParameter(parameters, key, modelId) {
 	const value = parameters[key];
-	return envFrom(value == null ? void 0 : String(value), {
-		name: `${modelId}.parameters.${key}`,
+	const normalized = value == null ? void 0 : String(value);
+	const name = `${modelId}.parameters.${key}`;
+	return envFrom({ [name]: normalized }, {
+		name,
 		type: "string"
 	});
 }
 function parseRequiredStringParameter(parameters, key, modelId) {
 	const value = parameters[key];
-	return requiredEnvFrom(value == null ? void 0 : String(value), {
-		name: `${modelId}.parameters.${key}`,
+	const normalized = value == null ? void 0 : String(value);
+	const name = `${modelId}.parameters.${key}`;
+	return requiredEnvFrom({ [name]: normalized }, {
+		name,
 		type: "string"
 	});
 }
@@ -41,7 +46,7 @@ function parseHeadersParameter(parameters, modelId) {
 * Normalizes one configured chat model into runtime executor config.
 *
 * Use when:
-* - eval code needs typed provider constructor options from `context.model()`
+* - eval code needs typed provider constructor options from a resolved model
 * - model parameters should be validated once with clear error messages
 *
 * Expects:
@@ -79,7 +84,7 @@ function toChatModelRuntimeConfig(model) {
 * Resolves OpenAI runtime config from one resolved run-context model.
 *
 * Use when:
-* - task execution already has `context.model()` output
+* - task execution already has a model resolved through chat-model helpers
 * - eval code wants typed OpenAI provider options with a concise helper name
 *
 * Expects:
@@ -97,7 +102,7 @@ function openaiFromRunContext(model) {
 * Resolves Ollama runtime config from one resolved run-context model.
 *
 * Use when:
-* - task execution already has `context.model()` output
+* - task execution already has a model resolved through chat-model helpers
 * - eval code wants typed Ollama provider options with a concise helper name
 *
 * Expects:
@@ -115,7 +120,7 @@ function ollamaFromRunContext(model) {
 * Resolves OpenRouter runtime config from one resolved run-context model.
 *
 * Use when:
-* - task execution already has `context.model()` output
+* - task execution already has a model resolved through chat-model helpers
 * - eval code wants typed OpenRouter provider options with a concise helper name
 *
 * Expects:
@@ -332,30 +337,28 @@ async function resolveChatModelResolverValue(value, context) {
 	return value;
 }
 function resolveRequiredStringValue(value, name) {
-	return requiredEnvFrom(value, {
+	return requiredEnvFrom({ [name]: value }, {
 		name,
 		type: "string"
 	});
 }
 function resolveOptionalStringValue(value, name) {
-	return envFrom(value, {
+	return envFrom({ [name]: value }, {
 		name,
 		type: "string"
 	});
 }
 function resolveOptionalEnvValue(env, envKey) {
-	const options = {
+	return envFrom(env, {
 		name: envKey,
 		type: "string"
-	};
-	return envFrom(env[envKey], options);
+	});
 }
 function resolveRequiredEnvValue(env, envKey) {
-	const options = {
+	return requiredEnvFrom(env, {
 		name: envKey,
 		type: "string"
-	};
-	return requiredEnvFrom(env[envKey], options);
+	});
 }
 function resolveProviderParameters(provider, env) {
 	const parameters = { ...provider.parameters };
@@ -479,6 +482,59 @@ function chatProviderFrom(options) {
 	};
 }
 /**
+* Resolves a configured chat model from one scoped matrix axis.
+*
+* Use when:
+* - a matrix axis selects the agent, judge, or another chat model role
+* - eval code should keep model lookup semantics inside the chat-models plugin
+*
+* Expects:
+* - `scope` to identify `context.task.matrix.run` or `context.task.matrix.eval`
+* - `options.axis` to exist and contain a model id, model name, or alias
+*
+* Returns:
+* - the configured model matching the selected matrix value
+*/
+function modelFromMatrix(context, scope, options) {
+	const selectedModelName = context.task.matrix[scope][options.axis];
+	if (selectedModelName == null) throw new Error(`Missing ${scope} matrix axis "${options.axis}".`);
+	const model = resolveModelByName(context.models, selectedModelName);
+	if (model == null) throw new Error(`Unknown configured chat model "${selectedModelName}" from ${scope} matrix axis "${options.axis}".`);
+	return model;
+}
+/**
+* Resolves a configured chat model from one run-matrix axis.
+*
+* Use when:
+* - run matrix selects the model used by the system under evaluation
+* - callers want the scoped helper instead of passing `scope: 'run'`
+*
+* Expects:
+* - `options.axis` to exist in `context.task.matrix.run`
+*
+* Returns:
+* - the configured model matching the selected run-matrix value
+*/
+function modelFromRun(context, options) {
+	return modelFromMatrix(context, "run", options);
+}
+/**
+* Resolves a configured chat model from one eval-matrix axis.
+*
+* Use when:
+* - eval matrix selects a judge, rubric, or evaluator model
+* - callers want the scoped helper instead of passing `scope: 'eval'`
+*
+* Expects:
+* - `options.axis` to exist in `context.task.matrix.eval`
+*
+* Returns:
+* - the configured model matching the selected eval-matrix value
+*/
+function modelFromEval(context, options) {
+	return modelFromMatrix(context, "eval", options);
+}
+/**
 * Creates a run-matrix `model` axis from configured chat model names.
 *
 * Use when:
@@ -534,6 +590,6 @@ function ChatModels(options) {
 	};
 }
 //#endregion
-export { ChatModels, ChatProviders, chatModelFrom, chatModelMatrix, chatProviderFrom, emitChatModelErrorTelemetry, emitChatModelRequestTelemetry, emitChatModelResponseTelemetry, extractChatModelToolCalls, extractMeteringDimensions, ollamaFromRunContext, openaiFromRunContext, openrouterFromRunContext, toChatModelRuntimeConfig };
+export { ChatModels, ChatProviders, chatModelFrom, chatModelMatrix, chatProviderFrom, emitChatModelErrorTelemetry, emitChatModelRequestTelemetry, emitChatModelResponseTelemetry, extractChatModelToolCalls, extractMeteringDimensions, modelFromEval, modelFromMatrix, modelFromRun, ollamaFromRunContext, openaiFromRunContext, openrouterFromRunContext, toChatModelRuntimeConfig };
 //# sourceMappingURL=index.mjs.map