npm - @agentica/benchmark - Versions diffs - 0.8.3 → 0.9.0 - Mend

@agentica/benchmark 0.8.3 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/README.md +124 -122
package/lib/AgenticaCallBenchmark.d.ts +7 -6
package/lib/AgenticaCallBenchmark.js.map +1 -1
package/lib/AgenticaSelectBenchmark.d.ts +7 -6
package/lib/AgenticaSelectBenchmark.js.map +1 -1
package/lib/index.mjs +46 -1
package/lib/index.mjs.map +1 -1
package/lib/internal/AgenticaBenchmarkPredicator.d.ts +5 -4
package/lib/internal/AgenticaBenchmarkPredicator.js +74 -2
package/lib/internal/AgenticaBenchmarkPredicator.js.map +1 -1
package/lib/internal/AgenticaBenchmarkUtil.d.ts +2 -1
package/lib/internal/AgenticaBenchmarkUtil.js.map +1 -1
package/lib/internal/AgenticaCallBenchmarkReporter.d.ts +2 -1
package/lib/internal/AgenticaCallBenchmarkReporter.js.map +1 -1
package/lib/internal/AgenticaPromptReporter.d.ts +2 -1
package/lib/internal/AgenticaPromptReporter.js.map +1 -1
package/lib/internal/AgenticaSelectBenchmarkReporter.js.map +1 -1
package/lib/structures/IAgenticaBenchmarkExpected.d.ts +10 -9
package/lib/structures/IAgenticaCallBenchmarkEvent.d.ts +8 -7
package/lib/structures/IAgenticaCallBenchmarkResult.d.ts +6 -5
package/lib/structures/IAgenticaCallBenchmarkScenario.d.ts +3 -2
package/lib/structures/IAgenticaSelectBenchmarkEvent.d.ts +9 -8
package/lib/structures/IAgenticaSelectBenchmarkResult.d.ts +6 -5
package/lib/structures/IAgenticaSelectBenchmarkScenario.d.ts +3 -2
package/package.json +5 -5
package/src/AgenticaCallBenchmark.ts +28 -25
package/src/AgenticaSelectBenchmark.ts +32 -30
package/src/internal/AgenticaBenchmarkPredicator.ts +18 -10
package/src/internal/AgenticaBenchmarkUtil.ts +5 -1
package/src/internal/AgenticaCallBenchmarkReporter.ts +15 -12
package/src/internal/AgenticaPromptReporter.ts +4 -1
package/src/internal/AgenticaSelectBenchmarkReporter.ts +11 -8
package/src/structures/IAgenticaBenchmarkExpected.ts +23 -13
package/src/structures/IAgenticaCallBenchmarkEvent.ts +14 -10
package/src/structures/IAgenticaCallBenchmarkResult.ts +6 -5
package/src/structures/IAgenticaCallBenchmarkScenario.ts +6 -2
package/src/structures/IAgenticaSelectBenchmarkEvent.ts +15 -11
package/src/structures/IAgenticaSelectBenchmarkResult.ts +8 -5
package/src/structures/IAgenticaSelectBenchmarkScenario.ts +6 -2

package/src/structures/IAgenticaCallBenchmarkScenario.ts CHANGED Viewed

@@ -1,3 +1,5 @@
+import { ILlmSchema } from "@samchon/openapi";
 import { IAgenticaBenchmarkExpected } from "./IAgenticaBenchmarkExpected";
 /**
@@ -14,7 +16,9 @@ import { IAgenticaBenchmarkExpected } from "./IAgenticaBenchmarkExpected";
  *
  * @author Samchon
  */
-export interface IAgenticaCallBenchmarkScenario {
+export interface IAgenticaCallBenchmarkScenario<
+  Model extends ILlmSchema.Model,
+> {
   /**
    * Name of the scenario.
    *
@@ -35,5 +39,5 @@ export interface IAgenticaCallBenchmarkScenario {
    * the user's {@link text} conversation for the LLM
    * (Large Language Model) function calling.
    */
-  expected: IAgenticaBenchmarkExpected;
+  expected: IAgenticaBenchmarkExpected<Model>;
 }

package/src/structures/IAgenticaSelectBenchmarkEvent.ts CHANGED Viewed

@@ -3,6 +3,7 @@ import {
   IAgenticaPrompt,
   IAgenticaTokenUsage,
 } from "@agentica/core";
+import { ILlmSchema } from "@samchon/openapi";
 import { IAgenticaSelectBenchmarkScenario } from "./IAgenticaSelectBenchmarkScenario";
@@ -28,10 +29,10 @@ import { IAgenticaSelectBenchmarkScenario } from "./IAgenticaSelectBenchmarkScen
  *
  * @author Samchon
  */
-export type IAgenticaSelectBenchmarkEvent =
-  | IAgenticaSelectBenchmarkEvent.ISuccess
-  | IAgenticaSelectBenchmarkEvent.IFailure
-  | IAgenticaSelectBenchmarkEvent.IError;
+export type IAgenticaSelectBenchmarkEvent<Model extends ILlmSchema.Model> =
+  | IAgenticaSelectBenchmarkEvent.ISuccess<Model>
+  | IAgenticaSelectBenchmarkEvent.IFailure<Model>
+  | IAgenticaSelectBenchmarkEvent.IError<Model>;
 export namespace IAgenticaSelectBenchmarkEvent {
   /**
    * Success event type.
@@ -39,7 +40,8 @@ export namespace IAgenticaSelectBenchmarkEvent {
    * The `success` event type represents that the benchmark testing is
    * fully meet the expected scenario.
    */
-  export interface ISuccess extends IEventBase<"success"> {
+  export interface ISuccess<Model extends ILlmSchema.Model>
+    extends IEventBase<"success", Model> {
     /**
      * Usage of the token during the benchmark.
      */
@@ -48,7 +50,7 @@ export namespace IAgenticaSelectBenchmarkEvent {
     /**
      * Selected operations in the benchmark.
      */
-    selected: IAgenticaOperationSelection[];
+    selected: IAgenticaOperationSelection<Model>[];
     /**
      * Prompt messages from the assistant.
@@ -62,7 +64,8 @@ export namespace IAgenticaSelectBenchmarkEvent {
    * The `failure` event type represents that the `selector` had not
    * selected the expected scenario in the benchmark testing.
    */
-  export interface IFailure extends IEventBase<"failure"> {
+  export interface IFailure<Model extends ILlmSchema.Model>
+    extends IEventBase<"failure", Model> {
     /**
      * Usage of the token during the benchmark.
      */
@@ -71,7 +74,7 @@ export namespace IAgenticaSelectBenchmarkEvent {
     /**
      * Selected operations in the benchmark.
      */
-    selected: IAgenticaOperationSelection[];
+    selected: IAgenticaOperationSelection<Model>[];
     /**
      * Prompt messages from the assistant.
@@ -79,14 +82,15 @@ export namespace IAgenticaSelectBenchmarkEvent {
     assistantPrompts: IAgenticaPrompt.IText<"assistant">[];
   }
-  export interface IError extends IEventBase<"error"> {
+  export interface IError<Model extends ILlmSchema.Model>
+    extends IEventBase<"error", Model> {
     /**
      * Error occurred during the benchmark.
      */
     error: unknown;
   }
-  interface IEventBase<Type extends string> {
+  interface IEventBase<Type extends string, Model extends ILlmSchema.Model> {
     /**
      * Discriminant type.
      */
@@ -95,7 +99,7 @@ export namespace IAgenticaSelectBenchmarkEvent {
     /**
      * Expected scenario.
      */
-    scenario: IAgenticaSelectBenchmarkScenario;
+    scenario: IAgenticaSelectBenchmarkScenario<Model>;
     /**
      * When the benchmark testing started.

package/src/structures/IAgenticaSelectBenchmarkResult.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import { IAgenticaTokenUsage } from "@agentica/core";
+import { ILlmSchema } from "@samchon/openapi";
 import { IAgenticaSelectBenchmarkEvent } from "./IAgenticaSelectBenchmarkEvent";
 import { IAgenticaSelectBenchmarkScenario } from "./IAgenticaSelectBenchmarkScenario";
@@ -20,11 +21,13 @@ import { IAgenticaSelectBenchmarkScenario } from "./IAgenticaSelectBenchmarkScen
  *
  * @author Samchon
  */
-export interface IAgenticaSelectBenchmarkResult {
+export interface IAgenticaSelectBenchmarkResult<
+  Model extends ILlmSchema.Model,
+> {
   /**
    * Experiments for each scenario.
    */
-  experiments: IAgenticaSelectBenchmarkResult.IExperiment[];
+  experiments: IAgenticaSelectBenchmarkResult.IExperiment<Model>[];
   /**
    * Aggregated token usage information.
@@ -45,11 +48,11 @@ export namespace IAgenticaSelectBenchmarkResult {
   /**
    * Experiment result about a scenario.
    */
-  export interface IExperiment {
+  export interface IExperiment<Model extends ILlmSchema.Model> {
     /**
      * Expected scenario.
      */
-    scenario: IAgenticaSelectBenchmarkScenario;
+    scenario: IAgenticaSelectBenchmarkScenario<Model>;
     /**
      * Events occurred during the benchmark in the scenario.
@@ -59,7 +62,7 @@ export namespace IAgenticaSelectBenchmarkResult {
      * {@link AgenticaSelectBenchmark.IConfig.repeat repeat} count.
      * And the event is one of the repeated benchmark results.
      */
-    events: IAgenticaSelectBenchmarkEvent[];
+    events: IAgenticaSelectBenchmarkEvent<Model>[];
     /**
      * LLM token usage information.

package/src/structures/IAgenticaSelectBenchmarkScenario.ts CHANGED Viewed

@@ -1,3 +1,5 @@
+import { ILlmSchema } from "@samchon/openapi";
 import { IAgenticaBenchmarkExpected } from "./IAgenticaBenchmarkExpected";
 /**
@@ -14,7 +16,9 @@ import { IAgenticaBenchmarkExpected } from "./IAgenticaBenchmarkExpected";
  *
  * @author Samchon
  */
-export interface IAgenticaSelectBenchmarkScenario {
+export interface IAgenticaSelectBenchmarkScenario<
+  Model extends ILlmSchema.Model,
+> {
   /**
    * Name of the scenario.
    *
@@ -35,5 +39,5 @@ export interface IAgenticaSelectBenchmarkScenario {
    * {@link text} conversation for the LLM (Large Language Model)
    * function selection.
    */
-  expected: IAgenticaBenchmarkExpected;
+  expected: IAgenticaBenchmarkExpected<Model>;
 }