npm - @agentica/benchmark - Versions diffs - 0.12.21 → 0.13.0 - Mend

@agentica/benchmark 0.12.21 → 0.13.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/README.md +39 -33
package/lib/AgenticaCallBenchmark.d.ts +12 -6
package/lib/AgenticaCallBenchmark.js +24 -18
package/lib/AgenticaCallBenchmark.js.map +1 -1
package/lib/AgenticaSelectBenchmark.d.ts +12 -6
package/lib/AgenticaSelectBenchmark.js +14 -12
package/lib/AgenticaSelectBenchmark.js.map +1 -1
package/lib/index.mjs +315 -236
package/lib/index.mjs.map +1 -1
package/lib/internal/AgenticaBenchmarkPredicator.d.ts +38 -29
package/lib/internal/AgenticaBenchmarkPredicator.js +100 -84
package/lib/internal/AgenticaBenchmarkPredicator.js.map +1 -1
package/lib/internal/AgenticaBenchmarkUtil.d.ts +21 -6
package/lib/internal/AgenticaBenchmarkUtil.js +39 -33
package/lib/internal/AgenticaBenchmarkUtil.js.map +1 -1
package/lib/internal/AgenticaCallBenchmarkReporter.d.ts +6 -5
package/lib/internal/AgenticaCallBenchmarkReporter.js +130 -126
package/lib/internal/AgenticaCallBenchmarkReporter.js.map +1 -1
package/lib/internal/AgenticaPromptReporter.d.ts +13 -5
package/lib/internal/AgenticaPromptReporter.js +45 -41
package/lib/internal/AgenticaPromptReporter.js.map +1 -1
package/lib/internal/AgenticaSelectBenchmarkReporter.d.ts +3 -1
package/lib/internal/AgenticaSelectBenchmarkReporter.js +153 -150
package/lib/internal/AgenticaSelectBenchmarkReporter.js.map +1 -1
package/lib/structures/IAgenticaBenchmarkExpected.d.ts +8 -2
package/lib/structures/IAgenticaCallBenchmarkEvent.d.ts +9 -3
package/lib/structures/IAgenticaCallBenchmarkResult.d.ts +10 -4
package/lib/structures/IAgenticaCallBenchmarkScenario.d.ts +8 -2
package/lib/structures/IAgenticaSelectBenchmarkEvent.d.ts +9 -3
package/lib/structures/IAgenticaSelectBenchmarkResult.d.ts +10 -4
package/lib/structures/IAgenticaSelectBenchmarkScenario.d.ts +8 -2
package/lib/utils/MathUtil.d.ts +15 -3
package/lib/utils/MathUtil.js +15 -4
package/lib/utils/MathUtil.js.map +1 -1
package/package.json +12 -10
package/src/AgenticaCallBenchmark.ts +64 -45
package/src/AgenticaSelectBenchmark.ts +42 -30
package/src/internal/AgenticaBenchmarkPredicator.ts +208 -186
package/src/internal/AgenticaBenchmarkUtil.ts +58 -40
package/src/internal/AgenticaCallBenchmarkReporter.ts +180 -182
package/src/internal/AgenticaPromptReporter.ts +46 -33
package/src/internal/AgenticaSelectBenchmarkReporter.ts +205 -203
package/src/structures/IAgenticaBenchmarkExpected.ts +9 -2
package/src/structures/IAgenticaCallBenchmarkEvent.ts +9 -3
package/src/structures/IAgenticaCallBenchmarkResult.ts +10 -4
package/src/structures/IAgenticaCallBenchmarkScenario.ts +8 -2
package/src/structures/IAgenticaSelectBenchmarkEvent.ts +9 -3
package/src/structures/IAgenticaSelectBenchmarkResult.ts +10 -4
package/src/structures/IAgenticaSelectBenchmarkScenario.ts +8 -2
package/src/utils/MathUtil.ts +16 -3

package/lib/index.mjs CHANGED Viewed

@@ -8,254 +8,302 @@ import "typia";
 import { ChatGptSelectFunctionAgent } from "@agentica/core/src/chatgpt/ChatGptSelectFunctionAgent";
-var AgenticaBenchmarkPredicator;
+const AgenticaBenchmarkPredicator = {
+    isNext,
+    success
+};
-(function(AgenticaBenchmarkPredicator) {
-    AgenticaBenchmarkPredicator.isNext = async agent => {
-        const last = agent.getPromptHistories().at(-1);
-        if (last?.type !== "text" || last.role !== "assistant") return null;
-        const consent = {
-            functions: [ {
-                name: "consent",
-                parameters: {
-                    description: "Properties for asking the user's consent",
-                    type: "object",
-                    properties: {
-                        content: {
-                            description: "Reason of the message implying what the AI agent wants\nto do at the next step after the user's consent.",
-                            type: "string"
-                        },
-                        reply: {
-                            title: "Recommended reply message for the user",
-                            description: "Recommended reply message for the user.\n\nThe message what AI agent wants the user to reply\naccepting the AI agent's next job suggestion.",
-                            type: "string"
-                        }
+async function isNext(agent) {
+    const last = agent.getPromptHistories().at(-1);
+    const llmVendor = agent.getVendor();
+    const isTextPrompt = last?.type === "text" && last.role === "assistant";
+    if (!isTextPrompt) {
+        return null;
+    }
+    const consent = {
+        functions: [ {
+            name: "consent",
+            parameters: {
+                description: "Properties for asking the user's consent",
+                type: "object",
+                properties: {
+                    content: {
+                        description: "Reason of the message implying what the AI agent wants\nto do at the next step after the user's consent.",
+                        type: "string"
                     },
-                    required: [ "content", "reply" ],
-                    additionalProperties: false,
-                    $defs: {}
+                    reply: {
+                        title: "Recommended reply message for the user",
+                        description: "Recommended reply message for the user.\n\nThe message what AI agent wants the user to reply\naccepting the AI agent's next job suggestion.",
+                        type: "string"
+                    }
                 },
-                description: "Ask user to consent for what the AI agent wants to do next.\n\nIf AI agent wants to do some function calling at next,\nbut it needs the user's consent about the function calling to do,\nthen call this tool function.",
-                validate: (() => {
-                    const _io0 = input => "string" === typeof input.content && "string" === typeof input.reply;
-                    const _vo0 = (input, _path, _exceptionable = true) => [ "string" === typeof input.content || _report(_exceptionable, {
-                        path: _path + ".content",
-                        expected: "string",
-                        value: input.content
-                    }), "string" === typeof input.reply || _report(_exceptionable, {
-                        path: _path + ".reply",
-                        expected: "string",
-                        value: input.reply
-                    }) ].every((flag => flag));
-                    const __is = input => "object" === typeof input && null !== input && _io0(input);
-                    let errors;
-                    let _report;
-                    return input => {
-                        if (false === __is(input)) {
-                            errors = [];
-                            _report = __typia_transform__validateReport._validateReport(errors);
-                            ((input, _path, _exceptionable = true) => ("object" === typeof input && null !== input || _report(true, {
-                                path: _path + "",
-                                expected: "IConsentProps",
-                                value: input
-                            })) && _vo0(input, _path + "", true) || _report(true, {
-                                path: _path + "",
-                                expected: "IConsentProps",
-                                value: input
-                            }))(input, "$input", true);
-                            const success = 0 === errors.length;
-                            return success ? {
-                                success,
-                                data: input
-                            } : {
-                                success,
-                                errors,
-                                data: input
-                            };
-                        }
-                        return {
-                            success: true,
+                required: [ "content", "reply" ],
+                additionalProperties: false,
+                $defs: {}
+            },
+            description: "Ask user to consent for what the AI agent wants to do next.\n\nIf AI agent wants to do some function calling at next,\nbut it needs the user's consent about the function calling to do,\nthen call this tool function.",
+            validate: (() => {
+                const _io0 = input => "string" === typeof input.content && "string" === typeof input.reply;
+                const _vo0 = (input, _path, _exceptionable = true) => [ "string" === typeof input.content || _report(_exceptionable, {
+                    path: _path + ".content",
+                    expected: "string",
+                    value: input.content
+                }), "string" === typeof input.reply || _report(_exceptionable, {
+                    path: _path + ".reply",
+                    expected: "string",
+                    value: input.reply
+                }) ].every((flag => flag));
+                const __is = input => "object" === typeof input && null !== input && _io0(input);
+                let errors;
+                let _report;
+                return input => {
+                    if (false === __is(input)) {
+                        errors = [];
+                        _report = __typia_transform__validateReport._validateReport(errors);
+                        ((input, _path, _exceptionable = true) => ("object" === typeof input && null !== input || _report(true, {
+                            path: _path + "",
+                            expected: "IConsentProps",
+                            value: input
+                        })) && _vo0(input, _path + "", true) || _report(true, {
+                            path: _path + "",
+                            expected: "IConsentProps",
+                            value: input
+                        }))(input, "$input", true);
+                        const success = 0 === errors.length;
+                        return success ? {
+                            success,
+                            data: input
+                        } : {
+                            success,
+                            errors,
                             data: input
                         };
+                    }
+                    return {
+                        success: true,
+                        data: input
+                    };
+                };
+            })()
+        } ]
+    }.functions[0];
+    const result = await llmVendor.api.chat.completions.create({
+        model: llmVendor.model,
+        messages: [ {
+            role: "system",
+            content: [ "You are an helpful assistant.", "", "If what the assistant said seems like to asking for", "user's consent about some function calling at the next step,", "use the tools appropriately to step to the next." ].join("\n")
+        }, {
+            role: "assistant",
+            content: last.text
+        } ],
+        tools: [ {
+            type: "function",
+            function: {
+                name: consent.name,
+                description: consent.description,
+                parameters: consent.parameters
+            }
+        } ],
+        tool_choice: "required",
+        parallel_tool_calls: false
+    }, llmVendor.options);
+    const toolCall = (result.choices[0]?.message.tool_calls ?? []).filter((tc => tc.type === "function" && tc.function.name === consent.name))?.[0];
+    if (toolCall === undefined) {
+        return null;
+    }
+    const input = (() => {
+        const _io0 = input => "string" === typeof input.content && "string" === typeof input.reply;
+        const __is = input => "object" === typeof input && null !== input && _io0(input);
+        return input => {
+            input = JSON.parse(input);
+            return __is(input) ? input : null;
+        };
+    })()(toolCall.function.arguments);
+    return input !== null ? input.reply : null;
+}
+function success(props) {
+    return successInner(props).result;
+}
+function successInner(props) {
+    const call = (expected, overrideOperations) => successInner({
+        expected,
+        operations: overrideOperations ?? props.operations,
+        strict: props.strict
+    });
+    switch (props.expected.type) {
+      case "array":
+        {
+            let take = 0;
+            const targetIterator = props.expected.items[Symbol.iterator]();
+            let targeted = targetIterator.next();
+            while (true) {
+                if (targeted.done === true) {
+                    return {
+                        result: true,
+                        take
                     };
-                })()
-            } ]
-        }.functions[0];
-        const result = await agent["props"].vendor.api.chat.completions.create({
-            model: agent["props"].vendor.model,
-            messages: [ {
-                role: "system",
-                content: [ "You are an helpful assistant.", "", "If what the assistant said seems like to asking for", "user's consent about some function calling at the next step,", "use the tools appropriately to step to the next." ].join("\n")
-            }, {
-                role: "assistant",
-                content: last.text
-            } ],
-            tools: [ {
-                type: "function",
-                function: {
-                    name: consent.name,
-                    description: consent.description,
-                    parameters: consent.parameters
                 }
-            } ],
-            tool_choice: "required",
-            parallel_tool_calls: false
-        }, agent["props"].vendor.options);
-        const toolCall = (result.choices[0]?.message.tool_calls ?? []).filter((tc => tc.type === "function" && tc.function.name === consent.name))?.[0];
-        if (toolCall === undefined) return null;
-        const input = JSON.parse(toolCall.function.arguments);
-        return (() => {
-            const _io0 = input => "string" === typeof input.content && "string" === typeof input.reply;
-            return input => "object" === typeof input && null !== input && _io0(input);
-        })()(input) ? input.reply : null;
-    };
-    AgenticaBenchmarkPredicator.success = props => successInner(props).result;
-    const successInner = props => {
-        const call = (expected, overrideOperations) => successInner({
-            expected,
-            operations: overrideOperations ?? props.operations,
-            strict: props.strict
-        });
-        switch (props.expected.type) {
-          case "array":
-            {
-                let take = 0;
-                const targetIterator = props.expected.items[Symbol.iterator]();
-                let targeted = targetIterator.next();
-                while (true) {
-                    if (targeted.done) {
-                        return {
-                            result: true,
-                            take
-                        };
-                    }
-                    if (take >= props.operations.length) {
-                        return {
-                            result: false
-                        };
-                    }
-                    const result = call(targeted.value, props.operations.slice(take));
-                    if (!result.result) {
-                        if (!props.strict) {
-                            take += 1;
-                            continue;
-                        }
+                if (take >= props.operations.length) {
+                    return {
+                        result: false
+                    };
+                }
+                const result = call(targeted.value, props.operations.slice(take));
+                if (!result.result) {
+                    if (props.strict === true) {
                         return {
                             result: false
                         };
                     }
-                    take += result.take;
-                    targeted = targetIterator.next();
+                    take += 1;
+                    continue;
                 }
+                take += result.take;
+                targeted = targetIterator.next();
             }
+        }
-          case "standalone":
-            {
-                const target = props.expected.operation;
-                const result = props.operations.some((op => op.name === target.name));
-                if (result) {
-                    return {
-                        result,
-                        take: 1
-                    };
-                }
+      case "standalone":
+        {
+            const target = props.expected.operation;
+            const result = props.operations.some((op => op.name === target.name));
+            if (result) {
                 return {
-                    result
+                    result,
+                    take: 1
                 };
             }
-          case "anyOf":
-            for (const expected of props.expected.anyOf) {
-                const callResult = call(expected);
-                if (callResult.result) {
-                    return callResult;
-                }
-            }
             return {
-                result: false
+                result
             };
+        }
-          case "allOf":
-            {
-                const result = props.expected.allOf.map((expected => call(expected)));
-                if (result.every((r => r.result))) {
-                    return {
-                        result: true,
-                        take: result.reduce(((acc, r) => Math.max(acc, r.take)), 0)
-                    };
-                }
+      case "anyOf":
+        for (const expected of props.expected.anyOf) {
+            const callResult = call(expected);
+            if (callResult.result) {
+                return callResult;
+            }
+        }
+        return {
+            result: false
+        };
+      case "allOf":
+        {
+            const result = props.expected.allOf.map((expected => call(expected)));
+            if (result.every((r => r.result))) {
                 return {
-                    result: false
+                    result: true,
+                    take: result.reduce(((acc, r) => Math.max(acc, r.take)), 0)
                 };
             }
+            return {
+                result: false
+            };
         }
-    };
-})(AgenticaBenchmarkPredicator || (AgenticaBenchmarkPredicator = {}));
-var MathUtil;
+    }
+}
-(function(MathUtil) {
-    MathUtil.round = value => Math.floor(value * 100) / 100;
-})(MathUtil || (MathUtil = {}));
+const MathUtil = {
+    round: value => Math.floor(value * 100) / 100
+};
-var AgenticaBenchmarkUtil;
+const AgenticaBenchmarkUtil = {
+    errorToJson,
+    expectedToJson
+};
-(function(AgenticaBenchmarkUtil) {
-    AgenticaBenchmarkUtil.errorToJson = error => {
-        if (error instanceof Error) return {
+function errorToJson(error) {
+    if (error instanceof Error) {
+        return {
             ...error,
             name: error.name,
             message: error.message,
             stack: error.stack
         };
-        return error;
-    };
-    AgenticaBenchmarkUtil.expectedToJson = expected => {
-        if (expected.type === "standalone") return {
+    }
+    return error;
+}
+function expectedToJson(expected) {
+    if (expected.type === "standalone") {
+        return {
             type: expected.type,
             operation: {
                 name: expected.operation.name,
                 description: expected.operation.function.description
             }
-        }; else if (expected.type === "array") return {
+        };
+    } else if (expected.type === "array") {
+        return {
             type: expected.type,
-            items: expected.items.map(AgenticaBenchmarkUtil.expectedToJson)
-        }; else if (expected.type === "allOf") return {
+            items: expected.items.map(expectedToJson)
+        };
+    } else if (expected.type === "allOf") {
+        return {
             type: expected.type,
-            allOf: expected.allOf.map(AgenticaBenchmarkUtil.expectedToJson)
-        }; else return {
+            allOf: expected.allOf.map(expectedToJson)
+        };
+    } else {
+        return {
             type: expected.type,
-            anyOf: expected.anyOf.map(AgenticaBenchmarkUtil.expectedToJson)
+            anyOf: expected.anyOf.map(expectedToJson)
         };
-    };
-})(AgenticaBenchmarkUtil || (AgenticaBenchmarkUtil = {}));
+    }
+}
-var AgenticaPromptReporter;
+const AgenticaPromptReporter = {
+    markdown: markdown$2
+};
-(function(AgenticaPromptReporter) {
-    AgenticaPromptReporter.markdown = p => {
-        if (p.type === "text") return [ `### Text (${p.role})`, p.text, "" ].join("\n"); else if (p.type === "select" || p.type === "cancel") return [ `### ${p.type === "select" ? "Select" : "Cancel"}`, ...p.selections.map((s => [ `#### ${s.operation.name}`, `  - controller: ${s.operation.controller.name}`, `  - function: ${s.operation.function.name}`, `  - reason: ${s.reason}`, "", ...!!s.operation.function.description?.length ? [ s.operation.function.description, "" ] : [] ])).flat() ].join("\n"); else if (p.type === "describe") return [ "### Describe", ...p.executes.map((e => `  - ${e.operation.name}`)), "", ...p.text.split("\n").map((s => `> ${s}`)), "" ].join("\n");
-        return [ "### Execute", `  - name: ${p.operation.name}`, `  - controller: ${p.operation.controller.name}`, `  - function: ${p.operation.function.name}`, "", "```json", JSON.stringify(p.arguments, null, 2), "```", "" ].join("\n");
-    };
-})(AgenticaPromptReporter || (AgenticaPromptReporter = {}));
+function markdown$2(p) {
+    if (p.type === "text") {
+        return [ `### Text (${p.role})`, p.text, "" ].join("\n");
+    } else if (p.type === "select" || p.type === "cancel") {
+        return [ `### ${p.type === "select" ? "Select" : "Cancel"}`, ...p.selections.flatMap((s => {
+            const functionDescriptionCount = s.operation.function.description?.length ?? 0;
+            return [ `#### ${s.operation.name}`, `  - controller: ${s.operation.controller.name}`, `  - function: ${s.operation.function.name}`, `  - reason: ${s.reason}`, "", ...functionDescriptionCount > 0 ? [ s.operation.function.description, "" ] : [] ];
+        })) ].join("\n");
+    } else if (p.type === "describe") {
+        return [ "### Describe", ...p.executes.map((e => `  - ${e.operation.name}`)), "", ...p.text.split("\n").map((s => `> ${s}`)), "" ].join("\n");
+    }
+    return [ "### Execute", `  - name: ${p.operation.name}`, `  - controller: ${p.operation.controller.name}`, `  - function: ${p.operation.function.name}`, "", "```json", JSON.stringify(p.arguments, null, 2), "```", "" ].join("\n");
+}
-var AgenticaCallBenchmarkReporter;
+const AgenticaCallBenchmarkReporter = {
+    markdown: markdown$1
+};
-(function(AgenticaCallBenchmarkReporter) {
-    AgenticaCallBenchmarkReporter.markdown = result => Object.fromEntries([ [ "./README.md", writeIndex(result) ], ...result.experiments.map((exp => [ [ `./${exp.scenario.name}/README.md`, writeExperimentIndex(exp) ], ...exp.events.map(((event, i) => [ `./${exp.scenario.name}/${i + 1}.${event.type}.md`, writeExperimentEvent(event, i) ])) ])).flat() ]);
-    const writeIndex = result => {
-        const events = result.experiments.map((r => r.events)).flat();
-        const average = events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / events.length;
-        const aggregate = result.usage.aggregate;
-        return [ "# LLM Function Call Benchmark", "## Summary", `  - Aggregation:`, `    - Scenarios: #${result.experiments.length.toLocaleString()}`, `    - Trial: ${events.length}`, `    - Success: ${events.filter((e => e.type === "success")).length}`, `    - Failure: ${events.filter((e => e.type === "failure")).length}`, `    - Average Time: ${MathUtil.round(average).toLocaleString()} ms`, `  - Token Usage`, `    - Total: ${aggregate.total.toLocaleString()}`, `    - Input`, `      - Total: ${aggregate.input.total.toLocaleString()}`, `      - Cached: ${aggregate.input.cached.toLocaleString()}`, `    - Output:`, `      - Total: ${aggregate.output.total.toLocaleString()}`, `      - Reasoning: ${aggregate.output.reasoning.toLocaleString()}`, `      - Accepted Prediction: ${aggregate.output.accepted_prediction.toLocaleString()}`, `      - Rejected Prediction: ${aggregate.output.rejected_prediction.toLocaleString()}`, "", "## Experiments", " Name | Select | Call | Time/Avg ", ":-----|:-------|:-----|----------:", ...result.experiments.map((exp => [ `[${exp.scenario.name}](./${exp.scenario.name}/README.md)`, drawStatus(exp.events, (e => e.type !== "error" && e.select === true)), drawStatus(exp.events, (e => e.type !== "error" && e.call === true)), `${MathUtil.round(exp.events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms` ].join(" | "))) ].join("\n");
-    };
-    const writeExperimentIndex = exp => [ `# ${exp.scenario.name}`, "## Summary", `  - Scenarios: #${exp.events.length.toLocaleString()}`, `  - Success: ${exp.events.filter((e => e.type === "success")).length}`, `  - Failure: ${exp.events.filter((e => e.type === "failure")).length}`, `  - Average Time: ${MathUtil.round(exp.events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms`, "", "## Events", " Name | Type | Time", ":-----|:-----|----:", ...exp.events.map(((e, i) => [ `[${i + 1}.](./${i + 1}.${e.type}.md)`, e.type, `${MathUtil.round(e.completed_at.getTime() - e.started_at.getTime())} ms` ].join(" | "))), "", "## Scenario", "### User Prompt", exp.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(exp.scenario.expected), null, 2), "```" ].join("\n");
-    const writeExperimentEvent = (event, index) => [ `# ${index + 1}. ${event.type}`, "## Summary", `  - Name: ${event.scenario.name}`, `  - Type: ${event.type}`, `  - Time: ${MathUtil.round(event.completed_at.getTime() - event.started_at.getTime()).toLocaleString()} ms`, ...event.type !== "error" ? [ `  - Select: ${event.select ? "✅" : "❌"}`, `  - Call: ${event.call ? "✅" : "❌"}` ] : [], `  - Token Usage:`, `    - Total: ${JSON.stringify(event.usage.aggregate.total)}`, `    - Input`, `      - Total: ${event.usage.aggregate.input.total}`, `      - Cached: ${event.usage.aggregate.input.cached}`, `    - Output:`, `      - Total: ${event.usage.aggregate.output.total}`, `      - Accepted Prediction: ${event.usage.aggregate.output.accepted_prediction}`, `      - Reasoning: ${event.usage.aggregate.output.reasoning}`, `      - Rejected Prediction: ${event.usage.aggregate.output.rejected_prediction}`, "", "## Scenario", "### User Prompt", event.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(event.scenario.expected), null, 2), "```", "", "## Prompt Histories", ...event.prompts.map(AgenticaPromptReporter.markdown), "", ...event.type === "error" ? [ "## Error", "```json", JSON.stringify(AgenticaBenchmarkUtil.errorToJson(event.error), null, 2), "```" ] : [] ].join("\n");
-    const drawStatus = (events, success) => {
-        const count = Math.floor(events.filter(success).length / events.length * 10);
-        return new Array(count).fill("■").join("") + new Array(10 - count).fill("□").join("");
-    };
-})(AgenticaCallBenchmarkReporter || (AgenticaCallBenchmarkReporter = {}));
+function markdown$1(result) {
+    return Object.fromEntries([ [ "./README.md", writeIndex$1(result) ], ...result.experiments.map((exp => [ [ `./${exp.scenario.name}/README.md`, writeExperimentIndex$1(exp) ], ...exp.events.map(((event, i) => [ `./${exp.scenario.name}/${i + 1}.${event.type}.md`, writeExperimentEvent$1(event, i) ])) ])).flat() ]);
+}
+function writeIndex$1(result) {
+    const events = result.experiments.map((r => r.events)).flat();
+    const average = events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / events.length;
+    const aggregate = result.usage.aggregate;
+    return [ "# LLM Function Call Benchmark", "## Summary", `  - Aggregation:`, `    - Scenarios: #${result.experiments.length.toLocaleString()}`, `    - Trial: ${events.length}`, `    - Success: ${events.filter((e => e.type === "success")).length}`, `    - Failure: ${events.filter((e => e.type === "failure")).length}`, `    - Average Time: ${MathUtil.round(average).toLocaleString()} ms`, `  - Token Usage`, `    - Total: ${aggregate.total.toLocaleString()}`, `    - Input`, `      - Total: ${aggregate.input.total.toLocaleString()}`, `      - Cached: ${aggregate.input.cached.toLocaleString()}`, `    - Output:`, `      - Total: ${aggregate.output.total.toLocaleString()}`, `      - Reasoning: ${aggregate.output.reasoning.toLocaleString()}`, `      - Accepted Prediction: ${aggregate.output.accepted_prediction.toLocaleString()}`, `      - Rejected Prediction: ${aggregate.output.rejected_prediction.toLocaleString()}`, "", "## Experiments", " Name | Select | Call | Time/Avg ", ":-----|:-------|:-----|----------:", ...result.experiments.map((exp => [ `[${exp.scenario.name}](./${exp.scenario.name}/README.md)`, drawStatus(exp.events, (e => e.type !== "error" && e.select === true)), drawStatus(exp.events, (e => e.type !== "error" && e.call === true)), `${MathUtil.round(exp.events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms` ].join(" | "))) ].join("\n");
+}
+function writeExperimentIndex$1(exp) {
+    return [ `# ${exp.scenario.name}`, "## Summary", `  - Scenarios: #${exp.events.length.toLocaleString()}`, `  - Success: ${exp.events.filter((e => e.type === "success")).length}`, `  - Failure: ${exp.events.filter((e => e.type === "failure")).length}`, `  - Average Time: ${MathUtil.round(exp.events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms`, "", "## Events", " Name | Type | Time", ":-----|:-----|----:", ...exp.events.map(((e, i) => [ `[${i + 1}.](./${i + 1}.${e.type}.md)`, e.type, `${MathUtil.round(e.completed_at.getTime() - e.started_at.getTime())} ms` ].join(" | "))), "", "## Scenario", "### User Prompt", exp.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(exp.scenario.expected), null, 2), "```" ].join("\n");
+}
+function writeExperimentEvent$1(event, index) {
+    return [ `# ${index + 1}. ${event.type}`, "## Summary", `  - Name: ${event.scenario.name}`, `  - Type: ${event.type}`, `  - Time: ${MathUtil.round(event.completed_at.getTime() - event.started_at.getTime()).toLocaleString()} ms`, ...event.type !== "error" ? [ `  - Select: ${event.select ? "✅" : "❌"}`, `  - Call: ${event.call ? "✅" : "❌"}` ] : [], `  - Token Usage:`, `    - Total: ${JSON.stringify(event.usage.aggregate.total)}`, `    - Input`, `      - Total: ${event.usage.aggregate.input.total}`, `      - Cached: ${event.usage.aggregate.input.cached}`, `    - Output:`, `      - Total: ${event.usage.aggregate.output.total}`, `      - Accepted Prediction: ${event.usage.aggregate.output.accepted_prediction}`, `      - Reasoning: ${event.usage.aggregate.output.reasoning}`, `      - Rejected Prediction: ${event.usage.aggregate.output.rejected_prediction}`, "", "## Scenario", "### User Prompt", event.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(event.scenario.expected), null, 2), "```", "", "## Prompt Histories", ...event.prompts.map(AgenticaPromptReporter.markdown), "", ...event.type === "error" ? [ "## Error", "```json", JSON.stringify(AgenticaBenchmarkUtil.errorToJson(event.error), null, 2), "```" ] : [] ].join("\n");
+}
+function drawStatus(events, success) {
+    const count = Math.floor(events.filter(success).length / events.length * 10);
+    return Array.from({
+        length: count
+    }).fill("■").join("") + Array.from({
+        length: 10 - count
+    }).fill("□").join("");
+}
 class AgenticaCallBenchmark {
     constructor(props) {
@@ -271,29 +319,36 @@ class AgenticaCallBenchmark {
     async execute(listener) {
         const started_at = new Date;
         const semaphore = new Semaphore(this.config_.simultaneous);
-        const experiments = await Promise.all(this.scenarios_.map((async scenario => {
-            const events = await Promise.all(new Array(this.config_.repeat).fill(0).map((async () => {
+        const task = this.scenarios_.map((async scenario => {
+            const events = await Promise.all(Array.from({
+                length: this.config_.repeat
+            }).map((async () => {
                 await semaphore.acquire();
                 const e = await this.step(scenario);
                 await semaphore.release();
-                if (listener !== undefined) listener(e);
+                if (listener !== undefined) {
+                    listener(e);
+                }
                 return e;
             })));
             return {
                 scenario,
                 events,
-                usage: events.filter((e => e.type !== "error")).map((e => e.usage)).reduce(AgenticaTokenUsage.plus, AgenticaTokenUsage.zero())
+                usage: events.filter((e => e.type !== "error")).map((e => e.usage)).reduce(((acc, cur) => AgenticaTokenUsage.plus(acc, cur)), AgenticaTokenUsage.zero())
             };
-        })));
+        }));
+        const experiments = await Promise.all(task);
         return this.result_ = {
             experiments,
             started_at,
             completed_at: new Date,
-            usage: experiments.map((p => p.usage)).reduce(AgenticaTokenUsage.plus, AgenticaTokenUsage.zero())
+            usage: experiments.map((p => p.usage)).reduce(((acc, cur) => AgenticaTokenUsage.plus(acc, cur)), AgenticaTokenUsage.zero())
         };
     }
     report() {
-        if (this.result_ === null) throw new Error("Benchmark is not executed yet.");
+        if (this.result_ === null) {
+            throw new Error("Benchmark is not executed yet.");
+        }
         return AgenticaCallBenchmarkReporter.markdown(this.result_);
     }
     async step(scenario) {
@@ -324,12 +379,18 @@ class AgenticaCallBenchmark {
         };
         try {
             await agent.conversate(scenario.text);
-            if (success()) return out();
+            if (success()) {
+                return out();
+            }
             for (let i = 0; i < this.config_.consent; ++i) {
                 const next = await AgenticaBenchmarkPredicator.isNext(agent);
-                if (next === null) break;
+                if (next === null) {
+                    break;
+                }
                 await agent.conversate(next);
-                if (success()) return out();
+                if (success()) {
+                    return out();
+                }
             }
             return out();
         } catch (error) {
@@ -346,25 +407,37 @@ class AgenticaCallBenchmark {
     }
 }
-var AgenticaSelectBenchmarkReporter;
+const AgenticaSelectBenchmarkReporter = {
+    markdown
+};
+function markdown(result) {
+    const iterator = [ [ "./README.md", writeIndex(result) ], ...result.experiments.map((exp => [ [ `./${exp.scenario.name}/README.md`, writeExperimentIndex(exp) ], ...exp.events.map(((event, i) => [ `./${exp.scenario.name}/${i + 1}.${event.type}.md`, writeExperimentEvent(event, i) ])) ])).flat() ];
+    return Object.fromEntries(iterator);
+}
+function writeIndex(result) {
+    const events = result.experiments.map((r => r.events)).flat();
+    const average = events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / events.length;
+    const aggregate = result.usage.aggregate;
+    return [ "# LLM Function Selection Benchmark", "## Summary", `  - Aggregation:`, `    - Scenarios: #${result.experiments.length.toLocaleString()}`, `    - Trial: ${events.length}`, `    - Success: ${events.filter((e => e.type === "success")).length}`, `    - Failure: ${events.filter((e => e.type === "failure")).length}`, `    - Average Time: ${MathUtil.round(average).toLocaleString()} ms`, `  - Token Usage`, `    - Total: ${aggregate.total.toLocaleString()}`, `    - Input`, `      - Total: ${aggregate.input.total.toLocaleString()}`, `      - Cached: ${aggregate.input.cached.toLocaleString()}`, `    - Output:`, `      - Total: ${aggregate.output.total.toLocaleString()}`, `      - Accepted Prediction: ${aggregate.output.accepted_prediction.toLocaleString()}`, `      - Reasoning: ${aggregate.output.reasoning.toLocaleString()}`, `      - Rejected Prediction: ${aggregate.output.rejected_prediction.toLocaleString()}`, "", "## Experiments", " Name | Status | Time/Avg  ", ":-----|:-------|----------:", ...result.experiments.map((exp => [ `[${exp.scenario.name}](./${exp.scenario.name}/README.md)`, (() => {
+        const success = Math.floor(exp.events.filter((e => e.type === "success")).length / exp.events.length * 10);
+        return Array.from({
+            length: success
+        }).fill("■").join("") + Array.from({
+            length: 10 - success
+        }).fill("□").join("");
+    })(), `${MathUtil.round(exp.events.map((event => event.completed_at.getTime() - event.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms` ].join(" | "))) ].join("\n");
+}
+function writeExperimentIndex(exp) {
+    const aggregate = exp.usage.aggregate;
+    return [ `# ${exp.scenario.name}`, "## Summary", "  - Aggregation:", `    - Trial: ${exp.events.length}`, `    - Success: ${exp.events.filter((e => e.type === "success")).length}`, `    - Failure: ${exp.events.filter((e => e.type === "failure")).length}`, `    - Average Time: ${MathUtil.round(exp.events.map((event => event.completed_at.getTime() - event.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms`, `  - Token Usage`, `    - Total: ${aggregate.total.toLocaleString()}`, `    - Input`, `      - Total: ${aggregate.input.total.toLocaleString()}`, `      - Cached: ${aggregate.input.cached.toLocaleString()}`, `    - Output:`, `      - Total: ${aggregate.output.total.toLocaleString()}`, `      - Accepted Prediction: ${aggregate.output.accepted_prediction.toLocaleString()}`, `      - Reasoning: ${aggregate.output.reasoning.toLocaleString()}`, `      - Rejected Prediction: ${aggregate.output.rejected_prediction.toLocaleString()}`, "", "## Events", " No | Type | Time", "---:|:-----|----:", ...exp.events.map(((e, i) => [ `[${i + 1}.](./${i + 1}.${e.type}.md)`, e.type, `${MathUtil.round(e.completed_at.getTime() - e.started_at.getTime())} ms` ].join(" | "))), "", "## Scenario", "### User Prompt", exp.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(exp.scenario.expected), null, 2), "```" ].join("\n");
+}
-(function(AgenticaSelectBenchmarkReporter) {
-    AgenticaSelectBenchmarkReporter.markdown = result => Object.fromEntries([ [ "./README.md", writeIndex(result) ], ...result.experiments.map((exp => [ [ `./${exp.scenario.name}/README.md`, writeExperimentIndex(exp) ], ...exp.events.map(((event, i) => [ `./${exp.scenario.name}/${i + 1}.${event.type}.md`, writeExperimentEvent(event, i) ])) ])).flat() ]);
-    const writeIndex = result => {
-        const events = result.experiments.map((r => r.events)).flat();
-        const average = events.map((e => e.completed_at.getTime() - e.started_at.getTime())).reduce(((a, b) => a + b), 0) / events.length;
-        const aggregate = result.usage.aggregate;
-        return [ "# LLM Function Selection Benchmark", "## Summary", `  - Aggregation:`, `    - Scenarios: #${result.experiments.length.toLocaleString()}`, `    - Trial: ${events.length}`, `    - Success: ${events.filter((e => e.type === "success")).length}`, `    - Failure: ${events.filter((e => e.type === "failure")).length}`, `    - Average Time: ${MathUtil.round(average).toLocaleString()} ms`, `  - Token Usage`, `    - Total: ${aggregate.total.toLocaleString()}`, `    - Input`, `      - Total: ${aggregate.input.total.toLocaleString()}`, `      - Cached: ${aggregate.input.cached.toLocaleString()}`, `    - Output:`, `      - Total: ${aggregate.output.total.toLocaleString()}`, `      - Accepted Prediction: ${aggregate.output.accepted_prediction.toLocaleString()}`, `      - Reasoning: ${aggregate.output.reasoning.toLocaleString()}`, `      - Rejected Prediction: ${aggregate.output.rejected_prediction.toLocaleString()}`, "", "## Experiments", " Name | Status | Time/Avg  ", ":-----|:-------|----------:", ...result.experiments.map((exp => [ `[${exp.scenario.name}](./${exp.scenario.name}/README.md)`, (() => {
-            const success = Math.floor(exp.events.filter((e => e.type === "success")).length / exp.events.length * 10);
-            return new Array(success).fill("■").join("") + new Array(10 - success).fill("□").join("");
-        })(), MathUtil.round(exp.events.map((event => event.completed_at.getTime() - event.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString() + " ms" ].join(" | "))) ].join("\n");
-    };
-    const writeExperimentIndex = exp => {
-        const aggregate = exp.usage.aggregate;
-        return [ `# ${exp.scenario.name}`, "## Summary", "  - Aggregation:", `    - Trial: ${exp.events.length}`, `    - Success: ${exp.events.filter((e => e.type === "success")).length}`, `    - Failure: ${exp.events.filter((e => e.type === "failure")).length}`, `    - Average Time: ${MathUtil.round(exp.events.map((event => event.completed_at.getTime() - event.started_at.getTime())).reduce(((a, b) => a + b), 0) / exp.events.length).toLocaleString()} ms`, `  - Token Usage`, `    - Total: ${aggregate.total.toLocaleString()}`, `    - Input`, `      - Total: ${aggregate.input.total.toLocaleString()}`, `      - Cached: ${aggregate.input.cached.toLocaleString()}`, `    - Output:`, `      - Total: ${aggregate.output.total.toLocaleString()}`, `      - Accepted Prediction: ${aggregate.output.accepted_prediction.toLocaleString()}`, `      - Reasoning: ${aggregate.output.reasoning.toLocaleString()}`, `      - Rejected Prediction: ${aggregate.output.rejected_prediction.toLocaleString()}`, "", "## Events", " No | Type | Time", "---:|:-----|----:", ...exp.events.map(((e, i) => [ `[${i + 1}.](./${i + 1}.${e.type}.md)`, e.type, MathUtil.round(e.completed_at.getTime() - e.started_at.getTime()) + " ms" ].join(" | "))), "", "## Scenario", "### User Prompt", exp.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(exp.scenario.expected), null, 2), "```" ].join("\n");
-    };
-    const writeExperimentEvent = (event, index) => [ `# ${index + 1}. ${event.type}`, `## Summary`, `  - Name: ${event.scenario.name}`, `  - Type: ${event.type}`, `  - Time: ${(event.completed_at.getTime() - event.started_at.getTime()).toLocaleString()} ms`, ...event.type !== "error" ? [ "  - Token Usage", `    - Total: ${event.usage.aggregate.toLocaleString()}`, `    - Prompt`, `      - Total: ${event.usage.aggregate.input.total.toLocaleString()}`, `      - Cached: ${event.usage.aggregate.input.cached.toLocaleString()}`, `    - Completion:`, `      - Total: ${event.usage.aggregate.output.total.toLocaleString()}`, `      - Reasoning: ${event.usage.aggregate.output.reasoning.toLocaleString()}`, `      - Accepted Prediction: ${event.usage.aggregate.output.accepted_prediction.toLocaleString()}`, `      - Rejected Prediction: ${event.usage.aggregate.output.rejected_prediction.toLocaleString()}` ] : [], "", "## Scenario", "### User Prompt", event.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(event.scenario.expected), null, 2), "```", "", ...event.type === "success" || event.type === "failure" ? [ "## Result", ...event.selected.map((s => [ `### ${s.operation.name}`, `  - Controller: \`${s.operation.controller.name}\``, `  - Function: \`${s.operation.function.name}\``, `  - Reason: ${s.reason}`, "", ...s.operation.function.description ? [ s.operation.function.description, "" ] : [] ].join("\n"))) ] : [], ...event.type === "error" ? [ "## Error", "```json", AgenticaBenchmarkUtil.errorToJson(JSON.stringify(event.error, null, 2)), "```", "" ] : [] ].join("\n");
-})(AgenticaSelectBenchmarkReporter || (AgenticaSelectBenchmarkReporter = {}));
+function writeExperimentEvent(event, index) {
+    return [ `# ${index + 1}. ${event.type}`, `## Summary`, `  - Name: ${event.scenario.name}`, `  - Type: ${event.type}`, `  - Time: ${(event.completed_at.getTime() - event.started_at.getTime()).toLocaleString()} ms`, ...event.type !== "error" ? [ "  - Token Usage", `    - Total: ${event.usage.aggregate.toLocaleString()}`, `    - Prompt`, `      - Total: ${event.usage.aggregate.input.total.toLocaleString()}`, `      - Cached: ${event.usage.aggregate.input.cached.toLocaleString()}`, `    - Completion:`, `      - Total: ${event.usage.aggregate.output.total.toLocaleString()}`, `      - Reasoning: ${event.usage.aggregate.output.reasoning.toLocaleString()}`, `      - Accepted Prediction: ${event.usage.aggregate.output.accepted_prediction.toLocaleString()}`, `      - Rejected Prediction: ${event.usage.aggregate.output.rejected_prediction.toLocaleString()}` ] : [], "", "## Scenario", "### User Prompt", event.scenario.text, "", "### Expected", "```json", JSON.stringify(AgenticaBenchmarkUtil.expectedToJson(event.scenario.expected), null, 2), "```", "", ...event.type === "success" || event.type === "failure" ? [ "## Result", ...event.selected.map((s => [ `### ${s.operation.name}`, `  - Controller: \`${s.operation.controller.name}\``, `  - Function: \`${s.operation.function.name}\``, `  - Reason: ${s.reason}`, "", ...s.operation.function.description !== undefined && s.operation.function.description !== "" ? [ s.operation.function.description, "" ] : [] ].join("\n"))) ] : [], ...event.type === "error" ? [ "## Error", "```json", AgenticaBenchmarkUtil.errorToJson(JSON.stringify(event.error, null, 2)), "```", "" ] : [] ].join("\n");
+}
 class AgenticaSelectBenchmark {
     constructor(props) {
@@ -381,28 +454,34 @@ class AgenticaSelectBenchmark {
         const started_at = new Date;
         const semaphore = new Semaphore(this.config_.simultaneous);
         const experiments = await Promise.all(this.scenarios_.map((async scenario => {
-            const events = await Promise.all(new Array(this.config_.repeat).fill(0).map((async () => {
+            const events = await Promise.all(Array.from({
+                length: this.config_.repeat
+            }).map((async () => {
                 await semaphore.acquire();
                 const e = await this.step(scenario);
                 await semaphore.release();
-                if (listener !== undefined) listener(e);
+                if (listener !== undefined) {
+                    listener(e);
+                }
                 return e;
             })));
             return {
                 scenario,
                 events,
-                usage: events.filter((e => e.type !== "error")).map((e => e.usage)).reduce(AgenticaTokenUsage.plus, AgenticaTokenUsage.zero())
+                usage: events.filter((e => e.type !== "error")).map((e => e.usage)).reduce(((acc, cur) => AgenticaTokenUsage.plus(acc, cur)), AgenticaTokenUsage.zero())
             };
         })));
         return this.result_ = {
             experiments,
             started_at,
             completed_at: new Date,
-            usage: experiments.map((p => p.usage)).reduce(AgenticaTokenUsage.plus, AgenticaTokenUsage.zero())
+            usage: experiments.map((p => p.usage)).reduce(((acc, cur) => AgenticaTokenUsage.plus(acc, cur)), AgenticaTokenUsage.zero())
         };
     }
     report() {
-        if (this.result_ === null) throw new Error("Benchmark is not executed yet.");
+        if (this.result_ === null) {
+            throw new Error("Benchmark is not executed yet.");
+        }
         return AgenticaSelectBenchmarkReporter.markdown(this.result_);
     }
     async step(scenario) {