@autobe/benchmark 0.30.0-dev.20260315 → 0.30.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +661 -661
- package/lib/example/AutoBeExampleLogger.js +16 -16
- package/lib/replay/AutoBeReplayDocumentation.js +39 -39
- package/package.json +4 -4
- package/src/example/AutoBeExampleArchiver.ts +381 -381
- package/src/example/AutoBeExampleBenchmark.ts +190 -190
- package/src/example/AutoBeExampleLogger.ts +85 -85
- package/src/example/AutoBeExampleStorage.ts +289 -289
- package/src/example/index.ts +4 -4
- package/src/index.ts +2 -2
- package/src/replay/AutoBeReplayComputer.ts +183 -183
- package/src/replay/AutoBeReplayDocumentation.ts +176 -176
- package/src/replay/AutoBeReplayStorage.ts +116 -116
- package/src/replay/index.ts +3 -3
- package/src/structures/IAutoBeExampleBenchmarkState.ts +30 -30
- package/src/structures/index.ts +1 -1
- package/README.md +0 -261
|
@@ -8,28 +8,28 @@ const utils_1 = require("@autobe/utils");
|
|
|
8
8
|
const typia_1 = __importDefault(require("typia"));
|
|
9
9
|
var AutoBeExampleLogger;
|
|
10
10
|
(function (AutoBeExampleLogger) {
|
|
11
|
-
AutoBeExampleLogger.markdown = (state) => utils_1.StringUtil.trim `
|
|
12
|
-
# AutoBe Example Benchmark Report
|
|
13
|
-
|
|
14
|
-
${markdownIndex(state)}
|
|
15
|
-
|
|
16
|
-
${state.vendors.map(markdownVendor).join("\n\n")}
|
|
11
|
+
AutoBeExampleLogger.markdown = (state) => utils_1.StringUtil.trim `
|
|
12
|
+
# AutoBe Example Benchmark Report
|
|
13
|
+
|
|
14
|
+
${markdownIndex(state)}
|
|
15
|
+
|
|
16
|
+
${state.vendors.map(markdownVendor).join("\n\n")}
|
|
17
17
|
`;
|
|
18
|
-
const markdownIndex = (state) => utils_1.StringUtil.trim `
|
|
19
|
-
## Table of Contents
|
|
20
|
-
|
|
18
|
+
const markdownIndex = (state) => utils_1.StringUtil.trim `
|
|
19
|
+
## Table of Contents
|
|
20
|
+
|
|
21
21
|
${state.vendors
|
|
22
22
|
.map((vendor) => `- [\`${vendor.name}\`](#${vendor.name
|
|
23
23
|
.replaceAll("/", "")
|
|
24
24
|
.replaceAll(":", "")})`)
|
|
25
|
-
.join("\n")}
|
|
25
|
+
.join("\n")}
|
|
26
26
|
`;
|
|
27
|
-
const markdownVendor = (state) => utils_1.StringUtil.trim `
|
|
28
|
-
## \`${state.name}\`
|
|
29
|
-
|
|
30
|
-
Project | Phase | State | Count | Elapsed Time
|
|
31
|
-
:-------|:------|:------|------:|-------------:
|
|
32
|
-
${state.projects.map(markdownProject).join("\n")}
|
|
27
|
+
const markdownVendor = (state) => utils_1.StringUtil.trim `
|
|
28
|
+
## \`${state.name}\`
|
|
29
|
+
|
|
30
|
+
Project | Phase | State | Count | Elapsed Time
|
|
31
|
+
:-------|:------|:------|------:|-------------:
|
|
32
|
+
${state.projects.map(markdownProject).join("\n")}
|
|
33
33
|
`;
|
|
34
34
|
const markdownProject = (state) => {
|
|
35
35
|
var _a, _b;
|
|
@@ -6,13 +6,13 @@ const AutoBeExampleStorage_1 = require("../example/AutoBeExampleStorage");
|
|
|
6
6
|
var AutoBeReplayDocumentation;
|
|
7
7
|
(function (AutoBeReplayDocumentation) {
|
|
8
8
|
AutoBeReplayDocumentation.readme = (experiments) => {
|
|
9
|
-
return utils_1.StringUtil.trim `
|
|
10
|
-
# AutoBe Generated Examples
|
|
11
|
-
|
|
12
|
-
## Benchmark
|
|
13
|
-
|
|
14
|
-
AI Model | Success | Score | FCSR | Status
|
|
15
|
-
:--------|---------|------:|-----:|:------:
|
|
9
|
+
return utils_1.StringUtil.trim `
|
|
10
|
+
# AutoBe Generated Examples
|
|
11
|
+
|
|
12
|
+
## Benchmark
|
|
13
|
+
|
|
14
|
+
AI Model | Success | Score | FCSR | Status
|
|
15
|
+
:--------|---------|------:|-----:|:------:
|
|
16
16
|
${experiments
|
|
17
17
|
.map((e) => [
|
|
18
18
|
`[\`${AutoBeExampleStorage_1.AutoBeExampleStorage.slugModel(e.vendor, false)}\`](#${AutoBeExampleStorage_1.AutoBeExampleStorage.slugModel(e.vendor, false)
|
|
@@ -29,15 +29,15 @@ var AutoBeReplayDocumentation;
|
|
|
29
29
|
})(),
|
|
30
30
|
e.emoji,
|
|
31
31
|
].join(" | "))
|
|
32
|
-
.join("\n")}
|
|
33
|
-
|
|
34
|
-
- FCSR: Function Calling Success Rate
|
|
35
|
-
- Status:
|
|
36
|
-
- 🟢: All projects completed successfully
|
|
37
|
-
- 🟡: Some projects failed
|
|
38
|
-
- ❌: All projects failed or not executed
|
|
39
|
-
|
|
40
|
-
${experiments.map(vendor).join("\n\n\n")}
|
|
32
|
+
.join("\n")}
|
|
33
|
+
|
|
34
|
+
- FCSR: Function Calling Success Rate
|
|
35
|
+
- Status:
|
|
36
|
+
- 🟢: All projects completed successfully
|
|
37
|
+
- 🟡: Some projects failed
|
|
38
|
+
- ❌: All projects failed or not executed
|
|
39
|
+
|
|
40
|
+
${experiments.map(vendor).join("\n\n\n")}
|
|
41
41
|
`;
|
|
42
42
|
};
|
|
43
43
|
const vendor = (exp) => {
|
|
@@ -64,23 +64,23 @@ var AutoBeReplayDocumentation;
|
|
|
64
64
|
phase(found.realize),
|
|
65
65
|
].join(" | ");
|
|
66
66
|
};
|
|
67
|
-
return utils_1.StringUtil.trim `
|
|
68
|
-
## \`${exp.vendor}\`
|
|
69
|
-
|
|
70
|
-
Project | Score | Analyze | Prisma | Interface | Test | Realize
|
|
71
|
-
:-------|------:|:-------:|:------:|:----------|:----:|:-------:
|
|
72
|
-
${row("todo")}
|
|
73
|
-
${row("bbs")}
|
|
74
|
-
${row("reddit")}
|
|
75
|
-
${row("shopping")}
|
|
76
|
-
|
|
67
|
+
return utils_1.StringUtil.trim `
|
|
68
|
+
## \`${exp.vendor}\`
|
|
69
|
+
|
|
70
|
+
Project | Score | Analyze | Prisma | Interface | Test | Realize
|
|
71
|
+
:-------|------:|:-------:|:------:|:----------|:----:|:-------:
|
|
72
|
+
${row("todo")}
|
|
73
|
+
${row("bbs")}
|
|
74
|
+
${row("reddit")}
|
|
75
|
+
${row("shopping")}
|
|
76
|
+
|
|
77
77
|
${exp.replays
|
|
78
78
|
.map((r) => project({
|
|
79
79
|
replay: r,
|
|
80
80
|
// biome-ignore lint: intended
|
|
81
81
|
score: exp.score[r.project],
|
|
82
82
|
}))
|
|
83
|
-
.join("\n\n\n")}
|
|
83
|
+
.join("\n\n\n")}
|
|
84
84
|
`;
|
|
85
85
|
};
|
|
86
86
|
const project = (props) => {
|
|
@@ -101,22 +101,22 @@ var AutoBeReplayDocumentation;
|
|
|
101
101
|
100) + "%",
|
|
102
102
|
].join(" | ");
|
|
103
103
|
};
|
|
104
|
-
return utils_1.StringUtil.trim `
|
|
105
|
-
### \`${props.replay.vendor}\` - \`${props.replay.project}\`
|
|
106
|
-
|
|
107
|
-
- Source Code: ${`[\`${AutoBeExampleStorage_1.AutoBeExampleStorage.slugModel(props.replay.vendor, false)}/${props.replay.project}\`](./${AutoBeExampleStorage_1.AutoBeExampleStorage.slugModel(props.replay.vendor, false)}/${props.replay.project}/)`}
|
|
108
|
-
- Score: ${props.score}
|
|
109
|
-
- Elapsed Time: ${formatElapsedTime(props.replay.elapsed)}
|
|
110
|
-
- Token Usage: ${formatTokens(props.replay.aggregates.total.tokenUsage.total)}
|
|
104
|
+
return utils_1.StringUtil.trim `
|
|
105
|
+
### \`${props.replay.vendor}\` - \`${props.replay.project}\`
|
|
106
|
+
|
|
107
|
+
- Source Code: ${`[\`${AutoBeExampleStorage_1.AutoBeExampleStorage.slugModel(props.replay.vendor, false)}/${props.replay.project}\`](./${AutoBeExampleStorage_1.AutoBeExampleStorage.slugModel(props.replay.vendor, false)}/${props.replay.project}/)`}
|
|
108
|
+
- Score: ${props.score}
|
|
109
|
+
- Elapsed Time: ${formatElapsedTime(props.replay.elapsed)}
|
|
110
|
+
- Token Usage: ${formatTokens(props.replay.aggregates.total.tokenUsage.total)}
|
|
111
111
|
- Function Calling Success Rate: ${((props.replay.aggregates.total.metric.success /
|
|
112
112
|
props.replay.aggregates.total.metric.attempt) *
|
|
113
|
-
100).toFixed(2)}%
|
|
114
|
-
|
|
115
|
-
Phase | Generated | Token Usage | Elapsed Time | FCSR
|
|
116
|
-
:-----|:----------|------------:|-------------:|------:
|
|
113
|
+
100).toFixed(2)}%
|
|
114
|
+
|
|
115
|
+
Phase | Generated | Token Usage | Elapsed Time | FCSR
|
|
116
|
+
:-----|:----------|------------:|-------------:|------:
|
|
117
117
|
${["analyze", "database", "interface", "test", "realize"]
|
|
118
118
|
.map((key) => phase(key))
|
|
119
|
-
.join("\n")}
|
|
119
|
+
.join("\n")}
|
|
120
120
|
`;
|
|
121
121
|
};
|
|
122
122
|
})(AutoBeReplayDocumentation || (exports.AutoBeReplayDocumentation = AutoBeReplayDocumentation = {}));
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@autobe/benchmark",
|
|
3
|
-
"version": "0.30.0
|
|
3
|
+
"version": "0.30.0",
|
|
4
4
|
"description": "AI backend server code generator",
|
|
5
5
|
"main": "lib/index.js",
|
|
6
6
|
"keywords": [],
|
|
@@ -27,9 +27,9 @@
|
|
|
27
27
|
"tstl": "^3.0.0",
|
|
28
28
|
"typia": "^12.0.1",
|
|
29
29
|
"uuid": "^11.1.0",
|
|
30
|
-
"@autobe/filesystem": "^0.30.0
|
|
31
|
-
"@autobe/
|
|
32
|
-
"@autobe/
|
|
30
|
+
"@autobe/filesystem": "^0.30.0",
|
|
31
|
+
"@autobe/interface": "^0.30.0",
|
|
32
|
+
"@autobe/utils": "^0.30.0"
|
|
33
33
|
},
|
|
34
34
|
"devDependencies": {
|
|
35
35
|
"@types/uuid": "^10.0.0",
|