peerbench 0.0.11 → 0.0.12
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/benchmarks/examples/echo-basic/schema-sets/echo.v1.d.ts +13 -13
- package/dist/benchmarks/examples/exact-match-scorer/runner.d.ts +1 -1
- package/dist/benchmarks/examples/exact-match-scorer/schema-sets/exact-match.v1.d.ts +13 -13
- package/dist/benchmarks/examples/text-transform/runner.d.ts +2 -2
- package/dist/benchmarks/examples/text-transform/schema-sets/echo.v1.d.ts +13 -13
- package/dist/benchmarks/examples/text-transform/schema-sets/reverse.v1.d.ts +13 -13
- package/dist/benchmarks/index.js +1 -1
- package/dist/benchmarks/peerbench/mcq-runner.d.ts +1 -1
- package/dist/benchmarks/peerbench/qa-runner.d.ts +1 -1
- package/dist/benchmarks/peerbench/schema-sets/mcq.v1.d.ts +13 -13
- package/dist/benchmarks/peerbench/schema-sets/multi-turn.v1.d.ts +13 -13
- package/dist/benchmarks/peerbench/schema-sets/qa.v1.d.ts +13 -13
- package/dist/{chunk-TRNCF2BG.js → chunk-HBGC6BDW.js} +1 -1
- package/dist/chunk-HBGC6BDW.js.map +1 -0
- package/dist/dev.d.ts +22 -0
- package/dist/providers/ai-sdk.d.ts +24 -0
- package/dist/providers/callables/llm.d.ts +3 -0
- package/dist/providers/index.d.ts +1 -0
- package/dist/providers/index.js +116 -0
- package/dist/providers/index.js.map +1 -1
- package/dist/schemas/extensions/index.js +1 -1
- package/dist/schemas/extensions/response/llm.d.ts +17 -0
- package/dist/schemas/llm/simple-system-prompt.d.ts +3 -3
- package/dist/schemas/llm/system-prompt.d.ts +7 -7
- package/dist/schemas/response.d.ts +7 -7
- package/dist/schemas/schema-definer.d.ts +5 -5
- package/dist/schemas/score.d.ts +7 -7
- package/dist/schemas/test-case.d.ts +7 -7
- package/package.json +5 -3
- package/dist/chunk-TRNCF2BG.js.map +0 -1
|
@@ -42,7 +42,7 @@ export declare const EchoBasicTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
42
42
|
schemaVersion: z.ZodNumber;
|
|
43
43
|
kind: z.ZodString;
|
|
44
44
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
45
|
-
}, "kind" | "
|
|
45
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
46
46
|
input: z.ZodString;
|
|
47
47
|
} & {
|
|
48
48
|
namespace: z.ZodLiteral<"example.peerbench.ai">;
|
|
@@ -56,7 +56,7 @@ export declare const EchoBasicTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
56
56
|
kind: "llm/echo-basic.tc";
|
|
57
57
|
schemaVersion: 1;
|
|
58
58
|
metadata?: Record<string, unknown> | undefined;
|
|
59
|
-
}, "kind" | "
|
|
59
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
60
60
|
id: string;
|
|
61
61
|
input: string;
|
|
62
62
|
namespace: "example.peerbench.ai";
|
|
@@ -71,7 +71,7 @@ export declare const EchoBasicTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
71
71
|
kind: "llm/echo-basic.tc";
|
|
72
72
|
schemaVersion: 1;
|
|
73
73
|
metadata?: Record<string, unknown> | undefined;
|
|
74
|
-
}, "
|
|
74
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
75
75
|
id: string;
|
|
76
76
|
input: string;
|
|
77
77
|
namespace: "example.peerbench.ai";
|
|
@@ -90,7 +90,7 @@ export declare const EchoBasicResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
90
90
|
completedAt: z.ZodNumber;
|
|
91
91
|
testCaseId: z.ZodString;
|
|
92
92
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
93
|
-
}, "kind" | "
|
|
93
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
94
94
|
data: z.ZodString;
|
|
95
95
|
modelSlug: z.ZodString;
|
|
96
96
|
provider: z.ZodString;
|
|
@@ -121,7 +121,7 @@ export declare const EchoBasicResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
121
121
|
outputTokensUsed?: number | undefined;
|
|
122
122
|
inputCost?: string | undefined;
|
|
123
123
|
outputCost?: string | undefined;
|
|
124
|
-
}, "kind" | "
|
|
124
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
125
125
|
id: string;
|
|
126
126
|
testCaseId: string;
|
|
127
127
|
startedAt: number;
|
|
@@ -156,7 +156,7 @@ export declare const EchoBasicResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
156
156
|
outputTokensUsed?: number | undefined;
|
|
157
157
|
inputCost?: string | undefined;
|
|
158
158
|
outputCost?: string | undefined;
|
|
159
|
-
}, "
|
|
159
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
160
160
|
id: string;
|
|
161
161
|
testCaseId: string;
|
|
162
162
|
startedAt: number;
|
|
@@ -190,25 +190,25 @@ export declare const EchoBasicScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
190
190
|
readonly human: "human";
|
|
191
191
|
readonly algo: "algo";
|
|
192
192
|
}>;
|
|
193
|
-
}, "kind" | "
|
|
193
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
194
194
|
namespace: z.ZodLiteral<"example.peerbench.ai">;
|
|
195
195
|
kind: z.ZodLiteral<"llm/echo-basic.sc">;
|
|
196
196
|
schemaVersion: z.ZodLiteral<1>;
|
|
197
197
|
}, z.core.$strip> & {
|
|
198
198
|
new: (input: Omit<{
|
|
199
|
-
value: number;
|
|
200
199
|
id: string;
|
|
201
200
|
responseId: string;
|
|
201
|
+
value: number;
|
|
202
202
|
scoringMethod: "ai" | "human" | "algo";
|
|
203
203
|
namespace: "example.peerbench.ai";
|
|
204
204
|
kind: "llm/echo-basic.sc";
|
|
205
205
|
schemaVersion: 1;
|
|
206
206
|
explanation?: string | undefined;
|
|
207
207
|
metadata?: Record<string, unknown> | undefined;
|
|
208
|
-
}, "kind" | "
|
|
209
|
-
value: number;
|
|
208
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
210
209
|
id: string;
|
|
211
210
|
responseId: string;
|
|
211
|
+
value: number;
|
|
212
212
|
scoringMethod: "ai" | "human" | "algo";
|
|
213
213
|
namespace: "example.peerbench.ai";
|
|
214
214
|
kind: "llm/echo-basic.sc";
|
|
@@ -217,19 +217,19 @@ export declare const EchoBasicScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
217
217
|
metadata?: Record<string, unknown> | undefined;
|
|
218
218
|
};
|
|
219
219
|
newWithId(input: Omit<{
|
|
220
|
-
value: number;
|
|
221
220
|
id: string;
|
|
222
221
|
responseId: string;
|
|
222
|
+
value: number;
|
|
223
223
|
scoringMethod: "ai" | "human" | "algo";
|
|
224
224
|
namespace: "example.peerbench.ai";
|
|
225
225
|
kind: "llm/echo-basic.sc";
|
|
226
226
|
schemaVersion: 1;
|
|
227
227
|
explanation?: string | undefined;
|
|
228
228
|
metadata?: Record<string, unknown> | undefined;
|
|
229
|
-
}, "
|
|
230
|
-
value: number;
|
|
229
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
231
230
|
id: string;
|
|
232
231
|
responseId: string;
|
|
232
|
+
value: number;
|
|
233
233
|
scoringMethod: "ai" | "human" | "algo";
|
|
234
234
|
namespace: "example.peerbench.ai";
|
|
235
235
|
kind: "llm/echo-basic.sc";
|
|
@@ -34,9 +34,9 @@ export declare const exactMatchScorerRunner: (params: {
|
|
|
34
34
|
outputCost?: string | undefined;
|
|
35
35
|
};
|
|
36
36
|
score: {
|
|
37
|
-
value: number;
|
|
38
37
|
id: string;
|
|
39
38
|
responseId: string;
|
|
39
|
+
value: number;
|
|
40
40
|
scoringMethod: "ai" | "human" | "algo";
|
|
41
41
|
match: boolean;
|
|
42
42
|
namespace: "example.peerbench.ai";
|
|
@@ -7,7 +7,7 @@ export declare const ExactMatchTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
7
7
|
schemaVersion: z.ZodNumber;
|
|
8
8
|
kind: z.ZodString;
|
|
9
9
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
10
|
-
}, "kind" | "
|
|
10
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
11
11
|
instruction: z.ZodString;
|
|
12
12
|
input: z.ZodString;
|
|
13
13
|
expectedOutput: z.ZodString;
|
|
@@ -27,7 +27,7 @@ export declare const ExactMatchTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
27
27
|
schemaVersion: 1;
|
|
28
28
|
metadata?: Record<string, unknown> | undefined;
|
|
29
29
|
normalize?: boolean | undefined;
|
|
30
|
-
}, "kind" | "
|
|
30
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
31
31
|
id: string;
|
|
32
32
|
instruction: string;
|
|
33
33
|
input: string;
|
|
@@ -48,7 +48,7 @@ export declare const ExactMatchTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
48
48
|
schemaVersion: 1;
|
|
49
49
|
metadata?: Record<string, unknown> | undefined;
|
|
50
50
|
normalize?: boolean | undefined;
|
|
51
|
-
}, "
|
|
51
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
52
52
|
id: string;
|
|
53
53
|
instruction: string;
|
|
54
54
|
input: string;
|
|
@@ -70,7 +70,7 @@ export declare const ExactMatchResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
70
70
|
completedAt: z.ZodNumber;
|
|
71
71
|
testCaseId: z.ZodString;
|
|
72
72
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
73
|
-
}, "kind" | "
|
|
73
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
74
74
|
data: z.ZodString;
|
|
75
75
|
modelSlug: z.ZodString;
|
|
76
76
|
provider: z.ZodString;
|
|
@@ -101,7 +101,7 @@ export declare const ExactMatchResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
101
101
|
outputTokensUsed?: number | undefined;
|
|
102
102
|
inputCost?: string | undefined;
|
|
103
103
|
outputCost?: string | undefined;
|
|
104
|
-
}, "kind" | "
|
|
104
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
105
105
|
id: string;
|
|
106
106
|
testCaseId: string;
|
|
107
107
|
startedAt: number;
|
|
@@ -136,7 +136,7 @@ export declare const ExactMatchResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
136
136
|
outputTokensUsed?: number | undefined;
|
|
137
137
|
inputCost?: string | undefined;
|
|
138
138
|
outputCost?: string | undefined;
|
|
139
|
-
}, "
|
|
139
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
140
140
|
id: string;
|
|
141
141
|
testCaseId: string;
|
|
142
142
|
startedAt: number;
|
|
@@ -170,7 +170,7 @@ export declare const ExactMatchScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
170
170
|
readonly human: "human";
|
|
171
171
|
readonly algo: "algo";
|
|
172
172
|
}>;
|
|
173
|
-
}, "kind" | "
|
|
173
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
174
174
|
match: z.ZodBoolean;
|
|
175
175
|
normalized: z.ZodOptional<z.ZodObject<{
|
|
176
176
|
expected: z.ZodString;
|
|
@@ -190,9 +190,9 @@ export declare const ExactMatchScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
190
190
|
schemaVersion: z.ZodLiteral<1>;
|
|
191
191
|
}, z.core.$strip> & {
|
|
192
192
|
new: (input: Omit<{
|
|
193
|
-
value: number;
|
|
194
193
|
id: string;
|
|
195
194
|
responseId: string;
|
|
195
|
+
value: number;
|
|
196
196
|
scoringMethod: "ai" | "human" | "algo";
|
|
197
197
|
match: boolean;
|
|
198
198
|
namespace: "example.peerbench.ai";
|
|
@@ -212,10 +212,10 @@ export declare const ExactMatchScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
212
212
|
scorerAIOutputTokensUsed?: number | undefined;
|
|
213
213
|
scorerAIInputCost?: string | undefined;
|
|
214
214
|
scorerAIOutputCost?: string | undefined;
|
|
215
|
-
}, "kind" | "
|
|
216
|
-
value: number;
|
|
215
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
217
216
|
id: string;
|
|
218
217
|
responseId: string;
|
|
218
|
+
value: number;
|
|
219
219
|
scoringMethod: "ai" | "human" | "algo";
|
|
220
220
|
match: boolean;
|
|
221
221
|
namespace: "example.peerbench.ai";
|
|
@@ -237,9 +237,9 @@ export declare const ExactMatchScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
237
237
|
scorerAIOutputCost?: string | undefined;
|
|
238
238
|
};
|
|
239
239
|
newWithId(input: Omit<{
|
|
240
|
-
value: number;
|
|
241
240
|
id: string;
|
|
242
241
|
responseId: string;
|
|
242
|
+
value: number;
|
|
243
243
|
scoringMethod: "ai" | "human" | "algo";
|
|
244
244
|
match: boolean;
|
|
245
245
|
namespace: "example.peerbench.ai";
|
|
@@ -259,10 +259,10 @@ export declare const ExactMatchScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
259
259
|
scorerAIOutputTokensUsed?: number | undefined;
|
|
260
260
|
scorerAIInputCost?: string | undefined;
|
|
261
261
|
scorerAIOutputCost?: string | undefined;
|
|
262
|
-
}, "
|
|
263
|
-
value: number;
|
|
262
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
264
263
|
id: string;
|
|
265
264
|
responseId: string;
|
|
265
|
+
value: number;
|
|
266
266
|
scoringMethod: "ai" | "human" | "algo";
|
|
267
267
|
match: boolean;
|
|
268
268
|
namespace: "example.peerbench.ai";
|
|
@@ -30,9 +30,9 @@ export declare const textTransformRunner: (params: {
|
|
|
30
30
|
outputCost?: string | undefined;
|
|
31
31
|
};
|
|
32
32
|
score: {
|
|
33
|
-
value: number;
|
|
34
33
|
id: string;
|
|
35
34
|
responseId: string;
|
|
35
|
+
value: number;
|
|
36
36
|
scoringMethod: "ai" | "human" | "algo";
|
|
37
37
|
match: boolean;
|
|
38
38
|
namespace: "example.peerbench.ai";
|
|
@@ -61,9 +61,9 @@ export declare const textTransformRunner: (params: {
|
|
|
61
61
|
outputCost?: string | undefined;
|
|
62
62
|
};
|
|
63
63
|
score: {
|
|
64
|
-
value: number;
|
|
65
64
|
id: string;
|
|
66
65
|
responseId: string;
|
|
66
|
+
value: number;
|
|
67
67
|
scoringMethod: "ai" | "human" | "algo";
|
|
68
68
|
match: boolean;
|
|
69
69
|
expected: string;
|
|
@@ -6,7 +6,7 @@ export declare const TextTransformEchoTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
6
6
|
schemaVersion: z.ZodNumber;
|
|
7
7
|
kind: z.ZodString;
|
|
8
8
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
9
|
-
}, "kind" | "
|
|
9
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
10
10
|
input: z.ZodString;
|
|
11
11
|
} & {
|
|
12
12
|
namespace: z.ZodLiteral<"example.peerbench.ai">;
|
|
@@ -20,7 +20,7 @@ export declare const TextTransformEchoTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
20
20
|
kind: "llm/text-transform-echo.tc";
|
|
21
21
|
schemaVersion: 1;
|
|
22
22
|
metadata?: Record<string, unknown> | undefined;
|
|
23
|
-
}, "kind" | "
|
|
23
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
24
24
|
id: string;
|
|
25
25
|
input: string;
|
|
26
26
|
namespace: "example.peerbench.ai";
|
|
@@ -35,7 +35,7 @@ export declare const TextTransformEchoTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
35
35
|
kind: "llm/text-transform-echo.tc";
|
|
36
36
|
schemaVersion: 1;
|
|
37
37
|
metadata?: Record<string, unknown> | undefined;
|
|
38
|
-
}, "
|
|
38
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
39
39
|
id: string;
|
|
40
40
|
input: string;
|
|
41
41
|
namespace: "example.peerbench.ai";
|
|
@@ -54,7 +54,7 @@ export declare const TextTransformEchoResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
54
54
|
completedAt: z.ZodNumber;
|
|
55
55
|
testCaseId: z.ZodString;
|
|
56
56
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
57
|
-
}, "kind" | "
|
|
57
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
58
58
|
data: z.ZodString;
|
|
59
59
|
modelSlug: z.ZodString;
|
|
60
60
|
provider: z.ZodString;
|
|
@@ -85,7 +85,7 @@ export declare const TextTransformEchoResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
85
85
|
outputTokensUsed?: number | undefined;
|
|
86
86
|
inputCost?: string | undefined;
|
|
87
87
|
outputCost?: string | undefined;
|
|
88
|
-
}, "kind" | "
|
|
88
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
89
89
|
id: string;
|
|
90
90
|
testCaseId: string;
|
|
91
91
|
startedAt: number;
|
|
@@ -120,7 +120,7 @@ export declare const TextTransformEchoResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
120
120
|
outputTokensUsed?: number | undefined;
|
|
121
121
|
inputCost?: string | undefined;
|
|
122
122
|
outputCost?: string | undefined;
|
|
123
|
-
}, "
|
|
123
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
124
124
|
id: string;
|
|
125
125
|
testCaseId: string;
|
|
126
126
|
startedAt: number;
|
|
@@ -154,7 +154,7 @@ export declare const TextTransformEchoScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
154
154
|
readonly human: "human";
|
|
155
155
|
readonly algo: "algo";
|
|
156
156
|
}>;
|
|
157
|
-
}, "kind" | "
|
|
157
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
158
158
|
match: z.ZodBoolean;
|
|
159
159
|
} & {
|
|
160
160
|
namespace: z.ZodLiteral<"example.peerbench.ai">;
|
|
@@ -162,9 +162,9 @@ export declare const TextTransformEchoScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
162
162
|
schemaVersion: z.ZodLiteral<1>;
|
|
163
163
|
}, z.core.$strip> & {
|
|
164
164
|
new: (input: Omit<{
|
|
165
|
-
value: number;
|
|
166
165
|
id: string;
|
|
167
166
|
responseId: string;
|
|
167
|
+
value: number;
|
|
168
168
|
scoringMethod: "ai" | "human" | "algo";
|
|
169
169
|
match: boolean;
|
|
170
170
|
namespace: "example.peerbench.ai";
|
|
@@ -172,10 +172,10 @@ export declare const TextTransformEchoScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
172
172
|
schemaVersion: 1;
|
|
173
173
|
explanation?: string | undefined;
|
|
174
174
|
metadata?: Record<string, unknown> | undefined;
|
|
175
|
-
}, "kind" | "
|
|
176
|
-
value: number;
|
|
175
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
177
176
|
id: string;
|
|
178
177
|
responseId: string;
|
|
178
|
+
value: number;
|
|
179
179
|
scoringMethod: "ai" | "human" | "algo";
|
|
180
180
|
match: boolean;
|
|
181
181
|
namespace: "example.peerbench.ai";
|
|
@@ -185,9 +185,9 @@ export declare const TextTransformEchoScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
185
185
|
metadata?: Record<string, unknown> | undefined;
|
|
186
186
|
};
|
|
187
187
|
newWithId(input: Omit<{
|
|
188
|
-
value: number;
|
|
189
188
|
id: string;
|
|
190
189
|
responseId: string;
|
|
190
|
+
value: number;
|
|
191
191
|
scoringMethod: "ai" | "human" | "algo";
|
|
192
192
|
match: boolean;
|
|
193
193
|
namespace: "example.peerbench.ai";
|
|
@@ -195,10 +195,10 @@ export declare const TextTransformEchoScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
195
195
|
schemaVersion: 1;
|
|
196
196
|
explanation?: string | undefined;
|
|
197
197
|
metadata?: Record<string, unknown> | undefined;
|
|
198
|
-
}, "
|
|
199
|
-
value: number;
|
|
198
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
200
199
|
id: string;
|
|
201
200
|
responseId: string;
|
|
201
|
+
value: number;
|
|
202
202
|
scoringMethod: "ai" | "human" | "algo";
|
|
203
203
|
match: boolean;
|
|
204
204
|
namespace: "example.peerbench.ai";
|
|
@@ -6,7 +6,7 @@ export declare const TextTransformReverseTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
6
6
|
schemaVersion: z.ZodNumber;
|
|
7
7
|
kind: z.ZodString;
|
|
8
8
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
9
|
-
}, "kind" | "
|
|
9
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
10
10
|
input: z.ZodString;
|
|
11
11
|
} & {
|
|
12
12
|
namespace: z.ZodLiteral<"example.peerbench.ai">;
|
|
@@ -20,7 +20,7 @@ export declare const TextTransformReverseTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
20
20
|
kind: "llm/text-transform-reverse.tc";
|
|
21
21
|
schemaVersion: 1;
|
|
22
22
|
metadata?: Record<string, unknown> | undefined;
|
|
23
|
-
}, "kind" | "
|
|
23
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
24
24
|
id: string;
|
|
25
25
|
input: string;
|
|
26
26
|
namespace: "example.peerbench.ai";
|
|
@@ -35,7 +35,7 @@ export declare const TextTransformReverseTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
35
35
|
kind: "llm/text-transform-reverse.tc";
|
|
36
36
|
schemaVersion: 1;
|
|
37
37
|
metadata?: Record<string, unknown> | undefined;
|
|
38
|
-
}, "
|
|
38
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
39
39
|
id: string;
|
|
40
40
|
input: string;
|
|
41
41
|
namespace: "example.peerbench.ai";
|
|
@@ -54,7 +54,7 @@ export declare const TextTransformReverseResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
54
54
|
completedAt: z.ZodNumber;
|
|
55
55
|
testCaseId: z.ZodString;
|
|
56
56
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
57
|
-
}, "kind" | "
|
|
57
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
58
58
|
data: z.ZodString;
|
|
59
59
|
modelSlug: z.ZodString;
|
|
60
60
|
provider: z.ZodString;
|
|
@@ -85,7 +85,7 @@ export declare const TextTransformReverseResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
85
85
|
outputTokensUsed?: number | undefined;
|
|
86
86
|
inputCost?: string | undefined;
|
|
87
87
|
outputCost?: string | undefined;
|
|
88
|
-
}, "kind" | "
|
|
88
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
89
89
|
id: string;
|
|
90
90
|
testCaseId: string;
|
|
91
91
|
startedAt: number;
|
|
@@ -120,7 +120,7 @@ export declare const TextTransformReverseResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
120
120
|
outputTokensUsed?: number | undefined;
|
|
121
121
|
inputCost?: string | undefined;
|
|
122
122
|
outputCost?: string | undefined;
|
|
123
|
-
}, "
|
|
123
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
124
124
|
id: string;
|
|
125
125
|
testCaseId: string;
|
|
126
126
|
startedAt: number;
|
|
@@ -154,7 +154,7 @@ export declare const TextTransformReverseScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
154
154
|
readonly human: "human";
|
|
155
155
|
readonly algo: "algo";
|
|
156
156
|
}>;
|
|
157
|
-
}, "kind" | "
|
|
157
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
158
158
|
match: z.ZodBoolean;
|
|
159
159
|
expected: z.ZodString;
|
|
160
160
|
} & {
|
|
@@ -163,9 +163,9 @@ export declare const TextTransformReverseScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
163
163
|
schemaVersion: z.ZodLiteral<1>;
|
|
164
164
|
}, z.core.$strip> & {
|
|
165
165
|
new: (input: Omit<{
|
|
166
|
-
value: number;
|
|
167
166
|
id: string;
|
|
168
167
|
responseId: string;
|
|
168
|
+
value: number;
|
|
169
169
|
scoringMethod: "ai" | "human" | "algo";
|
|
170
170
|
match: boolean;
|
|
171
171
|
expected: string;
|
|
@@ -174,10 +174,10 @@ export declare const TextTransformReverseScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
174
174
|
schemaVersion: 1;
|
|
175
175
|
explanation?: string | undefined;
|
|
176
176
|
metadata?: Record<string, unknown> | undefined;
|
|
177
|
-
}, "kind" | "
|
|
178
|
-
value: number;
|
|
177
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
179
178
|
id: string;
|
|
180
179
|
responseId: string;
|
|
180
|
+
value: number;
|
|
181
181
|
scoringMethod: "ai" | "human" | "algo";
|
|
182
182
|
match: boolean;
|
|
183
183
|
expected: string;
|
|
@@ -188,9 +188,9 @@ export declare const TextTransformReverseScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
188
188
|
metadata?: Record<string, unknown> | undefined;
|
|
189
189
|
};
|
|
190
190
|
newWithId(input: Omit<{
|
|
191
|
-
value: number;
|
|
192
191
|
id: string;
|
|
193
192
|
responseId: string;
|
|
193
|
+
value: number;
|
|
194
194
|
scoringMethod: "ai" | "human" | "algo";
|
|
195
195
|
match: boolean;
|
|
196
196
|
expected: string;
|
|
@@ -199,10 +199,10 @@ export declare const TextTransformReverseScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
199
199
|
schemaVersion: 1;
|
|
200
200
|
explanation?: string | undefined;
|
|
201
201
|
metadata?: Record<string, unknown> | undefined;
|
|
202
|
-
}, "
|
|
203
|
-
value: number;
|
|
202
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../../index.js").IdGenerator): Promise<{
|
|
204
203
|
id: string;
|
|
205
204
|
responseId: string;
|
|
205
|
+
value: number;
|
|
206
206
|
scoringMethod: "ai" | "human" | "algo";
|
|
207
207
|
match: boolean;
|
|
208
208
|
expected: string;
|
package/dist/benchmarks/index.js
CHANGED
|
@@ -36,9 +36,9 @@ export declare const mcqRunner: (params: {
|
|
|
36
36
|
outputCost?: string | undefined;
|
|
37
37
|
};
|
|
38
38
|
score: {
|
|
39
|
-
value: number;
|
|
40
39
|
id: string;
|
|
41
40
|
responseId: string;
|
|
41
|
+
value: number;
|
|
42
42
|
scoringMethod: "ai" | "human" | "algo";
|
|
43
43
|
extractedAnswers: string[];
|
|
44
44
|
namespace: "peerbench.ai";
|
|
@@ -36,9 +36,9 @@ export declare const qaRunner: (params: {
|
|
|
36
36
|
outputCost?: string | undefined;
|
|
37
37
|
};
|
|
38
38
|
score: {
|
|
39
|
-
value: number;
|
|
40
39
|
id: string;
|
|
41
40
|
responseId: string;
|
|
41
|
+
value: number;
|
|
42
42
|
scoringMethod: "ai" | "human" | "algo";
|
|
43
43
|
namespace: "peerbench.ai";
|
|
44
44
|
kind: "llm/qa.sc";
|
|
@@ -6,7 +6,7 @@ export declare const MCQTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
6
6
|
schemaVersion: z.ZodNumber;
|
|
7
7
|
kind: z.ZodString;
|
|
8
8
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
9
|
-
}, "kind" | "
|
|
9
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
10
10
|
question: z.ZodString;
|
|
11
11
|
options: z.ZodRecord<z.ZodString, z.ZodString>;
|
|
12
12
|
correctAnswerKeys: z.ZodArray<z.ZodString>;
|
|
@@ -24,7 +24,7 @@ export declare const MCQTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
24
24
|
kind: "llm/mcq.tc";
|
|
25
25
|
schemaVersion: 1;
|
|
26
26
|
metadata?: Record<string, unknown> | undefined;
|
|
27
|
-
}, "kind" | "
|
|
27
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
28
28
|
id: string;
|
|
29
29
|
question: string;
|
|
30
30
|
options: Record<string, string>;
|
|
@@ -43,7 +43,7 @@ export declare const MCQTestCaseSchemaV1: z.ZodObject<Omit<{
|
|
|
43
43
|
kind: "llm/mcq.tc";
|
|
44
44
|
schemaVersion: 1;
|
|
45
45
|
metadata?: Record<string, unknown> | undefined;
|
|
46
|
-
}, "
|
|
46
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../index.js").IdGenerator): Promise<{
|
|
47
47
|
id: string;
|
|
48
48
|
question: string;
|
|
49
49
|
options: Record<string, string>;
|
|
@@ -64,7 +64,7 @@ export declare const MCQResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
64
64
|
completedAt: z.ZodNumber;
|
|
65
65
|
testCaseId: z.ZodString;
|
|
66
66
|
metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
|
|
67
|
-
}, "kind" | "
|
|
67
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
68
68
|
data: z.ZodString;
|
|
69
69
|
modelSlug: z.ZodString;
|
|
70
70
|
provider: z.ZodString;
|
|
@@ -95,7 +95,7 @@ export declare const MCQResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
95
95
|
outputTokensUsed?: number | undefined;
|
|
96
96
|
inputCost?: string | undefined;
|
|
97
97
|
outputCost?: string | undefined;
|
|
98
|
-
}, "kind" | "
|
|
98
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
99
99
|
id: string;
|
|
100
100
|
testCaseId: string;
|
|
101
101
|
startedAt: number;
|
|
@@ -130,7 +130,7 @@ export declare const MCQResponseSchemaV1: z.ZodObject<Omit<{
|
|
|
130
130
|
outputTokensUsed?: number | undefined;
|
|
131
131
|
inputCost?: string | undefined;
|
|
132
132
|
outputCost?: string | undefined;
|
|
133
|
-
}, "
|
|
133
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../index.js").IdGenerator): Promise<{
|
|
134
134
|
id: string;
|
|
135
135
|
testCaseId: string;
|
|
136
136
|
startedAt: number;
|
|
@@ -164,7 +164,7 @@ export declare const MCQScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
164
164
|
readonly human: "human";
|
|
165
165
|
readonly algo: "algo";
|
|
166
166
|
}>;
|
|
167
|
-
}, "kind" | "
|
|
167
|
+
}, "kind" | "schemaVersion" | "namespace"> & {
|
|
168
168
|
extractedAnswers: z.ZodArray<z.ZodString>;
|
|
169
169
|
scorerAISystemPrompt: z.ZodOptional<z.ZodString>;
|
|
170
170
|
scorerAISystemPromptId: z.ZodOptional<z.ZodString>;
|
|
@@ -180,9 +180,9 @@ export declare const MCQScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
180
180
|
schemaVersion: z.ZodLiteral<1>;
|
|
181
181
|
}, z.core.$strip> & {
|
|
182
182
|
new: (input: Omit<{
|
|
183
|
-
value: number;
|
|
184
183
|
id: string;
|
|
185
184
|
responseId: string;
|
|
185
|
+
value: number;
|
|
186
186
|
scoringMethod: "ai" | "human" | "algo";
|
|
187
187
|
extractedAnswers: string[];
|
|
188
188
|
namespace: "peerbench.ai";
|
|
@@ -198,10 +198,10 @@ export declare const MCQScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
198
198
|
scorerAIOutputTokensUsed?: number | undefined;
|
|
199
199
|
scorerAIInputCost?: string | undefined;
|
|
200
200
|
scorerAIOutputCost?: string | undefined;
|
|
201
|
-
}, "kind" | "
|
|
202
|
-
value: number;
|
|
201
|
+
}, "kind" | "schemaVersion" | "namespace">) => {
|
|
203
202
|
id: string;
|
|
204
203
|
responseId: string;
|
|
204
|
+
value: number;
|
|
205
205
|
scoringMethod: "ai" | "human" | "algo";
|
|
206
206
|
extractedAnswers: string[];
|
|
207
207
|
namespace: "peerbench.ai";
|
|
@@ -219,9 +219,9 @@ export declare const MCQScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
219
219
|
scorerAIOutputCost?: string | undefined;
|
|
220
220
|
};
|
|
221
221
|
newWithId(input: Omit<{
|
|
222
|
-
value: number;
|
|
223
222
|
id: string;
|
|
224
223
|
responseId: string;
|
|
224
|
+
value: number;
|
|
225
225
|
scoringMethod: "ai" | "human" | "algo";
|
|
226
226
|
extractedAnswers: string[];
|
|
227
227
|
namespace: "peerbench.ai";
|
|
@@ -237,10 +237,10 @@ export declare const MCQScoreSchemaV1: z.ZodObject<Omit<{
|
|
|
237
237
|
scorerAIOutputTokensUsed?: number | undefined;
|
|
238
238
|
scorerAIInputCost?: string | undefined;
|
|
239
239
|
scorerAIOutputCost?: string | undefined;
|
|
240
|
-
}, "
|
|
241
|
-
value: number;
|
|
240
|
+
}, "id" | "kind" | "schemaVersion" | "namespace">, generator: import("../../../index.js").IdGenerator): Promise<{
|
|
242
241
|
id: string;
|
|
243
242
|
responseId: string;
|
|
243
|
+
value: number;
|
|
244
244
|
scoringMethod: "ai" | "human" | "algo";
|
|
245
245
|
extractedAnswers: string[];
|
|
246
246
|
namespace: "peerbench.ai";
|