@mastra/evals 0.1.0-alpha.5 → 0.1.0-alpha.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (106) hide show
  1. package/CHANGELOG.md +6 -0
  2. package/dist/evals.cjs.development.js +371 -0
  3. package/dist/evals.cjs.development.js.map +1 -0
  4. package/dist/evals.cjs.production.min.js +2 -0
  5. package/dist/evals.cjs.production.min.js.map +1 -0
  6. package/dist/evals.esm.js +367 -0
  7. package/dist/evals.esm.js.map +1 -0
  8. package/dist/evaluation.d.ts +3 -0
  9. package/dist/evaluation.d.ts.map +1 -0
  10. package/dist/index.d.ts +2 -0
  11. package/dist/index.d.ts.map +1 -0
  12. package/dist/index.js +8 -0
  13. package/dist/llm.esm.js +2024 -0
  14. package/dist/llm.esm.js.map +1 -0
  15. package/dist/metrics/index.d.ts +3 -0
  16. package/dist/metrics/index.d.ts.map +1 -0
  17. package/dist/metrics/judge/index.d.ts +6 -0
  18. package/dist/metrics/judge/index.d.ts.map +1 -0
  19. package/dist/metrics/llm/answer-relevancy/index.d.ts +17 -0
  20. package/dist/metrics/llm/answer-relevancy/index.d.ts.map +1 -0
  21. package/dist/metrics/llm/answer-relevancy/metricJudge.d.ts +14 -0
  22. package/dist/metrics/llm/answer-relevancy/metricJudge.d.ts.map +1 -0
  23. package/dist/metrics/llm/answer-relevancy/prompts.d.ts +19 -0
  24. package/dist/metrics/llm/answer-relevancy/prompts.d.ts.map +1 -0
  25. package/dist/metrics/llm/bias/index.d.ts +15 -0
  26. package/dist/metrics/llm/bias/index.d.ts.map +1 -0
  27. package/dist/metrics/llm/bias/metricJudge.d.ts +10 -0
  28. package/dist/metrics/llm/bias/metricJudge.d.ts.map +1 -0
  29. package/dist/metrics/llm/bias/prompts.d.ts +10 -0
  30. package/dist/metrics/llm/bias/prompts.d.ts.map +1 -0
  31. package/dist/metrics/llm/context-position/index.d.ts +16 -0
  32. package/dist/metrics/llm/context-position/index.d.ts.map +1 -0
  33. package/dist/metrics/llm/context-position/metricJudge.d.ts +14 -0
  34. package/dist/metrics/llm/context-position/metricJudge.d.ts.map +1 -0
  35. package/dist/metrics/llm/context-position/prompts.d.ts +17 -0
  36. package/dist/metrics/llm/context-position/prompts.d.ts.map +1 -0
  37. package/dist/metrics/llm/context-precision/index.d.ts +16 -0
  38. package/dist/metrics/llm/context-precision/index.d.ts.map +1 -0
  39. package/dist/metrics/llm/context-precision/metricJudge.d.ts +15 -0
  40. package/dist/metrics/llm/context-precision/metricJudge.d.ts.map +1 -0
  41. package/dist/metrics/llm/context-precision/prompts.d.ts +17 -0
  42. package/dist/metrics/llm/context-precision/prompts.d.ts.map +1 -0
  43. package/dist/metrics/llm/context-relevancy/index.d.ts +16 -0
  44. package/dist/metrics/llm/context-relevancy/index.d.ts.map +1 -0
  45. package/dist/metrics/llm/context-relevancy/metricJudge.d.ts +11 -0
  46. package/dist/metrics/llm/context-relevancy/metricJudge.d.ts.map +1 -0
  47. package/dist/metrics/llm/context-relevancy/prompts.d.ts +7 -0
  48. package/dist/metrics/llm/context-relevancy/prompts.d.ts.map +1 -0
  49. package/dist/metrics/llm/contextual-recall/index.d.ts +16 -0
  50. package/dist/metrics/llm/contextual-recall/index.d.ts.map +1 -0
  51. package/dist/metrics/llm/contextual-recall/metricJudge.d.ts +10 -0
  52. package/dist/metrics/llm/contextual-recall/metricJudge.d.ts.map +1 -0
  53. package/dist/metrics/llm/contextual-recall/prompts.d.ts +7 -0
  54. package/dist/metrics/llm/contextual-recall/prompts.d.ts.map +1 -0
  55. package/dist/metrics/llm/faithfulness/index.d.ts +16 -0
  56. package/dist/metrics/llm/faithfulness/index.d.ts.map +1 -0
  57. package/dist/metrics/llm/faithfulness/metricJudge.d.ts +15 -0
  58. package/dist/metrics/llm/faithfulness/metricJudge.d.ts.map +1 -0
  59. package/dist/metrics/llm/faithfulness/prompts.d.ts +20 -0
  60. package/dist/metrics/llm/faithfulness/prompts.d.ts.map +1 -0
  61. package/dist/metrics/llm/hallucination/index.d.ts +16 -0
  62. package/dist/metrics/llm/hallucination/index.d.ts.map +1 -0
  63. package/dist/metrics/llm/hallucination/metricJudge.d.ts +15 -0
  64. package/dist/metrics/llm/hallucination/metricJudge.d.ts.map +1 -0
  65. package/dist/metrics/llm/hallucination/prompts.d.ts +17 -0
  66. package/dist/metrics/llm/hallucination/prompts.d.ts.map +1 -0
  67. package/dist/metrics/llm/index.d.ts +11 -0
  68. package/dist/metrics/llm/index.d.ts.map +1 -0
  69. package/dist/metrics/llm/prompt-alignment/index.d.ts +17 -0
  70. package/dist/metrics/llm/prompt-alignment/index.d.ts.map +1 -0
  71. package/dist/metrics/llm/prompt-alignment/metricJudge.d.ts +14 -0
  72. package/dist/metrics/llm/prompt-alignment/metricJudge.d.ts.map +1 -0
  73. package/dist/metrics/llm/prompt-alignment/prompts.d.ts +17 -0
  74. package/dist/metrics/llm/prompt-alignment/prompts.d.ts.map +1 -0
  75. package/dist/metrics/llm/summarization/index.d.ts +15 -0
  76. package/dist/metrics/llm/summarization/index.d.ts.map +1 -0
  77. package/dist/metrics/llm/summarization/metricJudge.d.ts +25 -0
  78. package/dist/metrics/llm/summarization/metricJudge.d.ts.map +1 -0
  79. package/dist/metrics/llm/summarization/prompts.d.ts +30 -0
  80. package/dist/metrics/llm/summarization/prompts.d.ts.map +1 -0
  81. package/dist/metrics/llm/toxicity/index.d.ts +15 -0
  82. package/dist/metrics/llm/toxicity/index.d.ts.map +1 -0
  83. package/dist/metrics/llm/toxicity/metricJudge.d.ts +14 -0
  84. package/dist/metrics/llm/toxicity/metricJudge.d.ts.map +1 -0
  85. package/dist/metrics/llm/toxicity/prompts.d.ts +13 -0
  86. package/dist/metrics/llm/toxicity/prompts.d.ts.map +1 -0
  87. package/dist/metrics/llm/utils.d.ts +17 -0
  88. package/dist/metrics/llm/utils.d.ts.map +1 -0
  89. package/dist/metrics/nlp/completeness/index.d.ts +12 -0
  90. package/dist/metrics/nlp/completeness/index.d.ts.map +1 -0
  91. package/dist/metrics/nlp/content-similarity/index.d.ts +11 -0
  92. package/dist/metrics/nlp/content-similarity/index.d.ts.map +1 -0
  93. package/dist/metrics/nlp/index.d.ts +6 -0
  94. package/dist/metrics/nlp/index.d.ts.map +1 -0
  95. package/dist/metrics/nlp/keyword-coverage/index.d.ts +9 -0
  96. package/dist/metrics/nlp/keyword-coverage/index.d.ts.map +1 -0
  97. package/dist/metrics/nlp/textual-difference/index.d.ts +9 -0
  98. package/dist/metrics/nlp/textual-difference/index.d.ts.map +1 -0
  99. package/dist/metrics/nlp/tone/index.d.ts +10 -0
  100. package/dist/metrics/nlp/tone/index.d.ts.map +1 -0
  101. package/dist/metrics/nlp/types.d.ts +12 -0
  102. package/dist/metrics/nlp/types.d.ts.map +1 -0
  103. package/dist/nlp.esm.js +240 -0
  104. package/dist/nlp.esm.js.map +1 -0
  105. package/package.json +6 -12
  106. package/src/metrics/llm/index.ts +2 -1
package/CHANGELOG.md CHANGED
@@ -1,5 +1,11 @@
1
1
  # @mastra/evals
2
2
 
3
+ ## 0.1.0-alpha.6
4
+
5
+ ### Patch Changes
6
+
7
+ - aea3c13: Fix evals export for llm and nlp
8
+
3
9
  ## 0.1.0-alpha.5
4
10
 
5
11
  ### Minor Changes
@@ -0,0 +1,371 @@
1
+ 'use strict';
2
+
3
+ Object.defineProperty(exports, '__esModule', { value: true });
4
+
5
+ var core = require('@mastra/core');
6
+
7
+ function asyncGeneratorStep(n, t, e, r, o, a, c) {
8
+ try {
9
+ var i = n[a](c),
10
+ u = i.value;
11
+ } catch (n) {
12
+ return void e(n);
13
+ }
14
+ i.done ? t(u) : Promise.resolve(u).then(r, o);
15
+ }
16
+ function _asyncToGenerator(n) {
17
+ return function () {
18
+ var t = this,
19
+ e = arguments;
20
+ return new Promise(function (r, o) {
21
+ var a = n.apply(t, e);
22
+ function _next(n) {
23
+ asyncGeneratorStep(a, r, o, _next, _throw, "next", n);
24
+ }
25
+ function _throw(n) {
26
+ asyncGeneratorStep(a, r, o, _next, _throw, "throw", n);
27
+ }
28
+ _next(void 0);
29
+ });
30
+ };
31
+ }
32
+ function _regeneratorRuntime() {
33
+ _regeneratorRuntime = function () {
34
+ return e;
35
+ };
36
+ var t,
37
+ e = {},
38
+ r = Object.prototype,
39
+ n = r.hasOwnProperty,
40
+ o = Object.defineProperty || function (t, e, r) {
41
+ t[e] = r.value;
42
+ },
43
+ i = "function" == typeof Symbol ? Symbol : {},
44
+ a = i.iterator || "@@iterator",
45
+ c = i.asyncIterator || "@@asyncIterator",
46
+ u = i.toStringTag || "@@toStringTag";
47
+ function define(t, e, r) {
48
+ return Object.defineProperty(t, e, {
49
+ value: r,
50
+ enumerable: !0,
51
+ configurable: !0,
52
+ writable: !0
53
+ }), t[e];
54
+ }
55
+ try {
56
+ define({}, "");
57
+ } catch (t) {
58
+ define = function (t, e, r) {
59
+ return t[e] = r;
60
+ };
61
+ }
62
+ function wrap(t, e, r, n) {
63
+ var i = e && e.prototype instanceof Generator ? e : Generator,
64
+ a = Object.create(i.prototype),
65
+ c = new Context(n || []);
66
+ return o(a, "_invoke", {
67
+ value: makeInvokeMethod(t, r, c)
68
+ }), a;
69
+ }
70
+ function tryCatch(t, e, r) {
71
+ try {
72
+ return {
73
+ type: "normal",
74
+ arg: t.call(e, r)
75
+ };
76
+ } catch (t) {
77
+ return {
78
+ type: "throw",
79
+ arg: t
80
+ };
81
+ }
82
+ }
83
+ e.wrap = wrap;
84
+ var h = "suspendedStart",
85
+ l = "suspendedYield",
86
+ f = "executing",
87
+ s = "completed",
88
+ y = {};
89
+ function Generator() {}
90
+ function GeneratorFunction() {}
91
+ function GeneratorFunctionPrototype() {}
92
+ var p = {};
93
+ define(p, a, function () {
94
+ return this;
95
+ });
96
+ var d = Object.getPrototypeOf,
97
+ v = d && d(d(values([])));
98
+ v && v !== r && n.call(v, a) && (p = v);
99
+ var g = GeneratorFunctionPrototype.prototype = Generator.prototype = Object.create(p);
100
+ function defineIteratorMethods(t) {
101
+ ["next", "throw", "return"].forEach(function (e) {
102
+ define(t, e, function (t) {
103
+ return this._invoke(e, t);
104
+ });
105
+ });
106
+ }
107
+ function AsyncIterator(t, e) {
108
+ function invoke(r, o, i, a) {
109
+ var c = tryCatch(t[r], t, o);
110
+ if ("throw" !== c.type) {
111
+ var u = c.arg,
112
+ h = u.value;
113
+ return h && "object" == typeof h && n.call(h, "__await") ? e.resolve(h.__await).then(function (t) {
114
+ invoke("next", t, i, a);
115
+ }, function (t) {
116
+ invoke("throw", t, i, a);
117
+ }) : e.resolve(h).then(function (t) {
118
+ u.value = t, i(u);
119
+ }, function (t) {
120
+ return invoke("throw", t, i, a);
121
+ });
122
+ }
123
+ a(c.arg);
124
+ }
125
+ var r;
126
+ o(this, "_invoke", {
127
+ value: function (t, n) {
128
+ function callInvokeWithMethodAndArg() {
129
+ return new e(function (e, r) {
130
+ invoke(t, n, e, r);
131
+ });
132
+ }
133
+ return r = r ? r.then(callInvokeWithMethodAndArg, callInvokeWithMethodAndArg) : callInvokeWithMethodAndArg();
134
+ }
135
+ });
136
+ }
137
+ function makeInvokeMethod(e, r, n) {
138
+ var o = h;
139
+ return function (i, a) {
140
+ if (o === f) throw Error("Generator is already running");
141
+ if (o === s) {
142
+ if ("throw" === i) throw a;
143
+ return {
144
+ value: t,
145
+ done: !0
146
+ };
147
+ }
148
+ for (n.method = i, n.arg = a;;) {
149
+ var c = n.delegate;
150
+ if (c) {
151
+ var u = maybeInvokeDelegate(c, n);
152
+ if (u) {
153
+ if (u === y) continue;
154
+ return u;
155
+ }
156
+ }
157
+ if ("next" === n.method) n.sent = n._sent = n.arg;else if ("throw" === n.method) {
158
+ if (o === h) throw o = s, n.arg;
159
+ n.dispatchException(n.arg);
160
+ } else "return" === n.method && n.abrupt("return", n.arg);
161
+ o = f;
162
+ var p = tryCatch(e, r, n);
163
+ if ("normal" === p.type) {
164
+ if (o = n.done ? s : l, p.arg === y) continue;
165
+ return {
166
+ value: p.arg,
167
+ done: n.done
168
+ };
169
+ }
170
+ "throw" === p.type && (o = s, n.method = "throw", n.arg = p.arg);
171
+ }
172
+ };
173
+ }
174
+ function maybeInvokeDelegate(e, r) {
175
+ var n = r.method,
176
+ o = e.iterator[n];
177
+ if (o === t) return r.delegate = null, "throw" === n && e.iterator.return && (r.method = "return", r.arg = t, maybeInvokeDelegate(e, r), "throw" === r.method) || "return" !== n && (r.method = "throw", r.arg = new TypeError("The iterator does not provide a '" + n + "' method")), y;
178
+ var i = tryCatch(o, e.iterator, r.arg);
179
+ if ("throw" === i.type) return r.method = "throw", r.arg = i.arg, r.delegate = null, y;
180
+ var a = i.arg;
181
+ return a ? a.done ? (r[e.resultName] = a.value, r.next = e.nextLoc, "return" !== r.method && (r.method = "next", r.arg = t), r.delegate = null, y) : a : (r.method = "throw", r.arg = new TypeError("iterator result is not an object"), r.delegate = null, y);
182
+ }
183
+ function pushTryEntry(t) {
184
+ var e = {
185
+ tryLoc: t[0]
186
+ };
187
+ 1 in t && (e.catchLoc = t[1]), 2 in t && (e.finallyLoc = t[2], e.afterLoc = t[3]), this.tryEntries.push(e);
188
+ }
189
+ function resetTryEntry(t) {
190
+ var e = t.completion || {};
191
+ e.type = "normal", delete e.arg, t.completion = e;
192
+ }
193
+ function Context(t) {
194
+ this.tryEntries = [{
195
+ tryLoc: "root"
196
+ }], t.forEach(pushTryEntry, this), this.reset(!0);
197
+ }
198
+ function values(e) {
199
+ if (e || "" === e) {
200
+ var r = e[a];
201
+ if (r) return r.call(e);
202
+ if ("function" == typeof e.next) return e;
203
+ if (!isNaN(e.length)) {
204
+ var o = -1,
205
+ i = function next() {
206
+ for (; ++o < e.length;) if (n.call(e, o)) return next.value = e[o], next.done = !1, next;
207
+ return next.value = t, next.done = !0, next;
208
+ };
209
+ return i.next = i;
210
+ }
211
+ }
212
+ throw new TypeError(typeof e + " is not iterable");
213
+ }
214
+ return GeneratorFunction.prototype = GeneratorFunctionPrototype, o(g, "constructor", {
215
+ value: GeneratorFunctionPrototype,
216
+ configurable: !0
217
+ }), o(GeneratorFunctionPrototype, "constructor", {
218
+ value: GeneratorFunction,
219
+ configurable: !0
220
+ }), GeneratorFunction.displayName = define(GeneratorFunctionPrototype, u, "GeneratorFunction"), e.isGeneratorFunction = function (t) {
221
+ var e = "function" == typeof t && t.constructor;
222
+ return !!e && (e === GeneratorFunction || "GeneratorFunction" === (e.displayName || e.name));
223
+ }, e.mark = function (t) {
224
+ return Object.setPrototypeOf ? Object.setPrototypeOf(t, GeneratorFunctionPrototype) : (t.__proto__ = GeneratorFunctionPrototype, define(t, u, "GeneratorFunction")), t.prototype = Object.create(g), t;
225
+ }, e.awrap = function (t) {
226
+ return {
227
+ __await: t
228
+ };
229
+ }, defineIteratorMethods(AsyncIterator.prototype), define(AsyncIterator.prototype, c, function () {
230
+ return this;
231
+ }), e.AsyncIterator = AsyncIterator, e.async = function (t, r, n, o, i) {
232
+ void 0 === i && (i = Promise);
233
+ var a = new AsyncIterator(wrap(t, r, n, o), i);
234
+ return e.isGeneratorFunction(r) ? a : a.next().then(function (t) {
235
+ return t.done ? t.value : a.next();
236
+ });
237
+ }, defineIteratorMethods(g), define(g, u, "Generator"), define(g, a, function () {
238
+ return this;
239
+ }), define(g, "toString", function () {
240
+ return "[object Generator]";
241
+ }), e.keys = function (t) {
242
+ var e = Object(t),
243
+ r = [];
244
+ for (var n in e) r.push(n);
245
+ return r.reverse(), function next() {
246
+ for (; r.length;) {
247
+ var t = r.pop();
248
+ if (t in e) return next.value = t, next.done = !1, next;
249
+ }
250
+ return next.done = !0, next;
251
+ };
252
+ }, e.values = values, Context.prototype = {
253
+ constructor: Context,
254
+ reset: function (e) {
255
+ if (this.prev = 0, this.next = 0, this.sent = this._sent = t, this.done = !1, this.delegate = null, this.method = "next", this.arg = t, this.tryEntries.forEach(resetTryEntry), !e) for (var r in this) "t" === r.charAt(0) && n.call(this, r) && !isNaN(+r.slice(1)) && (this[r] = t);
256
+ },
257
+ stop: function () {
258
+ this.done = !0;
259
+ var t = this.tryEntries[0].completion;
260
+ if ("throw" === t.type) throw t.arg;
261
+ return this.rval;
262
+ },
263
+ dispatchException: function (e) {
264
+ if (this.done) throw e;
265
+ var r = this;
266
+ function handle(n, o) {
267
+ return a.type = "throw", a.arg = e, r.next = n, o && (r.method = "next", r.arg = t), !!o;
268
+ }
269
+ for (var o = this.tryEntries.length - 1; o >= 0; --o) {
270
+ var i = this.tryEntries[o],
271
+ a = i.completion;
272
+ if ("root" === i.tryLoc) return handle("end");
273
+ if (i.tryLoc <= this.prev) {
274
+ var c = n.call(i, "catchLoc"),
275
+ u = n.call(i, "finallyLoc");
276
+ if (c && u) {
277
+ if (this.prev < i.catchLoc) return handle(i.catchLoc, !0);
278
+ if (this.prev < i.finallyLoc) return handle(i.finallyLoc);
279
+ } else if (c) {
280
+ if (this.prev < i.catchLoc) return handle(i.catchLoc, !0);
281
+ } else {
282
+ if (!u) throw Error("try statement without catch or finally");
283
+ if (this.prev < i.finallyLoc) return handle(i.finallyLoc);
284
+ }
285
+ }
286
+ }
287
+ },
288
+ abrupt: function (t, e) {
289
+ for (var r = this.tryEntries.length - 1; r >= 0; --r) {
290
+ var o = this.tryEntries[r];
291
+ if (o.tryLoc <= this.prev && n.call(o, "finallyLoc") && this.prev < o.finallyLoc) {
292
+ var i = o;
293
+ break;
294
+ }
295
+ }
296
+ i && ("break" === t || "continue" === t) && i.tryLoc <= e && e <= i.finallyLoc && (i = null);
297
+ var a = i ? i.completion : {};
298
+ return a.type = t, a.arg = e, i ? (this.method = "next", this.next = i.finallyLoc, y) : this.complete(a);
299
+ },
300
+ complete: function (t, e) {
301
+ if ("throw" === t.type) throw t.arg;
302
+ return "break" === t.type || "continue" === t.type ? this.next = t.arg : "return" === t.type ? (this.rval = this.arg = t.arg, this.method = "return", this.next = "end") : "normal" === t.type && e && (this.next = e), y;
303
+ },
304
+ finish: function (t) {
305
+ for (var e = this.tryEntries.length - 1; e >= 0; --e) {
306
+ var r = this.tryEntries[e];
307
+ if (r.finallyLoc === t) return this.complete(r.completion, r.afterLoc), resetTryEntry(r), y;
308
+ }
309
+ },
310
+ catch: function (t) {
311
+ for (var e = this.tryEntries.length - 1; e >= 0; --e) {
312
+ var r = this.tryEntries[e];
313
+ if (r.tryLoc === t) {
314
+ var n = r.completion;
315
+ if ("throw" === n.type) {
316
+ var o = n.arg;
317
+ resetTryEntry(r);
318
+ }
319
+ return o;
320
+ }
321
+ }
322
+ throw Error("illegal catch attempt");
323
+ },
324
+ delegateYield: function (e, r, n) {
325
+ return this.delegate = {
326
+ iterator: values(e),
327
+ resultName: r,
328
+ nextLoc: n
329
+ }, "next" === this.method && (this.arg = t), y;
330
+ }
331
+ }, e;
332
+ }
333
+
334
+ function evaluate(_x, _x2, _x3) {
335
+ return _evaluate.apply(this, arguments);
336
+ }
337
+ function _evaluate() {
338
+ _evaluate = _asyncToGenerator(/*#__PURE__*/_regeneratorRuntime().mark(function _callee(agent, input, metric) {
339
+ var agentOutput, metricResult;
340
+ return _regeneratorRuntime().wrap(function _callee$(_context) {
341
+ while (1) switch (_context.prev = _context.next) {
342
+ case 0:
343
+ _context.next = 2;
344
+ return agent.generate(input);
345
+ case 2:
346
+ agentOutput = _context.sent;
347
+ _context.next = 5;
348
+ return metric.measure({
349
+ input: input.toString(),
350
+ output: agentOutput.text
351
+ });
352
+ case 5:
353
+ metricResult = _context.sent;
354
+ // capture infomration about the evaluation
355
+ core.executeHook(core.AvailableHooks.ON_EVALUATION, {
356
+ input: input.toString(),
357
+ output: agentOutput.text,
358
+ result: metricResult
359
+ });
360
+ return _context.abrupt("return", metricResult);
361
+ case 8:
362
+ case "end":
363
+ return _context.stop();
364
+ }
365
+ }, _callee);
366
+ }));
367
+ return _evaluate.apply(this, arguments);
368
+ }
369
+
370
+ exports.evaluate = evaluate;
371
+ //# sourceMappingURL=evals.cjs.development.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"evals.cjs.development.js","sources":["../src/evaluation.ts"],"sourcesContent":["import { AvailableHooks, executeHook } from '@mastra/core';\nimport { type Agent, type Metric } from '@mastra/core';\n\nexport async function evaluate<T extends Agent>(agent: T, input: Parameters<T['generate']>[0], metric: Metric) {\n const agentOutput = await agent.generate(input);\n\n const metricResult = await metric.measure({\n input: input.toString(),\n output: agentOutput.text,\n });\n\n // capture infomration about the evaluation\n executeHook(AvailableHooks.ON_EVALUATION, {\n input: input.toString(),\n output: agentOutput.text,\n result: metricResult,\n });\n\n return metricResult;\n}\n"],"names":["evaluate","_x","_x2","_x3","_evaluate","apply","arguments","_asyncToGenerator","_regeneratorRuntime","mark","_callee","agent","input","metric","agentOutput","metricResult","wrap","_callee$","_context","prev","next","generate","sent","measure","toString","output","text","executeHook","AvailableHooks","ON_EVALUATION","result","abrupt","stop"],"mappings":";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAGA,SAAsBA,QAAQA,CAAAC,EAAA,EAAAC,GAAA,EAAAC,GAAA,EAAA;AAAA,EAAA,OAAAC,SAAA,CAAAC,KAAA,CAAA,IAAA,EAAAC,SAAA,CAAA,CAAA;AAAA,CAAA;AAgB7B,SAAAF,SAAA,GAAA;AAAAA,EAAAA,SAAA,GAAAG,iBAAA,cAAAC,mBAAA,EAAAC,CAAAA,IAAA,CAhBM,SAAAC,OAAyCC,CAAAA,KAAQ,EAAEC,KAAmC,EAAEC,MAAc,EAAA;IAAA,IAAAC,WAAA,EAAAC,YAAA,CAAA;AAAA,IAAA,OAAAP,mBAAA,EAAA,CAAAQ,IAAA,CAAA,SAAAC,SAAAC,QAAA,EAAA;AAAA,MAAA,OAAA,CAAA,EAAA,QAAAA,QAAA,CAAAC,IAAA,GAAAD,QAAA,CAAAE,IAAA;AAAA,QAAA,KAAA,CAAA;AAAAF,UAAAA,QAAA,CAAAE,IAAA,GAAA,CAAA,CAAA;AAAA,UAAA,OACjFT,KAAK,CAACU,QAAQ,CAACT,KAAK,CAAC,CAAA;AAAA,QAAA,KAAA,CAAA;UAAzCE,WAAW,GAAAI,QAAA,CAAAI,IAAA,CAAA;AAAAJ,UAAAA,QAAA,CAAAE,IAAA,GAAA,CAAA,CAAA;UAAA,OAEUP,MAAM,CAACU,OAAO,CAAC;AACxCX,YAAAA,KAAK,EAAEA,KAAK,CAACY,QAAQ,EAAE;YACvBC,MAAM,EAAEX,WAAW,CAACY,IAAAA;AACrB,WAAA,CAAC,CAAA;AAAA,QAAA,KAAA,CAAA;UAHIX,YAAY,GAAAG,QAAA,CAAAI,IAAA,CAAA;AAKlB;AACAK,UAAAA,gBAAW,CAACC,mBAAc,CAACC,aAAa,EAAE;AACxCjB,YAAAA,KAAK,EAAEA,KAAK,CAACY,QAAQ,EAAE;YACvBC,MAAM,EAAEX,WAAW,CAACY,IAAI;AACxBI,YAAAA,MAAM,EAAEf,YAAAA;AACT,WAAA,CAAC,CAAA;AAAC,UAAA,OAAAG,QAAA,CAAAa,MAAA,CAAA,QAAA,EAEIhB,YAAY,CAAA,CAAA;AAAA,QAAA,KAAA,CAAA,CAAA;AAAA,QAAA,KAAA,KAAA;UAAA,OAAAG,QAAA,CAAAc,IAAA,EAAA,CAAA;AAAA,OAAA;AAAA,KAAA,EAAAtB,OAAA,CAAA,CAAA;GACpB,CAAA,CAAA,CAAA;AAAA,EAAA,OAAAN,SAAA,CAAAC,KAAA,CAAA,IAAA,EAAAC,SAAA,CAAA,CAAA;AAAA;;;;"}
@@ -0,0 +1,2 @@
1
+ "use strict";Object.defineProperty(exports,"__esModule",{value:!0});var t=require("@mastra/core");function r(t,r,e,n,o,i,a){try{var u=t[i](a),c=u.value}catch(t){return void e(t)}u.done?r(c):Promise.resolve(c).then(n,o)}function e(){e=function(){return r};var t,r={},n=Object.prototype,o=n.hasOwnProperty,i=Object.defineProperty||function(t,r,e){t[r]=e.value},a="function"==typeof Symbol?Symbol:{},u=a.iterator||"@@iterator",c=a.asyncIterator||"@@asyncIterator",s=a.toStringTag||"@@toStringTag";function f(t,r,e){return Object.defineProperty(t,r,{value:e,enumerable:!0,configurable:!0,writable:!0}),t[r]}try{f({},"")}catch(t){f=function(t,r,e){return t[r]=e}}function h(t,r,e,n){var o=Object.create((r&&r.prototype instanceof m?r:m).prototype),a=new S(n||[]);return i(o,"_invoke",{value:k(t,e,a)}),o}function l(t,r,e){try{return{type:"normal",arg:t.call(r,e)}}catch(t){return{type:"throw",arg:t}}}r.wrap=h;var p="suspendedStart",v="suspendedYield",y="executing",d="completed",g={};function m(){}function w(){}function x(){}var b={};f(b,u,(function(){return this}));var L=Object.getPrototypeOf,E=L&&L(L(T([])));E&&E!==n&&o.call(E,u)&&(b=E);var _=x.prototype=m.prototype=Object.create(b);function O(t){["next","throw","return"].forEach((function(r){f(t,r,(function(t){return this._invoke(r,t)}))}))}function j(t,r){function e(n,i,a,u){var c=l(t[n],t,i);if("throw"!==c.type){var s=c.arg,f=s.value;return f&&"object"==typeof f&&o.call(f,"__await")?r.resolve(f.__await).then((function(t){e("next",t,a,u)}),(function(t){e("throw",t,a,u)})):r.resolve(f).then((function(t){s.value=t,a(s)}),(function(t){return e("throw",t,a,u)}))}u(c.arg)}var n;i(this,"_invoke",{value:function(t,o){function i(){return new r((function(r,n){e(t,o,r,n)}))}return n=n?n.then(i,i):i()}})}function k(r,e,n){var o=p;return function(i,a){if(o===y)throw Error("Generator is already running");if(o===d){if("throw"===i)throw a;return{value:t,done:!0}}for(n.method=i,n.arg=a;;){var u=n.delegate;if(u){var c=N(u,n);if(c){if(c===g)continue;return c}}if("next"===n.method)n.sent=n._sent=n.arg;else if("throw"===n.method){if(o===p)throw o=d,n.arg;n.dispatchException(n.arg)}else"return"===n.method&&n.abrupt("return",n.arg);o=y;var s=l(r,e,n);if("normal"===s.type){if(o=n.done?d:v,s.arg===g)continue;return{value:s.arg,done:n.done}}"throw"===s.type&&(o=d,n.method="throw",n.arg=s.arg)}}}function N(r,e){var n=e.method,o=r.iterator[n];if(o===t)return e.delegate=null,"throw"===n&&r.iterator.return&&(e.method="return",e.arg=t,N(r,e),"throw"===e.method)||"return"!==n&&(e.method="throw",e.arg=new TypeError("The iterator does not provide a '"+n+"' method")),g;var i=l(o,r.iterator,e.arg);if("throw"===i.type)return e.method="throw",e.arg=i.arg,e.delegate=null,g;var a=i.arg;return a?a.done?(e[r.resultName]=a.value,e.next=r.nextLoc,"return"!==e.method&&(e.method="next",e.arg=t),e.delegate=null,g):a:(e.method="throw",e.arg=new TypeError("iterator result is not an object"),e.delegate=null,g)}function P(t){var r={tryLoc:t[0]};1 in t&&(r.catchLoc=t[1]),2 in t&&(r.finallyLoc=t[2],r.afterLoc=t[3]),this.tryEntries.push(r)}function G(t){var r=t.completion||{};r.type="normal",delete r.arg,t.completion=r}function S(t){this.tryEntries=[{tryLoc:"root"}],t.forEach(P,this),this.reset(!0)}function T(r){if(r||""===r){var e=r[u];if(e)return e.call(r);if("function"==typeof r.next)return r;if(!isNaN(r.length)){var n=-1,i=function e(){for(;++n<r.length;)if(o.call(r,n))return e.value=r[n],e.done=!1,e;return e.value=t,e.done=!0,e};return i.next=i}}throw new TypeError(typeof r+" is not iterable")}return w.prototype=x,i(_,"constructor",{value:x,configurable:!0}),i(x,"constructor",{value:w,configurable:!0}),w.displayName=f(x,s,"GeneratorFunction"),r.isGeneratorFunction=function(t){var r="function"==typeof t&&t.constructor;return!!r&&(r===w||"GeneratorFunction"===(r.displayName||r.name))},r.mark=function(t){return Object.setPrototypeOf?Object.setPrototypeOf(t,x):(t.__proto__=x,f(t,s,"GeneratorFunction")),t.prototype=Object.create(_),t},r.awrap=function(t){return{__await:t}},O(j.prototype),f(j.prototype,c,(function(){return this})),r.AsyncIterator=j,r.async=function(t,e,n,o,i){void 0===i&&(i=Promise);var a=new j(h(t,e,n,o),i);return r.isGeneratorFunction(e)?a:a.next().then((function(t){return t.done?t.value:a.next()}))},O(_),f(_,s,"Generator"),f(_,u,(function(){return this})),f(_,"toString",(function(){return"[object Generator]"})),r.keys=function(t){var r=Object(t),e=[];for(var n in r)e.push(n);return e.reverse(),function t(){for(;e.length;){var n=e.pop();if(n in r)return t.value=n,t.done=!1,t}return t.done=!0,t}},r.values=T,S.prototype={constructor:S,reset:function(r){if(this.prev=0,this.next=0,this.sent=this._sent=t,this.done=!1,this.delegate=null,this.method="next",this.arg=t,this.tryEntries.forEach(G),!r)for(var e in this)"t"===e.charAt(0)&&o.call(this,e)&&!isNaN(+e.slice(1))&&(this[e]=t)},stop:function(){this.done=!0;var t=this.tryEntries[0].completion;if("throw"===t.type)throw t.arg;return this.rval},dispatchException:function(r){if(this.done)throw r;var e=this;function n(n,o){return u.type="throw",u.arg=r,e.next=n,o&&(e.method="next",e.arg=t),!!o}for(var i=this.tryEntries.length-1;i>=0;--i){var a=this.tryEntries[i],u=a.completion;if("root"===a.tryLoc)return n("end");if(a.tryLoc<=this.prev){var c=o.call(a,"catchLoc"),s=o.call(a,"finallyLoc");if(c&&s){if(this.prev<a.catchLoc)return n(a.catchLoc,!0);if(this.prev<a.finallyLoc)return n(a.finallyLoc)}else if(c){if(this.prev<a.catchLoc)return n(a.catchLoc,!0)}else{if(!s)throw Error("try statement without catch or finally");if(this.prev<a.finallyLoc)return n(a.finallyLoc)}}}},abrupt:function(t,r){for(var e=this.tryEntries.length-1;e>=0;--e){var n=this.tryEntries[e];if(n.tryLoc<=this.prev&&o.call(n,"finallyLoc")&&this.prev<n.finallyLoc){var i=n;break}}i&&("break"===t||"continue"===t)&&i.tryLoc<=r&&r<=i.finallyLoc&&(i=null);var a=i?i.completion:{};return a.type=t,a.arg=r,i?(this.method="next",this.next=i.finallyLoc,g):this.complete(a)},complete:function(t,r){if("throw"===t.type)throw t.arg;return"break"===t.type||"continue"===t.type?this.next=t.arg:"return"===t.type?(this.rval=this.arg=t.arg,this.method="return",this.next="end"):"normal"===t.type&&r&&(this.next=r),g},finish:function(t){for(var r=this.tryEntries.length-1;r>=0;--r){var e=this.tryEntries[r];if(e.finallyLoc===t)return this.complete(e.completion,e.afterLoc),G(e),g}},catch:function(t){for(var r=this.tryEntries.length-1;r>=0;--r){var e=this.tryEntries[r];if(e.tryLoc===t){var n=e.completion;if("throw"===n.type){var o=n.arg;G(e)}return o}}throw Error("illegal catch attempt")},delegateYield:function(r,e,n){return this.delegate={iterator:T(r),resultName:e,nextLoc:n},"next"===this.method&&(this.arg=t),g}},r}function n(){var o;return o=e().mark((function r(n,o,i){var a,u;return e().wrap((function(r){for(;;)switch(r.prev=r.next){case 0:return r.next=2,n.generate(o);case 2:return a=r.sent,r.next=5,i.measure({input:o.toString(),output:a.text});case 5:return u=r.sent,t.executeHook(t.AvailableHooks.ON_EVALUATION,{input:o.toString(),output:a.text,result:u}),r.abrupt("return",u);case 8:case"end":return r.stop()}}),r)})),n=function(){var t=this,e=arguments;return new Promise((function(n,i){var a=o.apply(t,e);function u(t){r(a,n,i,u,c,"next",t)}function c(t){r(a,n,i,u,c,"throw",t)}u(void 0)}))},n.apply(this,arguments)}exports.evaluate=function(t,r,e){return n.apply(this,arguments)};
2
+ //# sourceMappingURL=evals.cjs.production.min.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"evals.cjs.production.min.js","sources":["../src/evaluation.ts"],"sourcesContent":["import { AvailableHooks, executeHook } from '@mastra/core';\nimport { type Agent, type Metric } from '@mastra/core';\n\nexport async function evaluate<T extends Agent>(agent: T, input: Parameters<T['generate']>[0], metric: Metric) {\n const agentOutput = await agent.generate(input);\n\n const metricResult = await metric.measure({\n input: input.toString(),\n output: agentOutput.text,\n });\n\n // capture infomration about the evaluation\n executeHook(AvailableHooks.ON_EVALUATION, {\n input: input.toString(),\n output: agentOutput.text,\n result: metricResult,\n });\n\n return metricResult;\n}\n"],"names":["_evaluate","_regeneratorRuntime","mark","_callee","agent","input","metric","agentOutput","metricResult","wrap","_context","prev","next","generate","sent","measure","toString","output","text","executeHook","AvailableHooks","ON_EVALUATION","result","abrupt","stop","apply","this","arguments","_x","_x2","_x3"],"mappings":"+jNAmBC,SAAAA,UAAA,SAAAC,IAAAC,MAhBM,SAAAC,EAAyCC,EAAUC,EAAqCC,GAAc,IAAAC,EAAAC,EAAA,OAAAP,IAAAQ,MAAA,SAAAC,GAAA,cAAAA,EAAAC,KAAAD,EAAAE,MAAA,KAAA,EAAA,OAAAF,EAAAE,KAAA,EACjFR,EAAMS,SAASR,GAAM,KAAA,EAA9B,OAAXE,EAAWG,EAAAI,KAAAJ,EAAAE,KAAA,EAEUN,EAAOS,QAAQ,CACxCV,MAAOA,EAAMW,WACbC,OAAQV,EAAYW,OACpB,KAAA,EAOC,OAVGV,EAAYE,EAAAI,KAMlBK,EAAWA,YAACC,EAAcA,eAACC,cAAe,CACxChB,MAAOA,EAAMW,WACbC,OAAQV,EAAYW,KACpBI,OAAQd,IACPE,EAAAa,OAAA,SAEIf,GAAY,KAAA,EAAA,IAAA,MAAA,OAAAE,EAAAc,OAAA,GAAArB,EACpB,IAAAH,gLAAAA,EAAAyB,MAAAC,KAAAC,UAAA,kBAhBD,SAA8BC,EAAAC,EAAAC,GAAA,OAAA9B,EAAAyB,MAAAC,KAAAC,UAAA"}