promptfoo 0.91.3 → 0.92.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (181) hide show
  1. package/dist/drizzle/0006_harsh_caretaker.sql +42 -0
  2. package/dist/drizzle/0007_cloudy_wong.sql +1 -0
  3. package/dist/drizzle/meta/0006_snapshot.json +721 -0
  4. package/dist/drizzle/meta/0007_snapshot.json +723 -0
  5. package/dist/drizzle/meta/_journal.json +14 -0
  6. package/dist/package.json +10 -8
  7. package/dist/src/app/assets/{index-C6z1nbLN.js → index-CMDD1oSm.js} +233 -231
  8. package/dist/src/app/assets/{index.es-oqbvfIxR.js → index.es-D8cSwMq4.js} +1 -1
  9. package/dist/src/app/assets/{sync-D2s75VlC.js → sync-DJZvzYiS.js} +1 -1
  10. package/dist/src/app/index.html +1 -1
  11. package/dist/src/assertions.js +2 -2
  12. package/dist/src/assertions.js.map +1 -1
  13. package/dist/src/commands/cache.d.ts.map +1 -1
  14. package/dist/src/commands/cache.js +0 -2
  15. package/dist/src/commands/cache.js.map +1 -1
  16. package/dist/src/commands/eval.d.ts.map +1 -1
  17. package/dist/src/commands/eval.js +19 -16
  18. package/dist/src/commands/eval.js.map +1 -1
  19. package/dist/src/commands/export.d.ts.map +1 -1
  20. package/dist/src/commands/export.js +8 -31
  21. package/dist/src/commands/export.js.map +1 -1
  22. package/dist/src/commands/import.d.ts.map +1 -1
  23. package/dist/src/commands/import.js +52 -13
  24. package/dist/src/commands/import.js.map +1 -1
  25. package/dist/src/commands/list.d.ts.map +1 -1
  26. package/dist/src/commands/list.js +35 -7
  27. package/dist/src/commands/list.js.map +1 -1
  28. package/dist/src/commands/share.d.ts +2 -2
  29. package/dist/src/commands/share.d.ts.map +1 -1
  30. package/dist/src/commands/share.js +12 -13
  31. package/dist/src/commands/share.js.map +1 -1
  32. package/dist/src/commands/show.d.ts.map +1 -1
  33. package/dist/src/commands/show.js +10 -6
  34. package/dist/src/commands/show.js.map +1 -1
  35. package/dist/src/constants.d.ts +1 -0
  36. package/dist/src/constants.d.ts.map +1 -1
  37. package/dist/src/constants.js +2 -1
  38. package/dist/src/constants.js.map +1 -1
  39. package/dist/src/database/index.js +1 -1
  40. package/dist/src/database/index.js.map +1 -1
  41. package/dist/src/database/tables.d.ts +602 -4
  42. package/dist/src/database/tables.d.ts.map +1 -1
  43. package/dist/src/database/tables.js +67 -8
  44. package/dist/src/database/tables.js.map +1 -1
  45. package/dist/src/database/types.d.ts +3 -3
  46. package/dist/src/database/types.d.ts.map +1 -1
  47. package/dist/src/evaluator.d.ts +3 -2
  48. package/dist/src/evaluator.d.ts.map +1 -1
  49. package/dist/src/evaluator.js +75 -104
  50. package/dist/src/evaluator.js.map +1 -1
  51. package/dist/src/evaluatorHelpers.d.ts.map +1 -1
  52. package/dist/src/evaluatorHelpers.js +2 -1
  53. package/dist/src/evaluatorHelpers.js.map +1 -1
  54. package/dist/src/index.d.ts +2 -1
  55. package/dist/src/index.d.ts.map +1 -1
  56. package/dist/src/index.js +12 -9
  57. package/dist/src/index.js.map +1 -1
  58. package/dist/src/models/eval.d.ts +95 -0
  59. package/dist/src/models/eval.d.ts.map +1 -0
  60. package/dist/src/models/eval.js +390 -0
  61. package/dist/src/models/eval.js.map +1 -0
  62. package/dist/src/models/evalResult.d.ts +50 -0
  63. package/dist/src/models/evalResult.d.ts.map +1 -0
  64. package/dist/src/models/evalResult.js +122 -0
  65. package/dist/src/models/evalResult.js.map +1 -0
  66. package/dist/src/models/provider.d.ts +9 -0
  67. package/dist/src/models/provider.d.ts.map +1 -0
  68. package/dist/src/models/provider.js +47 -0
  69. package/dist/src/models/provider.js.map +1 -0
  70. package/dist/src/prompts/index.d.ts.map +1 -1
  71. package/dist/src/prompts/index.js +2 -1
  72. package/dist/src/prompts/index.js.map +1 -1
  73. package/dist/src/prompts/utils.d.ts +1 -0
  74. package/dist/src/prompts/utils.d.ts.map +1 -1
  75. package/dist/src/prompts/utils.js +7 -0
  76. package/dist/src/prompts/utils.js.map +1 -1
  77. package/dist/src/providers/http.js +2 -2
  78. package/dist/src/providers/http.js.map +1 -1
  79. package/dist/src/providers.js +5 -5
  80. package/dist/src/providers.js.map +1 -1
  81. package/dist/src/redteam/eval/excessive-agency/llm_rubric-20240617.json +10 -0
  82. package/dist/src/redteam/eval/excessive-agency/llm_rubric-20240618.json +10 -0
  83. package/dist/src/redteam/eval/harmful/llm_rubric-20240723.json +10 -0
  84. package/dist/src/redteam/eval/harmful/llm_rubric-20240724.json +10 -0
  85. package/dist/src/server/routes/evalRoutes.d.ts +1 -0
  86. package/dist/src/server/routes/evalRoutes.d.ts.map +1 -0
  87. package/dist/src/server/routes/evalRoutes.js +2 -0
  88. package/dist/src/server/routes/evalRoutes.js.map +1 -0
  89. package/dist/src/server/server.d.ts +1 -0
  90. package/dist/src/server/server.d.ts.map +1 -1
  91. package/dist/src/server/server.js +70 -31
  92. package/dist/src/server/server.js.map +1 -1
  93. package/dist/src/share.d.ts +2 -2
  94. package/dist/src/share.d.ts.map +1 -1
  95. package/dist/src/share.js +93 -34
  96. package/dist/src/share.js.map +1 -1
  97. package/dist/src/table.d.ts +2 -2
  98. package/dist/src/table.d.ts.map +1 -1
  99. package/dist/src/table.js +3 -3
  100. package/dist/src/table.js.map +1 -1
  101. package/dist/src/types/index.d.ts +163 -11
  102. package/dist/src/types/index.d.ts.map +1 -1
  103. package/dist/src/types/index.js +21 -1
  104. package/dist/src/types/index.js.map +1 -1
  105. package/dist/src/util/config/load.d.ts.map +1 -1
  106. package/dist/src/util/config/load.js +2 -1
  107. package/dist/src/util/config/load.js.map +1 -1
  108. package/dist/src/util/config/manage.d.ts.map +1 -1
  109. package/dist/src/util/config/manage.js.map +1 -1
  110. package/dist/src/util/convertEvalResultsToTable.d.ts +16 -0
  111. package/dist/src/util/convertEvalResultsToTable.d.ts.map +1 -0
  112. package/dist/src/util/convertEvalResultsToTable.js +137 -0
  113. package/dist/src/util/convertEvalResultsToTable.js.map +1 -0
  114. package/dist/src/util/createHash.d.ts +1 -0
  115. package/dist/src/util/createHash.d.ts.map +1 -1
  116. package/dist/src/util/createHash.js +9 -0
  117. package/dist/src/util/createHash.js.map +1 -1
  118. package/dist/src/util/file.d.ts +8 -0
  119. package/dist/src/util/file.d.ts.map +1 -0
  120. package/dist/src/util/file.js +13 -0
  121. package/dist/src/util/file.js.map +1 -0
  122. package/dist/src/util/index.d.ts +9 -14
  123. package/dist/src/util/index.d.ts.map +1 -1
  124. package/dist/src/util/index.js +87 -223
  125. package/dist/src/util/index.js.map +1 -1
  126. package/dist/src/util/time.d.ts +2 -0
  127. package/dist/src/util/time.d.ts.map +1 -0
  128. package/dist/src/util/time.js +7 -0
  129. package/dist/src/util/time.js.map +1 -0
  130. package/dist/src/util/transform.js +2 -2
  131. package/dist/src/util/transform.js.map +1 -1
  132. package/dist/src/validators/providers.d.ts +6 -0
  133. package/dist/src/validators/providers.d.ts.map +1 -1
  134. package/dist/src/validators/providers.js +1 -0
  135. package/dist/src/validators/providers.js.map +1 -1
  136. package/dist/src/validators/redteam.d.ts +6 -0
  137. package/dist/src/validators/redteam.d.ts.map +1 -1
  138. package/dist/test/commands/eval/filterFailingTests.test.js +24 -2
  139. package/dist/test/commands/eval/filterFailingTests.test.js.map +1 -1
  140. package/dist/test/evaluator.test.js +153 -74
  141. package/dist/test/evaluator.test.js.map +1 -1
  142. package/dist/test/factories/data/eval/database_records.d.ts +142 -0
  143. package/dist/test/factories/data/eval/database_records.d.ts.map +1 -0
  144. package/dist/test/factories/data/eval/database_records.js +251 -0
  145. package/dist/test/factories/data/eval/database_records.js.map +1 -0
  146. package/dist/test/factories/evalFactory.d.ts +768 -0
  147. package/dist/test/factories/evalFactory.d.ts.map +1 -0
  148. package/dist/test/factories/evalFactory.js +121 -0
  149. package/dist/test/factories/evalFactory.js.map +1 -0
  150. package/dist/test/factories/index.d.ts +1 -0
  151. package/dist/test/factories/index.d.ts.map +1 -0
  152. package/dist/test/factories/index.js +2 -0
  153. package/dist/test/factories/index.js.map +1 -0
  154. package/dist/test/index.test.js +17 -33
  155. package/dist/test/index.test.js.map +1 -1
  156. package/dist/test/models/eval.test.d.ts +2 -0
  157. package/dist/test/models/eval.test.d.ts.map +1 -0
  158. package/dist/test/models/eval.test.js +34 -0
  159. package/dist/test/models/eval.test.js.map +1 -0
  160. package/dist/test/providers.test.js +3 -3
  161. package/dist/test/providers.test.js.map +1 -1
  162. package/dist/test/server/share.test.d.ts +2 -0
  163. package/dist/test/server/share.test.d.ts.map +1 -0
  164. package/dist/test/server/share.test.js +36 -0
  165. package/dist/test/server/share.test.js.map +1 -0
  166. package/dist/test/server/v3evalToShare.json +507 -0
  167. package/dist/test/server/v4evalToShare.json +421 -0
  168. package/dist/test/types.test.js +58 -0
  169. package/dist/test/types.test.js.map +1 -1
  170. package/dist/test/util.file.test.d.ts +2 -0
  171. package/dist/test/util.file.test.d.ts.map +1 -0
  172. package/dist/test/util.file.test.js +32 -0
  173. package/dist/test/util.file.test.js.map +1 -0
  174. package/dist/test/util.listPrevious.test.d.ts +2 -0
  175. package/dist/test/util.listPrevious.test.d.ts.map +1 -0
  176. package/dist/test/util.listPrevious.test.js +37 -0
  177. package/dist/test/util.listPrevious.test.js.map +1 -0
  178. package/dist/test/util.test.js +38 -311
  179. package/dist/test/util.test.js.map +1 -1
  180. package/dist/tsconfig.tsbuildinfo +1 -0
  181. package/package.json +10 -8
@@ -0,0 +1,42 @@
1
+ CREATE TABLE `eval_results` (
2
+ `id` text PRIMARY KEY NOT NULL,
3
+ `created_at` integer DEFAULT CURRENT_TIMESTAMP NOT NULL,
4
+ `updated_at` integer DEFAULT CURRENT_TIMESTAMP NOT NULL,
5
+ `eval_id` text NOT NULL,
6
+ `prompt_idx` integer NOT NULL,
7
+ `test_case_idx` integer NOT NULL,
8
+ `test_case` text NOT NULL,
9
+ `prompt` text NOT NULL,
10
+ `prompt_id` text,
11
+ `provider` text NOT NULL,
12
+ `provider_id` text,
13
+ `latency_ms` integer,
14
+ `cost` real,
15
+ `response` text,
16
+ `error` text,
17
+ `success` integer NOT NULL,
18
+ `score` real NOT NULL,
19
+ `grading_result` text,
20
+ `named_scores` text,
21
+ `metadata` text,
22
+ FOREIGN KEY (`eval_id`) REFERENCES `evals`(`id`) ON UPDATE no action ON DELETE no action,
23
+ FOREIGN KEY (`prompt_id`) REFERENCES `prompts`(`id`) ON UPDATE no action ON DELETE no action,
24
+ FOREIGN KEY (`provider_id`) REFERENCES `providers`(`id`) ON UPDATE no action ON DELETE no action
25
+ );
26
+ --> statement-breakpoint
27
+ CREATE TABLE `evals_to_providers` (
28
+ `provider_id` text NOT NULL,
29
+ `eval_id` text NOT NULL,
30
+ PRIMARY KEY(`provider_id`, `eval_id`),
31
+ FOREIGN KEY (`provider_id`) REFERENCES `providers`(`id`) ON UPDATE no action ON DELETE no action,
32
+ FOREIGN KEY (`eval_id`) REFERENCES `evals`(`id`) ON UPDATE no action ON DELETE no action
33
+ );
34
+ --> statement-breakpoint
35
+ CREATE TABLE `providers` (
36
+ `id` text PRIMARY KEY NOT NULL,
37
+ `provider_id` text NOT NULL,
38
+ `options` text NOT NULL
39
+ );
40
+ --> statement-breakpoint
41
+ ALTER TABLE `evals` ADD `prompts` text;--> statement-breakpoint
42
+ CREATE INDEX `eval_result_eval_id_idx` ON `eval_results` (`eval_id`);
@@ -0,0 +1 @@
1
+ ALTER TABLE `eval_results` RENAME COLUMN `test_case_idx` TO `test_idx`;