llama-stack-client 0.3.4-rc3 → 0.4.0-rc1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (573) hide show
  1. package/CHANGELOG.md +153 -0
  2. package/README.md +19 -21
  3. package/error.d.ts.map +1 -1
  4. package/error.js +1 -0
  5. package/error.js.map +1 -1
  6. package/error.mjs.map +1 -1
  7. package/index.d.mts +23 -50
  8. package/index.d.ts +23 -50
  9. package/index.d.ts.map +1 -1
  10. package/index.js +20 -29
  11. package/index.js.map +1 -1
  12. package/index.mjs +18 -28
  13. package/index.mjs.map +1 -1
  14. package/lib/response-helpers.d.ts +23 -0
  15. package/lib/response-helpers.d.ts.map +1 -0
  16. package/lib/response-helpers.js +53 -0
  17. package/lib/response-helpers.js.map +1 -0
  18. package/lib/response-helpers.mjs +49 -0
  19. package/lib/response-helpers.mjs.map +1 -0
  20. package/package.json +1 -1
  21. package/pagination.d.ts.map +1 -1
  22. package/pagination.js +2 -4
  23. package/pagination.js.map +1 -1
  24. package/pagination.mjs +1 -4
  25. package/pagination.mjs.map +1 -1
  26. package/resource.d.ts.map +1 -1
  27. package/resource.js.map +1 -1
  28. package/resource.mjs.map +1 -1
  29. package/resources/alpha/alpha.d.ts +22 -0
  30. package/resources/alpha/alpha.d.ts.map +1 -0
  31. package/resources/alpha/alpha.js +57 -0
  32. package/resources/alpha/alpha.js.map +1 -0
  33. package/resources/alpha/alpha.mjs +30 -0
  34. package/resources/alpha/alpha.mjs.map +1 -0
  35. package/resources/{benchmarks.d.ts → alpha/benchmarks.d.ts} +25 -35
  36. package/resources/alpha/benchmarks.d.ts.map +1 -0
  37. package/resources/{benchmarks.js → alpha/benchmarks.js} +18 -4
  38. package/resources/alpha/benchmarks.js.map +1 -0
  39. package/resources/alpha/benchmarks.mjs +44 -0
  40. package/resources/alpha/benchmarks.mjs.map +1 -0
  41. package/resources/alpha/eval/eval.d.ts +160 -0
  42. package/resources/alpha/eval/eval.d.ts.map +1 -0
  43. package/resources/{eval → alpha/eval}/eval.js +7 -6
  44. package/resources/alpha/eval/eval.js.map +1 -0
  45. package/resources/{eval → alpha/eval}/eval.mjs +7 -5
  46. package/resources/alpha/eval/eval.mjs.map +1 -0
  47. package/resources/alpha/eval/index.d.ts +3 -0
  48. package/resources/alpha/eval/index.d.ts.map +1 -0
  49. package/resources/{eval → alpha/eval}/index.js +2 -1
  50. package/resources/alpha/eval/index.js.map +1 -0
  51. package/resources/{eval → alpha/eval}/index.mjs +2 -0
  52. package/resources/alpha/eval/index.mjs.map +1 -0
  53. package/resources/{eval → alpha/eval}/jobs.d.ts +2 -2
  54. package/resources/alpha/eval/jobs.d.ts.map +1 -0
  55. package/resources/{eval → alpha/eval}/jobs.js +6 -5
  56. package/resources/alpha/eval/jobs.js.map +1 -0
  57. package/resources/{eval → alpha/eval}/jobs.mjs +6 -4
  58. package/resources/alpha/eval/jobs.mjs.map +1 -0
  59. package/resources/alpha/eval.d.ts.map +1 -0
  60. package/resources/{eval.js → alpha/eval.js} +1 -0
  61. package/resources/alpha/eval.js.map +1 -0
  62. package/resources/alpha/eval.mjs.map +1 -0
  63. package/resources/alpha/index.d.ts +6 -0
  64. package/resources/alpha/index.d.ts.map +1 -0
  65. package/resources/alpha/index.js +21 -0
  66. package/resources/alpha/index.js.map +1 -0
  67. package/resources/alpha/index.mjs +13 -0
  68. package/resources/alpha/index.mjs.map +1 -0
  69. package/resources/alpha/inference.d.ts +85 -0
  70. package/resources/alpha/inference.d.ts.map +1 -0
  71. package/resources/{agents/steps.js → alpha/inference.js} +9 -8
  72. package/resources/alpha/inference.js.map +1 -0
  73. package/resources/alpha/inference.mjs +17 -0
  74. package/resources/alpha/inference.mjs.map +1 -0
  75. package/resources/alpha/post-training/index.d.ts +3 -0
  76. package/resources/alpha/post-training/index.d.ts.map +1 -0
  77. package/resources/{post-training → alpha/post-training}/index.js +2 -1
  78. package/resources/alpha/post-training/index.js.map +1 -0
  79. package/resources/{post-training → alpha/post-training}/index.mjs +2 -0
  80. package/resources/alpha/post-training/index.mjs.map +1 -0
  81. package/resources/alpha/post-training/job.d.ts +116 -0
  82. package/resources/alpha/post-training/job.d.ts.map +1 -0
  83. package/resources/{post-training → alpha/post-training}/job.js +7 -6
  84. package/resources/alpha/post-training/job.js.map +1 -0
  85. package/resources/{post-training → alpha/post-training}/job.mjs +7 -5
  86. package/resources/alpha/post-training/job.mjs.map +1 -0
  87. package/resources/alpha/post-training/post-training.d.ts +242 -0
  88. package/resources/alpha/post-training/post-training.d.ts.map +1 -0
  89. package/resources/{post-training → alpha/post-training}/post-training.js +5 -4
  90. package/resources/alpha/post-training/post-training.js.map +1 -0
  91. package/resources/{post-training → alpha/post-training}/post-training.mjs +5 -3
  92. package/resources/alpha/post-training/post-training.mjs.map +1 -0
  93. package/resources/alpha/post-training.d.ts.map +1 -0
  94. package/resources/{post-training.js → alpha/post-training.js} +2 -1
  95. package/resources/alpha/post-training.js.map +1 -0
  96. package/resources/{post-training.mjs → alpha/post-training.mjs} +2 -0
  97. package/resources/alpha/post-training.mjs.map +1 -0
  98. package/resources/alpha.d.ts +2 -0
  99. package/resources/alpha.d.ts.map +1 -0
  100. package/resources/alpha.js +25 -0
  101. package/resources/alpha.js.map +1 -0
  102. package/resources/alpha.mjs +9 -0
  103. package/resources/alpha.mjs.map +1 -0
  104. package/resources/batches.d.ts +322 -0
  105. package/resources/batches.d.ts.map +1 -0
  106. package/resources/batches.js +45 -0
  107. package/resources/batches.js.map +1 -0
  108. package/resources/batches.mjs +40 -0
  109. package/resources/batches.mjs.map +1 -0
  110. package/resources/beta/beta.d.ts +10 -0
  111. package/resources/beta/beta.d.ts.map +1 -0
  112. package/resources/{tool-runtime/tool-runtime.js → beta/beta.js} +10 -22
  113. package/resources/beta/beta.js.map +1 -0
  114. package/resources/beta/beta.mjs +18 -0
  115. package/resources/beta/beta.mjs.map +1 -0
  116. package/resources/beta/datasets.d.ts +257 -0
  117. package/resources/beta/datasets.d.ts.map +1 -0
  118. package/resources/{datasets.js → beta/datasets.js} +14 -9
  119. package/resources/beta/datasets.js.map +1 -0
  120. package/resources/{datasets.mjs → beta/datasets.mjs} +14 -8
  121. package/resources/beta/datasets.mjs.map +1 -0
  122. package/resources/beta/index.d.ts +3 -0
  123. package/resources/beta/index.d.ts.map +1 -0
  124. package/resources/beta/index.js +15 -0
  125. package/resources/beta/index.js.map +1 -0
  126. package/resources/beta/index.mjs +10 -0
  127. package/resources/beta/index.mjs.map +1 -0
  128. package/resources/beta.d.ts +2 -0
  129. package/resources/beta.d.ts.map +1 -0
  130. package/resources/{agents.js → beta.js} +4 -3
  131. package/resources/beta.js.map +1 -0
  132. package/resources/beta.mjs +9 -0
  133. package/resources/beta.mjs.map +1 -0
  134. package/resources/chat/chat.d.ts +73 -78
  135. package/resources/chat/chat.d.ts.map +1 -1
  136. package/resources/chat/chat.js +2 -2
  137. package/resources/chat/chat.js.map +1 -1
  138. package/resources/chat/chat.mjs +3 -2
  139. package/resources/chat/chat.mjs.map +1 -1
  140. package/resources/chat/completions.d.ts +756 -1402
  141. package/resources/chat/completions.d.ts.map +1 -1
  142. package/resources/chat/completions.js +8 -14
  143. package/resources/chat/completions.js.map +1 -1
  144. package/resources/chat/completions.mjs +7 -11
  145. package/resources/chat/completions.mjs.map +1 -1
  146. package/resources/chat/index.d.ts +1 -1
  147. package/resources/chat/index.d.ts.map +1 -1
  148. package/resources/chat/index.js +3 -3
  149. package/resources/chat/index.js.map +1 -1
  150. package/resources/chat/index.mjs +3 -1
  151. package/resources/chat/index.mjs.map +1 -1
  152. package/resources/chat.js +2 -1
  153. package/resources/chat.js.map +1 -1
  154. package/resources/chat.mjs +2 -0
  155. package/resources/chat.mjs.map +1 -1
  156. package/resources/completions.d.ts +52 -95
  157. package/resources/completions.d.ts.map +1 -1
  158. package/resources/completions.js +3 -6
  159. package/resources/completions.js.map +1 -1
  160. package/resources/completions.mjs +3 -5
  161. package/resources/completions.mjs.map +1 -1
  162. package/resources/conversations/conversations.d.ts +292 -0
  163. package/resources/conversations/conversations.d.ts.map +1 -0
  164. package/resources/conversations/conversations.js +78 -0
  165. package/resources/conversations/conversations.js.map +1 -0
  166. package/resources/conversations/conversations.mjs +51 -0
  167. package/resources/conversations/conversations.mjs.map +1 -0
  168. package/resources/conversations/index.d.ts +3 -0
  169. package/resources/conversations/index.d.ts.map +1 -0
  170. package/resources/conversations/index.js +16 -0
  171. package/resources/conversations/index.js.map +1 -0
  172. package/resources/conversations/index.mjs +10 -0
  173. package/resources/conversations/index.mjs.map +1 -0
  174. package/resources/conversations/items.d.ts +762 -0
  175. package/resources/conversations/items.d.ts.map +1 -0
  176. package/resources/conversations/items.js +51 -0
  177. package/resources/conversations/items.js.map +1 -0
  178. package/resources/conversations/items.mjs +46 -0
  179. package/resources/conversations/items.mjs.map +1 -0
  180. package/resources/conversations.d.ts +2 -0
  181. package/resources/conversations.d.ts.map +1 -0
  182. package/resources/conversations.js +25 -0
  183. package/resources/conversations.js.map +1 -0
  184. package/resources/conversations.mjs +9 -0
  185. package/resources/conversations.mjs.map +1 -0
  186. package/resources/embeddings.d.ts +10 -52
  187. package/resources/embeddings.d.ts.map +1 -1
  188. package/resources/embeddings.js +5 -2
  189. package/resources/embeddings.js.map +1 -1
  190. package/resources/embeddings.mjs +5 -1
  191. package/resources/embeddings.mjs.map +1 -1
  192. package/resources/files.d.ts +44 -54
  193. package/resources/files.d.ts.map +1 -1
  194. package/resources/files.js +18 -9
  195. package/resources/files.js.map +1 -1
  196. package/resources/files.mjs +18 -8
  197. package/resources/files.mjs.map +1 -1
  198. package/resources/index.d.ts +9 -13
  199. package/resources/index.d.ts.map +1 -1
  200. package/resources/index.js +15 -21
  201. package/resources/index.js.map +1 -1
  202. package/resources/index.mjs +9 -11
  203. package/resources/index.mjs.map +1 -1
  204. package/resources/inspect.d.ts +6 -32
  205. package/resources/inspect.d.ts.map +1 -1
  206. package/resources/inspect.js +6 -1
  207. package/resources/inspect.js.map +1 -1
  208. package/resources/inspect.mjs +6 -0
  209. package/resources/inspect.mjs.map +1 -1
  210. package/resources/models/index.d.ts +2 -2
  211. package/resources/models/index.d.ts.map +1 -1
  212. package/resources/models/index.js +2 -1
  213. package/resources/models/index.js.map +1 -1
  214. package/resources/models/index.mjs +2 -0
  215. package/resources/models/index.mjs.map +1 -1
  216. package/resources/models/models.d.ts +71 -31
  217. package/resources/models/models.d.ts.map +1 -1
  218. package/resources/models/models.js +13 -2
  219. package/resources/models/models.js.map +1 -1
  220. package/resources/models/models.mjs +13 -1
  221. package/resources/models/models.mjs.map +1 -1
  222. package/resources/models/openai.d.ts +2 -16
  223. package/resources/models/openai.d.ts.map +1 -1
  224. package/resources/models/openai.js +3 -2
  225. package/resources/models/openai.js.map +1 -1
  226. package/resources/models/openai.mjs +3 -1
  227. package/resources/models/openai.mjs.map +1 -1
  228. package/resources/models.js +2 -1
  229. package/resources/models.js.map +1 -1
  230. package/resources/models.mjs +2 -0
  231. package/resources/models.mjs.map +1 -1
  232. package/resources/moderations.d.ts +9 -35
  233. package/resources/moderations.d.ts.map +1 -1
  234. package/resources/moderations.js +5 -2
  235. package/resources/moderations.js.map +1 -1
  236. package/resources/moderations.mjs +5 -1
  237. package/resources/moderations.mjs.map +1 -1
  238. package/resources/prompts/index.d.ts +3 -0
  239. package/resources/prompts/index.d.ts.map +1 -0
  240. package/resources/prompts/index.js +15 -0
  241. package/resources/prompts/index.js.map +1 -0
  242. package/resources/prompts/index.mjs +10 -0
  243. package/resources/prompts/index.mjs.map +1 -0
  244. package/resources/prompts/prompts.d.ts +96 -0
  245. package/resources/prompts/prompts.d.ts.map +1 -0
  246. package/resources/{agents/agents.js → prompts/prompts.js} +43 -30
  247. package/resources/prompts/prompts.js.map +1 -0
  248. package/resources/prompts/prompts.mjs +66 -0
  249. package/resources/prompts/prompts.mjs.map +1 -0
  250. package/resources/prompts/versions.d.ts +12 -0
  251. package/resources/prompts/versions.d.ts.map +1 -0
  252. package/resources/prompts/versions.js +23 -0
  253. package/resources/prompts/versions.js.map +1 -0
  254. package/resources/prompts/versions.mjs +19 -0
  255. package/resources/prompts/versions.mjs.map +1 -0
  256. package/resources/prompts.d.ts +2 -0
  257. package/resources/prompts.d.ts.map +1 -0
  258. package/resources/prompts.js +25 -0
  259. package/resources/prompts.js.map +1 -0
  260. package/resources/prompts.mjs +9 -0
  261. package/resources/prompts.mjs.map +1 -0
  262. package/resources/providers.d.ts +4 -6
  263. package/resources/providers.d.ts.map +1 -1
  264. package/resources/providers.js +6 -1
  265. package/resources/providers.js.map +1 -1
  266. package/resources/providers.mjs +6 -0
  267. package/resources/providers.mjs.map +1 -1
  268. package/resources/responses/index.js +2 -1
  269. package/resources/responses/index.js.map +1 -1
  270. package/resources/responses/index.mjs +2 -0
  271. package/resources/responses/index.mjs.map +1 -1
  272. package/resources/responses/input-items.d.ts +190 -151
  273. package/resources/responses/input-items.d.ts.map +1 -1
  274. package/resources/responses/input-items.js +3 -2
  275. package/resources/responses/input-items.js.map +1 -1
  276. package/resources/responses/input-items.mjs +3 -1
  277. package/resources/responses/input-items.mjs.map +1 -1
  278. package/resources/responses/responses.d.ts +1387 -1449
  279. package/resources/responses/responses.d.ts.map +1 -1
  280. package/resources/responses/responses.js +8 -11
  281. package/resources/responses/responses.js.map +1 -1
  282. package/resources/responses/responses.mjs +8 -10
  283. package/resources/responses/responses.mjs.map +1 -1
  284. package/resources/responses.js +2 -1
  285. package/resources/responses.js.map +1 -1
  286. package/resources/responses.mjs +2 -0
  287. package/resources/responses.mjs.map +1 -1
  288. package/resources/routes.d.ts +7 -7
  289. package/resources/routes.d.ts.map +1 -1
  290. package/resources/routes.js +8 -6
  291. package/resources/routes.js.map +1 -1
  292. package/resources/routes.mjs +8 -5
  293. package/resources/routes.mjs.map +1 -1
  294. package/resources/safety.d.ts +144 -10
  295. package/resources/safety.d.ts.map +1 -1
  296. package/resources/safety.js +4 -1
  297. package/resources/safety.js.map +1 -1
  298. package/resources/safety.mjs +4 -0
  299. package/resources/safety.mjs.map +1 -1
  300. package/resources/scoring-functions.d.ts +120 -50
  301. package/resources/scoring-functions.d.ts.map +1 -1
  302. package/resources/scoring-functions.js +15 -1
  303. package/resources/scoring-functions.js.map +1 -1
  304. package/resources/scoring-functions.mjs +15 -0
  305. package/resources/scoring-functions.mjs.map +1 -1
  306. package/resources/scoring.d.ts +85 -26
  307. package/resources/scoring.d.ts.map +1 -1
  308. package/resources/scoring.js +2 -1
  309. package/resources/scoring.js.map +1 -1
  310. package/resources/scoring.mjs +2 -0
  311. package/resources/scoring.mjs.map +1 -1
  312. package/resources/shared.d.ts +125 -629
  313. package/resources/shared.d.ts.map +1 -1
  314. package/resources/shared.js +2 -0
  315. package/resources/shared.js.map +1 -1
  316. package/resources/shared.mjs +2 -0
  317. package/resources/shared.mjs.map +1 -1
  318. package/resources/shields.d.ts +19 -24
  319. package/resources/shields.d.ts.map +1 -1
  320. package/resources/shields.js +6 -1
  321. package/resources/shields.js.map +1 -1
  322. package/resources/shields.mjs +6 -0
  323. package/resources/shields.mjs.map +1 -1
  324. package/resources/tool-runtime.d.ts +151 -1
  325. package/resources/tool-runtime.d.ts.map +1 -1
  326. package/resources/tool-runtime.js +22 -16
  327. package/resources/tool-runtime.js.map +1 -1
  328. package/resources/tool-runtime.mjs +20 -1
  329. package/resources/tool-runtime.mjs.map +1 -1
  330. package/resources/toolgroups.d.ts +27 -37
  331. package/resources/toolgroups.d.ts.map +1 -1
  332. package/resources/toolgroups.js +10 -1
  333. package/resources/toolgroups.js.map +1 -1
  334. package/resources/toolgroups.mjs +10 -0
  335. package/resources/toolgroups.mjs.map +1 -1
  336. package/resources/tools.d.ts +9 -76
  337. package/resources/tools.d.ts.map +1 -1
  338. package/resources/tools.js +4 -1
  339. package/resources/tools.js.map +1 -1
  340. package/resources/tools.mjs +4 -0
  341. package/resources/tools.mjs.map +1 -1
  342. package/resources/vector-io.d.ts +272 -148
  343. package/resources/vector-io.d.ts.map +1 -1
  344. package/resources/vector-io.js +2 -1
  345. package/resources/vector-io.js.map +1 -1
  346. package/resources/vector-io.mjs +2 -0
  347. package/resources/vector-io.mjs.map +1 -1
  348. package/resources/vector-stores/file-batches.d.ts +111 -0
  349. package/resources/vector-stores/file-batches.d.ts.map +1 -0
  350. package/resources/vector-stores/file-batches.js +45 -0
  351. package/resources/vector-stores/file-batches.js.map +1 -0
  352. package/resources/vector-stores/file-batches.mjs +41 -0
  353. package/resources/vector-stores/file-batches.mjs.map +1 -0
  354. package/resources/vector-stores/files.d.ts +83 -135
  355. package/resources/vector-stores/files.d.ts.map +1 -1
  356. package/resources/vector-stores/files.js +15 -14
  357. package/resources/vector-stores/files.js.map +1 -1
  358. package/resources/vector-stores/files.mjs +15 -13
  359. package/resources/vector-stores/files.mjs.map +1 -1
  360. package/resources/vector-stores/index.d.ts +2 -1
  361. package/resources/vector-stores/index.d.ts.map +1 -1
  362. package/resources/vector-stores/index.js +5 -2
  363. package/resources/vector-stores/index.js.map +1 -1
  364. package/resources/vector-stores/index.mjs +3 -0
  365. package/resources/vector-stores/index.mjs.map +1 -1
  366. package/resources/vector-stores/vector-stores.d.ts +118 -217
  367. package/resources/vector-stores/vector-stores.d.ts.map +1 -1
  368. package/resources/vector-stores/vector-stores.js +18 -12
  369. package/resources/vector-stores/vector-stores.js.map +1 -1
  370. package/resources/vector-stores/vector-stores.mjs +18 -11
  371. package/resources/vector-stores/vector-stores.mjs.map +1 -1
  372. package/resources/vector-stores.js +2 -1
  373. package/resources/vector-stores.js.map +1 -1
  374. package/resources/vector-stores.mjs +2 -0
  375. package/resources/vector-stores.mjs.map +1 -1
  376. package/src/error.ts +1 -0
  377. package/src/index.ts +82 -252
  378. package/src/lib/response-helpers.ts +60 -0
  379. package/src/pagination.ts +2 -5
  380. package/src/resource.ts +1 -0
  381. package/src/resources/alpha/alpha.ts +85 -0
  382. package/src/resources/{benchmarks.ts → alpha/benchmarks.ts} +36 -37
  383. package/src/resources/{eval → alpha/eval}/eval.ts +83 -65
  384. package/src/resources/{eval → alpha/eval}/index.ts +1 -2
  385. package/src/resources/{eval → alpha/eval}/jobs.ts +6 -6
  386. package/src/resources/{eval.ts → alpha/eval.ts} +1 -0
  387. package/src/resources/alpha/index.ts +34 -0
  388. package/src/resources/alpha/inference.ts +132 -0
  389. package/src/resources/{post-training → alpha/post-training}/index.ts +2 -2
  390. package/src/resources/alpha/post-training/job.ts +182 -0
  391. package/src/resources/alpha/post-training/post-training.ts +369 -0
  392. package/src/resources/{post-training.ts → alpha/post-training.ts} +1 -1
  393. package/src/resources/alpha.ts +9 -0
  394. package/src/resources/batches.ts +572 -0
  395. package/src/resources/beta/beta.ts +41 -0
  396. package/src/resources/beta/datasets.ts +350 -0
  397. package/src/resources/beta/index.ts +20 -0
  398. package/src/resources/{agents.ts → beta.ts} +2 -2
  399. package/src/resources/chat/chat.ts +82 -81
  400. package/src/resources/chat/completions.ts +874 -1484
  401. package/src/resources/chat/index.ts +1 -2
  402. package/src/resources/chat.ts +1 -1
  403. package/src/resources/completions.ts +57 -101
  404. package/src/resources/conversations/conversations.ts +455 -0
  405. package/src/resources/conversations/index.ts +25 -0
  406. package/src/resources/conversations/items.ts +1221 -0
  407. package/src/resources/conversations.ts +9 -0
  408. package/src/resources/embeddings.ts +14 -55
  409. package/src/resources/files.ts +54 -61
  410. package/src/resources/index.ts +33 -109
  411. package/src/resources/inspect.ts +7 -33
  412. package/src/resources/models/index.ts +4 -2
  413. package/src/resources/models/models.ts +79 -30
  414. package/src/resources/models/openai.ts +4 -24
  415. package/src/resources/models.ts +1 -1
  416. package/src/resources/moderations.ts +10 -36
  417. package/src/resources/prompts/index.ts +19 -0
  418. package/src/resources/prompts/prompts.ts +171 -0
  419. package/src/resources/prompts/versions.ts +26 -0
  420. package/src/resources/prompts.ts +9 -0
  421. package/src/resources/providers.ts +5 -7
  422. package/src/resources/responses/index.ts +1 -1
  423. package/src/resources/responses/input-items.ts +293 -161
  424. package/src/resources/responses/responses.ts +2112 -1632
  425. package/src/resources/responses.ts +1 -1
  426. package/src/resources/routes.ts +25 -10
  427. package/src/resources/safety.ts +199 -9
  428. package/src/resources/scoring-functions.ts +168 -52
  429. package/src/resources/scoring.ts +125 -22
  430. package/src/resources/shared.ts +141 -714
  431. package/src/resources/shields.ts +18 -23
  432. package/src/resources/tool-runtime.ts +210 -2
  433. package/src/resources/toolgroups.ts +26 -36
  434. package/src/resources/tools.ts +10 -94
  435. package/src/resources/vector-io.ts +323 -145
  436. package/src/resources/vector-stores/file-batches.ts +201 -0
  437. package/src/resources/vector-stores/files.ts +123 -143
  438. package/src/resources/vector-stores/index.ts +9 -1
  439. package/src/resources/vector-stores/vector-stores.ts +150 -216
  440. package/src/resources/vector-stores.ts +1 -1
  441. package/src/version.ts +1 -1
  442. package/version.d.ts +1 -1
  443. package/version.js +1 -1
  444. package/version.mjs +1 -1
  445. package/resources/agents/agents.d.ts +0 -246
  446. package/resources/agents/agents.d.ts.map +0 -1
  447. package/resources/agents/agents.js.map +0 -1
  448. package/resources/agents/agents.mjs +0 -52
  449. package/resources/agents/agents.mjs.map +0 -1
  450. package/resources/agents/index.d.ts +0 -5
  451. package/resources/agents/index.d.ts.map +0 -1
  452. package/resources/agents/index.js +0 -18
  453. package/resources/agents/index.js.map +0 -1
  454. package/resources/agents/index.mjs +0 -10
  455. package/resources/agents/index.mjs.map +0 -1
  456. package/resources/agents/session.d.ts +0 -98
  457. package/resources/agents/session.d.ts.map +0 -1
  458. package/resources/agents/session.js +0 -42
  459. package/resources/agents/session.js.map +0 -1
  460. package/resources/agents/session.mjs +0 -37
  461. package/resources/agents/session.mjs.map +0 -1
  462. package/resources/agents/steps.d.ts +0 -22
  463. package/resources/agents/steps.d.ts.map +0 -1
  464. package/resources/agents/steps.js.map +0 -1
  465. package/resources/agents/steps.mjs +0 -15
  466. package/resources/agents/steps.mjs.map +0 -1
  467. package/resources/agents/turn.d.ts +0 -461
  468. package/resources/agents/turn.d.ts.map +0 -1
  469. package/resources/agents/turn.js +0 -34
  470. package/resources/agents/turn.js.map +0 -1
  471. package/resources/agents/turn.mjs +0 -29
  472. package/resources/agents/turn.mjs.map +0 -1
  473. package/resources/agents.d.ts +0 -2
  474. package/resources/agents.d.ts.map +0 -1
  475. package/resources/agents.js.map +0 -1
  476. package/resources/agents.mjs +0 -7
  477. package/resources/agents.mjs.map +0 -1
  478. package/resources/benchmarks.d.ts.map +0 -1
  479. package/resources/benchmarks.js.map +0 -1
  480. package/resources/benchmarks.mjs +0 -31
  481. package/resources/benchmarks.mjs.map +0 -1
  482. package/resources/datasets.d.ts +0 -320
  483. package/resources/datasets.d.ts.map +0 -1
  484. package/resources/datasets.js.map +0 -1
  485. package/resources/datasets.mjs.map +0 -1
  486. package/resources/eval/eval.d.ts +0 -159
  487. package/resources/eval/eval.d.ts.map +0 -1
  488. package/resources/eval/eval.js.map +0 -1
  489. package/resources/eval/eval.mjs.map +0 -1
  490. package/resources/eval/index.d.ts +0 -3
  491. package/resources/eval/index.d.ts.map +0 -1
  492. package/resources/eval/index.js.map +0 -1
  493. package/resources/eval/index.mjs.map +0 -1
  494. package/resources/eval/jobs.d.ts.map +0 -1
  495. package/resources/eval/jobs.js.map +0 -1
  496. package/resources/eval/jobs.mjs.map +0 -1
  497. package/resources/eval.d.ts.map +0 -1
  498. package/resources/eval.js.map +0 -1
  499. package/resources/eval.mjs.map +0 -1
  500. package/resources/inference.d.ts +0 -580
  501. package/resources/inference.d.ts.map +0 -1
  502. package/resources/inference.js +0 -54
  503. package/resources/inference.js.map +0 -1
  504. package/resources/inference.mjs +0 -49
  505. package/resources/inference.mjs.map +0 -1
  506. package/resources/post-training/index.d.ts +0 -3
  507. package/resources/post-training/index.d.ts.map +0 -1
  508. package/resources/post-training/index.js.map +0 -1
  509. package/resources/post-training/index.mjs.map +0 -1
  510. package/resources/post-training/job.d.ts +0 -205
  511. package/resources/post-training/job.d.ts.map +0 -1
  512. package/resources/post-training/job.js.map +0 -1
  513. package/resources/post-training/job.mjs.map +0 -1
  514. package/resources/post-training/post-training.d.ts +0 -402
  515. package/resources/post-training/post-training.d.ts.map +0 -1
  516. package/resources/post-training/post-training.js.map +0 -1
  517. package/resources/post-training/post-training.mjs.map +0 -1
  518. package/resources/post-training.d.ts.map +0 -1
  519. package/resources/post-training.js.map +0 -1
  520. package/resources/post-training.mjs.map +0 -1
  521. package/resources/synthetic-data-generation.d.ts +0 -47
  522. package/resources/synthetic-data-generation.d.ts.map +0 -1
  523. package/resources/synthetic-data-generation.js +0 -20
  524. package/resources/synthetic-data-generation.js.map +0 -1
  525. package/resources/synthetic-data-generation.mjs +0 -15
  526. package/resources/synthetic-data-generation.mjs.map +0 -1
  527. package/resources/telemetry.d.ts +0 -519
  528. package/resources/telemetry.d.ts.map +0 -1
  529. package/resources/telemetry.js +0 -70
  530. package/resources/telemetry.js.map +0 -1
  531. package/resources/telemetry.mjs +0 -65
  532. package/resources/telemetry.mjs.map +0 -1
  533. package/resources/tool-runtime/index.d.ts +0 -3
  534. package/resources/tool-runtime/index.d.ts.map +0 -1
  535. package/resources/tool-runtime/index.js +0 -14
  536. package/resources/tool-runtime/index.js.map +0 -1
  537. package/resources/tool-runtime/index.mjs +0 -8
  538. package/resources/tool-runtime/index.mjs.map +0 -1
  539. package/resources/tool-runtime/rag-tool.d.ts +0 -45
  540. package/resources/tool-runtime/rag-tool.d.ts.map +0 -1
  541. package/resources/tool-runtime/rag-tool.js +0 -30
  542. package/resources/tool-runtime/rag-tool.js.map +0 -1
  543. package/resources/tool-runtime/rag-tool.mjs +0 -25
  544. package/resources/tool-runtime/rag-tool.mjs.map +0 -1
  545. package/resources/tool-runtime/tool-runtime.d.ts +0 -132
  546. package/resources/tool-runtime/tool-runtime.d.ts.map +0 -1
  547. package/resources/tool-runtime/tool-runtime.js.map +0 -1
  548. package/resources/tool-runtime/tool-runtime.mjs +0 -29
  549. package/resources/tool-runtime/tool-runtime.mjs.map +0 -1
  550. package/resources/vector-dbs.d.ts +0 -128
  551. package/resources/vector-dbs.d.ts.map +0 -1
  552. package/resources/vector-dbs.js +0 -41
  553. package/resources/vector-dbs.js.map +0 -1
  554. package/resources/vector-dbs.mjs +0 -36
  555. package/resources/vector-dbs.mjs.map +0 -1
  556. package/src/resources/agents/agents.ts +0 -372
  557. package/src/resources/agents/index.ts +0 -44
  558. package/src/resources/agents/session.ts +0 -169
  559. package/src/resources/agents/steps.ts +0 -47
  560. package/src/resources/agents/turn.ts +0 -638
  561. package/src/resources/datasets.ts +0 -413
  562. package/src/resources/inference.ts +0 -768
  563. package/src/resources/post-training/job.ts +0 -274
  564. package/src/resources/post-training/post-training.ts +0 -516
  565. package/src/resources/synthetic-data-generation.ts +0 -65
  566. package/src/resources/telemetry.ts +0 -692
  567. package/src/resources/tool-runtime/index.ts +0 -17
  568. package/src/resources/tool-runtime/rag-tool.ts +0 -69
  569. package/src/resources/tool-runtime/tool-runtime.ts +0 -191
  570. package/src/resources/vector-dbs.ts +0 -191
  571. /package/resources/{eval.d.ts → alpha/eval.d.ts} +0 -0
  572. /package/resources/{eval.mjs → alpha/eval.mjs} +0 -0
  573. /package/resources/{post-training.d.ts → alpha/post-training.d.ts} +0 -0
@@ -0,0 +1,60 @@
1
+ // Copyright (c) Meta Platforms, Inc. and affiliates.
2
+ // All rights reserved.
3
+ //
4
+ // This source code is licensed under the terms described in the LICENSE file in
5
+ // the root directory of this source tree.
6
+
7
+ /**
8
+ * Helper utilities for working with response objects.
9
+ */
10
+
11
+ import type { ResponseObject } from '../resources/responses/responses';
12
+
13
+ /**
14
+ * Extracts aggregated text output from a ResponseObject.
15
+ * This concatenates all `output_text` entries from the response's output array.
16
+ *
17
+ * Useful for streaming responses where you want to get the final text from chunk.response:
18
+ *
19
+ * @example
20
+ * ```ts
21
+ * const stream = await client.responses.create({ stream: true, ... });
22
+ * for await (const chunk of stream) {
23
+ * if (chunk.type === 'response.completed') {
24
+ * const text = getResponseOutputText(chunk.response);
25
+ * console.log(text);
26
+ * }
27
+ * }
28
+ * ```
29
+ */
30
+ export function getResponseOutputText(response: ResponseObject): string {
31
+ const pieces: string[] = [];
32
+
33
+ for (const output of response.output ?? []) {
34
+ if (!output || output.type !== 'message') {
35
+ continue;
36
+ }
37
+
38
+ const content = output.content;
39
+ if (typeof content === 'string') {
40
+ pieces.push(content);
41
+ continue;
42
+ }
43
+
44
+ if (!Array.isArray(content)) {
45
+ continue;
46
+ }
47
+
48
+ for (const item of content) {
49
+ if (typeof item === 'string') {
50
+ pieces.push(item);
51
+ continue;
52
+ }
53
+ if (item && item.type === 'output_text' && 'text' in item && typeof item.text === 'string') {
54
+ pieces.push(item.text);
55
+ }
56
+ }
57
+ }
58
+
59
+ return pieces.join('');
60
+ }
package/src/pagination.ts CHANGED
@@ -4,6 +4,7 @@
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
6
 
7
+ //
7
8
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
9
 
9
10
  import { AbstractPage, Response, APIClient, FinalRequestOptions, PageInfo } from './core';
@@ -54,11 +55,7 @@ export class DatasetsIterrows<Item> extends AbstractPage<Item> implements Datase
54
55
  }
55
56
 
56
57
  nextPageInfo(): PageInfo | null {
57
- const offset = this.next_index;
58
- if (!offset) {
59
- return null;
60
- }
61
-
58
+ const offset = this.next_index ?? 0;
62
59
  const length = this.getPaginatedItems().length;
63
60
  const currentCount = offset + length;
64
61
 
package/src/resource.ts CHANGED
@@ -4,6 +4,7 @@
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
6
 
7
+ //
7
8
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
9
 
9
10
  import type { LlamaStackClient } from './index';
@@ -0,0 +1,85 @@
1
+ // Copyright (c) Meta Platforms, Inc. and affiliates.
2
+ // All rights reserved.
3
+ //
4
+ // This source code is licensed under the terms described in the LICENSE file in
5
+ // the root directory of this source tree.
6
+ //
7
+ // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
+
9
+ import { APIResource } from '../../resource';
10
+ import * as BenchmarksAPI from './benchmarks';
11
+ import {
12
+ Benchmark,
13
+ BenchmarkListResponse,
14
+ BenchmarkRegisterParams,
15
+ Benchmarks,
16
+ ListBenchmarksResponse,
17
+ } from './benchmarks';
18
+ import * as InferenceAPI from './inference';
19
+ import { Inference, InferenceRerankParams, InferenceRerankResponse } from './inference';
20
+ import * as EvalAPI from './eval/eval';
21
+ import {
22
+ BenchmarkConfig,
23
+ Eval,
24
+ EvalEvaluateRowsAlphaParams,
25
+ EvalEvaluateRowsParams,
26
+ EvalRunEvalAlphaParams,
27
+ EvalRunEvalParams,
28
+ EvaluateResponse,
29
+ Job,
30
+ } from './eval/eval';
31
+ import * as PostTrainingAPI from './post-training/post-training';
32
+ import {
33
+ AlgorithmConfig,
34
+ PostTraining,
35
+ PostTrainingJob,
36
+ PostTrainingPreferenceOptimizeParams,
37
+ PostTrainingSupervisedFineTuneParams,
38
+ } from './post-training/post-training';
39
+
40
+ export class Alpha extends APIResource {
41
+ inference: InferenceAPI.Inference = new InferenceAPI.Inference(this._client);
42
+ postTraining: PostTrainingAPI.PostTraining = new PostTrainingAPI.PostTraining(this._client);
43
+ benchmarks: BenchmarksAPI.Benchmarks = new BenchmarksAPI.Benchmarks(this._client);
44
+ eval: EvalAPI.Eval = new EvalAPI.Eval(this._client);
45
+ }
46
+
47
+ Alpha.Inference = Inference;
48
+ Alpha.PostTraining = PostTraining;
49
+ Alpha.Benchmarks = Benchmarks;
50
+ Alpha.Eval = Eval;
51
+
52
+ export declare namespace Alpha {
53
+ export {
54
+ Inference as Inference,
55
+ type InferenceRerankResponse as InferenceRerankResponse,
56
+ type InferenceRerankParams as InferenceRerankParams,
57
+ };
58
+
59
+ export {
60
+ PostTraining as PostTraining,
61
+ type AlgorithmConfig as AlgorithmConfig,
62
+ type PostTrainingJob as PostTrainingJob,
63
+ type PostTrainingPreferenceOptimizeParams as PostTrainingPreferenceOptimizeParams,
64
+ type PostTrainingSupervisedFineTuneParams as PostTrainingSupervisedFineTuneParams,
65
+ };
66
+
67
+ export {
68
+ Benchmarks as Benchmarks,
69
+ type Benchmark as Benchmark,
70
+ type ListBenchmarksResponse as ListBenchmarksResponse,
71
+ type BenchmarkListResponse as BenchmarkListResponse,
72
+ type BenchmarkRegisterParams as BenchmarkRegisterParams,
73
+ };
74
+
75
+ export {
76
+ Eval as Eval,
77
+ type BenchmarkConfig as BenchmarkConfig,
78
+ type EvaluateResponse as EvaluateResponse,
79
+ type Job as Job,
80
+ type EvalEvaluateRowsParams as EvalEvaluateRowsParams,
81
+ type EvalEvaluateRowsAlphaParams as EvalEvaluateRowsAlphaParams,
82
+ type EvalRunEvalParams as EvalRunEvalParams,
83
+ type EvalRunEvalAlphaParams as EvalRunEvalAlphaParams,
84
+ };
85
+ }
@@ -4,17 +4,18 @@
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
6
 
7
+ //
7
8
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
9
 
9
- import { APIResource } from '../resource';
10
- import * as Core from '../core';
10
+ import { APIResource } from '../../resource';
11
+ import * as Core from '../../core';
11
12
 
12
13
  export class Benchmarks extends APIResource {
13
14
  /**
14
15
  * Get a benchmark by its ID.
15
16
  */
16
17
  retrieve(benchmarkId: string, options?: Core.RequestOptions): Core.APIPromise<Benchmark> {
17
- return this._client.get(`/v1/eval/benchmarks/${benchmarkId}`, options);
18
+ return this._client.get(`/v1alpha/eval/benchmarks/${benchmarkId}`, options);
18
19
  }
19
20
 
20
21
  /**
@@ -22,51 +23,67 @@ export class Benchmarks extends APIResource {
22
23
  */
23
24
  list(options?: Core.RequestOptions): Core.APIPromise<BenchmarkListResponse> {
24
25
  return (
25
- this._client.get('/v1/eval/benchmarks', options) as Core.APIPromise<{ data: BenchmarkListResponse }>
26
+ this._client.get('/v1alpha/eval/benchmarks', options) as Core.APIPromise<{
27
+ data: BenchmarkListResponse;
28
+ }>
26
29
  )._thenUnwrap((obj) => obj.data);
27
30
  }
28
31
 
29
32
  /**
30
33
  * Register a benchmark.
34
+ *
35
+ * @deprecated
31
36
  */
32
37
  register(body: BenchmarkRegisterParams, options?: Core.RequestOptions): Core.APIPromise<void> {
33
- return this._client.post('/v1/eval/benchmarks', {
38
+ return this._client.post('/v1alpha/eval/benchmarks', {
34
39
  body,
35
40
  ...options,
36
41
  headers: { Accept: '*/*', ...options?.headers },
37
42
  });
38
43
  }
44
+
45
+ /**
46
+ * Unregister a benchmark.
47
+ *
48
+ * @deprecated
49
+ */
50
+ unregister(benchmarkId: string, options?: Core.RequestOptions): Core.APIPromise<void> {
51
+ return this._client.delete(`/v1alpha/eval/benchmarks/${benchmarkId}`, {
52
+ ...options,
53
+ headers: { Accept: '*/*', ...options?.headers },
54
+ });
55
+ }
39
56
  }
40
57
 
41
58
  /**
42
59
  * A benchmark resource for evaluating model performance.
43
60
  */
44
61
  export interface Benchmark {
45
- /**
46
- * Identifier of the dataset to use for the benchmark evaluation
47
- */
48
62
  dataset_id: string;
49
63
 
64
+ /**
65
+ * Unique identifier for this resource in llama stack
66
+ */
50
67
  identifier: string;
51
68
 
52
69
  /**
53
- * Metadata for this evaluation task
70
+ * ID of the provider that owns this resource
54
71
  */
55
- metadata: { [key: string]: boolean | number | string | Array<unknown> | unknown | null };
56
-
57
72
  provider_id: string;
58
73
 
74
+ scoring_functions: Array<string>;
75
+
59
76
  /**
60
- * List of scoring function identifiers to apply during evaluation
77
+ * Metadata for this evaluation task
61
78
  */
62
- scoring_functions: Array<string>;
79
+ metadata?: { [key: string]: unknown };
63
80
 
64
81
  /**
65
- * The resource type, always benchmark
82
+ * Unique identifier for this resource in the provider
66
83
  */
67
- type: 'benchmark';
84
+ provider_resource_id?: string | null;
68
85
 
69
- provider_resource_id?: string;
86
+ type?: 'benchmark';
70
87
  }
71
88
 
72
89
  export interface ListBenchmarksResponse {
@@ -76,35 +93,17 @@ export interface ListBenchmarksResponse {
76
93
  export type BenchmarkListResponse = Array<Benchmark>;
77
94
 
78
95
  export interface BenchmarkRegisterParams {
79
- /**
80
- * The ID of the benchmark to register.
81
- */
82
96
  benchmark_id: string;
83
97
 
84
- /**
85
- * The ID of the dataset to use for the benchmark.
86
- */
87
98
  dataset_id: string;
88
99
 
89
- /**
90
- * The scoring functions to use for the benchmark.
91
- */
92
100
  scoring_functions: Array<string>;
93
101
 
94
- /**
95
- * The metadata to use for the benchmark.
96
- */
97
- metadata?: { [key: string]: boolean | number | string | Array<unknown> | unknown | null };
102
+ metadata?: { [key: string]: unknown } | null;
98
103
 
99
- /**
100
- * The ID of the provider benchmark to use for the benchmark.
101
- */
102
- provider_benchmark_id?: string;
104
+ provider_benchmark_id?: string | null;
103
105
 
104
- /**
105
- * The ID of the provider to use for the benchmark.
106
- */
107
- provider_id?: string;
106
+ provider_id?: string | null;
108
107
  }
109
108
 
110
109
  export declare namespace Benchmarks {
@@ -3,13 +3,12 @@
3
3
  //
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
-
6
+ //
7
7
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
8
 
9
- import { APIResource } from '../../resource';
10
- import * as Core from '../../core';
11
- import * as ScoringFunctionsAPI from '../scoring-functions';
12
- import * as Shared from '../shared';
9
+ import { APIResource } from '../../../resource';
10
+ import * as Core from '../../../core';
11
+ import * as Shared from '../../shared';
13
12
  import * as JobsAPI from './jobs';
14
13
  import { Jobs } from './jobs';
15
14
 
@@ -24,7 +23,7 @@ export class Eval extends APIResource {
24
23
  body: EvalEvaluateRowsParams,
25
24
  options?: Core.RequestOptions,
26
25
  ): Core.APIPromise<EvaluateResponse> {
27
- return this._client.post(`/v1/eval/benchmarks/${benchmarkId}/evaluations`, { body, ...options });
26
+ return this._client.post(`/v1alpha/eval/benchmarks/${benchmarkId}/evaluations`, { body, ...options });
28
27
  }
29
28
 
30
29
  /**
@@ -35,14 +34,14 @@ export class Eval extends APIResource {
35
34
  body: EvalEvaluateRowsAlphaParams,
36
35
  options?: Core.RequestOptions,
37
36
  ): Core.APIPromise<EvaluateResponse> {
38
- return this._client.post(`/v1/eval/benchmarks/${benchmarkId}/evaluations`, { body, ...options });
37
+ return this._client.post(`/v1alpha/eval/benchmarks/${benchmarkId}/evaluations`, { body, ...options });
39
38
  }
40
39
 
41
40
  /**
42
41
  * Run an evaluation on a benchmark.
43
42
  */
44
43
  runEval(benchmarkId: string, body: EvalRunEvalParams, options?: Core.RequestOptions): Core.APIPromise<Job> {
45
- return this._client.post(`/v1/eval/benchmarks/${benchmarkId}/jobs`, { body, ...options });
44
+ return this._client.post(`/v1alpha/eval/benchmarks/${benchmarkId}/jobs`, { body, ...options });
46
45
  }
47
46
 
48
47
  /**
@@ -53,7 +52,7 @@ export class Eval extends APIResource {
53
52
  body: EvalRunEvalAlphaParams,
54
53
  options?: Core.RequestOptions,
55
54
  ): Core.APIPromise<Job> {
56
- return this._client.post(`/v1/eval/benchmarks/${benchmarkId}/jobs`, { body, ...options });
55
+ return this._client.post(`/v1alpha/eval/benchmarks/${benchmarkId}/jobs`, { body, ...options });
57
56
  }
58
57
  }
59
58
 
@@ -62,61 +61,102 @@ export class Eval extends APIResource {
62
61
  */
63
62
  export interface BenchmarkConfig {
64
63
  /**
65
- * The candidate to evaluate.
64
+ * A model candidate for evaluation.
65
+ */
66
+ eval_candidate: BenchmarkConfig.EvalCandidate;
67
+
68
+ /**
69
+ * Number of examples to evaluate (useful for testing), if not provided, all
70
+ * examples in the dataset will be evaluated
66
71
  */
67
- eval_candidate: EvalCandidate;
72
+ num_examples?: number | null;
68
73
 
69
74
  /**
70
75
  * Map between scoring function id and parameters for each scoring function you
71
76
  * want to run
72
77
  */
73
- scoring_params: { [key: string]: ScoringFunctionsAPI.ScoringFnParams };
78
+ scoring_params?: {
79
+ [key: string]:
80
+ | BenchmarkConfig.LlmAsJudgeScoringFnParams
81
+ | BenchmarkConfig.RegexParserScoringFnParams
82
+ | BenchmarkConfig.BasicScoringFnParams;
83
+ };
84
+ }
74
85
 
86
+ export namespace BenchmarkConfig {
75
87
  /**
76
- * (Optional) The number of examples to evaluate. If not provided, all examples in
77
- * the dataset will be evaluated
88
+ * A model candidate for evaluation.
78
89
  */
79
- num_examples?: number;
80
- }
90
+ export interface EvalCandidate {
91
+ model: string;
81
92
 
82
- /**
83
- * A model candidate for evaluation.
84
- */
85
- export type EvalCandidate = EvalCandidate.ModelCandidate | EvalCandidate.AgentCandidate;
93
+ /**
94
+ * Sampling parameters.
95
+ */
96
+ sampling_params: Shared.SamplingParams;
97
+
98
+ /**
99
+ * A system message providing instructions or context to the model.
100
+ */
101
+ system_message?: Shared.SystemMessage | null;
102
+
103
+ type?: 'model';
104
+ }
86
105
 
87
- export namespace EvalCandidate {
88
106
  /**
89
- * A model candidate for evaluation.
107
+ * Parameters for LLM-as-judge scoring function configuration.
90
108
  */
91
- export interface ModelCandidate {
109
+ export interface LlmAsJudgeScoringFnParams {
110
+ judge_model: string;
111
+
92
112
  /**
93
- * The model ID to evaluate.
113
+ * Aggregation functions to apply to the scores of each row
94
114
  */
95
- model: string;
115
+ aggregation_functions?: Array<
116
+ 'average' | 'weighted_average' | 'median' | 'categorical_count' | 'accuracy'
117
+ >;
96
118
 
97
119
  /**
98
- * The sampling parameters for the model.
120
+ * Regexes to extract the answer from generated response
99
121
  */
100
- sampling_params: Shared.SamplingParams;
122
+ judge_score_regexes?: Array<string>;
123
+
124
+ prompt_template?: string | null;
125
+
126
+ type?: 'llm_as_judge';
127
+ }
101
128
 
102
- type: 'model';
129
+ /**
130
+ * Parameters for regex parser scoring function configuration.
131
+ */
132
+ export interface RegexParserScoringFnParams {
133
+ /**
134
+ * Aggregation functions to apply to the scores of each row
135
+ */
136
+ aggregation_functions?: Array<
137
+ 'average' | 'weighted_average' | 'median' | 'categorical_count' | 'accuracy'
138
+ >;
103
139
 
104
140
  /**
105
- * (Optional) The system message providing instructions or context to the model.
141
+ * Regex to extract the answer from generated response
106
142
  */
107
- system_message?: Shared.SystemMessage;
143
+ parsing_regexes?: Array<string>;
144
+
145
+ type?: 'regex_parser';
108
146
  }
109
147
 
110
148
  /**
111
- * An agent candidate for evaluation.
149
+ * Parameters for basic scoring function configuration.
112
150
  */
113
- export interface AgentCandidate {
151
+ export interface BasicScoringFnParams {
114
152
  /**
115
- * The configuration for the agent candidate.
153
+ * Aggregation functions to apply to the scores of each row
116
154
  */
117
- config: Shared.AgentConfig;
155
+ aggregation_functions?: Array<
156
+ 'average' | 'weighted_average' | 'median' | 'categorical_count' | 'accuracy'
157
+ >;
118
158
 
119
- type: 'agent';
159
+ type?: 'basic';
120
160
  }
121
161
  }
122
162
 
@@ -124,14 +164,8 @@ export namespace EvalCandidate {
124
164
  * The response from an evaluation.
125
165
  */
126
166
  export interface EvaluateResponse {
127
- /**
128
- * The generations from the evaluation.
129
- */
130
- generations: Array<{ [key: string]: boolean | number | string | Array<unknown> | unknown | null }>;
167
+ generations: Array<{ [key: string]: unknown }>;
131
168
 
132
- /**
133
- * The scores from the evaluation.
134
- */
135
169
  scores: { [key: string]: Shared.ScoringResult };
136
170
  }
137
171
 
@@ -139,61 +173,46 @@ export interface EvaluateResponse {
139
173
  * A job execution instance with status tracking.
140
174
  */
141
175
  export interface Job {
142
- /**
143
- * Unique identifier for the job
144
- */
145
176
  job_id: string;
146
177
 
147
178
  /**
148
- * Current execution status of the job
179
+ * Status of a job execution.
149
180
  */
150
181
  status: 'completed' | 'in_progress' | 'failed' | 'scheduled' | 'cancelled';
151
182
  }
152
183
 
153
184
  export interface EvalEvaluateRowsParams {
154
185
  /**
155
- * The configuration for the benchmark.
186
+ * A benchmark configuration for evaluation.
156
187
  */
157
188
  benchmark_config: BenchmarkConfig;
158
189
 
159
- /**
160
- * The rows to evaluate.
161
- */
162
- input_rows: Array<{ [key: string]: boolean | number | string | Array<unknown> | unknown | null }>;
190
+ input_rows: Array<{ [key: string]: unknown }>;
163
191
 
164
- /**
165
- * The scoring functions to use for the evaluation.
166
- */
167
192
  scoring_functions: Array<string>;
168
193
  }
169
194
 
170
195
  export interface EvalEvaluateRowsAlphaParams {
171
196
  /**
172
- * The configuration for the benchmark.
197
+ * A benchmark configuration for evaluation.
173
198
  */
174
199
  benchmark_config: BenchmarkConfig;
175
200
 
176
- /**
177
- * The rows to evaluate.
178
- */
179
- input_rows: Array<{ [key: string]: boolean | number | string | Array<unknown> | unknown | null }>;
201
+ input_rows: Array<{ [key: string]: unknown }>;
180
202
 
181
- /**
182
- * The scoring functions to use for the evaluation.
183
- */
184
203
  scoring_functions: Array<string>;
185
204
  }
186
205
 
187
206
  export interface EvalRunEvalParams {
188
207
  /**
189
- * The configuration for the benchmark.
208
+ * A benchmark configuration for evaluation.
190
209
  */
191
210
  benchmark_config: BenchmarkConfig;
192
211
  }
193
212
 
194
213
  export interface EvalRunEvalAlphaParams {
195
214
  /**
196
- * The configuration for the benchmark.
215
+ * A benchmark configuration for evaluation.
197
216
  */
198
217
  benchmark_config: BenchmarkConfig;
199
218
  }
@@ -203,7 +222,6 @@ Eval.Jobs = Jobs;
203
222
  export declare namespace Eval {
204
223
  export {
205
224
  type BenchmarkConfig as BenchmarkConfig,
206
- type EvalCandidate as EvalCandidate,
207
225
  type EvaluateResponse as EvaluateResponse,
208
226
  type Job as Job,
209
227
  type EvalEvaluateRowsParams as EvalEvaluateRowsParams,
@@ -3,13 +3,12 @@
3
3
  //
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
-
6
+ //
7
7
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
8
 
9
9
  export {
10
10
  Eval,
11
11
  type BenchmarkConfig,
12
- type EvalCandidate,
13
12
  type EvaluateResponse,
14
13
  type Job,
15
14
  type EvalEvaluateRowsParams,
@@ -3,11 +3,11 @@
3
3
  //
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
-
6
+ //
7
7
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
8
 
9
- import { APIResource } from '../../resource';
10
- import * as Core from '../../core';
9
+ import { APIResource } from '../../../resource';
10
+ import * as Core from '../../../core';
11
11
  import * as EvalAPI from './eval';
12
12
 
13
13
  export class Jobs extends APIResource {
@@ -19,14 +19,14 @@ export class Jobs extends APIResource {
19
19
  jobId: string,
20
20
  options?: Core.RequestOptions,
21
21
  ): Core.APIPromise<EvalAPI.EvaluateResponse> {
22
- return this._client.get(`/v1/eval/benchmarks/${benchmarkId}/jobs/${jobId}/result`, options);
22
+ return this._client.get(`/v1alpha/eval/benchmarks/${benchmarkId}/jobs/${jobId}/result`, options);
23
23
  }
24
24
 
25
25
  /**
26
26
  * Cancel a job.
27
27
  */
28
28
  cancel(benchmarkId: string, jobId: string, options?: Core.RequestOptions): Core.APIPromise<void> {
29
- return this._client.delete(`/v1/eval/benchmarks/${benchmarkId}/jobs/${jobId}`, {
29
+ return this._client.delete(`/v1alpha/eval/benchmarks/${benchmarkId}/jobs/${jobId}`, {
30
30
  ...options,
31
31
  headers: { Accept: '*/*', ...options?.headers },
32
32
  });
@@ -36,6 +36,6 @@ export class Jobs extends APIResource {
36
36
  * Get the status of a job.
37
37
  */
38
38
  status(benchmarkId: string, jobId: string, options?: Core.RequestOptions): Core.APIPromise<EvalAPI.Job> {
39
- return this._client.get(`/v1/eval/benchmarks/${benchmarkId}/jobs/${jobId}`, options);
39
+ return this._client.get(`/v1alpha/eval/benchmarks/${benchmarkId}/jobs/${jobId}`, options);
40
40
  }
41
41
  }
@@ -4,6 +4,7 @@
4
4
  // This source code is licensed under the terms described in the LICENSE file in
5
5
  // the root directory of this source tree.
6
6
 
7
+ //
7
8
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
8
9
 
9
10
  export * from './eval/index';