openai 4.97.0 → 4.99.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (242) hide show
  1. package/CHANGELOG.md +29 -0
  2. package/index.d.mts +5 -2
  3. package/index.d.ts +5 -2
  4. package/index.d.ts.map +1 -1
  5. package/index.js +3 -0
  6. package/index.js.map +1 -1
  7. package/index.mjs +3 -0
  8. package/index.mjs.map +1 -1
  9. package/package.json +1 -1
  10. package/resources/audio/speech.d.ts +12 -0
  11. package/resources/audio/speech.d.ts.map +1 -1
  12. package/resources/audio/speech.js +12 -0
  13. package/resources/audio/speech.js.map +1 -1
  14. package/resources/audio/speech.mjs +12 -0
  15. package/resources/audio/speech.mjs.map +1 -1
  16. package/resources/audio/transcriptions.d.ts +38 -0
  17. package/resources/audio/transcriptions.d.ts.map +1 -1
  18. package/resources/audio/transcriptions.js.map +1 -1
  19. package/resources/audio/transcriptions.mjs.map +1 -1
  20. package/resources/audio/translations.d.ts +8 -0
  21. package/resources/audio/translations.d.ts.map +1 -1
  22. package/resources/audio/translations.js.map +1 -1
  23. package/resources/audio/translations.mjs.map +1 -1
  24. package/resources/beta/assistants.d.ts +36 -0
  25. package/resources/beta/assistants.d.ts.map +1 -1
  26. package/resources/beta/assistants.js +28 -0
  27. package/resources/beta/assistants.js.map +1 -1
  28. package/resources/beta/assistants.mjs +28 -0
  29. package/resources/beta/assistants.mjs.map +1 -1
  30. package/resources/beta/realtime/sessions.d.ts +6 -0
  31. package/resources/beta/realtime/sessions.d.ts.map +1 -1
  32. package/resources/beta/realtime/sessions.js +6 -0
  33. package/resources/beta/realtime/sessions.js.map +1 -1
  34. package/resources/beta/realtime/sessions.mjs +6 -0
  35. package/resources/beta/realtime/sessions.mjs.map +1 -1
  36. package/resources/beta/realtime/transcription-sessions.d.ts +6 -0
  37. package/resources/beta/realtime/transcription-sessions.d.ts.map +1 -1
  38. package/resources/beta/realtime/transcription-sessions.js +6 -0
  39. package/resources/beta/realtime/transcription-sessions.js.map +1 -1
  40. package/resources/beta/realtime/transcription-sessions.mjs +6 -0
  41. package/resources/beta/realtime/transcription-sessions.mjs.map +1 -1
  42. package/resources/beta/threads/messages.d.ts +43 -0
  43. package/resources/beta/threads/messages.d.ts.map +1 -1
  44. package/resources/beta/threads/messages.js +33 -0
  45. package/resources/beta/threads/messages.js.map +1 -1
  46. package/resources/beta/threads/messages.mjs +33 -0
  47. package/resources/beta/threads/messages.mjs.map +1 -1
  48. package/resources/beta/threads/runs/runs.d.ts +52 -0
  49. package/resources/beta/threads/runs/runs.d.ts.map +1 -1
  50. package/resources/beta/threads/runs/runs.js +24 -0
  51. package/resources/beta/threads/runs/runs.js.map +1 -1
  52. package/resources/beta/threads/runs/runs.mjs +24 -0
  53. package/resources/beta/threads/runs/runs.mjs.map +1 -1
  54. package/resources/beta/threads/runs/steps.d.ts +21 -0
  55. package/resources/beta/threads/runs/steps.d.ts.map +1 -1
  56. package/resources/beta/threads/runs/steps.js.map +1 -1
  57. package/resources/beta/threads/runs/steps.mjs.map +1 -1
  58. package/resources/beta/threads/threads.d.ts +33 -0
  59. package/resources/beta/threads/threads.d.ts.map +1 -1
  60. package/resources/beta/threads/threads.js +21 -0
  61. package/resources/beta/threads/threads.js.map +1 -1
  62. package/resources/beta/threads/threads.mjs +21 -0
  63. package/resources/beta/threads/threads.mjs.map +1 -1
  64. package/resources/chat/completions/completions.d.ts +38 -0
  65. package/resources/chat/completions/completions.d.ts.map +1 -1
  66. package/resources/chat/completions/completions.js +20 -0
  67. package/resources/chat/completions/completions.js.map +1 -1
  68. package/resources/chat/completions/completions.mjs +20 -0
  69. package/resources/chat/completions/completions.mjs.map +1 -1
  70. package/resources/chat/completions/messages.d.ts +10 -0
  71. package/resources/chat/completions/messages.d.ts.map +1 -1
  72. package/resources/chat/completions/messages.js.map +1 -1
  73. package/resources/chat/completions/messages.mjs.map +1 -1
  74. package/resources/completions.d.ts +8 -0
  75. package/resources/completions.d.ts.map +1 -1
  76. package/resources/completions.js.map +1 -1
  77. package/resources/completions.mjs.map +1 -1
  78. package/resources/embeddings.d.ts +13 -3
  79. package/resources/embeddings.d.ts.map +1 -1
  80. package/resources/embeddings.js +9 -0
  81. package/resources/embeddings.js.map +1 -1
  82. package/resources/embeddings.mjs +9 -0
  83. package/resources/embeddings.mjs.map +1 -1
  84. package/resources/evals/evals.d.ts +164 -519
  85. package/resources/evals/evals.d.ts.map +1 -1
  86. package/resources/evals/evals.js.map +1 -1
  87. package/resources/evals/evals.mjs.map +1 -1
  88. package/resources/evals/index.d.ts +1 -1
  89. package/resources/evals/index.d.ts.map +1 -1
  90. package/resources/evals/index.js.map +1 -1
  91. package/resources/evals/index.mjs.map +1 -1
  92. package/resources/evals/runs/runs.d.ts +64 -69
  93. package/resources/evals/runs/runs.d.ts.map +1 -1
  94. package/resources/evals/runs/runs.js.map +1 -1
  95. package/resources/evals/runs/runs.mjs.map +1 -1
  96. package/resources/fine-tuning/alpha/alpha.d.ts +10 -0
  97. package/resources/fine-tuning/alpha/alpha.d.ts.map +1 -0
  98. package/resources/fine-tuning/alpha/alpha.js +39 -0
  99. package/resources/fine-tuning/alpha/alpha.js.map +1 -0
  100. package/resources/fine-tuning/alpha/alpha.mjs +12 -0
  101. package/resources/fine-tuning/alpha/alpha.mjs.map +1 -0
  102. package/resources/fine-tuning/alpha/graders.d.ts +107 -0
  103. package/resources/fine-tuning/alpha/graders.d.ts.map +1 -0
  104. package/resources/fine-tuning/alpha/graders.js +50 -0
  105. package/resources/fine-tuning/alpha/graders.js.map +1 -0
  106. package/resources/fine-tuning/alpha/graders.mjs +46 -0
  107. package/resources/fine-tuning/alpha/graders.mjs.map +1 -0
  108. package/resources/fine-tuning/alpha/index.d.ts +3 -0
  109. package/resources/fine-tuning/alpha/index.d.ts.map +1 -0
  110. package/resources/fine-tuning/alpha/index.js +9 -0
  111. package/resources/fine-tuning/alpha/index.js.map +1 -0
  112. package/resources/fine-tuning/alpha/index.mjs +4 -0
  113. package/resources/fine-tuning/alpha/index.mjs.map +1 -0
  114. package/resources/fine-tuning/alpha.d.ts +2 -0
  115. package/resources/fine-tuning/alpha.d.ts.map +1 -0
  116. package/resources/fine-tuning/alpha.js +19 -0
  117. package/resources/fine-tuning/alpha.js.map +1 -0
  118. package/resources/fine-tuning/alpha.mjs +3 -0
  119. package/resources/fine-tuning/alpha.mjs.map +1 -0
  120. package/resources/fine-tuning/checkpoints/permissions.d.ts +28 -0
  121. package/resources/fine-tuning/checkpoints/permissions.d.ts.map +1 -1
  122. package/resources/fine-tuning/checkpoints/permissions.js +20 -0
  123. package/resources/fine-tuning/checkpoints/permissions.js.map +1 -1
  124. package/resources/fine-tuning/checkpoints/permissions.mjs +20 -0
  125. package/resources/fine-tuning/checkpoints/permissions.mjs.map +1 -1
  126. package/resources/fine-tuning/fine-tuning.d.ts +8 -0
  127. package/resources/fine-tuning/fine-tuning.d.ts.map +1 -1
  128. package/resources/fine-tuning/fine-tuning.js +8 -0
  129. package/resources/fine-tuning/fine-tuning.js.map +1 -1
  130. package/resources/fine-tuning/fine-tuning.mjs +8 -0
  131. package/resources/fine-tuning/fine-tuning.mjs.map +1 -1
  132. package/resources/fine-tuning/index.d.ts +2 -0
  133. package/resources/fine-tuning/index.d.ts.map +1 -1
  134. package/resources/fine-tuning/index.js +11 -7
  135. package/resources/fine-tuning/index.js.map +1 -1
  136. package/resources/fine-tuning/index.mjs +2 -0
  137. package/resources/fine-tuning/index.mjs.map +1 -1
  138. package/resources/fine-tuning/jobs/checkpoints.d.ts +10 -0
  139. package/resources/fine-tuning/jobs/checkpoints.d.ts.map +1 -1
  140. package/resources/fine-tuning/jobs/checkpoints.js.map +1 -1
  141. package/resources/fine-tuning/jobs/checkpoints.mjs.map +1 -1
  142. package/resources/fine-tuning/jobs/jobs.d.ts +78 -145
  143. package/resources/fine-tuning/jobs/jobs.d.ts.map +1 -1
  144. package/resources/fine-tuning/jobs/jobs.js +48 -0
  145. package/resources/fine-tuning/jobs/jobs.js.map +1 -1
  146. package/resources/fine-tuning/jobs/jobs.mjs +48 -0
  147. package/resources/fine-tuning/jobs/jobs.mjs.map +1 -1
  148. package/resources/fine-tuning/methods.d.ts +120 -0
  149. package/resources/fine-tuning/methods.d.ts.map +1 -0
  150. package/resources/fine-tuning/methods.js +9 -0
  151. package/resources/fine-tuning/methods.js.map +1 -0
  152. package/resources/fine-tuning/methods.mjs +5 -0
  153. package/resources/fine-tuning/methods.mjs.map +1 -0
  154. package/resources/graders/grader-models.d.ts +234 -0
  155. package/resources/graders/grader-models.d.ts.map +1 -0
  156. package/resources/graders/grader-models.js +9 -0
  157. package/resources/graders/grader-models.js.map +1 -0
  158. package/resources/graders/grader-models.mjs +5 -0
  159. package/resources/graders/grader-models.mjs.map +1 -0
  160. package/resources/graders/graders.d.ts +10 -0
  161. package/resources/graders/graders.d.ts.map +1 -0
  162. package/resources/graders/graders.js +39 -0
  163. package/resources/graders/graders.js.map +1 -0
  164. package/resources/graders/graders.mjs +12 -0
  165. package/resources/graders/graders.mjs.map +1 -0
  166. package/resources/graders/index.d.ts +3 -0
  167. package/resources/graders/index.d.ts.map +1 -0
  168. package/resources/graders/index.js +9 -0
  169. package/resources/graders/index.js.map +1 -0
  170. package/resources/graders/index.mjs +4 -0
  171. package/resources/graders/index.mjs.map +1 -0
  172. package/resources/graders.d.ts +2 -0
  173. package/resources/graders.d.ts.map +1 -0
  174. package/resources/graders.js +19 -0
  175. package/resources/graders.js.map +1 -0
  176. package/resources/graders.mjs +3 -0
  177. package/resources/graders.mjs.map +1 -0
  178. package/resources/images.d.ts +22 -0
  179. package/resources/images.d.ts.map +1 -1
  180. package/resources/images.js +22 -0
  181. package/resources/images.js.map +1 -1
  182. package/resources/images.mjs +22 -0
  183. package/resources/images.mjs.map +1 -1
  184. package/resources/index.d.ts +2 -1
  185. package/resources/index.d.ts.map +1 -1
  186. package/resources/index.js +3 -1
  187. package/resources/index.js.map +1 -1
  188. package/resources/index.mjs +1 -0
  189. package/resources/index.mjs.map +1 -1
  190. package/resources/responses/input-items.d.ts +10 -0
  191. package/resources/responses/input-items.d.ts.map +1 -1
  192. package/resources/responses/input-items.js.map +1 -1
  193. package/resources/responses/input-items.mjs.map +1 -1
  194. package/resources/responses/responses.d.ts +22 -0
  195. package/resources/responses/responses.d.ts.map +1 -1
  196. package/resources/responses/responses.js +7 -0
  197. package/resources/responses/responses.js.map +1 -1
  198. package/resources/responses/responses.mjs +7 -0
  199. package/resources/responses/responses.mjs.map +1 -1
  200. package/resources/shared.d.ts +1 -1
  201. package/resources/shared.d.ts.map +1 -1
  202. package/src/index.ts +5 -6
  203. package/src/resources/audio/speech.ts +12 -0
  204. package/src/resources/audio/transcriptions.ts +43 -0
  205. package/src/resources/audio/translations.ts +8 -0
  206. package/src/resources/beta/assistants.ts +36 -0
  207. package/src/resources/beta/realtime/sessions.ts +6 -0
  208. package/src/resources/beta/realtime/transcription-sessions.ts +6 -0
  209. package/src/resources/beta/threads/messages.ts +43 -0
  210. package/src/resources/beta/threads/runs/runs.ts +52 -0
  211. package/src/resources/beta/threads/runs/steps.ts +21 -0
  212. package/src/resources/beta/threads/threads.ts +33 -0
  213. package/src/resources/chat/completions/completions.ts +38 -0
  214. package/src/resources/chat/completions/messages.ts +10 -0
  215. package/src/resources/completions.ts +8 -0
  216. package/src/resources/embeddings.ts +13 -3
  217. package/src/resources/evals/evals.ts +194 -628
  218. package/src/resources/evals/index.ts +0 -3
  219. package/src/resources/evals/runs/runs.ts +69 -77
  220. package/src/resources/fine-tuning/alpha/alpha.ts +27 -0
  221. package/src/resources/fine-tuning/alpha/graders.ts +168 -0
  222. package/src/resources/fine-tuning/alpha/index.ts +10 -0
  223. package/src/resources/fine-tuning/alpha.ts +3 -0
  224. package/src/resources/fine-tuning/checkpoints/permissions.ts +28 -0
  225. package/src/resources/fine-tuning/fine-tuning.ts +28 -0
  226. package/src/resources/fine-tuning/index.ts +10 -0
  227. package/src/resources/fine-tuning/jobs/checkpoints.ts +10 -0
  228. package/src/resources/fine-tuning/jobs/jobs.ts +84 -161
  229. package/src/resources/fine-tuning/methods.ts +152 -0
  230. package/src/resources/graders/grader-models.ts +296 -0
  231. package/src/resources/graders/graders.ts +31 -0
  232. package/src/resources/graders/index.ts +12 -0
  233. package/src/resources/graders.ts +3 -0
  234. package/src/resources/images.ts +22 -0
  235. package/src/resources/index.ts +1 -3
  236. package/src/resources/responses/input-items.ts +10 -0
  237. package/src/resources/responses/responses.ts +22 -0
  238. package/src/resources/shared.ts +1 -0
  239. package/src/version.ts +1 -1
  240. package/version.d.ts +1 -1
  241. package/version.js +1 -1
  242. package/version.mjs +1 -1
@@ -1,5 +1,6 @@
1
1
  // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
2
2
 
3
+ export { Alpha } from './alpha/index';
3
4
  export { Checkpoints } from './checkpoints/index';
4
5
  export { FineTuning } from './fine-tuning';
5
6
  export {
@@ -15,3 +16,12 @@ export {
15
16
  type JobListParams,
16
17
  type JobListEventsParams,
17
18
  } from './jobs/index';
19
+ export {
20
+ Methods,
21
+ type DpoHyperparameters,
22
+ type DpoMethod,
23
+ type ReinforcementHyperparameters,
24
+ type ReinforcementMethod,
25
+ type SupervisedHyperparameters,
26
+ type SupervisedMethod,
27
+ } from './methods';
@@ -8,6 +8,16 @@ import { CursorPage, type CursorPageParams } from '../../../pagination';
8
8
  export class Checkpoints extends APIResource {
9
9
  /**
10
10
  * List checkpoints for a fine-tuning job.
11
+ *
12
+ * @example
13
+ * ```ts
14
+ * // Automatically fetches more pages as needed.
15
+ * for await (const fineTuningJobCheckpoint of client.fineTuning.jobs.checkpoints.list(
16
+ * 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
17
+ * )) {
18
+ * // ...
19
+ * }
20
+ * ```
11
21
  */
12
22
  list(
13
23
  fineTuningJobId: string,
@@ -3,6 +3,7 @@
3
3
  import { APIResource } from '../../../resource';
4
4
  import { isRequestOptions } from '../../../core';
5
5
  import * as Core from '../../../core';
6
+ import * as MethodsAPI from '../methods';
6
7
  import * as CheckpointsAPI from './checkpoints';
7
8
  import {
8
9
  CheckpointListParams,
@@ -23,6 +24,14 @@ export class Jobs extends APIResource {
23
24
  * of the fine-tuned models once complete.
24
25
  *
25
26
  * [Learn more about fine-tuning](https://platform.openai.com/docs/guides/fine-tuning)
27
+ *
28
+ * @example
29
+ * ```ts
30
+ * const fineTuningJob = await client.fineTuning.jobs.create({
31
+ * model: 'gpt-4o-mini',
32
+ * training_file: 'file-abc123',
33
+ * });
34
+ * ```
26
35
  */
27
36
  create(body: JobCreateParams, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
28
37
  return this._client.post('/fine_tuning/jobs', { body, ...options });
@@ -32,6 +41,13 @@ export class Jobs extends APIResource {
32
41
  * Get info about a fine-tuning job.
33
42
  *
34
43
  * [Learn more about fine-tuning](https://platform.openai.com/docs/guides/fine-tuning)
44
+ *
45
+ * @example
46
+ * ```ts
47
+ * const fineTuningJob = await client.fineTuning.jobs.retrieve(
48
+ * 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
49
+ * );
50
+ * ```
35
51
  */
36
52
  retrieve(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
37
53
  return this._client.get(`/fine_tuning/jobs/${fineTuningJobId}`, options);
@@ -39,6 +55,14 @@ export class Jobs extends APIResource {
39
55
 
40
56
  /**
41
57
  * List your organization's fine-tuning jobs
58
+ *
59
+ * @example
60
+ * ```ts
61
+ * // Automatically fetches more pages as needed.
62
+ * for await (const fineTuningJob of client.fineTuning.jobs.list()) {
63
+ * // ...
64
+ * }
65
+ * ```
42
66
  */
43
67
  list(
44
68
  query?: JobListParams,
@@ -57,6 +81,13 @@ export class Jobs extends APIResource {
57
81
 
58
82
  /**
59
83
  * Immediately cancel a fine-tune job.
84
+ *
85
+ * @example
86
+ * ```ts
87
+ * const fineTuningJob = await client.fineTuning.jobs.cancel(
88
+ * 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
89
+ * );
90
+ * ```
60
91
  */
61
92
  cancel(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
62
93
  return this._client.post(`/fine_tuning/jobs/${fineTuningJobId}/cancel`, options);
@@ -64,6 +95,16 @@ export class Jobs extends APIResource {
64
95
 
65
96
  /**
66
97
  * Get status updates for a fine-tuning job.
98
+ *
99
+ * @example
100
+ * ```ts
101
+ * // Automatically fetches more pages as needed.
102
+ * for await (const fineTuningJobEvent of client.fineTuning.jobs.listEvents(
103
+ * 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
104
+ * )) {
105
+ * // ...
106
+ * }
107
+ * ```
67
108
  */
68
109
  listEvents(
69
110
  fineTuningJobId: string,
@@ -87,6 +128,34 @@ export class Jobs extends APIResource {
87
128
  ...options,
88
129
  });
89
130
  }
131
+
132
+ /**
133
+ * Pause a fine-tune job.
134
+ *
135
+ * @example
136
+ * ```ts
137
+ * const fineTuningJob = await client.fineTuning.jobs.pause(
138
+ * 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
139
+ * );
140
+ * ```
141
+ */
142
+ pause(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
143
+ return this._client.post(`/fine_tuning/jobs/${fineTuningJobId}/pause`, options);
144
+ }
145
+
146
+ /**
147
+ * Resume a fine-tune job.
148
+ *
149
+ * @example
150
+ * ```ts
151
+ * const fineTuningJob = await client.fineTuning.jobs.resume(
152
+ * 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
153
+ * );
154
+ * ```
155
+ */
156
+ resume(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
157
+ return this._client.post(`/fine_tuning/jobs/${fineTuningJobId}/resume`, options);
158
+ }
90
159
  }
91
160
 
92
161
  export class FineTuningJobsPage extends CursorPage<FineTuningJob> {}
@@ -233,7 +302,7 @@ export namespace FineTuningJob {
233
302
  * Number of examples in each batch. A larger batch size means that model
234
303
  * parameters are updated less frequently, but with lower variance.
235
304
  */
236
- batch_size?: 'auto' | number;
305
+ batch_size?: unknown | 'auto' | number | null;
237
306
 
238
307
  /**
239
308
  * Scaling factor for the learning rate. A smaller learning rate may be useful to
@@ -253,97 +322,24 @@ export namespace FineTuningJob {
253
322
  */
254
323
  export interface Method {
255
324
  /**
256
- * Configuration for the DPO fine-tuning method.
325
+ * The type of method. Is either `supervised`, `dpo`, or `reinforcement`.
257
326
  */
258
- dpo?: Method.Dpo;
327
+ type: 'supervised' | 'dpo' | 'reinforcement';
259
328
 
260
329
  /**
261
- * Configuration for the supervised fine-tuning method.
262
- */
263
- supervised?: Method.Supervised;
264
-
265
- /**
266
- * The type of method. Is either `supervised` or `dpo`.
330
+ * Configuration for the DPO fine-tuning method.
267
331
  */
268
- type?: 'supervised' | 'dpo';
269
- }
332
+ dpo?: MethodsAPI.DpoMethod;
270
333
 
271
- export namespace Method {
272
334
  /**
273
- * Configuration for the DPO fine-tuning method.
335
+ * Configuration for the reinforcement fine-tuning method.
274
336
  */
275
- export interface Dpo {
276
- /**
277
- * The hyperparameters used for the fine-tuning job.
278
- */
279
- hyperparameters?: Dpo.Hyperparameters;
280
- }
281
-
282
- export namespace Dpo {
283
- /**
284
- * The hyperparameters used for the fine-tuning job.
285
- */
286
- export interface Hyperparameters {
287
- /**
288
- * Number of examples in each batch. A larger batch size means that model
289
- * parameters are updated less frequently, but with lower variance.
290
- */
291
- batch_size?: 'auto' | number;
292
-
293
- /**
294
- * The beta value for the DPO method. A higher beta value will increase the weight
295
- * of the penalty between the policy and reference model.
296
- */
297
- beta?: 'auto' | number;
298
-
299
- /**
300
- * Scaling factor for the learning rate. A smaller learning rate may be useful to
301
- * avoid overfitting.
302
- */
303
- learning_rate_multiplier?: 'auto' | number;
304
-
305
- /**
306
- * The number of epochs to train the model for. An epoch refers to one full cycle
307
- * through the training dataset.
308
- */
309
- n_epochs?: 'auto' | number;
310
- }
311
- }
337
+ reinforcement?: MethodsAPI.ReinforcementMethod;
312
338
 
313
339
  /**
314
340
  * Configuration for the supervised fine-tuning method.
315
341
  */
316
- export interface Supervised {
317
- /**
318
- * The hyperparameters used for the fine-tuning job.
319
- */
320
- hyperparameters?: Supervised.Hyperparameters;
321
- }
322
-
323
- export namespace Supervised {
324
- /**
325
- * The hyperparameters used for the fine-tuning job.
326
- */
327
- export interface Hyperparameters {
328
- /**
329
- * Number of examples in each batch. A larger batch size means that model
330
- * parameters are updated less frequently, but with lower variance.
331
- */
332
- batch_size?: 'auto' | number;
333
-
334
- /**
335
- * Scaling factor for the learning rate. A smaller learning rate may be useful to
336
- * avoid overfitting.
337
- */
338
- learning_rate_multiplier?: 'auto' | number;
339
-
340
- /**
341
- * The number of epochs to train the model for. An epoch refers to one full cycle
342
- * through the training dataset.
343
- */
344
- n_epochs?: 'auto' | number;
345
- }
346
- }
342
+ supervised?: MethodsAPI.SupervisedMethod;
347
343
  }
348
344
  }
349
345
 
@@ -597,97 +593,24 @@ export namespace JobCreateParams {
597
593
  */
598
594
  export interface Method {
599
595
  /**
600
- * Configuration for the DPO fine-tuning method.
596
+ * The type of method. Is either `supervised`, `dpo`, or `reinforcement`.
601
597
  */
602
- dpo?: Method.Dpo;
598
+ type: 'supervised' | 'dpo' | 'reinforcement';
603
599
 
604
600
  /**
605
- * Configuration for the supervised fine-tuning method.
601
+ * Configuration for the DPO fine-tuning method.
606
602
  */
607
- supervised?: Method.Supervised;
603
+ dpo?: MethodsAPI.DpoMethod;
608
604
 
609
605
  /**
610
- * The type of method. Is either `supervised` or `dpo`.
606
+ * Configuration for the reinforcement fine-tuning method.
611
607
  */
612
- type?: 'supervised' | 'dpo';
613
- }
614
-
615
- export namespace Method {
616
- /**
617
- * Configuration for the DPO fine-tuning method.
618
- */
619
- export interface Dpo {
620
- /**
621
- * The hyperparameters used for the fine-tuning job.
622
- */
623
- hyperparameters?: Dpo.Hyperparameters;
624
- }
625
-
626
- export namespace Dpo {
627
- /**
628
- * The hyperparameters used for the fine-tuning job.
629
- */
630
- export interface Hyperparameters {
631
- /**
632
- * Number of examples in each batch. A larger batch size means that model
633
- * parameters are updated less frequently, but with lower variance.
634
- */
635
- batch_size?: 'auto' | number;
636
-
637
- /**
638
- * The beta value for the DPO method. A higher beta value will increase the weight
639
- * of the penalty between the policy and reference model.
640
- */
641
- beta?: 'auto' | number;
642
-
643
- /**
644
- * Scaling factor for the learning rate. A smaller learning rate may be useful to
645
- * avoid overfitting.
646
- */
647
- learning_rate_multiplier?: 'auto' | number;
648
-
649
- /**
650
- * The number of epochs to train the model for. An epoch refers to one full cycle
651
- * through the training dataset.
652
- */
653
- n_epochs?: 'auto' | number;
654
- }
655
- }
608
+ reinforcement?: MethodsAPI.ReinforcementMethod;
656
609
 
657
610
  /**
658
611
  * Configuration for the supervised fine-tuning method.
659
612
  */
660
- export interface Supervised {
661
- /**
662
- * The hyperparameters used for the fine-tuning job.
663
- */
664
- hyperparameters?: Supervised.Hyperparameters;
665
- }
666
-
667
- export namespace Supervised {
668
- /**
669
- * The hyperparameters used for the fine-tuning job.
670
- */
671
- export interface Hyperparameters {
672
- /**
673
- * Number of examples in each batch. A larger batch size means that model
674
- * parameters are updated less frequently, but with lower variance.
675
- */
676
- batch_size?: 'auto' | number;
677
-
678
- /**
679
- * Scaling factor for the learning rate. A smaller learning rate may be useful to
680
- * avoid overfitting.
681
- */
682
- learning_rate_multiplier?: 'auto' | number;
683
-
684
- /**
685
- * The number of epochs to train the model for. An epoch refers to one full cycle
686
- * through the training dataset.
687
- */
688
- n_epochs?: 'auto' | number;
689
- }
690
- }
613
+ supervised?: MethodsAPI.SupervisedMethod;
691
614
  }
692
615
  }
693
616
 
@@ -0,0 +1,152 @@
1
+ // File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
2
+
3
+ import { APIResource } from '../../resource';
4
+ import * as GraderModelsAPI from '../graders/grader-models';
5
+
6
+ export class Methods extends APIResource {}
7
+
8
+ /**
9
+ * The hyperparameters used for the DPO fine-tuning job.
10
+ */
11
+ export interface DpoHyperparameters {
12
+ /**
13
+ * Number of examples in each batch. A larger batch size means that model
14
+ * parameters are updated less frequently, but with lower variance.
15
+ */
16
+ batch_size?: 'auto' | number;
17
+
18
+ /**
19
+ * The beta value for the DPO method. A higher beta value will increase the weight
20
+ * of the penalty between the policy and reference model.
21
+ */
22
+ beta?: 'auto' | number;
23
+
24
+ /**
25
+ * Scaling factor for the learning rate. A smaller learning rate may be useful to
26
+ * avoid overfitting.
27
+ */
28
+ learning_rate_multiplier?: 'auto' | number;
29
+
30
+ /**
31
+ * The number of epochs to train the model for. An epoch refers to one full cycle
32
+ * through the training dataset.
33
+ */
34
+ n_epochs?: 'auto' | number;
35
+ }
36
+
37
+ /**
38
+ * Configuration for the DPO fine-tuning method.
39
+ */
40
+ export interface DpoMethod {
41
+ /**
42
+ * The hyperparameters used for the DPO fine-tuning job.
43
+ */
44
+ hyperparameters?: DpoHyperparameters;
45
+ }
46
+
47
+ /**
48
+ * The hyperparameters used for the reinforcement fine-tuning job.
49
+ */
50
+ export interface ReinforcementHyperparameters {
51
+ /**
52
+ * Number of examples in each batch. A larger batch size means that model
53
+ * parameters are updated less frequently, but with lower variance.
54
+ */
55
+ batch_size?: 'auto' | number;
56
+
57
+ /**
58
+ * Multiplier on amount of compute used for exploring search space during training.
59
+ */
60
+ compute_multiplier?: 'auto' | number;
61
+
62
+ /**
63
+ * The number of training steps between evaluation runs.
64
+ */
65
+ eval_interval?: 'auto' | number;
66
+
67
+ /**
68
+ * Number of evaluation samples to generate per training step.
69
+ */
70
+ eval_samples?: 'auto' | number;
71
+
72
+ /**
73
+ * Scaling factor for the learning rate. A smaller learning rate may be useful to
74
+ * avoid overfitting.
75
+ */
76
+ learning_rate_multiplier?: 'auto' | number;
77
+
78
+ /**
79
+ * The number of epochs to train the model for. An epoch refers to one full cycle
80
+ * through the training dataset.
81
+ */
82
+ n_epochs?: 'auto' | number;
83
+
84
+ /**
85
+ * Level of reasoning effort.
86
+ */
87
+ reasoning_effort?: 'default' | 'low' | 'medium' | 'high';
88
+ }
89
+
90
+ /**
91
+ * Configuration for the reinforcement fine-tuning method.
92
+ */
93
+ export interface ReinforcementMethod {
94
+ /**
95
+ * The grader used for the fine-tuning job.
96
+ */
97
+ grader:
98
+ | GraderModelsAPI.StringCheckGrader
99
+ | GraderModelsAPI.TextSimilarityGrader
100
+ | GraderModelsAPI.PythonGrader
101
+ | GraderModelsAPI.ScoreModelGrader
102
+ | GraderModelsAPI.MultiGrader;
103
+
104
+ /**
105
+ * The hyperparameters used for the reinforcement fine-tuning job.
106
+ */
107
+ hyperparameters?: ReinforcementHyperparameters;
108
+ }
109
+
110
+ /**
111
+ * The hyperparameters used for the fine-tuning job.
112
+ */
113
+ export interface SupervisedHyperparameters {
114
+ /**
115
+ * Number of examples in each batch. A larger batch size means that model
116
+ * parameters are updated less frequently, but with lower variance.
117
+ */
118
+ batch_size?: 'auto' | number;
119
+
120
+ /**
121
+ * Scaling factor for the learning rate. A smaller learning rate may be useful to
122
+ * avoid overfitting.
123
+ */
124
+ learning_rate_multiplier?: 'auto' | number;
125
+
126
+ /**
127
+ * The number of epochs to train the model for. An epoch refers to one full cycle
128
+ * through the training dataset.
129
+ */
130
+ n_epochs?: 'auto' | number;
131
+ }
132
+
133
+ /**
134
+ * Configuration for the supervised fine-tuning method.
135
+ */
136
+ export interface SupervisedMethod {
137
+ /**
138
+ * The hyperparameters used for the fine-tuning job.
139
+ */
140
+ hyperparameters?: SupervisedHyperparameters;
141
+ }
142
+
143
+ export declare namespace Methods {
144
+ export {
145
+ type DpoHyperparameters as DpoHyperparameters,
146
+ type DpoMethod as DpoMethod,
147
+ type ReinforcementHyperparameters as ReinforcementHyperparameters,
148
+ type ReinforcementMethod as ReinforcementMethod,
149
+ type SupervisedHyperparameters as SupervisedHyperparameters,
150
+ type SupervisedMethod as SupervisedMethod,
151
+ };
152
+ }