openai 4.97.0 → 4.99.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +29 -0
- package/index.d.mts +5 -2
- package/index.d.ts +5 -2
- package/index.d.ts.map +1 -1
- package/index.js +3 -0
- package/index.js.map +1 -1
- package/index.mjs +3 -0
- package/index.mjs.map +1 -1
- package/package.json +1 -1
- package/resources/audio/speech.d.ts +12 -0
- package/resources/audio/speech.d.ts.map +1 -1
- package/resources/audio/speech.js +12 -0
- package/resources/audio/speech.js.map +1 -1
- package/resources/audio/speech.mjs +12 -0
- package/resources/audio/speech.mjs.map +1 -1
- package/resources/audio/transcriptions.d.ts +38 -0
- package/resources/audio/transcriptions.d.ts.map +1 -1
- package/resources/audio/transcriptions.js.map +1 -1
- package/resources/audio/transcriptions.mjs.map +1 -1
- package/resources/audio/translations.d.ts +8 -0
- package/resources/audio/translations.d.ts.map +1 -1
- package/resources/audio/translations.js.map +1 -1
- package/resources/audio/translations.mjs.map +1 -1
- package/resources/beta/assistants.d.ts +36 -0
- package/resources/beta/assistants.d.ts.map +1 -1
- package/resources/beta/assistants.js +28 -0
- package/resources/beta/assistants.js.map +1 -1
- package/resources/beta/assistants.mjs +28 -0
- package/resources/beta/assistants.mjs.map +1 -1
- package/resources/beta/realtime/sessions.d.ts +6 -0
- package/resources/beta/realtime/sessions.d.ts.map +1 -1
- package/resources/beta/realtime/sessions.js +6 -0
- package/resources/beta/realtime/sessions.js.map +1 -1
- package/resources/beta/realtime/sessions.mjs +6 -0
- package/resources/beta/realtime/sessions.mjs.map +1 -1
- package/resources/beta/realtime/transcription-sessions.d.ts +6 -0
- package/resources/beta/realtime/transcription-sessions.d.ts.map +1 -1
- package/resources/beta/realtime/transcription-sessions.js +6 -0
- package/resources/beta/realtime/transcription-sessions.js.map +1 -1
- package/resources/beta/realtime/transcription-sessions.mjs +6 -0
- package/resources/beta/realtime/transcription-sessions.mjs.map +1 -1
- package/resources/beta/threads/messages.d.ts +43 -0
- package/resources/beta/threads/messages.d.ts.map +1 -1
- package/resources/beta/threads/messages.js +33 -0
- package/resources/beta/threads/messages.js.map +1 -1
- package/resources/beta/threads/messages.mjs +33 -0
- package/resources/beta/threads/messages.mjs.map +1 -1
- package/resources/beta/threads/runs/runs.d.ts +52 -0
- package/resources/beta/threads/runs/runs.d.ts.map +1 -1
- package/resources/beta/threads/runs/runs.js +24 -0
- package/resources/beta/threads/runs/runs.js.map +1 -1
- package/resources/beta/threads/runs/runs.mjs +24 -0
- package/resources/beta/threads/runs/runs.mjs.map +1 -1
- package/resources/beta/threads/runs/steps.d.ts +21 -0
- package/resources/beta/threads/runs/steps.d.ts.map +1 -1
- package/resources/beta/threads/runs/steps.js.map +1 -1
- package/resources/beta/threads/runs/steps.mjs.map +1 -1
- package/resources/beta/threads/threads.d.ts +33 -0
- package/resources/beta/threads/threads.d.ts.map +1 -1
- package/resources/beta/threads/threads.js +21 -0
- package/resources/beta/threads/threads.js.map +1 -1
- package/resources/beta/threads/threads.mjs +21 -0
- package/resources/beta/threads/threads.mjs.map +1 -1
- package/resources/chat/completions/completions.d.ts +38 -0
- package/resources/chat/completions/completions.d.ts.map +1 -1
- package/resources/chat/completions/completions.js +20 -0
- package/resources/chat/completions/completions.js.map +1 -1
- package/resources/chat/completions/completions.mjs +20 -0
- package/resources/chat/completions/completions.mjs.map +1 -1
- package/resources/chat/completions/messages.d.ts +10 -0
- package/resources/chat/completions/messages.d.ts.map +1 -1
- package/resources/chat/completions/messages.js.map +1 -1
- package/resources/chat/completions/messages.mjs.map +1 -1
- package/resources/completions.d.ts +8 -0
- package/resources/completions.d.ts.map +1 -1
- package/resources/completions.js.map +1 -1
- package/resources/completions.mjs.map +1 -1
- package/resources/embeddings.d.ts +13 -3
- package/resources/embeddings.d.ts.map +1 -1
- package/resources/embeddings.js +9 -0
- package/resources/embeddings.js.map +1 -1
- package/resources/embeddings.mjs +9 -0
- package/resources/embeddings.mjs.map +1 -1
- package/resources/evals/evals.d.ts +164 -519
- package/resources/evals/evals.d.ts.map +1 -1
- package/resources/evals/evals.js.map +1 -1
- package/resources/evals/evals.mjs.map +1 -1
- package/resources/evals/index.d.ts +1 -1
- package/resources/evals/index.d.ts.map +1 -1
- package/resources/evals/index.js.map +1 -1
- package/resources/evals/index.mjs.map +1 -1
- package/resources/evals/runs/runs.d.ts +64 -69
- package/resources/evals/runs/runs.d.ts.map +1 -1
- package/resources/evals/runs/runs.js.map +1 -1
- package/resources/evals/runs/runs.mjs.map +1 -1
- package/resources/fine-tuning/alpha/alpha.d.ts +10 -0
- package/resources/fine-tuning/alpha/alpha.d.ts.map +1 -0
- package/resources/fine-tuning/alpha/alpha.js +39 -0
- package/resources/fine-tuning/alpha/alpha.js.map +1 -0
- package/resources/fine-tuning/alpha/alpha.mjs +12 -0
- package/resources/fine-tuning/alpha/alpha.mjs.map +1 -0
- package/resources/fine-tuning/alpha/graders.d.ts +107 -0
- package/resources/fine-tuning/alpha/graders.d.ts.map +1 -0
- package/resources/fine-tuning/alpha/graders.js +50 -0
- package/resources/fine-tuning/alpha/graders.js.map +1 -0
- package/resources/fine-tuning/alpha/graders.mjs +46 -0
- package/resources/fine-tuning/alpha/graders.mjs.map +1 -0
- package/resources/fine-tuning/alpha/index.d.ts +3 -0
- package/resources/fine-tuning/alpha/index.d.ts.map +1 -0
- package/resources/fine-tuning/alpha/index.js +9 -0
- package/resources/fine-tuning/alpha/index.js.map +1 -0
- package/resources/fine-tuning/alpha/index.mjs +4 -0
- package/resources/fine-tuning/alpha/index.mjs.map +1 -0
- package/resources/fine-tuning/alpha.d.ts +2 -0
- package/resources/fine-tuning/alpha.d.ts.map +1 -0
- package/resources/fine-tuning/alpha.js +19 -0
- package/resources/fine-tuning/alpha.js.map +1 -0
- package/resources/fine-tuning/alpha.mjs +3 -0
- package/resources/fine-tuning/alpha.mjs.map +1 -0
- package/resources/fine-tuning/checkpoints/permissions.d.ts +28 -0
- package/resources/fine-tuning/checkpoints/permissions.d.ts.map +1 -1
- package/resources/fine-tuning/checkpoints/permissions.js +20 -0
- package/resources/fine-tuning/checkpoints/permissions.js.map +1 -1
- package/resources/fine-tuning/checkpoints/permissions.mjs +20 -0
- package/resources/fine-tuning/checkpoints/permissions.mjs.map +1 -1
- package/resources/fine-tuning/fine-tuning.d.ts +8 -0
- package/resources/fine-tuning/fine-tuning.d.ts.map +1 -1
- package/resources/fine-tuning/fine-tuning.js +8 -0
- package/resources/fine-tuning/fine-tuning.js.map +1 -1
- package/resources/fine-tuning/fine-tuning.mjs +8 -0
- package/resources/fine-tuning/fine-tuning.mjs.map +1 -1
- package/resources/fine-tuning/index.d.ts +2 -0
- package/resources/fine-tuning/index.d.ts.map +1 -1
- package/resources/fine-tuning/index.js +11 -7
- package/resources/fine-tuning/index.js.map +1 -1
- package/resources/fine-tuning/index.mjs +2 -0
- package/resources/fine-tuning/index.mjs.map +1 -1
- package/resources/fine-tuning/jobs/checkpoints.d.ts +10 -0
- package/resources/fine-tuning/jobs/checkpoints.d.ts.map +1 -1
- package/resources/fine-tuning/jobs/checkpoints.js.map +1 -1
- package/resources/fine-tuning/jobs/checkpoints.mjs.map +1 -1
- package/resources/fine-tuning/jobs/jobs.d.ts +78 -145
- package/resources/fine-tuning/jobs/jobs.d.ts.map +1 -1
- package/resources/fine-tuning/jobs/jobs.js +48 -0
- package/resources/fine-tuning/jobs/jobs.js.map +1 -1
- package/resources/fine-tuning/jobs/jobs.mjs +48 -0
- package/resources/fine-tuning/jobs/jobs.mjs.map +1 -1
- package/resources/fine-tuning/methods.d.ts +120 -0
- package/resources/fine-tuning/methods.d.ts.map +1 -0
- package/resources/fine-tuning/methods.js +9 -0
- package/resources/fine-tuning/methods.js.map +1 -0
- package/resources/fine-tuning/methods.mjs +5 -0
- package/resources/fine-tuning/methods.mjs.map +1 -0
- package/resources/graders/grader-models.d.ts +234 -0
- package/resources/graders/grader-models.d.ts.map +1 -0
- package/resources/graders/grader-models.js +9 -0
- package/resources/graders/grader-models.js.map +1 -0
- package/resources/graders/grader-models.mjs +5 -0
- package/resources/graders/grader-models.mjs.map +1 -0
- package/resources/graders/graders.d.ts +10 -0
- package/resources/graders/graders.d.ts.map +1 -0
- package/resources/graders/graders.js +39 -0
- package/resources/graders/graders.js.map +1 -0
- package/resources/graders/graders.mjs +12 -0
- package/resources/graders/graders.mjs.map +1 -0
- package/resources/graders/index.d.ts +3 -0
- package/resources/graders/index.d.ts.map +1 -0
- package/resources/graders/index.js +9 -0
- package/resources/graders/index.js.map +1 -0
- package/resources/graders/index.mjs +4 -0
- package/resources/graders/index.mjs.map +1 -0
- package/resources/graders.d.ts +2 -0
- package/resources/graders.d.ts.map +1 -0
- package/resources/graders.js +19 -0
- package/resources/graders.js.map +1 -0
- package/resources/graders.mjs +3 -0
- package/resources/graders.mjs.map +1 -0
- package/resources/images.d.ts +22 -0
- package/resources/images.d.ts.map +1 -1
- package/resources/images.js +22 -0
- package/resources/images.js.map +1 -1
- package/resources/images.mjs +22 -0
- package/resources/images.mjs.map +1 -1
- package/resources/index.d.ts +2 -1
- package/resources/index.d.ts.map +1 -1
- package/resources/index.js +3 -1
- package/resources/index.js.map +1 -1
- package/resources/index.mjs +1 -0
- package/resources/index.mjs.map +1 -1
- package/resources/responses/input-items.d.ts +10 -0
- package/resources/responses/input-items.d.ts.map +1 -1
- package/resources/responses/input-items.js.map +1 -1
- package/resources/responses/input-items.mjs.map +1 -1
- package/resources/responses/responses.d.ts +22 -0
- package/resources/responses/responses.d.ts.map +1 -1
- package/resources/responses/responses.js +7 -0
- package/resources/responses/responses.js.map +1 -1
- package/resources/responses/responses.mjs +7 -0
- package/resources/responses/responses.mjs.map +1 -1
- package/resources/shared.d.ts +1 -1
- package/resources/shared.d.ts.map +1 -1
- package/src/index.ts +5 -6
- package/src/resources/audio/speech.ts +12 -0
- package/src/resources/audio/transcriptions.ts +43 -0
- package/src/resources/audio/translations.ts +8 -0
- package/src/resources/beta/assistants.ts +36 -0
- package/src/resources/beta/realtime/sessions.ts +6 -0
- package/src/resources/beta/realtime/transcription-sessions.ts +6 -0
- package/src/resources/beta/threads/messages.ts +43 -0
- package/src/resources/beta/threads/runs/runs.ts +52 -0
- package/src/resources/beta/threads/runs/steps.ts +21 -0
- package/src/resources/beta/threads/threads.ts +33 -0
- package/src/resources/chat/completions/completions.ts +38 -0
- package/src/resources/chat/completions/messages.ts +10 -0
- package/src/resources/completions.ts +8 -0
- package/src/resources/embeddings.ts +13 -3
- package/src/resources/evals/evals.ts +194 -628
- package/src/resources/evals/index.ts +0 -3
- package/src/resources/evals/runs/runs.ts +69 -77
- package/src/resources/fine-tuning/alpha/alpha.ts +27 -0
- package/src/resources/fine-tuning/alpha/graders.ts +168 -0
- package/src/resources/fine-tuning/alpha/index.ts +10 -0
- package/src/resources/fine-tuning/alpha.ts +3 -0
- package/src/resources/fine-tuning/checkpoints/permissions.ts +28 -0
- package/src/resources/fine-tuning/fine-tuning.ts +28 -0
- package/src/resources/fine-tuning/index.ts +10 -0
- package/src/resources/fine-tuning/jobs/checkpoints.ts +10 -0
- package/src/resources/fine-tuning/jobs/jobs.ts +84 -161
- package/src/resources/fine-tuning/methods.ts +152 -0
- package/src/resources/graders/grader-models.ts +296 -0
- package/src/resources/graders/graders.ts +31 -0
- package/src/resources/graders/index.ts +12 -0
- package/src/resources/graders.ts +3 -0
- package/src/resources/images.ts +22 -0
- package/src/resources/index.ts +1 -3
- package/src/resources/responses/input-items.ts +10 -0
- package/src/resources/responses/responses.ts +22 -0
- package/src/resources/shared.ts +1 -0
- package/src/version.ts +1 -1
- package/version.d.ts +1 -1
- package/version.js +1 -1
- package/version.mjs +1 -1
|
@@ -1,5 +1,6 @@
|
|
|
1
1
|
// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
|
|
2
2
|
|
|
3
|
+
export { Alpha } from './alpha/index';
|
|
3
4
|
export { Checkpoints } from './checkpoints/index';
|
|
4
5
|
export { FineTuning } from './fine-tuning';
|
|
5
6
|
export {
|
|
@@ -15,3 +16,12 @@ export {
|
|
|
15
16
|
type JobListParams,
|
|
16
17
|
type JobListEventsParams,
|
|
17
18
|
} from './jobs/index';
|
|
19
|
+
export {
|
|
20
|
+
Methods,
|
|
21
|
+
type DpoHyperparameters,
|
|
22
|
+
type DpoMethod,
|
|
23
|
+
type ReinforcementHyperparameters,
|
|
24
|
+
type ReinforcementMethod,
|
|
25
|
+
type SupervisedHyperparameters,
|
|
26
|
+
type SupervisedMethod,
|
|
27
|
+
} from './methods';
|
|
@@ -8,6 +8,16 @@ import { CursorPage, type CursorPageParams } from '../../../pagination';
|
|
|
8
8
|
export class Checkpoints extends APIResource {
|
|
9
9
|
/**
|
|
10
10
|
* List checkpoints for a fine-tuning job.
|
|
11
|
+
*
|
|
12
|
+
* @example
|
|
13
|
+
* ```ts
|
|
14
|
+
* // Automatically fetches more pages as needed.
|
|
15
|
+
* for await (const fineTuningJobCheckpoint of client.fineTuning.jobs.checkpoints.list(
|
|
16
|
+
* 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
|
|
17
|
+
* )) {
|
|
18
|
+
* // ...
|
|
19
|
+
* }
|
|
20
|
+
* ```
|
|
11
21
|
*/
|
|
12
22
|
list(
|
|
13
23
|
fineTuningJobId: string,
|
|
@@ -3,6 +3,7 @@
|
|
|
3
3
|
import { APIResource } from '../../../resource';
|
|
4
4
|
import { isRequestOptions } from '../../../core';
|
|
5
5
|
import * as Core from '../../../core';
|
|
6
|
+
import * as MethodsAPI from '../methods';
|
|
6
7
|
import * as CheckpointsAPI from './checkpoints';
|
|
7
8
|
import {
|
|
8
9
|
CheckpointListParams,
|
|
@@ -23,6 +24,14 @@ export class Jobs extends APIResource {
|
|
|
23
24
|
* of the fine-tuned models once complete.
|
|
24
25
|
*
|
|
25
26
|
* [Learn more about fine-tuning](https://platform.openai.com/docs/guides/fine-tuning)
|
|
27
|
+
*
|
|
28
|
+
* @example
|
|
29
|
+
* ```ts
|
|
30
|
+
* const fineTuningJob = await client.fineTuning.jobs.create({
|
|
31
|
+
* model: 'gpt-4o-mini',
|
|
32
|
+
* training_file: 'file-abc123',
|
|
33
|
+
* });
|
|
34
|
+
* ```
|
|
26
35
|
*/
|
|
27
36
|
create(body: JobCreateParams, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
|
|
28
37
|
return this._client.post('/fine_tuning/jobs', { body, ...options });
|
|
@@ -32,6 +41,13 @@ export class Jobs extends APIResource {
|
|
|
32
41
|
* Get info about a fine-tuning job.
|
|
33
42
|
*
|
|
34
43
|
* [Learn more about fine-tuning](https://platform.openai.com/docs/guides/fine-tuning)
|
|
44
|
+
*
|
|
45
|
+
* @example
|
|
46
|
+
* ```ts
|
|
47
|
+
* const fineTuningJob = await client.fineTuning.jobs.retrieve(
|
|
48
|
+
* 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
|
|
49
|
+
* );
|
|
50
|
+
* ```
|
|
35
51
|
*/
|
|
36
52
|
retrieve(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
|
|
37
53
|
return this._client.get(`/fine_tuning/jobs/${fineTuningJobId}`, options);
|
|
@@ -39,6 +55,14 @@ export class Jobs extends APIResource {
|
|
|
39
55
|
|
|
40
56
|
/**
|
|
41
57
|
* List your organization's fine-tuning jobs
|
|
58
|
+
*
|
|
59
|
+
* @example
|
|
60
|
+
* ```ts
|
|
61
|
+
* // Automatically fetches more pages as needed.
|
|
62
|
+
* for await (const fineTuningJob of client.fineTuning.jobs.list()) {
|
|
63
|
+
* // ...
|
|
64
|
+
* }
|
|
65
|
+
* ```
|
|
42
66
|
*/
|
|
43
67
|
list(
|
|
44
68
|
query?: JobListParams,
|
|
@@ -57,6 +81,13 @@ export class Jobs extends APIResource {
|
|
|
57
81
|
|
|
58
82
|
/**
|
|
59
83
|
* Immediately cancel a fine-tune job.
|
|
84
|
+
*
|
|
85
|
+
* @example
|
|
86
|
+
* ```ts
|
|
87
|
+
* const fineTuningJob = await client.fineTuning.jobs.cancel(
|
|
88
|
+
* 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
|
|
89
|
+
* );
|
|
90
|
+
* ```
|
|
60
91
|
*/
|
|
61
92
|
cancel(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
|
|
62
93
|
return this._client.post(`/fine_tuning/jobs/${fineTuningJobId}/cancel`, options);
|
|
@@ -64,6 +95,16 @@ export class Jobs extends APIResource {
|
|
|
64
95
|
|
|
65
96
|
/**
|
|
66
97
|
* Get status updates for a fine-tuning job.
|
|
98
|
+
*
|
|
99
|
+
* @example
|
|
100
|
+
* ```ts
|
|
101
|
+
* // Automatically fetches more pages as needed.
|
|
102
|
+
* for await (const fineTuningJobEvent of client.fineTuning.jobs.listEvents(
|
|
103
|
+
* 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
|
|
104
|
+
* )) {
|
|
105
|
+
* // ...
|
|
106
|
+
* }
|
|
107
|
+
* ```
|
|
67
108
|
*/
|
|
68
109
|
listEvents(
|
|
69
110
|
fineTuningJobId: string,
|
|
@@ -87,6 +128,34 @@ export class Jobs extends APIResource {
|
|
|
87
128
|
...options,
|
|
88
129
|
});
|
|
89
130
|
}
|
|
131
|
+
|
|
132
|
+
/**
|
|
133
|
+
* Pause a fine-tune job.
|
|
134
|
+
*
|
|
135
|
+
* @example
|
|
136
|
+
* ```ts
|
|
137
|
+
* const fineTuningJob = await client.fineTuning.jobs.pause(
|
|
138
|
+
* 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
|
|
139
|
+
* );
|
|
140
|
+
* ```
|
|
141
|
+
*/
|
|
142
|
+
pause(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
|
|
143
|
+
return this._client.post(`/fine_tuning/jobs/${fineTuningJobId}/pause`, options);
|
|
144
|
+
}
|
|
145
|
+
|
|
146
|
+
/**
|
|
147
|
+
* Resume a fine-tune job.
|
|
148
|
+
*
|
|
149
|
+
* @example
|
|
150
|
+
* ```ts
|
|
151
|
+
* const fineTuningJob = await client.fineTuning.jobs.resume(
|
|
152
|
+
* 'ft-AF1WoRqd3aJAHsqc9NY7iL8F',
|
|
153
|
+
* );
|
|
154
|
+
* ```
|
|
155
|
+
*/
|
|
156
|
+
resume(fineTuningJobId: string, options?: Core.RequestOptions): Core.APIPromise<FineTuningJob> {
|
|
157
|
+
return this._client.post(`/fine_tuning/jobs/${fineTuningJobId}/resume`, options);
|
|
158
|
+
}
|
|
90
159
|
}
|
|
91
160
|
|
|
92
161
|
export class FineTuningJobsPage extends CursorPage<FineTuningJob> {}
|
|
@@ -233,7 +302,7 @@ export namespace FineTuningJob {
|
|
|
233
302
|
* Number of examples in each batch. A larger batch size means that model
|
|
234
303
|
* parameters are updated less frequently, but with lower variance.
|
|
235
304
|
*/
|
|
236
|
-
batch_size?: 'auto' | number;
|
|
305
|
+
batch_size?: unknown | 'auto' | number | null;
|
|
237
306
|
|
|
238
307
|
/**
|
|
239
308
|
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
@@ -253,97 +322,24 @@ export namespace FineTuningJob {
|
|
|
253
322
|
*/
|
|
254
323
|
export interface Method {
|
|
255
324
|
/**
|
|
256
|
-
*
|
|
325
|
+
* The type of method. Is either `supervised`, `dpo`, or `reinforcement`.
|
|
257
326
|
*/
|
|
258
|
-
dpo
|
|
327
|
+
type: 'supervised' | 'dpo' | 'reinforcement';
|
|
259
328
|
|
|
260
329
|
/**
|
|
261
|
-
* Configuration for the
|
|
262
|
-
*/
|
|
263
|
-
supervised?: Method.Supervised;
|
|
264
|
-
|
|
265
|
-
/**
|
|
266
|
-
* The type of method. Is either `supervised` or `dpo`.
|
|
330
|
+
* Configuration for the DPO fine-tuning method.
|
|
267
331
|
*/
|
|
268
|
-
|
|
269
|
-
}
|
|
332
|
+
dpo?: MethodsAPI.DpoMethod;
|
|
270
333
|
|
|
271
|
-
export namespace Method {
|
|
272
334
|
/**
|
|
273
|
-
* Configuration for the
|
|
335
|
+
* Configuration for the reinforcement fine-tuning method.
|
|
274
336
|
*/
|
|
275
|
-
|
|
276
|
-
/**
|
|
277
|
-
* The hyperparameters used for the fine-tuning job.
|
|
278
|
-
*/
|
|
279
|
-
hyperparameters?: Dpo.Hyperparameters;
|
|
280
|
-
}
|
|
281
|
-
|
|
282
|
-
export namespace Dpo {
|
|
283
|
-
/**
|
|
284
|
-
* The hyperparameters used for the fine-tuning job.
|
|
285
|
-
*/
|
|
286
|
-
export interface Hyperparameters {
|
|
287
|
-
/**
|
|
288
|
-
* Number of examples in each batch. A larger batch size means that model
|
|
289
|
-
* parameters are updated less frequently, but with lower variance.
|
|
290
|
-
*/
|
|
291
|
-
batch_size?: 'auto' | number;
|
|
292
|
-
|
|
293
|
-
/**
|
|
294
|
-
* The beta value for the DPO method. A higher beta value will increase the weight
|
|
295
|
-
* of the penalty between the policy and reference model.
|
|
296
|
-
*/
|
|
297
|
-
beta?: 'auto' | number;
|
|
298
|
-
|
|
299
|
-
/**
|
|
300
|
-
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
301
|
-
* avoid overfitting.
|
|
302
|
-
*/
|
|
303
|
-
learning_rate_multiplier?: 'auto' | number;
|
|
304
|
-
|
|
305
|
-
/**
|
|
306
|
-
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
307
|
-
* through the training dataset.
|
|
308
|
-
*/
|
|
309
|
-
n_epochs?: 'auto' | number;
|
|
310
|
-
}
|
|
311
|
-
}
|
|
337
|
+
reinforcement?: MethodsAPI.ReinforcementMethod;
|
|
312
338
|
|
|
313
339
|
/**
|
|
314
340
|
* Configuration for the supervised fine-tuning method.
|
|
315
341
|
*/
|
|
316
|
-
|
|
317
|
-
/**
|
|
318
|
-
* The hyperparameters used for the fine-tuning job.
|
|
319
|
-
*/
|
|
320
|
-
hyperparameters?: Supervised.Hyperparameters;
|
|
321
|
-
}
|
|
322
|
-
|
|
323
|
-
export namespace Supervised {
|
|
324
|
-
/**
|
|
325
|
-
* The hyperparameters used for the fine-tuning job.
|
|
326
|
-
*/
|
|
327
|
-
export interface Hyperparameters {
|
|
328
|
-
/**
|
|
329
|
-
* Number of examples in each batch. A larger batch size means that model
|
|
330
|
-
* parameters are updated less frequently, but with lower variance.
|
|
331
|
-
*/
|
|
332
|
-
batch_size?: 'auto' | number;
|
|
333
|
-
|
|
334
|
-
/**
|
|
335
|
-
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
336
|
-
* avoid overfitting.
|
|
337
|
-
*/
|
|
338
|
-
learning_rate_multiplier?: 'auto' | number;
|
|
339
|
-
|
|
340
|
-
/**
|
|
341
|
-
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
342
|
-
* through the training dataset.
|
|
343
|
-
*/
|
|
344
|
-
n_epochs?: 'auto' | number;
|
|
345
|
-
}
|
|
346
|
-
}
|
|
342
|
+
supervised?: MethodsAPI.SupervisedMethod;
|
|
347
343
|
}
|
|
348
344
|
}
|
|
349
345
|
|
|
@@ -597,97 +593,24 @@ export namespace JobCreateParams {
|
|
|
597
593
|
*/
|
|
598
594
|
export interface Method {
|
|
599
595
|
/**
|
|
600
|
-
*
|
|
596
|
+
* The type of method. Is either `supervised`, `dpo`, or `reinforcement`.
|
|
601
597
|
*/
|
|
602
|
-
dpo
|
|
598
|
+
type: 'supervised' | 'dpo' | 'reinforcement';
|
|
603
599
|
|
|
604
600
|
/**
|
|
605
|
-
* Configuration for the
|
|
601
|
+
* Configuration for the DPO fine-tuning method.
|
|
606
602
|
*/
|
|
607
|
-
|
|
603
|
+
dpo?: MethodsAPI.DpoMethod;
|
|
608
604
|
|
|
609
605
|
/**
|
|
610
|
-
*
|
|
606
|
+
* Configuration for the reinforcement fine-tuning method.
|
|
611
607
|
*/
|
|
612
|
-
|
|
613
|
-
}
|
|
614
|
-
|
|
615
|
-
export namespace Method {
|
|
616
|
-
/**
|
|
617
|
-
* Configuration for the DPO fine-tuning method.
|
|
618
|
-
*/
|
|
619
|
-
export interface Dpo {
|
|
620
|
-
/**
|
|
621
|
-
* The hyperparameters used for the fine-tuning job.
|
|
622
|
-
*/
|
|
623
|
-
hyperparameters?: Dpo.Hyperparameters;
|
|
624
|
-
}
|
|
625
|
-
|
|
626
|
-
export namespace Dpo {
|
|
627
|
-
/**
|
|
628
|
-
* The hyperparameters used for the fine-tuning job.
|
|
629
|
-
*/
|
|
630
|
-
export interface Hyperparameters {
|
|
631
|
-
/**
|
|
632
|
-
* Number of examples in each batch. A larger batch size means that model
|
|
633
|
-
* parameters are updated less frequently, but with lower variance.
|
|
634
|
-
*/
|
|
635
|
-
batch_size?: 'auto' | number;
|
|
636
|
-
|
|
637
|
-
/**
|
|
638
|
-
* The beta value for the DPO method. A higher beta value will increase the weight
|
|
639
|
-
* of the penalty between the policy and reference model.
|
|
640
|
-
*/
|
|
641
|
-
beta?: 'auto' | number;
|
|
642
|
-
|
|
643
|
-
/**
|
|
644
|
-
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
645
|
-
* avoid overfitting.
|
|
646
|
-
*/
|
|
647
|
-
learning_rate_multiplier?: 'auto' | number;
|
|
648
|
-
|
|
649
|
-
/**
|
|
650
|
-
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
651
|
-
* through the training dataset.
|
|
652
|
-
*/
|
|
653
|
-
n_epochs?: 'auto' | number;
|
|
654
|
-
}
|
|
655
|
-
}
|
|
608
|
+
reinforcement?: MethodsAPI.ReinforcementMethod;
|
|
656
609
|
|
|
657
610
|
/**
|
|
658
611
|
* Configuration for the supervised fine-tuning method.
|
|
659
612
|
*/
|
|
660
|
-
|
|
661
|
-
/**
|
|
662
|
-
* The hyperparameters used for the fine-tuning job.
|
|
663
|
-
*/
|
|
664
|
-
hyperparameters?: Supervised.Hyperparameters;
|
|
665
|
-
}
|
|
666
|
-
|
|
667
|
-
export namespace Supervised {
|
|
668
|
-
/**
|
|
669
|
-
* The hyperparameters used for the fine-tuning job.
|
|
670
|
-
*/
|
|
671
|
-
export interface Hyperparameters {
|
|
672
|
-
/**
|
|
673
|
-
* Number of examples in each batch. A larger batch size means that model
|
|
674
|
-
* parameters are updated less frequently, but with lower variance.
|
|
675
|
-
*/
|
|
676
|
-
batch_size?: 'auto' | number;
|
|
677
|
-
|
|
678
|
-
/**
|
|
679
|
-
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
680
|
-
* avoid overfitting.
|
|
681
|
-
*/
|
|
682
|
-
learning_rate_multiplier?: 'auto' | number;
|
|
683
|
-
|
|
684
|
-
/**
|
|
685
|
-
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
686
|
-
* through the training dataset.
|
|
687
|
-
*/
|
|
688
|
-
n_epochs?: 'auto' | number;
|
|
689
|
-
}
|
|
690
|
-
}
|
|
613
|
+
supervised?: MethodsAPI.SupervisedMethod;
|
|
691
614
|
}
|
|
692
615
|
}
|
|
693
616
|
|
|
@@ -0,0 +1,152 @@
|
|
|
1
|
+
// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
|
|
2
|
+
|
|
3
|
+
import { APIResource } from '../../resource';
|
|
4
|
+
import * as GraderModelsAPI from '../graders/grader-models';
|
|
5
|
+
|
|
6
|
+
export class Methods extends APIResource {}
|
|
7
|
+
|
|
8
|
+
/**
|
|
9
|
+
* The hyperparameters used for the DPO fine-tuning job.
|
|
10
|
+
*/
|
|
11
|
+
export interface DpoHyperparameters {
|
|
12
|
+
/**
|
|
13
|
+
* Number of examples in each batch. A larger batch size means that model
|
|
14
|
+
* parameters are updated less frequently, but with lower variance.
|
|
15
|
+
*/
|
|
16
|
+
batch_size?: 'auto' | number;
|
|
17
|
+
|
|
18
|
+
/**
|
|
19
|
+
* The beta value for the DPO method. A higher beta value will increase the weight
|
|
20
|
+
* of the penalty between the policy and reference model.
|
|
21
|
+
*/
|
|
22
|
+
beta?: 'auto' | number;
|
|
23
|
+
|
|
24
|
+
/**
|
|
25
|
+
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
26
|
+
* avoid overfitting.
|
|
27
|
+
*/
|
|
28
|
+
learning_rate_multiplier?: 'auto' | number;
|
|
29
|
+
|
|
30
|
+
/**
|
|
31
|
+
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
32
|
+
* through the training dataset.
|
|
33
|
+
*/
|
|
34
|
+
n_epochs?: 'auto' | number;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
/**
|
|
38
|
+
* Configuration for the DPO fine-tuning method.
|
|
39
|
+
*/
|
|
40
|
+
export interface DpoMethod {
|
|
41
|
+
/**
|
|
42
|
+
* The hyperparameters used for the DPO fine-tuning job.
|
|
43
|
+
*/
|
|
44
|
+
hyperparameters?: DpoHyperparameters;
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
/**
|
|
48
|
+
* The hyperparameters used for the reinforcement fine-tuning job.
|
|
49
|
+
*/
|
|
50
|
+
export interface ReinforcementHyperparameters {
|
|
51
|
+
/**
|
|
52
|
+
* Number of examples in each batch. A larger batch size means that model
|
|
53
|
+
* parameters are updated less frequently, but with lower variance.
|
|
54
|
+
*/
|
|
55
|
+
batch_size?: 'auto' | number;
|
|
56
|
+
|
|
57
|
+
/**
|
|
58
|
+
* Multiplier on amount of compute used for exploring search space during training.
|
|
59
|
+
*/
|
|
60
|
+
compute_multiplier?: 'auto' | number;
|
|
61
|
+
|
|
62
|
+
/**
|
|
63
|
+
* The number of training steps between evaluation runs.
|
|
64
|
+
*/
|
|
65
|
+
eval_interval?: 'auto' | number;
|
|
66
|
+
|
|
67
|
+
/**
|
|
68
|
+
* Number of evaluation samples to generate per training step.
|
|
69
|
+
*/
|
|
70
|
+
eval_samples?: 'auto' | number;
|
|
71
|
+
|
|
72
|
+
/**
|
|
73
|
+
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
74
|
+
* avoid overfitting.
|
|
75
|
+
*/
|
|
76
|
+
learning_rate_multiplier?: 'auto' | number;
|
|
77
|
+
|
|
78
|
+
/**
|
|
79
|
+
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
80
|
+
* through the training dataset.
|
|
81
|
+
*/
|
|
82
|
+
n_epochs?: 'auto' | number;
|
|
83
|
+
|
|
84
|
+
/**
|
|
85
|
+
* Level of reasoning effort.
|
|
86
|
+
*/
|
|
87
|
+
reasoning_effort?: 'default' | 'low' | 'medium' | 'high';
|
|
88
|
+
}
|
|
89
|
+
|
|
90
|
+
/**
|
|
91
|
+
* Configuration for the reinforcement fine-tuning method.
|
|
92
|
+
*/
|
|
93
|
+
export interface ReinforcementMethod {
|
|
94
|
+
/**
|
|
95
|
+
* The grader used for the fine-tuning job.
|
|
96
|
+
*/
|
|
97
|
+
grader:
|
|
98
|
+
| GraderModelsAPI.StringCheckGrader
|
|
99
|
+
| GraderModelsAPI.TextSimilarityGrader
|
|
100
|
+
| GraderModelsAPI.PythonGrader
|
|
101
|
+
| GraderModelsAPI.ScoreModelGrader
|
|
102
|
+
| GraderModelsAPI.MultiGrader;
|
|
103
|
+
|
|
104
|
+
/**
|
|
105
|
+
* The hyperparameters used for the reinforcement fine-tuning job.
|
|
106
|
+
*/
|
|
107
|
+
hyperparameters?: ReinforcementHyperparameters;
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
/**
|
|
111
|
+
* The hyperparameters used for the fine-tuning job.
|
|
112
|
+
*/
|
|
113
|
+
export interface SupervisedHyperparameters {
|
|
114
|
+
/**
|
|
115
|
+
* Number of examples in each batch. A larger batch size means that model
|
|
116
|
+
* parameters are updated less frequently, but with lower variance.
|
|
117
|
+
*/
|
|
118
|
+
batch_size?: 'auto' | number;
|
|
119
|
+
|
|
120
|
+
/**
|
|
121
|
+
* Scaling factor for the learning rate. A smaller learning rate may be useful to
|
|
122
|
+
* avoid overfitting.
|
|
123
|
+
*/
|
|
124
|
+
learning_rate_multiplier?: 'auto' | number;
|
|
125
|
+
|
|
126
|
+
/**
|
|
127
|
+
* The number of epochs to train the model for. An epoch refers to one full cycle
|
|
128
|
+
* through the training dataset.
|
|
129
|
+
*/
|
|
130
|
+
n_epochs?: 'auto' | number;
|
|
131
|
+
}
|
|
132
|
+
|
|
133
|
+
/**
|
|
134
|
+
* Configuration for the supervised fine-tuning method.
|
|
135
|
+
*/
|
|
136
|
+
export interface SupervisedMethod {
|
|
137
|
+
/**
|
|
138
|
+
* The hyperparameters used for the fine-tuning job.
|
|
139
|
+
*/
|
|
140
|
+
hyperparameters?: SupervisedHyperparameters;
|
|
141
|
+
}
|
|
142
|
+
|
|
143
|
+
export declare namespace Methods {
|
|
144
|
+
export {
|
|
145
|
+
type DpoHyperparameters as DpoHyperparameters,
|
|
146
|
+
type DpoMethod as DpoMethod,
|
|
147
|
+
type ReinforcementHyperparameters as ReinforcementHyperparameters,
|
|
148
|
+
type ReinforcementMethod as ReinforcementMethod,
|
|
149
|
+
type SupervisedHyperparameters as SupervisedHyperparameters,
|
|
150
|
+
type SupervisedMethod as SupervisedMethod,
|
|
151
|
+
};
|
|
152
|
+
}
|