npm - openai - Versions diffs - 4.97.0 → 4.99.0 - Mend

openai 4.97.0 → 4.99.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (242) hide show

package/CHANGELOG.md +29 -0
package/index.d.mts +5 -2
package/index.d.ts +5 -2
package/index.d.ts.map +1 -1
package/index.js +3 -0
package/index.js.map +1 -1
package/index.mjs +3 -0
package/index.mjs.map +1 -1
package/package.json +1 -1
package/resources/audio/speech.d.ts +12 -0
package/resources/audio/speech.d.ts.map +1 -1
package/resources/audio/speech.js +12 -0
package/resources/audio/speech.js.map +1 -1
package/resources/audio/speech.mjs +12 -0
package/resources/audio/speech.mjs.map +1 -1
package/resources/audio/transcriptions.d.ts +38 -0
package/resources/audio/transcriptions.d.ts.map +1 -1
package/resources/audio/transcriptions.js.map +1 -1
package/resources/audio/transcriptions.mjs.map +1 -1
package/resources/audio/translations.d.ts +8 -0
package/resources/audio/translations.d.ts.map +1 -1
package/resources/audio/translations.js.map +1 -1
package/resources/audio/translations.mjs.map +1 -1
package/resources/beta/assistants.d.ts +36 -0
package/resources/beta/assistants.d.ts.map +1 -1
package/resources/beta/assistants.js +28 -0
package/resources/beta/assistants.js.map +1 -1
package/resources/beta/assistants.mjs +28 -0
package/resources/beta/assistants.mjs.map +1 -1
package/resources/beta/realtime/sessions.d.ts +6 -0
package/resources/beta/realtime/sessions.d.ts.map +1 -1
package/resources/beta/realtime/sessions.js +6 -0
package/resources/beta/realtime/sessions.js.map +1 -1
package/resources/beta/realtime/sessions.mjs +6 -0
package/resources/beta/realtime/sessions.mjs.map +1 -1
package/resources/beta/realtime/transcription-sessions.d.ts +6 -0
package/resources/beta/realtime/transcription-sessions.d.ts.map +1 -1
package/resources/beta/realtime/transcription-sessions.js +6 -0
package/resources/beta/realtime/transcription-sessions.js.map +1 -1
package/resources/beta/realtime/transcription-sessions.mjs +6 -0
package/resources/beta/realtime/transcription-sessions.mjs.map +1 -1
package/resources/beta/threads/messages.d.ts +43 -0
package/resources/beta/threads/messages.d.ts.map +1 -1
package/resources/beta/threads/messages.js +33 -0
package/resources/beta/threads/messages.js.map +1 -1
package/resources/beta/threads/messages.mjs +33 -0
package/resources/beta/threads/messages.mjs.map +1 -1
package/resources/beta/threads/runs/runs.d.ts +52 -0
package/resources/beta/threads/runs/runs.d.ts.map +1 -1
package/resources/beta/threads/runs/runs.js +24 -0
package/resources/beta/threads/runs/runs.js.map +1 -1
package/resources/beta/threads/runs/runs.mjs +24 -0
package/resources/beta/threads/runs/runs.mjs.map +1 -1
package/resources/beta/threads/runs/steps.d.ts +21 -0
package/resources/beta/threads/runs/steps.d.ts.map +1 -1
package/resources/beta/threads/runs/steps.js.map +1 -1
package/resources/beta/threads/runs/steps.mjs.map +1 -1
package/resources/beta/threads/threads.d.ts +33 -0
package/resources/beta/threads/threads.d.ts.map +1 -1
package/resources/beta/threads/threads.js +21 -0
package/resources/beta/threads/threads.js.map +1 -1
package/resources/beta/threads/threads.mjs +21 -0
package/resources/beta/threads/threads.mjs.map +1 -1
package/resources/chat/completions/completions.d.ts +38 -0
package/resources/chat/completions/completions.d.ts.map +1 -1
package/resources/chat/completions/completions.js +20 -0
package/resources/chat/completions/completions.js.map +1 -1
package/resources/chat/completions/completions.mjs +20 -0
package/resources/chat/completions/completions.mjs.map +1 -1
package/resources/chat/completions/messages.d.ts +10 -0
package/resources/chat/completions/messages.d.ts.map +1 -1
package/resources/chat/completions/messages.js.map +1 -1
package/resources/chat/completions/messages.mjs.map +1 -1
package/resources/completions.d.ts +8 -0
package/resources/completions.d.ts.map +1 -1
package/resources/completions.js.map +1 -1
package/resources/completions.mjs.map +1 -1
package/resources/embeddings.d.ts +13 -3
package/resources/embeddings.d.ts.map +1 -1
package/resources/embeddings.js +9 -0
package/resources/embeddings.js.map +1 -1
package/resources/embeddings.mjs +9 -0
package/resources/embeddings.mjs.map +1 -1
package/resources/evals/evals.d.ts +164 -519
package/resources/evals/evals.d.ts.map +1 -1
package/resources/evals/evals.js.map +1 -1
package/resources/evals/evals.mjs.map +1 -1
package/resources/evals/index.d.ts +1 -1
package/resources/evals/index.d.ts.map +1 -1
package/resources/evals/index.js.map +1 -1
package/resources/evals/index.mjs.map +1 -1
package/resources/evals/runs/runs.d.ts +64 -69
package/resources/evals/runs/runs.d.ts.map +1 -1
package/resources/evals/runs/runs.js.map +1 -1
package/resources/evals/runs/runs.mjs.map +1 -1
package/resources/fine-tuning/alpha/alpha.d.ts +10 -0
package/resources/fine-tuning/alpha/alpha.d.ts.map +1 -0
package/resources/fine-tuning/alpha/alpha.js +39 -0
package/resources/fine-tuning/alpha/alpha.js.map +1 -0
package/resources/fine-tuning/alpha/alpha.mjs +12 -0
package/resources/fine-tuning/alpha/alpha.mjs.map +1 -0
package/resources/fine-tuning/alpha/graders.d.ts +107 -0
package/resources/fine-tuning/alpha/graders.d.ts.map +1 -0
package/resources/fine-tuning/alpha/graders.js +50 -0
package/resources/fine-tuning/alpha/graders.js.map +1 -0
package/resources/fine-tuning/alpha/graders.mjs +46 -0
package/resources/fine-tuning/alpha/graders.mjs.map +1 -0
package/resources/fine-tuning/alpha/index.d.ts +3 -0
package/resources/fine-tuning/alpha/index.d.ts.map +1 -0
package/resources/fine-tuning/alpha/index.js +9 -0
package/resources/fine-tuning/alpha/index.js.map +1 -0
package/resources/fine-tuning/alpha/index.mjs +4 -0
package/resources/fine-tuning/alpha/index.mjs.map +1 -0
package/resources/fine-tuning/alpha.d.ts +2 -0
package/resources/fine-tuning/alpha.d.ts.map +1 -0
package/resources/fine-tuning/alpha.js +19 -0
package/resources/fine-tuning/alpha.js.map +1 -0
package/resources/fine-tuning/alpha.mjs +3 -0
package/resources/fine-tuning/alpha.mjs.map +1 -0
package/resources/fine-tuning/checkpoints/permissions.d.ts +28 -0
package/resources/fine-tuning/checkpoints/permissions.d.ts.map +1 -1
package/resources/fine-tuning/checkpoints/permissions.js +20 -0
package/resources/fine-tuning/checkpoints/permissions.js.map +1 -1
package/resources/fine-tuning/checkpoints/permissions.mjs +20 -0
package/resources/fine-tuning/checkpoints/permissions.mjs.map +1 -1
package/resources/fine-tuning/fine-tuning.d.ts +8 -0
package/resources/fine-tuning/fine-tuning.d.ts.map +1 -1
package/resources/fine-tuning/fine-tuning.js +8 -0
package/resources/fine-tuning/fine-tuning.js.map +1 -1
package/resources/fine-tuning/fine-tuning.mjs +8 -0
package/resources/fine-tuning/fine-tuning.mjs.map +1 -1
package/resources/fine-tuning/index.d.ts +2 -0
package/resources/fine-tuning/index.d.ts.map +1 -1
package/resources/fine-tuning/index.js +11 -7
package/resources/fine-tuning/index.js.map +1 -1
package/resources/fine-tuning/index.mjs +2 -0
package/resources/fine-tuning/index.mjs.map +1 -1
package/resources/fine-tuning/jobs/checkpoints.d.ts +10 -0
package/resources/fine-tuning/jobs/checkpoints.d.ts.map +1 -1
package/resources/fine-tuning/jobs/checkpoints.js.map +1 -1
package/resources/fine-tuning/jobs/checkpoints.mjs.map +1 -1
package/resources/fine-tuning/jobs/jobs.d.ts +78 -145
package/resources/fine-tuning/jobs/jobs.d.ts.map +1 -1
package/resources/fine-tuning/jobs/jobs.js +48 -0
package/resources/fine-tuning/jobs/jobs.js.map +1 -1
package/resources/fine-tuning/jobs/jobs.mjs +48 -0
package/resources/fine-tuning/jobs/jobs.mjs.map +1 -1
package/resources/fine-tuning/methods.d.ts +120 -0
package/resources/fine-tuning/methods.d.ts.map +1 -0
package/resources/fine-tuning/methods.js +9 -0
package/resources/fine-tuning/methods.js.map +1 -0
package/resources/fine-tuning/methods.mjs +5 -0
package/resources/fine-tuning/methods.mjs.map +1 -0
package/resources/graders/grader-models.d.ts +234 -0
package/resources/graders/grader-models.d.ts.map +1 -0
package/resources/graders/grader-models.js +9 -0
package/resources/graders/grader-models.js.map +1 -0
package/resources/graders/grader-models.mjs +5 -0
package/resources/graders/grader-models.mjs.map +1 -0
package/resources/graders/graders.d.ts +10 -0
package/resources/graders/graders.d.ts.map +1 -0
package/resources/graders/graders.js +39 -0
package/resources/graders/graders.js.map +1 -0
package/resources/graders/graders.mjs +12 -0
package/resources/graders/graders.mjs.map +1 -0
package/resources/graders/index.d.ts +3 -0
package/resources/graders/index.d.ts.map +1 -0
package/resources/graders/index.js +9 -0
package/resources/graders/index.js.map +1 -0
package/resources/graders/index.mjs +4 -0
package/resources/graders/index.mjs.map +1 -0
package/resources/graders.d.ts +2 -0
package/resources/graders.d.ts.map +1 -0
package/resources/graders.js +19 -0
package/resources/graders.js.map +1 -0
package/resources/graders.mjs +3 -0
package/resources/graders.mjs.map +1 -0
package/resources/images.d.ts +22 -0
package/resources/images.d.ts.map +1 -1
package/resources/images.js +22 -0
package/resources/images.js.map +1 -1
package/resources/images.mjs +22 -0
package/resources/images.mjs.map +1 -1
package/resources/index.d.ts +2 -1
package/resources/index.d.ts.map +1 -1
package/resources/index.js +3 -1
package/resources/index.js.map +1 -1
package/resources/index.mjs +1 -0
package/resources/index.mjs.map +1 -1
package/resources/responses/input-items.d.ts +10 -0
package/resources/responses/input-items.d.ts.map +1 -1
package/resources/responses/input-items.js.map +1 -1
package/resources/responses/input-items.mjs.map +1 -1
package/resources/responses/responses.d.ts +22 -0
package/resources/responses/responses.d.ts.map +1 -1
package/resources/responses/responses.js +7 -0
package/resources/responses/responses.js.map +1 -1
package/resources/responses/responses.mjs +7 -0
package/resources/responses/responses.mjs.map +1 -1
package/resources/shared.d.ts +1 -1
package/resources/shared.d.ts.map +1 -1
package/src/index.ts +5 -6
package/src/resources/audio/speech.ts +12 -0
package/src/resources/audio/transcriptions.ts +43 -0
package/src/resources/audio/translations.ts +8 -0
package/src/resources/beta/assistants.ts +36 -0
package/src/resources/beta/realtime/sessions.ts +6 -0
package/src/resources/beta/realtime/transcription-sessions.ts +6 -0
package/src/resources/beta/threads/messages.ts +43 -0
package/src/resources/beta/threads/runs/runs.ts +52 -0
package/src/resources/beta/threads/runs/steps.ts +21 -0
package/src/resources/beta/threads/threads.ts +33 -0
package/src/resources/chat/completions/completions.ts +38 -0
package/src/resources/chat/completions/messages.ts +10 -0
package/src/resources/completions.ts +8 -0
package/src/resources/embeddings.ts +13 -3
package/src/resources/evals/evals.ts +194 -628
package/src/resources/evals/index.ts +0 -3
package/src/resources/evals/runs/runs.ts +69 -77
package/src/resources/fine-tuning/alpha/alpha.ts +27 -0
package/src/resources/fine-tuning/alpha/graders.ts +168 -0
package/src/resources/fine-tuning/alpha/index.ts +10 -0
package/src/resources/fine-tuning/alpha.ts +3 -0
package/src/resources/fine-tuning/checkpoints/permissions.ts +28 -0
package/src/resources/fine-tuning/fine-tuning.ts +28 -0
package/src/resources/fine-tuning/index.ts +10 -0
package/src/resources/fine-tuning/jobs/checkpoints.ts +10 -0
package/src/resources/fine-tuning/jobs/jobs.ts +84 -161
package/src/resources/fine-tuning/methods.ts +152 -0
package/src/resources/graders/grader-models.ts +296 -0
package/src/resources/graders/graders.ts +31 -0
package/src/resources/graders/index.ts +12 -0
package/src/resources/graders.ts +3 -0
package/src/resources/images.ts +22 -0
package/src/resources/index.ts +1 -3
package/src/resources/responses/input-items.ts +10 -0
package/src/resources/responses/responses.ts +22 -0
package/src/resources/shared.ts +1 -0
package/src/version.ts +1 -1
package/version.d.ts +1 -1
package/version.js +1 -1
package/version.mjs +1 -1

package/src/resources/evals/evals.ts CHANGED Viewed

@@ -4,6 +4,7 @@ import { APIResource } from '../../resource';
 import { isRequestOptions } from '../../core';
 import * as Core from '../../core';
 import * as Shared from '../shared';
+import * as GraderModelsAPI from '../graders/grader-models';
 import * as ResponsesAPI from '../responses/responses';
 import * as RunsAPI from './runs/runs';
 import {
@@ -104,88 +105,7 @@ export interface EvalCustomDataSourceConfig {
 }
 /**
- * A LabelModelGrader object which uses a model to assign labels to each item in
- * the evaluation.
- */
-export interface EvalLabelModelGrader {
-  input: Array<EvalLabelModelGrader.Input>;
-  /**
-   * The labels to assign to each item in the evaluation.
-   */
-  labels: Array<string>;
-  /**
-   * The model to use for the evaluation. Must support structured outputs.
-   */
-  model: string;
-  /**
-   * The name of the grader.
-   */
-  name: string;
-  /**
-   * The labels that indicate a passing result. Must be a subset of labels.
-   */
-  passing_labels: Array<string>;
-  /**
-   * The object type, which is always `label_model`.
-   */
-  type: 'label_model';
-}
-export namespace EvalLabelModelGrader {
-  /**
-   * A message input to the model with a role indicating instruction following
-   * hierarchy. Instructions given with the `developer` or `system` role take
-   * precedence over instructions given with the `user` role. Messages with the
-   * `assistant` role are presumed to have been generated by the model in previous
-   * interactions.
-   */
-  export interface Input {
-    /**
-     * Text inputs to the model - can contain template strings.
-     */
-    content: string | ResponsesAPI.ResponseInputText | Input.OutputText;
-    /**
-     * The role of the message input. One of `user`, `assistant`, `system`, or
-     * `developer`.
-     */
-    role: 'user' | 'assistant' | 'system' | 'developer';
-    /**
-     * The type of the message input. Always `message`.
-     */
-    type?: 'message';
-  }
-  export namespace Input {
-    /**
-     * A text output from the model.
-     */
-    export interface OutputText {
-      /**
-       * The text output from the model.
-       */
-      text: string;
-      /**
-       * The type of the output text. Always `output_text`.
-       */
-      type: 'output_text';
-    }
-  }
-}
-/**
- * A StoredCompletionsDataSourceConfig which specifies the metadata property of
- * your stored completions query. This is usually metadata like `usecase=chatbot`
- * or `prompt-version=v2`, etc. The schema returned by this data source config is
- * used to defined what variables are available in your evals. `item` and `sample`
- * are both defined when using this data source config.
+ * @deprecated Deprecated in favor of LogsDataSourceConfig.
  */
 export interface EvalStoredCompletionsDataSourceConfig {
   /**
@@ -195,9 +115,9 @@ export interface EvalStoredCompletionsDataSourceConfig {
   schema: Record<string, unknown>;
   /**
-   * The type of data source. Always `stored_completions`.
+   * The type of data source. Always `stored-completions`.
    */
-  type: 'stored_completions';
+  type: 'stored-completions';
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -210,83 +130,6 @@ export interface EvalStoredCompletionsDataSourceConfig {
   metadata?: Shared.Metadata | null;
 }
-/**
- * A StringCheckGrader object that performs a string comparison between input and
- * reference using a specified operation.
- */
-export interface EvalStringCheckGrader {
-  /**
-   * The input text. This may include template strings.
-   */
-  input: string;
-  /**
-   * The name of the grader.
-   */
-  name: string;
-  /**
-   * The string check operation to perform. One of `eq`, `ne`, `like`, or `ilike`.
-   */
-  operation: 'eq' | 'ne' | 'like' | 'ilike';
-  /**
-   * The reference text. This may include template strings.
-   */
-  reference: string;
-  /**
-   * The object type, which is always `string_check`.
-   */
-  type: 'string_check';
-}
-/**
- * A TextSimilarityGrader object which grades text based on similarity metrics.
- */
-export interface EvalTextSimilarityGrader {
-  /**
-   * The evaluation metric to use. One of `fuzzy_match`, `bleu`, `gleu`, `meteor`,
-   * `rouge_1`, `rouge_2`, `rouge_3`, `rouge_4`, `rouge_5`, or `rouge_l`.
-   */
-  evaluation_metric:
-    | 'fuzzy_match'
-    | 'bleu'
-    | 'gleu'
-    | 'meteor'
-    | 'rouge_1'
-    | 'rouge_2'
-    | 'rouge_3'
-    | 'rouge_4'
-    | 'rouge_5'
-    | 'rouge_l';
-  /**
-   * The text being graded.
-   */
-  input: string;
-  /**
-   * A float score where a value greater than or equal indicates a passing grade.
-   */
-  pass_threshold: number;
-  /**
-   * The text being graded against.
-   */
-  reference: string;
-  /**
-   * The type of grader.
-   */
-  type: 'text_similarity';
-  /**
-   * The name of the grader.
-   */
-  name?: string;
-}
 /**
  * An Eval object with a data source config and testing criteria. An Eval
  * represents a task to be done for your LLM integration. Like:
@@ -309,7 +152,10 @@ export interface EvalCreateResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalCreateResponse.Logs
+    | EvalStoredCompletionsDataSourceConfig;
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -335,39 +181,59 @@ export interface EvalCreateResponse {
    * A list of testing criteria.
    */
   testing_criteria: Array<
-    | EvalLabelModelGrader
-    | EvalStringCheckGrader
-    | EvalTextSimilarityGrader
-    | EvalCreateResponse.Python
-    | EvalCreateResponse.ScoreModel
+    | GraderModelsAPI.LabelModelGrader
+    | GraderModelsAPI.StringCheckGrader
+    | EvalCreateResponse.EvalGraderTextSimilarity
+    | EvalCreateResponse.EvalGraderPython
+    | EvalCreateResponse.EvalGraderScoreModel
   >;
 }
 export namespace EvalCreateResponse {
   /**
-   * A PythonGrader object that runs a python script on the input.
+   * A LogsDataSourceConfig which specifies the metadata property of your logs query.
+   * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc. The
+   * schema returned by this data source config is used to defined what variables are
+   * available in your evals. `item` and `sample` are both defined when using this
+   * data source config.
    */
-  export interface Python {
+  export interface Logs {
     /**
-     * The name of the grader.
+     * The json schema for the run data source items. Learn how to build JSON schemas
+     * [here](https://json-schema.org/).
      */
-    name: string;
+    schema: Record<string, unknown>;
     /**
-     * The source code of the python script.
+     * The type of data source. Always `logs`.
      */
-    source: string;
+    type: 'logs';
     /**
-     * The object type, which is always `python`.
+     * Set of 16 key-value pairs that can be attached to an object. This can be useful
+     * for storing additional information about the object in a structured format, and
+     * querying for objects via API or the dashboard.
+     *
+     * Keys are strings with a maximum length of 64 characters. Values are strings with
+     * a maximum length of 512 characters.
      */
-    type: 'python';
+    metadata?: Shared.Metadata | null;
+  }
+  /**
+   * A TextSimilarityGrader object which grades text based on similarity metrics.
+   */
+  export interface EvalGraderTextSimilarity extends GraderModelsAPI.TextSimilarityGrader {
     /**
-     * The image tag to use for the python script.
+     * The threshold for the score.
      */
-    image_tag?: string;
+    pass_threshold: number;
+  }
+  /**
+   * A PythonGrader object that runs a python script on the input.
+   */
+  export interface EvalGraderPython extends GraderModelsAPI.PythonGrader {
     /**
      * The threshold for the score.
      */
@@ -377,85 +243,11 @@ export namespace EvalCreateResponse {
   /**
    * A ScoreModelGrader object that uses a model to assign a score to the input.
    */
-  export interface ScoreModel {
-    /**
-     * The input text. This may include template strings.
-     */
-    input: Array<ScoreModel.Input>;
-    /**
-     * The model to use for the evaluation.
-     */
-    model: string;
-    /**
-     * The name of the grader.
-     */
-    name: string;
-    /**
-     * The object type, which is always `score_model`.
-     */
-    type: 'score_model';
+  export interface EvalGraderScoreModel extends GraderModelsAPI.ScoreModelGrader {
     /**
      * The threshold for the score.
      */
     pass_threshold?: number;
-    /**
-     * The range of the score. Defaults to `[0, 1]`.
-     */
-    range?: Array<number>;
-    /**
-     * The sampling parameters for the model.
-     */
-    sampling_params?: unknown;
-  }
-  export namespace ScoreModel {
-    /**
-     * A message input to the model with a role indicating instruction following
-     * hierarchy. Instructions given with the `developer` or `system` role take
-     * precedence over instructions given with the `user` role. Messages with the
-     * `assistant` role are presumed to have been generated by the model in previous
-     * interactions.
-     */
-    export interface Input {
-      /**
-       * Text inputs to the model - can contain template strings.
-       */
-      content: string | ResponsesAPI.ResponseInputText | Input.OutputText;
-      /**
-       * The role of the message input. One of `user`, `assistant`, `system`, or
-       * `developer`.
-       */
-      role: 'user' | 'assistant' | 'system' | 'developer';
-      /**
-       * The type of the message input. Always `message`.
-       */
-      type?: 'message';
-    }
-    export namespace Input {
-      /**
-       * A text output from the model.
-       */
-      export interface OutputText {
-        /**
-         * The text output from the model.
-         */
-        text: string;
-        /**
-         * The type of the output text. Always `output_text`.
-         */
-        type: 'output_text';
-      }
-    }
   }
 }
@@ -481,7 +273,10 @@ export interface EvalRetrieveResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalRetrieveResponse.Logs
+    | EvalStoredCompletionsDataSourceConfig;
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -507,39 +302,59 @@ export interface EvalRetrieveResponse {
    * A list of testing criteria.
    */
   testing_criteria: Array<
-    | EvalLabelModelGrader
-    | EvalStringCheckGrader
-    | EvalTextSimilarityGrader
-    | EvalRetrieveResponse.Python
-    | EvalRetrieveResponse.ScoreModel
+    | GraderModelsAPI.LabelModelGrader
+    | GraderModelsAPI.StringCheckGrader
+    | EvalRetrieveResponse.EvalGraderTextSimilarity
+    | EvalRetrieveResponse.EvalGraderPython
+    | EvalRetrieveResponse.EvalGraderScoreModel
   >;
 }
 export namespace EvalRetrieveResponse {
   /**
-   * A PythonGrader object that runs a python script on the input.
+   * A LogsDataSourceConfig which specifies the metadata property of your logs query.
+   * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc. The
+   * schema returned by this data source config is used to defined what variables are
+   * available in your evals. `item` and `sample` are both defined when using this
+   * data source config.
    */
-  export interface Python {
+  export interface Logs {
     /**
-     * The name of the grader.
+     * The json schema for the run data source items. Learn how to build JSON schemas
+     * [here](https://json-schema.org/).
      */
-    name: string;
+    schema: Record<string, unknown>;
     /**
-     * The source code of the python script.
+     * The type of data source. Always `logs`.
      */
-    source: string;
+    type: 'logs';
     /**
-     * The object type, which is always `python`.
+     * Set of 16 key-value pairs that can be attached to an object. This can be useful
+     * for storing additional information about the object in a structured format, and
+     * querying for objects via API or the dashboard.
+     *
+     * Keys are strings with a maximum length of 64 characters. Values are strings with
+     * a maximum length of 512 characters.
      */
-    type: 'python';
+    metadata?: Shared.Metadata | null;
+  }
+  /**
+   * A TextSimilarityGrader object which grades text based on similarity metrics.
+   */
+  export interface EvalGraderTextSimilarity extends GraderModelsAPI.TextSimilarityGrader {
     /**
-     * The image tag to use for the python script.
+     * The threshold for the score.
      */
-    image_tag?: string;
+    pass_threshold: number;
+  }
+  /**
+   * A PythonGrader object that runs a python script on the input.
+   */
+  export interface EvalGraderPython extends GraderModelsAPI.PythonGrader {
     /**
      * The threshold for the score.
      */
@@ -549,85 +364,11 @@ export namespace EvalRetrieveResponse {
   /**
    * A ScoreModelGrader object that uses a model to assign a score to the input.
    */
-  export interface ScoreModel {
-    /**
-     * The input text. This may include template strings.
-     */
-    input: Array<ScoreModel.Input>;
-    /**
-     * The model to use for the evaluation.
-     */
-    model: string;
-    /**
-     * The name of the grader.
-     */
-    name: string;
-    /**
-     * The object type, which is always `score_model`.
-     */
-    type: 'score_model';
+  export interface EvalGraderScoreModel extends GraderModelsAPI.ScoreModelGrader {
     /**
      * The threshold for the score.
      */
     pass_threshold?: number;
-    /**
-     * The range of the score. Defaults to `[0, 1]`.
-     */
-    range?: Array<number>;
-    /**
-     * The sampling parameters for the model.
-     */
-    sampling_params?: unknown;
-  }
-  export namespace ScoreModel {
-    /**
-     * A message input to the model with a role indicating instruction following
-     * hierarchy. Instructions given with the `developer` or `system` role take
-     * precedence over instructions given with the `user` role. Messages with the
-     * `assistant` role are presumed to have been generated by the model in previous
-     * interactions.
-     */
-    export interface Input {
-      /**
-       * Text inputs to the model - can contain template strings.
-       */
-      content: string | ResponsesAPI.ResponseInputText | Input.OutputText;
-      /**
-       * The role of the message input. One of `user`, `assistant`, `system`, or
-       * `developer`.
-       */
-      role: 'user' | 'assistant' | 'system' | 'developer';
-      /**
-       * The type of the message input. Always `message`.
-       */
-      type?: 'message';
-    }
-    export namespace Input {
-      /**
-       * A text output from the model.
-       */
-      export interface OutputText {
-        /**
-         * The text output from the model.
-         */
-        text: string;
-        /**
-         * The type of the output text. Always `output_text`.
-         */
-        type: 'output_text';
-      }
-    }
   }
 }
@@ -653,7 +394,10 @@ export interface EvalUpdateResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalUpdateResponse.Logs
+    | EvalStoredCompletionsDataSourceConfig;
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -679,39 +423,59 @@ export interface EvalUpdateResponse {
    * A list of testing criteria.
    */
   testing_criteria: Array<
-    | EvalLabelModelGrader
-    | EvalStringCheckGrader
-    | EvalTextSimilarityGrader
-    | EvalUpdateResponse.Python
-    | EvalUpdateResponse.ScoreModel
+    | GraderModelsAPI.LabelModelGrader
+    | GraderModelsAPI.StringCheckGrader
+    | EvalUpdateResponse.EvalGraderTextSimilarity
+    | EvalUpdateResponse.EvalGraderPython
+    | EvalUpdateResponse.EvalGraderScoreModel
   >;
 }
 export namespace EvalUpdateResponse {
   /**
-   * A PythonGrader object that runs a python script on the input.
+   * A LogsDataSourceConfig which specifies the metadata property of your logs query.
+   * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc. The
+   * schema returned by this data source config is used to defined what variables are
+   * available in your evals. `item` and `sample` are both defined when using this
+   * data source config.
    */
-  export interface Python {
+  export interface Logs {
     /**
-     * The name of the grader.
+     * The json schema for the run data source items. Learn how to build JSON schemas
+     * [here](https://json-schema.org/).
      */
-    name: string;
+    schema: Record<string, unknown>;
     /**
-     * The source code of the python script.
+     * The type of data source. Always `logs`.
      */
-    source: string;
+    type: 'logs';
     /**
-     * The object type, which is always `python`.
+     * Set of 16 key-value pairs that can be attached to an object. This can be useful
+     * for storing additional information about the object in a structured format, and
+     * querying for objects via API or the dashboard.
+     *
+     * Keys are strings with a maximum length of 64 characters. Values are strings with
+     * a maximum length of 512 characters.
      */
-    type: 'python';
+    metadata?: Shared.Metadata | null;
+  }
+  /**
+   * A TextSimilarityGrader object which grades text based on similarity metrics.
+   */
+  export interface EvalGraderTextSimilarity extends GraderModelsAPI.TextSimilarityGrader {
     /**
-     * The image tag to use for the python script.
+     * The threshold for the score.
      */
-    image_tag?: string;
+    pass_threshold: number;
+  }
+  /**
+   * A PythonGrader object that runs a python script on the input.
+   */
+  export interface EvalGraderPython extends GraderModelsAPI.PythonGrader {
     /**
      * The threshold for the score.
      */
@@ -721,85 +485,11 @@ export namespace EvalUpdateResponse {
   /**
    * A ScoreModelGrader object that uses a model to assign a score to the input.
    */
-  export interface ScoreModel {
-    /**
-     * The input text. This may include template strings.
-     */
-    input: Array<ScoreModel.Input>;
-    /**
-     * The model to use for the evaluation.
-     */
-    model: string;
-    /**
-     * The name of the grader.
-     */
-    name: string;
-    /**
-     * The object type, which is always `score_model`.
-     */
-    type: 'score_model';
+  export interface EvalGraderScoreModel extends GraderModelsAPI.ScoreModelGrader {
     /**
      * The threshold for the score.
      */
     pass_threshold?: number;
-    /**
-     * The range of the score. Defaults to `[0, 1]`.
-     */
-    range?: Array<number>;
-    /**
-     * The sampling parameters for the model.
-     */
-    sampling_params?: unknown;
-  }
-  export namespace ScoreModel {
-    /**
-     * A message input to the model with a role indicating instruction following
-     * hierarchy. Instructions given with the `developer` or `system` role take
-     * precedence over instructions given with the `user` role. Messages with the
-     * `assistant` role are presumed to have been generated by the model in previous
-     * interactions.
-     */
-    export interface Input {
-      /**
-       * Text inputs to the model - can contain template strings.
-       */
-      content: string | ResponsesAPI.ResponseInputText | Input.OutputText;
-      /**
-       * The role of the message input. One of `user`, `assistant`, `system`, or
-       * `developer`.
-       */
-      role: 'user' | 'assistant' | 'system' | 'developer';
-      /**
-       * The type of the message input. Always `message`.
-       */
-      type?: 'message';
-    }
-    export namespace Input {
-      /**
-       * A text output from the model.
-       */
-      export interface OutputText {
-        /**
-         * The text output from the model.
-         */
-        text: string;
-        /**
-         * The type of the output text. Always `output_text`.
-         */
-        type: 'output_text';
-      }
-    }
   }
 }
@@ -825,7 +515,10 @@ export interface EvalListResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalListResponse.Logs
+    | EvalStoredCompletionsDataSourceConfig;
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -851,39 +544,59 @@ export interface EvalListResponse {
    * A list of testing criteria.
    */
   testing_criteria: Array<
-    | EvalLabelModelGrader
-    | EvalStringCheckGrader
-    | EvalTextSimilarityGrader
-    | EvalListResponse.Python
-    | EvalListResponse.ScoreModel
+    | GraderModelsAPI.LabelModelGrader
+    | GraderModelsAPI.StringCheckGrader
+    | EvalListResponse.EvalGraderTextSimilarity
+    | EvalListResponse.EvalGraderPython
+    | EvalListResponse.EvalGraderScoreModel
   >;
 }
 export namespace EvalListResponse {
   /**
-   * A PythonGrader object that runs a python script on the input.
+   * A LogsDataSourceConfig which specifies the metadata property of your logs query.
+   * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc. The
+   * schema returned by this data source config is used to defined what variables are
+   * available in your evals. `item` and `sample` are both defined when using this
+   * data source config.
    */
-  export interface Python {
+  export interface Logs {
     /**
-     * The name of the grader.
+     * The json schema for the run data source items. Learn how to build JSON schemas
+     * [here](https://json-schema.org/).
      */
-    name: string;
+    schema: Record<string, unknown>;
     /**
-     * The source code of the python script.
+     * The type of data source. Always `logs`.
      */
-    source: string;
+    type: 'logs';
     /**
-     * The object type, which is always `python`.
+     * Set of 16 key-value pairs that can be attached to an object. This can be useful
+     * for storing additional information about the object in a structured format, and
+     * querying for objects via API or the dashboard.
+     *
+     * Keys are strings with a maximum length of 64 characters. Values are strings with
+     * a maximum length of 512 characters.
      */
-    type: 'python';
+    metadata?: Shared.Metadata | null;
+  }
+  /**
+   * A TextSimilarityGrader object which grades text based on similarity metrics.
+   */
+  export interface EvalGraderTextSimilarity extends GraderModelsAPI.TextSimilarityGrader {
     /**
-     * The image tag to use for the python script.
+     * The threshold for the score.
      */
-    image_tag?: string;
+    pass_threshold: number;
+  }
+  /**
+   * A PythonGrader object that runs a python script on the input.
+   */
+  export interface EvalGraderPython extends GraderModelsAPI.PythonGrader {
     /**
      * The threshold for the score.
      */
@@ -893,85 +606,11 @@ export namespace EvalListResponse {
   /**
    * A ScoreModelGrader object that uses a model to assign a score to the input.
    */
-  export interface ScoreModel {
-    /**
-     * The input text. This may include template strings.
-     */
-    input: Array<ScoreModel.Input>;
-    /**
-     * The model to use for the evaluation.
-     */
-    model: string;
-    /**
-     * The name of the grader.
-     */
-    name: string;
-    /**
-     * The object type, which is always `score_model`.
-     */
-    type: 'score_model';
+  export interface EvalGraderScoreModel extends GraderModelsAPI.ScoreModelGrader {
     /**
      * The threshold for the score.
      */
     pass_threshold?: number;
-    /**
-     * The range of the score. Defaults to `[0, 1]`.
-     */
-    range?: Array<number>;
-    /**
-     * The sampling parameters for the model.
-     */
-    sampling_params?: unknown;
-  }
-  export namespace ScoreModel {
-    /**
-     * A message input to the model with a role indicating instruction following
-     * hierarchy. Instructions given with the `developer` or `system` role take
-     * precedence over instructions given with the `user` role. Messages with the
-     * `assistant` role are presumed to have been generated by the model in previous
-     * interactions.
-     */
-    export interface Input {
-      /**
-       * Text inputs to the model - can contain template strings.
-       */
-      content: string | ResponsesAPI.ResponseInputText | Input.OutputText;
-      /**
-       * The role of the message input. One of `user`, `assistant`, `system`, or
-       * `developer`.
-       */
-      role: 'user' | 'assistant' | 'system' | 'developer';
-      /**
-       * The type of the message input. Always `message`.
-       */
-      type?: 'message';
-    }
-    export namespace Input {
-      /**
-       * A text output from the model.
-       */
-      export interface OutputText {
-        /**
-         * The text output from the model.
-         */
-        text: string;
-        /**
-         * The type of the output text. Always `output_text`.
-         */
-        type: 'output_text';
-      }
-    }
   }
 }
@@ -987,15 +626,15 @@ export interface EvalCreateParams {
   /**
    * The configuration for the data source used for the evaluation runs.
    */
-  data_source_config: EvalCreateParams.Custom | EvalCreateParams.Logs;
+  data_source_config: EvalCreateParams.Custom | EvalCreateParams.Logs | EvalCreateParams.StoredCompletions;
   /**
    * A list of graders for all eval runs in this group.
    */
   testing_criteria: Array<
     | EvalCreateParams.LabelModel
-    | EvalStringCheckGrader
-    | EvalTextSimilarityGrader
+    | GraderModelsAPI.StringCheckGrader
+    | EvalCreateParams.TextSimilarity
     | EvalCreateParams.Python
     | EvalCreateParams.ScoreModel
   >;
@@ -1044,9 +683,8 @@ export namespace EvalCreateParams {
   }
   /**
-   * A data source config which specifies the metadata property of your stored
-   * completions query. This is usually metadata like `usecase=chatbot` or
-   * `prompt-version=v2`, etc.
+   * A data source config which specifies the metadata property of your logs query.
+   * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc.
    */
   export interface Logs {
     /**
@@ -1060,6 +698,21 @@ export namespace EvalCreateParams {
     metadata?: Record<string, unknown>;
   }
+  /**
+   * Deprecated in favor of LogsDataSourceConfig.
+   */
+  export interface StoredCompletions {
+    /**
+     * The type of data source. Always `stored-completions`.
+     */
+    type: 'stored-completions';
+    /**
+     * Metadata filters for the stored completions data source.
+     */
+    metadata?: Record<string, unknown>;
+  }
   /**
    * A LabelModelGrader object which uses a model to assign labels to each item in
    * the evaluation.
@@ -1154,29 +807,19 @@ export namespace EvalCreateParams {
   }
   /**
-   * A PythonGrader object that runs a python script on the input.
+   * A TextSimilarityGrader object which grades text based on similarity metrics.
    */
-  export interface Python {
+  export interface TextSimilarity extends GraderModelsAPI.TextSimilarityGrader {
     /**
-     * The name of the grader.
-     */
-    name: string;
-    /**
-     * The source code of the python script.
-     */
-    source: string;
-    /**
-     * The object type, which is always `python`.
-     */
-    type: 'python';
-    /**
-     * The image tag to use for the python script.
+     * The threshold for the score.
      */
-    image_tag?: string;
+    pass_threshold: number;
+  }
+  /**
+   * A PythonGrader object that runs a python script on the input.
+   */
+  export interface Python extends GraderModelsAPI.PythonGrader {
     /**
      * The threshold for the score.
      */
@@ -1186,85 +829,11 @@ export namespace EvalCreateParams {
   /**
    * A ScoreModelGrader object that uses a model to assign a score to the input.
    */
-  export interface ScoreModel {
-    /**
-     * The input text. This may include template strings.
-     */
-    input: Array<ScoreModel.Input>;
-    /**
-     * The model to use for the evaluation.
-     */
-    model: string;
-    /**
-     * The name of the grader.
-     */
-    name: string;
-    /**
-     * The object type, which is always `score_model`.
-     */
-    type: 'score_model';
+  export interface ScoreModel extends GraderModelsAPI.ScoreModelGrader {
     /**
      * The threshold for the score.
      */
     pass_threshold?: number;
-    /**
-     * The range of the score. Defaults to `[0, 1]`.
-     */
-    range?: Array<number>;
-    /**
-     * The sampling parameters for the model.
-     */
-    sampling_params?: unknown;
-  }
-  export namespace ScoreModel {
-    /**
-     * A message input to the model with a role indicating instruction following
-     * hierarchy. Instructions given with the `developer` or `system` role take
-     * precedence over instructions given with the `user` role. Messages with the
-     * `assistant` role are presumed to have been generated by the model in previous
-     * interactions.
-     */
-    export interface Input {
-      /**
-       * Text inputs to the model - can contain template strings.
-       */
-      content: string | ResponsesAPI.ResponseInputText | Input.OutputText;
-      /**
-       * The role of the message input. One of `user`, `assistant`, `system`, or
-       * `developer`.
-       */
-      role: 'user' | 'assistant' | 'system' | 'developer';
-      /**
-       * The type of the message input. Always `message`.
-       */
-      type?: 'message';
-    }
-    export namespace Input {
-      /**
-       * A text output from the model.
-       */
-      export interface OutputText {
-        /**
-         * The text output from the model.
-         */
-        text: string;
-        /**
-         * The type of the output text. Always `output_text`.
-         */
-        type: 'output_text';
-      }
-    }
   }
 }
@@ -1306,10 +875,7 @@ Evals.RunListResponsesPage = RunListResponsesPage;
 export declare namespace Evals {
   export {
     type EvalCustomDataSourceConfig as EvalCustomDataSourceConfig,
-    type EvalLabelModelGrader as EvalLabelModelGrader,
     type EvalStoredCompletionsDataSourceConfig as EvalStoredCompletionsDataSourceConfig,
-    type EvalStringCheckGrader as EvalStringCheckGrader,
-    type EvalTextSimilarityGrader as EvalTextSimilarityGrader,
     type EvalCreateResponse as EvalCreateResponse,
     type EvalRetrieveResponse as EvalRetrieveResponse,
     type EvalUpdateResponse as EvalUpdateResponse,