npm - notdiamond - Versions diffs - 2.0.0-rc2 → 2.0.0-rc5 - Mend

notdiamond 2.0.0-rc2 → 2.0.0-rc5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (167) hide show

package/CHANGELOG.md +45 -0
package/README.md +14 -16
package/client.d.mts +20 -34
package/client.d.mts.map +1 -1
package/client.d.ts +20 -34
package/client.d.ts.map +1 -1
package/client.js +22 -38
package/client.js.map +1 -1
package/client.mjs +22 -38
package/client.mjs.map +1 -1
package/internal/tslib.js +17 -17
package/internal/utils/env.d.mts.map +1 -1
package/internal/utils/env.d.ts.map +1 -1
package/internal/utils/env.js +4 -2
package/internal/utils/env.js.map +1 -1
package/internal/utils/env.mjs +4 -2
package/internal/utils/env.mjs.map +1 -1
package/package.json +10 -11
package/resources/index.d.mts +6 -6
package/resources/index.d.mts.map +1 -1
package/resources/index.d.ts +6 -6
package/resources/index.d.ts.map +1 -1
package/resources/index.js +8 -8
package/resources/index.js.map +1 -1
package/resources/index.mjs +4 -4
package/resources/index.mjs.map +1 -1
package/resources/model-router.d.mts +311 -0
package/resources/model-router.d.mts.map +1 -0
package/resources/model-router.d.ts +311 -0
package/resources/model-router.d.ts.map +1 -0
package/resources/model-router.js +97 -0
package/resources/model-router.js.map +1 -0
package/resources/model-router.mjs +93 -0
package/resources/model-router.mjs.map +1 -0
package/resources/models.d.mts +50 -25
package/resources/models.d.mts.map +1 -1
package/resources/models.d.ts +50 -25
package/resources/models.d.ts.map +1 -1
package/resources/models.js +5 -0
package/resources/models.js.map +1 -1
package/resources/models.mjs +5 -0
package/resources/models.mjs.map +1 -1
package/resources/preferences.d.mts +49 -47
package/resources/preferences.d.mts.map +1 -1
package/resources/preferences.d.ts +49 -47
package/resources/preferences.d.ts.map +1 -1
package/resources/preferences.js +30 -33
package/resources/preferences.js.map +1 -1
package/resources/preferences.mjs +30 -33
package/resources/preferences.mjs.map +1 -1
package/resources/prompt/adapt.d.mts +352 -0
package/resources/prompt/adapt.d.mts.map +1 -0
package/resources/prompt/adapt.d.ts +352 -0
package/resources/prompt/adapt.d.ts.map +1 -0
package/resources/prompt/adapt.js +154 -0
package/resources/prompt/adapt.js.map +1 -0
package/resources/prompt/adapt.mjs +150 -0
package/resources/prompt/adapt.mjs.map +1 -0
package/resources/prompt/index.d.mts +3 -0
package/resources/prompt/index.d.mts.map +1 -0
package/resources/prompt/index.d.ts +3 -0
package/resources/prompt/index.d.ts.map +1 -0
package/resources/prompt/index.js +9 -0
package/resources/prompt/index.js.map +1 -0
package/resources/prompt/index.mjs +4 -0
package/resources/prompt/index.mjs.map +1 -0
package/resources/prompt/prompt.d.mts +338 -0
package/resources/prompt/prompt.d.mts.map +1 -0
package/resources/prompt/prompt.d.ts +338 -0
package/resources/prompt/prompt.d.ts.map +1 -0
package/resources/prompt/prompt.js +128 -0
package/resources/prompt/prompt.js.map +1 -0
package/resources/prompt/prompt.mjs +123 -0
package/resources/prompt/prompt.mjs.map +1 -0
package/resources/prompt.d.mts +2 -0
package/resources/prompt.d.mts.map +1 -0
package/resources/prompt.d.ts +2 -0
package/resources/prompt.d.ts.map +1 -0
package/resources/prompt.js +6 -0
package/resources/prompt.js.map +1 -0
package/resources/prompt.mjs +3 -0
package/resources/prompt.mjs.map +1 -0
package/resources/pzn.d.mts +225 -0
package/resources/pzn.d.mts.map +1 -0
package/resources/pzn.d.ts +225 -0
package/resources/pzn.d.ts.map +1 -0
package/resources/{routing.js → pzn.js} +26 -69
package/resources/pzn.js.map +1 -0
package/resources/{routing.mjs → pzn.mjs} +24 -67
package/resources/pzn.mjs.map +1 -0
package/resources/report/index.d.mts +3 -0
package/resources/report/index.d.mts.map +1 -0
package/resources/report/index.d.ts +3 -0
package/resources/report/index.d.ts.map +1 -0
package/resources/report/index.js +9 -0
package/resources/report/index.js.map +1 -0
package/resources/report/index.mjs +4 -0
package/resources/report/index.mjs.map +1 -0
package/resources/report/metrics.d.mts +87 -0
package/resources/report/metrics.d.mts.map +1 -0
package/resources/report/metrics.d.ts +87 -0
package/resources/report/metrics.d.ts.map +1 -0
package/resources/report/metrics.js +57 -0
package/resources/report/metrics.js.map +1 -0
package/resources/report/metrics.mjs +53 -0
package/resources/report/metrics.mjs.map +1 -0
package/resources/report/report.d.mts +10 -0
package/resources/report/report.d.mts.map +1 -0
package/resources/report/report.d.ts +10 -0
package/resources/report/report.d.ts.map +1 -0
package/resources/report/report.js +17 -0
package/resources/report/report.js.map +1 -0
package/resources/report/report.mjs +12 -0
package/resources/report/report.mjs.map +1 -0
package/resources/report.d.mts +1 -244
package/resources/report.d.mts.map +1 -1
package/resources/report.d.ts +1 -244
package/resources/report.d.ts.map +1 -1
package/resources/report.js +2 -82
package/resources/report.js.map +1 -1
package/resources/report.mjs +1 -80
package/resources/report.mjs.map +1 -1
package/src/client.ts +70 -119
package/src/internal/utils/env.ts +4 -2
package/src/resources/index.ts +24 -34
package/src/resources/model-router.ts +356 -0
package/src/resources/models.ts +55 -32
package/src/resources/preferences.ts +61 -70
package/src/resources/prompt/adapt.ts +402 -0
package/src/resources/prompt/index.ts +16 -0
package/src/resources/prompt/prompt.ts +398 -0
package/src/resources/prompt.ts +3 -0
package/src/resources/pzn.ts +273 -0
package/src/resources/report/index.ts +4 -0
package/src/resources/report/metrics.ts +99 -0
package/src/resources/report/report.ts +19 -0
package/src/resources/report.ts +1 -298
package/src/version.ts +1 -1
package/version.d.mts +1 -1
package/version.d.ts +1 -1
package/version.js +1 -1
package/version.mjs +1 -1
package/resources/admin.d.mts +0 -4
package/resources/admin.d.mts.map +0 -1
package/resources/admin.d.ts +0 -4
package/resources/admin.d.ts.map +0 -1
package/resources/admin.js +0 -9
package/resources/admin.js.map +0 -1
package/resources/admin.mjs +0 -5
package/resources/admin.mjs.map +0 -1
package/resources/prompt-adaptation.d.mts +0 -581
package/resources/prompt-adaptation.d.mts.map +0 -1
package/resources/prompt-adaptation.d.ts +0 -581
package/resources/prompt-adaptation.d.ts.map +0 -1
package/resources/prompt-adaptation.js +0 -289
package/resources/prompt-adaptation.js.map +0 -1
package/resources/prompt-adaptation.mjs +0 -285
package/resources/prompt-adaptation.mjs.map +0 -1
package/resources/routing.d.mts +0 -391
package/resources/routing.d.mts.map +0 -1
package/resources/routing.d.ts +0 -391
package/resources/routing.d.ts.map +0 -1
package/resources/routing.js.map +0 -1
package/resources/routing.mjs.map +0 -1
package/src/resources/admin.ts +0 -5
package/src/resources/prompt-adaptation.ts +0 -707
package/src/resources/routing.ts +0 -476

package/src/resources/prompt/adapt.ts ADDED Viewed

@@ -0,0 +1,402 @@
+// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+import { APIResource } from '../../core/resource';
+import { APIPromise } from '../../core/api-promise';
+import { RequestOptions } from '../../internal/request-options';
+import { path } from '../../internal/utils/path';
+export class Adapt extends APIResource {
+  /**
+   * Adapt your prompt from one LLM to work optimally across different target LLMs.
+   *
+   * This endpoint automatically optimizes your prompt (system prompt + user message
+   * template) to achieve better performance when switching between different
+   * language models. Each model has unique characteristics, and what works well for
+   * GPT-4 might not work as well for Claude or Gemini.
+   *
+   * **How Prompt Adaptation Works:**
+   *
+   * 1. You provide your current prompt optimized for an origin model
+   * 2. You specify target models you want to adapt to
+   * 3. You provide evaluation examples (golden records) with expected answers
+   * 4. The system runs optimization to find the best prompt for each target model
+   * 5. You receive adapted prompts that perform well on your target models
+   *
+   * **Evaluation Metrics:** Choose either a standard metric or provide custom
+   * evaluation:
+   *
+   * - **Standard metrics**: LLMaaJ:SQL, LLMaaJ:Sem_Sim_1/3/10 (semantic similarity),
+   *   JSON_Match
+   * - **Custom evaluation**: Provide evaluation_config with your own LLM judge,
+   *   prompt, and cutoff
+   *
+   * **Dataset Requirements:**
+   *
+   * - Minimum 25 examples in train_goldens (more examples = better adaptation)
+   * - Each example must have fields matching your template placeholders
+   * - Supervised evaluation requires 'answer' field in each golden record
+   * - Unsupervised evaluation can work without answers
+   *
+   * **Training Time:**
+   *
+   * - Processing is asynchronous and typically takes 10-30 minutes
+   * - Time depends on: number of target models, dataset size, model availability
+   * - Use the returned adaptation_run_id to check status and retrieve results
+   *
+   * **Subscription Tiers:**
+   *
+   * - Free: 1 target model
+   * - Starter: 3 target models
+   * - Startup: 5 target models
+   * - Enterprise: 10 target models
+   *
+   * **Best Practices:**
+   *
+   * 1. Use diverse, representative examples from your production workload
+   * 2. Include examples for best results (25 minimum)
+   * 3. Ensure consistent evaluation across all examples
+   * 4. Test both train_goldens and test_goldens split for validation
+   * 5. Use the same model versions you'll use in production
+   *
+   * **Example Workflow:**
+   *
+   * ```
+   * 1. POST /v2/prompt/adapt - Submit adaptation request
+   * 2. GET /v2/prompt/adaptStatus/{id} - Poll status until completed
+   * 3. GET /v2/prompt/adaptResults/{id} - Retrieve optimized prompts
+   * 4. Use optimized prompts in production with target models
+   * ```
+   *
+   * **Related Documentation:** See
+   * https://docs.notdiamond.ai/docs/adapting-prompts-to-new-models for detailed
+   * guide.
+   *
+   * @example
+   * ```ts
+   * const adapt = await client.prompt.adapt.create({
+   *   fields: ['question'],
+   *   system_prompt: 'You are a helpful assistant that answers questions accurately.',
+   *   target_models: [
+   *     { provider: 'anthropic', model: 'claude-sonnet-4-5-20250929' },
+   *     { provider: 'google', model: 'gemini-1.5-pro' },
+   *   ],
+   *   template: 'Question: {question}\nAnswer:',
+   *   evaluation_metric: 'LLMaaJ:Sem_Sim_3',
+   *   origin_model: { provider: 'openai', model: 'gpt-4o' },
+   *   test_goldens: [
+   *     {
+   *       fields: { ... },
+   *       answer: '9',
+   *     },
+   *     {
+   *       fields: { ... },
+   *       answer: 'Pacific Ocean',
+   *     },
+   *   ],
+   *   train_goldens: [
+   *     {
+   *       fields: { ... },
+   *       answer: '4',
+   *     },
+   *     {
+   *       fields: { ... },
+   *       answer: 'Paris',
+   *     },
+   *     {
+   *       fields: { ... },
+   *       answer: 'William Shakespeare',
+   *     },
+   *     {
+   *       fields: { ... },
+   *       answer: 'Water',
+   *     },
+   *     {
+   *       fields: { ... },
+   *       answer: '7',
+   *     },
+   *   ],
+   * });
+   * ```
+   */
+  create(body: AdaptCreateParams, options?: RequestOptions): APIPromise<AdaptCreateResponse> {
+    return this._client.post('/v2/prompt/adapt', { body, ...options });
+  }
+  /**
+   * Get LLM usage costs for a specific prompt adaptation run.
+   *
+   * This endpoint returns the total cost and detailed usage records for all LLM
+   * requests made during a prompt adaptation run. Use this to track costs associated
+   * with optimizing prompts for different target models.
+   *
+   * **Cost Breakdown:**
+   *
+   * - Total cost across all models used in the adaptation
+   * - Individual usage records with provider, model, tokens, and costs
+   * - Timestamps for each LLM request
+   * - Task type (e.g., optimization, evaluation)
+   *
+   * **Access Control:**
+   *
+   * - Only accessible by the user who created the adaptation run
+   * - Requires prompt adaptation access
+   *
+   * @example
+   * ```ts
+   * const response = await client.prompt.adapt.getCosts(
+   *   'adaptation_run_id',
+   * );
+   * ```
+   */
+  getCosts(adaptationRunID: string, options?: RequestOptions): APIPromise<AdaptGetCostsResponse> {
+    return this._client.get(path`/v2/prompt/adapt/${adaptationRunID}/costs`, options);
+  }
+}
+/**
+ * A training or test example for prompt adaptation.
+ */
+export interface GoldenRecord {
+  /**
+   * Dictionary mapping field names to their values. Keys must match the fields
+   * specified in the template
+   */
+  fields: { [key: string]: string };
+  /**
+   * Expected answer for supervised evaluation. Required for supervised metrics,
+   * optional for unsupervised
+   */
+  answer?: string | null;
+}
+/**
+ * Model for specifying an LLM provider in API requests.
+ */
+export interface RequestProvider {
+  /**
+   * Model name (e.g., 'gpt-4o', 'claude-sonnet-4-5-20250929')
+   */
+  model: string;
+  /**
+   * Provider name (e.g., 'openai', 'anthropic', 'google')
+   */
+  provider: string;
+  /**
+   * Maximum context length for the model (required for custom models)
+   */
+  context_length?: number | null;
+  /**
+   * Input token price per million tokens in USD (required for custom models)
+   */
+  input_price?: number | null;
+  /**
+   * Whether this is a custom model not in Not Diamond's supported model list
+   */
+  is_custom?: boolean;
+  /**
+   * Average latency in seconds (required for custom models)
+   */
+  latency?: number | null;
+  /**
+   * Output token price per million tokens in USD (required for custom models)
+   */
+  output_price?: number | null;
+}
+/**
+ * Response model for POST /v2/prompt/adapt endpoint.
+ *
+ * Returned immediately after submitting a prompt adaptation request. The
+ * adaptation process runs asynchronously, so use the returned adaptation_run_id to
+ * track progress and retrieve results when complete.
+ *
+ * **Next steps:**
+ *
+ * 1. Store the adaptation_run_id
+ * 2. Poll GET /v2/prompt/adaptStatus/{adaptation_run_id} to check progress
+ * 3. When status is 'completed', retrieve optimized prompts from GET
+ *    /v2/prompt/adaptResults/{adaptation_run_id}
+ * 4. Use the optimized prompts with your target models
+ */
+export interface AdaptCreateResponse {
+  /**
+   * Unique identifier for this adaptation run. Use this to poll status and retrieve
+   * optimized prompts when complete
+   */
+  adaptation_run_id: string;
+}
+/**
+ * Response model for GET /v2/prompt/adapt/{adaptation_run_id}/costs endpoint.
+ *
+ * Contains the total LLM costs and detailed usage records for a prompt adaptation
+ * run. Use this to track costs associated with optimizing prompts for different
+ * target models.
+ */
+export interface AdaptGetCostsResponse {
+  /**
+   * Unique identifier for the adaptation run
+   */
+  adaptation_run_id: string;
+  /**
+   * Total cost in USD across all LLM requests in this adaptation run
+   */
+  total_cost: number;
+  /**
+   * Detailed usage records for each LLM request made during the adaptation
+   */
+  usage_records: Array<AdaptGetCostsResponse.UsageRecord>;
+}
+export namespace AdaptGetCostsResponse {
+  /**
+   * Individual LLM usage record with token counts and cost breakdown.
+   *
+   * Returned by GET /llm-usage endpoint and included in AdaptationRunCostResponse.
+   * Each record represents a single LLM API call with detailed usage metrics.
+   */
+  export interface UsageRecord {
+    /**
+     * Unique identifier for this usage record
+     */
+    id: string;
+    /**
+     * Adaptation run ID this usage is associated with
+     */
+    adaptation_run_id: string;
+    /**
+     * Cost of input tokens in USD
+     */
+    input_cost: number;
+    /**
+     * Number of input tokens consumed
+     */
+    input_tokens: number;
+    /**
+     * Model name (e.g., 'gpt-4', 'claude-3-opus-20240229')
+     */
+    model: string;
+    /**
+     * Organization ID associated with the request
+     */
+    organization_id: string;
+    /**
+     * Cost of output tokens in USD
+     */
+    output_cost: number;
+    /**
+     * Number of output tokens generated
+     */
+    output_tokens: number;
+    /**
+     * LLM provider (e.g., 'openai', 'anthropic', 'google')
+     */
+    provider: string;
+    /**
+     * Type of task (e.g., 'optimization', 'evaluation')
+     */
+    task_type: string;
+    /**
+     * Unix timestamp when the request was made
+     */
+    timestamp: number;
+    /**
+     * Total cost (input + output) in USD
+     */
+    total_cost: number;
+    /**
+     * User ID who made the request
+     */
+    user_id: string;
+  }
+}
+export interface AdaptCreateParams {
+  /**
+   * List of field names that will be substituted into the template. Must match keys
+   * in golden records
+   */
+  fields: Array<string>;
+  /**
+   * System prompt to use with the origin model. This sets the context and role for
+   * the LLM
+   */
+  system_prompt: string;
+  /**
+   * List of models to adapt the prompt for. Maximum count depends on your
+   * subscription tier (Free: 1, Starter: 3, Startup: 5, Enterprise: 10)
+   */
+  target_models: Array<RequestProvider>;
+  /**
+   * User message template with placeholders for fields. Use curly braces for field
+   * substitution
+   */
+  template: string;
+  evaluation_config?: string | null;
+  evaluation_metric?: string | null;
+  /**
+   * Training examples (legacy parameter). Use train_goldens and test_goldens for
+   * better control. Minimum 25 examples
+   */
+  goldens?: Array<GoldenRecord> | null;
+  /**
+   * Model for specifying an LLM provider in API requests.
+   */
+  origin_model?: RequestProvider | null;
+  /**
+   * Optional baseline score for the origin model. If provided, can skip origin model
+   * evaluation
+   */
+  origin_model_evaluation_score?: number | null;
+  /**
+   * Test examples for evaluation. Required if train_goldens is provided. Used to
+   * measure final performance on held-out data
+   */
+  test_goldens?: Array<GoldenRecord> | null;
+  /**
+   * Training examples for prompt optimization. Minimum 25 examples required. Cannot
+   * be used with 'goldens' parameter
+   */
+  train_goldens?: Array<GoldenRecord> | null;
+}
+export declare namespace Adapt {
+  export {
+    type GoldenRecord as GoldenRecord,
+    type RequestProvider as RequestProvider,
+    type AdaptCreateResponse as AdaptCreateResponse,
+    type AdaptGetCostsResponse as AdaptGetCostsResponse,
+    type AdaptCreateParams as AdaptCreateParams,
+  };
+}

package/src/resources/prompt/index.ts ADDED Viewed

@@ -0,0 +1,16 @@
+// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+export {
+  Adapt,
+  type GoldenRecord,
+  type RequestProvider,
+  type AdaptCreateResponse,
+  type AdaptGetCostsResponse,
+  type AdaptCreateParams,
+} from './adapt';
+export {
+  Prompt,
+  type JobStatus,
+  type PromptGetAdaptResultsResponse,
+  type PromptGetAdaptStatusResponse,
+} from './prompt';