npm - llama-stack-client - Versions diffs - 0.2.0 → 0.2.3-rc5 - Mend

llama-stack-client 0.2.0 → 0.2.3-rc5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (124) hide show

package/_shims/index.d.ts +2 -0
package/_shims/index.js +5 -1
package/_shims/index.mjs +5 -1
package/core.d.ts +12 -1
package/core.d.ts.map +1 -1
package/core.js +8 -6
package/core.js.map +1 -1
package/core.mjs +9 -7
package/core.mjs.map +1 -1
package/index.d.mts +10 -7
package/index.d.ts +10 -7
package/index.d.ts.map +1 -1
package/index.js +6 -3
package/index.js.map +1 -1
package/index.mjs +6 -3
package/index.mjs.map +1 -1
package/package.json +1 -1
package/resources/chat/chat.d.ts +153 -0
package/resources/chat/chat.d.ts.map +1 -0
package/resources/chat/chat.js +39 -0
package/resources/chat/chat.js.map +1 -0
package/resources/chat/chat.mjs +12 -0
package/resources/chat/chat.mjs.map +1 -0
package/resources/chat/completions.d.ts +632 -0
package/resources/chat/completions.d.ts.map +1 -0
package/resources/chat/completions.js +16 -0
package/resources/chat/completions.js.map +1 -0
package/resources/chat/completions.mjs +12 -0
package/resources/chat/completions.mjs.map +1 -0
package/resources/chat/index.d.ts +3 -0
package/resources/chat/index.d.ts.map +1 -0
package/resources/chat/index.js +9 -0
package/resources/chat/index.js.map +1 -0
package/resources/chat/index.mjs +4 -0
package/resources/chat/index.mjs.map +1 -0
package/resources/chat.d.ts +2 -0
package/resources/chat.d.ts.map +1 -0
package/resources/chat.js +19 -0
package/resources/chat.js.map +1 -0
package/resources/chat.mjs +3 -0
package/resources/chat.mjs.map +1 -0
package/resources/completions.d.ts +193 -0
package/resources/completions.d.ts.map +1 -0
package/resources/completions.js +16 -0
package/resources/completions.js.map +1 -0
package/resources/completions.mjs +12 -0
package/resources/completions.mjs.map +1 -0
package/resources/datasets.d.ts +13 -6
package/resources/datasets.d.ts.map +1 -1
package/resources/datasets.js.map +1 -1
package/resources/datasets.mjs.map +1 -1
package/resources/eval/eval.d.ts +1 -1
package/resources/eval/eval.d.ts.map +1 -1
package/resources/index.d.ts +4 -3
package/resources/index.d.ts.map +1 -1
package/resources/index.js +5 -3
package/resources/index.js.map +1 -1
package/resources/index.mjs +2 -1
package/resources/index.mjs.map +1 -1
package/resources/inference.d.ts +86 -1
package/resources/inference.d.ts.map +1 -1
package/resources/inference.js +6 -0
package/resources/inference.js.map +1 -1
package/resources/inference.mjs +6 -0
package/resources/inference.mjs.map +1 -1
package/resources/inspect.d.ts +2 -1
package/resources/inspect.d.ts.map +1 -1
package/resources/post-training/job.d.ts +1 -1
package/resources/post-training/job.d.ts.map +1 -1
package/resources/post-training/post-training.d.ts +19 -19
package/resources/post-training/post-training.d.ts.map +1 -1
package/resources/shared.d.ts +40 -1
package/resources/shared.d.ts.map +1 -1
package/resources/tool-runtime/index.d.ts +1 -1
package/resources/tool-runtime/index.d.ts.map +1 -1
package/resources/tool-runtime/index.js.map +1 -1
package/resources/tool-runtime/index.mjs.map +1 -1
package/resources/tool-runtime/tool-runtime.d.ts +4 -4
package/resources/tool-runtime/tool-runtime.d.ts.map +1 -1
package/resources/tool-runtime/tool-runtime.js +1 -9
package/resources/tool-runtime/tool-runtime.js.map +1 -1
package/resources/tool-runtime/tool-runtime.mjs +1 -9
package/resources/tool-runtime/tool-runtime.mjs.map +1 -1
package/src/_shims/index.d.ts +2 -0
package/src/_shims/index.js +5 -1
package/src/_shims/index.mjs +5 -1
package/src/core.ts +24 -5
package/src/index.ts +30 -15
package/src/resources/chat/chat.ts +206 -0
package/src/resources/chat/completions.ts +890 -0
package/src/resources/chat/index.ts +10 -0
package/src/resources/chat.ts +3 -0
package/src/resources/completions.ts +268 -0
package/src/resources/datasets.ts +13 -6
package/src/resources/eval/eval.ts +1 -1
package/src/resources/index.ts +12 -6
package/src/resources/inference.ts +121 -0
package/src/resources/inspect.ts +3 -1
package/src/resources/post-training/job.ts +1 -1
package/src/resources/post-training/post-training.ts +32 -32
package/src/resources/shared.ts +42 -1
package/src/resources/tool-runtime/index.ts +1 -0
package/src/resources/tool-runtime/tool-runtime.ts +11 -12
package/src/version.ts +1 -1
package/version.d.ts +1 -1
package/version.d.ts.map +1 -1
package/version.js +1 -1
package/version.js.map +1 -1
package/version.mjs +1 -1
package/version.mjs.map +1 -1
package/internal/decoders/jsonl.d.ts +0 -12
package/internal/decoders/jsonl.d.ts.map +0 -1
package/internal/decoders/jsonl.js +0 -35
package/internal/decoders/jsonl.js.map +0 -1
package/internal/decoders/jsonl.mjs +0 -31
package/internal/decoders/jsonl.mjs.map +0 -1
package/resources/batch-inference.d.ts +0 -66
package/resources/batch-inference.d.ts.map +0 -1
package/resources/batch-inference.js +0 -15
package/resources/batch-inference.js.map +0 -1
package/resources/batch-inference.mjs +0 -11
package/resources/batch-inference.mjs.map +0 -1
package/src/internal/decoders/jsonl.ts +0 -41
package/src/resources/batch-inference.ts +0 -103

package/src/_shims/index.mjs CHANGED Viewed

@@ -3,5 +3,9 @@
  */
 import * as shims from './registry.mjs';
 import * as auto from "./auto/runtime";
-if (!shims.kind) shims.setShims(auto.getRuntime(), { auto: true });
+export const init = () => {
+  if (!shims.kind) shims.setShims(auto.getRuntime(), { auto: true });
+};
 export * from './registry.mjs';
+init();

package/src/core.ts CHANGED Viewed

@@ -17,7 +17,12 @@ import {
   type RequestInit,
   type Response,
   type HeadersInit,
+  init,
 } from './_shims/index';
+// try running side effects outside of _shims/index to workaround https://github.com/vercel/next.js/issues/76881
+init();
 export { type Response };
 import { BlobLike, isBlobLike, isMultipartBody } from './uploads';
 export {
@@ -29,6 +34,20 @@ export {
 export type Fetch = (url: RequestInfo, init?: RequestInit) => Promise<Response>;
+/**
+ * An alias to the builtin `Array` type so we can
+ * easily alias it in import statements if there are name clashes.
+ */
+type _Array<T> = Array<T>;
+/**
+ * An alias to the builtin `Record` type so we can
+ * easily alias it in import statements if there are name clashes.
+ */
+type _Record<K extends keyof any, T> = Record<K, T>;
+export type { _Array as Array, _Record as Record };
 type PromiseOrValue<T> = T | Promise<T>;
 type APIResponseProps = {
@@ -291,10 +310,10 @@ export abstract class APIClient {
   }
   buildRequest<Req>(
-    options: FinalRequestOptions<Req>,
+    inputOptions: FinalRequestOptions<Req>,
     { retryCount = 0 }: { retryCount?: number } = {},
   ): { req: RequestInit; url: string; timeout: number } {
-    options = { ...options };
+    const options = { ...inputOptions };
     const { method, path, query, headers: headers = {} } = options;
     const body =
@@ -322,8 +341,8 @@ export abstract class APIClient {
     }
     if (this.idempotencyHeader && method !== 'get') {
-      if (!options.idempotencyKey) options.idempotencyKey = this.defaultIdempotencyKey();
-      headers[this.idempotencyHeader] = options.idempotencyKey;
+      if (!inputOptions.idempotencyKey) inputOptions.idempotencyKey = this.defaultIdempotencyKey();
+      headers[this.idempotencyHeader] = inputOptions.idempotencyKey;
     }
     const reqHeaders = this.buildHeaders({ options, headers, contentLength, retryCount });
@@ -380,7 +399,7 @@ export abstract class APIClient {
       getHeader(headers, 'x-stainless-timeout') === undefined &&
       options.timeout
     ) {
-      reqHeaders['x-stainless-timeout'] = String(options.timeout);
+      reqHeaders['x-stainless-timeout'] = String(Math.trunc(options.timeout / 1000));
     }
     this.validateHeaders(reqHeaders, headers);

package/src/index.ts CHANGED Viewed

@@ -8,12 +8,6 @@ import * as Pagination from './pagination';
 import { type DatasetsIterrowsParams, DatasetsIterrowsResponse } from './pagination';
 import * as Uploads from './uploads';
 import * as API from './resources/index';
-import {
-  BatchInference,
-  BatchInferenceChatCompletionParams,
-  BatchInferenceChatCompletionResponse,
-  BatchInferenceCompletionParams,
-} from './resources/batch-inference';
 import {
   Benchmark,
   BenchmarkListResponse,
@@ -21,6 +15,13 @@ import {
   Benchmarks,
   ListBenchmarksResponse,
 } from './resources/benchmarks';
+import {
+  CompletionCreateParams,
+  CompletionCreateParamsNonStreaming,
+  CompletionCreateParamsStreaming,
+  CompletionCreateResponse,
+  Completions,
+} from './resources/completions';
 import {
   DatasetIterrowsParams,
   DatasetIterrowsResponse,
@@ -36,6 +37,9 @@ import {
   CompletionResponse,
   EmbeddingsResponse,
   Inference,
+  InferenceBatchChatCompletionParams,
+  InferenceBatchChatCompletionResponse,
+  InferenceBatchCompletionParams,
   InferenceChatCompletionParams,
   InferenceChatCompletionParamsNonStreaming,
   InferenceChatCompletionParamsStreaming,
@@ -132,6 +136,7 @@ import {
   ToolExecutionStep,
   ToolResponse,
 } from './resources/agents/agents';
+import { Chat, ChatCompletionChunk } from './resources/chat/chat';
 import {
   BenchmarkConfig,
   Eval,
@@ -157,6 +162,7 @@ import {
   ToolRuntime,
   ToolRuntimeInvokeToolParams,
   ToolRuntimeListToolsParams,
+  ToolRuntimeListToolsResponse,
 } from './resources/tool-runtime/tool-runtime';
 export interface ClientOptions {
@@ -270,11 +276,12 @@ export class LlamaStackClient extends Core.APIClient {
   tools: API.Tools = new API.Tools(this);
   toolRuntime: API.ToolRuntime = new API.ToolRuntime(this);
   agents: API.Agents = new API.Agents(this);
-  batchInference: API.BatchInference = new API.BatchInference(this);
   datasets: API.Datasets = new API.Datasets(this);
   eval: API.Eval = new API.Eval(this);
   inspect: API.Inspect = new API.Inspect(this);
   inference: API.Inference = new API.Inference(this);
+  chat: API.Chat = new API.Chat(this);
+  completions: API.Completions = new API.Completions(this);
   vectorIo: API.VectorIo = new API.VectorIo(this);
   vectorDBs: API.VectorDBs = new API.VectorDBs(this);
   models: API.Models = new API.Models(this);
@@ -336,11 +343,12 @@ LlamaStackClient.Toolgroups = Toolgroups;
 LlamaStackClient.Tools = Tools;
 LlamaStackClient.ToolRuntime = ToolRuntime;
 LlamaStackClient.Agents = Agents;
-LlamaStackClient.BatchInference = BatchInference;
 LlamaStackClient.Datasets = Datasets;
 LlamaStackClient.Eval = Eval;
 LlamaStackClient.Inspect = Inspect;
 LlamaStackClient.Inference = Inference;
+LlamaStackClient.Chat = Chat;
+LlamaStackClient.Completions = Completions;
 LlamaStackClient.VectorIo = VectorIo;
 LlamaStackClient.VectorDBs = VectorDBs;
 LlamaStackClient.Models = Models;
@@ -383,6 +391,7 @@ export declare namespace LlamaStackClient {
     ToolRuntime as ToolRuntime,
     type ToolDef as ToolDef,
     type ToolInvocationResult as ToolInvocationResult,
+    type ToolRuntimeListToolsResponse as ToolRuntimeListToolsResponse,
     type ToolRuntimeInvokeToolParams as ToolRuntimeInvokeToolParams,
     type ToolRuntimeListToolsParams as ToolRuntimeListToolsParams,
   };
@@ -398,13 +407,6 @@ export declare namespace LlamaStackClient {
     type AgentCreateParams as AgentCreateParams,
   };
-  export {
-    BatchInference as BatchInference,
-    type BatchInferenceChatCompletionResponse as BatchInferenceChatCompletionResponse,
-    type BatchInferenceChatCompletionParams as BatchInferenceChatCompletionParams,
-    type BatchInferenceCompletionParams as BatchInferenceCompletionParams,
-  };
   export {
     Datasets as Datasets,
     type ListDatasetsResponse as ListDatasetsResponse,
@@ -442,6 +444,9 @@ export declare namespace LlamaStackClient {
     type CompletionResponse as CompletionResponse,
     type EmbeddingsResponse as EmbeddingsResponse,
     type TokenLogProbs as TokenLogProbs,
+    type InferenceBatchChatCompletionResponse as InferenceBatchChatCompletionResponse,
+    type InferenceBatchChatCompletionParams as InferenceBatchChatCompletionParams,
+    type InferenceBatchCompletionParams as InferenceBatchCompletionParams,
     type InferenceChatCompletionParams as InferenceChatCompletionParams,
     type InferenceChatCompletionParamsNonStreaming as InferenceChatCompletionParamsNonStreaming,
     type InferenceChatCompletionParamsStreaming as InferenceChatCompletionParamsStreaming,
@@ -451,6 +456,16 @@ export declare namespace LlamaStackClient {
     type InferenceEmbeddingsParams as InferenceEmbeddingsParams,
   };
+  export { Chat as Chat, type ChatCompletionChunk as ChatCompletionChunk };
+  export {
+    Completions as Completions,
+    type CompletionCreateResponse as CompletionCreateResponse,
+    type CompletionCreateParams as CompletionCreateParams,
+    type CompletionCreateParamsNonStreaming as CompletionCreateParamsNonStreaming,
+    type CompletionCreateParamsStreaming as CompletionCreateParamsStreaming,
+  };
   export {
     VectorIo as VectorIo,
     type QueryChunksResponse as QueryChunksResponse,

package/src/resources/chat/chat.ts ADDED Viewed

@@ -0,0 +1,206 @@
+// File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+import { APIResource } from '../../resource';
+import * as CompletionsAPI from './completions';
+import {
+  CompletionCreateParams,
+  CompletionCreateParamsNonStreaming,
+  CompletionCreateParamsStreaming,
+  CompletionCreateResponse,
+  Completions,
+} from './completions';
+export class Chat extends APIResource {
+  completions: CompletionsAPI.Completions = new CompletionsAPI.Completions(this._client);
+}
+/**
+ * Chunk from a streaming response to an OpenAI-compatible chat completion request.
+ */
+export interface ChatCompletionChunk {
+  /**
+   * The ID of the chat completion
+   */
+  id: string;
+  /**
+   * List of choices
+   */
+  choices: Array<ChatCompletionChunk.Choice>;
+  /**
+   * The Unix timestamp in seconds when the chat completion was created
+   */
+  created: number;
+  /**
+   * The model that was used to generate the chat completion
+   */
+  model: string;
+  /**
+   * The object type, which will be "chat.completion.chunk"
+   */
+  object: 'chat.completion.chunk';
+}
+export namespace ChatCompletionChunk {
+  /**
+   * A chunk choice from an OpenAI-compatible chat completion streaming response.
+   */
+  export interface Choice {
+    /**
+     * The delta from the chunk
+     */
+    delta: Choice.Delta;
+    /**
+     * The reason the model stopped generating
+     */
+    finish_reason: string;
+    /**
+     * The index of the choice
+     */
+    index: number;
+    /**
+     * (Optional) The log probabilities for the tokens in the message
+     */
+    logprobs?: Choice.Logprobs;
+  }
+  export namespace Choice {
+    /**
+     * The delta from the chunk
+     */
+    export interface Delta {
+      /**
+       * (Optional) The content of the delta
+       */
+      content?: string;
+      /**
+       * (Optional) The refusal of the delta
+       */
+      refusal?: string;
+      /**
+       * (Optional) The role of the delta
+       */
+      role?: string;
+      /**
+       * (Optional) The tool calls of the delta
+       */
+      tool_calls?: Array<Delta.ToolCall>;
+    }
+    export namespace Delta {
+      export interface ToolCall {
+        type: 'function';
+        id?: string;
+        function?: ToolCall.Function;
+        index?: number;
+      }
+      export namespace ToolCall {
+        export interface Function {
+          arguments?: string;
+          name?: string;
+        }
+      }
+    }
+    /**
+     * (Optional) The log probabilities for the tokens in the message
+     */
+    export interface Logprobs {
+      /**
+       * (Optional) The log probabilities for the tokens in the message
+       */
+      content?: Array<Logprobs.Content>;
+      /**
+       * (Optional) The log probabilities for the tokens in the message
+       */
+      refusal?: Array<Logprobs.Refusal>;
+    }
+    export namespace Logprobs {
+      /**
+       * The log probability for a token from an OpenAI-compatible chat completion
+       * response.
+       */
+      export interface Content {
+        token: string;
+        logprob: number;
+        top_logprobs: Array<Content.TopLogprob>;
+        bytes?: Array<number>;
+      }
+      export namespace Content {
+        /**
+         * The top log probability for a token from an OpenAI-compatible chat completion
+         * response.
+         */
+        export interface TopLogprob {
+          token: string;
+          logprob: number;
+          bytes?: Array<number>;
+        }
+      }
+      /**
+       * The log probability for a token from an OpenAI-compatible chat completion
+       * response.
+       */
+      export interface Refusal {
+        token: string;
+        logprob: number;
+        top_logprobs: Array<Refusal.TopLogprob>;
+        bytes?: Array<number>;
+      }
+      export namespace Refusal {
+        /**
+         * The top log probability for a token from an OpenAI-compatible chat completion
+         * response.
+         */
+        export interface TopLogprob {
+          token: string;
+          logprob: number;
+          bytes?: Array<number>;
+        }
+      }
+    }
+  }
+}
+Chat.Completions = Completions;
+export declare namespace Chat {
+  export { type ChatCompletionChunk as ChatCompletionChunk };
+  export {
+    Completions as Completions,
+    type CompletionCreateResponse as CompletionCreateResponse,
+    type CompletionCreateParams as CompletionCreateParams,
+    type CompletionCreateParamsNonStreaming as CompletionCreateParamsNonStreaming,
+    type CompletionCreateParamsStreaming as CompletionCreateParamsStreaming,
+  };
+}