@superlinked/sie-sdk 0.4.2 → 0.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.cjs +1 -1
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.cts +35 -2
- package/dist/index.d.ts +35 -2
- package/dist/index.js +1 -1
- package/dist/index.js.map +1 -1
- package/package.json +2 -2
package/dist/index.d.cts
CHANGED
|
@@ -108,6 +108,37 @@ interface ModelDims {
|
|
|
108
108
|
sparse?: number;
|
|
109
109
|
multivector?: number;
|
|
110
110
|
}
|
|
111
|
+
/**
|
|
112
|
+
* Advertised model capabilities.
|
|
113
|
+
*
|
|
114
|
+
* Mirrors the gateway `capabilities` object on each `/v1/models` entry
|
|
115
|
+
* (`ModelCapabilitiesWire`). All fields are optional; their presence
|
|
116
|
+
* depends on what the model config declares. `grammar` lists the
|
|
117
|
+
* supported grammar kinds ("json_schema" | "regex" | "ebnf").
|
|
118
|
+
* `code`/`sql`/`guard` are informational flags advertising validated
|
|
119
|
+
* generation jobs that back the model="code"/"sql"/"guard" aliases.
|
|
120
|
+
*
|
|
121
|
+
* These flags mean the model *supports* a task — they are NOT a
|
|
122
|
+
* precision-independent quality SLA. A flag is true at the model level even
|
|
123
|
+
* when quality is profile/precision-dependent (e.g. `sql` quality regresses
|
|
124
|
+
* under FP8; route SQL-critical traffic to a BF16 bundle via the `sql` alias).
|
|
125
|
+
*/
|
|
126
|
+
interface ModelCapabilities {
|
|
127
|
+
/** Supported grammar kinds: ["json_schema", "regex", "ebnf"] */
|
|
128
|
+
grammar?: string[];
|
|
129
|
+
/** Whether the model supports tool / function calling */
|
|
130
|
+
tools?: boolean;
|
|
131
|
+
/** Union of LoRA served-names across profiles (display summary) */
|
|
132
|
+
lora_adapters?: string[];
|
|
133
|
+
/** Per-profile LoRA served-names, keyed by profile name */
|
|
134
|
+
profile_lora_adapters?: Record<string, string[]>;
|
|
135
|
+
/** Validated for code generation; backs model="code" */
|
|
136
|
+
code?: boolean;
|
|
137
|
+
/** Supports text-to-SQL; backs model="sql". Precision-sensitive (FP8 regresses SQL) — a support flag, not a per-profile quality guarantee. */
|
|
138
|
+
sql?: boolean;
|
|
139
|
+
/** Generative guard model; backs model="guard" */
|
|
140
|
+
guard?: boolean;
|
|
141
|
+
}
|
|
111
142
|
/**
|
|
112
143
|
* Information about a model returned by listModels().
|
|
113
144
|
*/
|
|
@@ -124,6 +155,8 @@ interface ModelInfo {
|
|
|
124
155
|
dims?: ModelDims;
|
|
125
156
|
/** Maximum sequence length the model supports */
|
|
126
157
|
maxSequenceLength?: number;
|
|
158
|
+
/** Advertised model capabilities (grammar, tools, code/sql/guard, LoRA adapters) */
|
|
159
|
+
capabilities?: ModelCapabilities;
|
|
127
160
|
}
|
|
128
161
|
/**
|
|
129
162
|
* A single score entry from reranking.
|
|
@@ -1235,7 +1268,7 @@ declare class SIEClient {
|
|
|
1235
1268
|
private detectEndpointType;
|
|
1236
1269
|
}
|
|
1237
1270
|
|
|
1238
|
-
declare const SDK_VERSION = "0.
|
|
1271
|
+
declare const SDK_VERSION = "0.6.0";
|
|
1239
1272
|
|
|
1240
1273
|
/**
|
|
1241
1274
|
* Helpers for converting SIE encode results to plain JavaScript types.
|
|
@@ -1635,4 +1668,4 @@ declare function toImageWireFormat(input: ImageInput, format?: "jpeg" | "png" |
|
|
|
1635
1668
|
*/
|
|
1636
1669
|
declare function detectImageFormat(bytes: Uint8Array): "jpeg" | "png" | "webp" | "unknown";
|
|
1637
1670
|
|
|
1638
|
-
export { type CapacityInfo, type ChatChoice, type ChatChunkChoice, type ChatCompletion, type ChatCompletionChunk, type ChatCompletionRequest, type ChatDelta, type ChatFinishReason, type ChatMessage, type ChatUsage, type Classification, type ClusterStatusMessage, type ClusterSummary, type ClusterWorkerInfo, type DType, type DetectedObject, type EncodeOptions, type EncodeResult, type Entity, type ExtractOptions, type ExtractResult, type FinishReason, type GPUMetrics, type GenerateChunk, type GenerateOptions, type GenerateResult, type GenerationUsage, type ImageInput, type ImageWireFormat, InputTooLongError, type Item, LoraLoadingError, type ModelConfig, type ModelDims, type ModelInfo, ModelLoadFailedError, ModelLoadingError, type ModelState, type ModelStatus, type ModelSummary, type OutputType, PoolError, type PoolInfo, type PoolSpec, type PoolStatus, ProvisioningError, type Relation, RequestError, type ResponseFormat, SDK_VERSION, SIEClient, type SIEClientOptions, SIEConnectionError, SIEError, SIEStreamError, type ScoreEntry, type ScoreOptions, type ScoreResult, ServerError, type ServerInfo, type SparseResult, type SparseVector, type StatusMessage, type TimingInfo, type ToolCall, type ToolCallDelta, type ToolChoice, type ToolSpec, type WorkerInfo, type WorkerStatusMessage, denseEmbedding, detectImageFormat, multivectorEmbedding, normalizeSparseVector, packMessage, sparseEmbedding, sparseEmbeddingMap, toFloat32Array, toImageBytes, toImageWireFormat, toNumberArray, unpackMessage };
|
|
1671
|
+
export { type CapacityInfo, type ChatChoice, type ChatChunkChoice, type ChatCompletion, type ChatCompletionChunk, type ChatCompletionRequest, type ChatDelta, type ChatFinishReason, type ChatMessage, type ChatUsage, type Classification, type ClusterStatusMessage, type ClusterSummary, type ClusterWorkerInfo, type DType, type DetectedObject, type EncodeOptions, type EncodeResult, type Entity, type ExtractOptions, type ExtractResult, type FinishReason, type GPUMetrics, type GenerateChunk, type GenerateOptions, type GenerateResult, type GenerationUsage, type ImageInput, type ImageWireFormat, InputTooLongError, type Item, LoraLoadingError, type ModelCapabilities, type ModelConfig, type ModelDims, type ModelInfo, ModelLoadFailedError, ModelLoadingError, type ModelState, type ModelStatus, type ModelSummary, type OutputType, PoolError, type PoolInfo, type PoolSpec, type PoolStatus, ProvisioningError, type Relation, RequestError, type ResponseFormat, SDK_VERSION, SIEClient, type SIEClientOptions, SIEConnectionError, SIEError, SIEStreamError, type ScoreEntry, type ScoreOptions, type ScoreResult, ServerError, type ServerInfo, type SparseResult, type SparseVector, type StatusMessage, type TimingInfo, type ToolCall, type ToolCallDelta, type ToolChoice, type ToolSpec, type WorkerInfo, type WorkerStatusMessage, denseEmbedding, detectImageFormat, multivectorEmbedding, normalizeSparseVector, packMessage, sparseEmbedding, sparseEmbeddingMap, toFloat32Array, toImageBytes, toImageWireFormat, toNumberArray, unpackMessage };
|
package/dist/index.d.ts
CHANGED
|
@@ -108,6 +108,37 @@ interface ModelDims {
|
|
|
108
108
|
sparse?: number;
|
|
109
109
|
multivector?: number;
|
|
110
110
|
}
|
|
111
|
+
/**
|
|
112
|
+
* Advertised model capabilities.
|
|
113
|
+
*
|
|
114
|
+
* Mirrors the gateway `capabilities` object on each `/v1/models` entry
|
|
115
|
+
* (`ModelCapabilitiesWire`). All fields are optional; their presence
|
|
116
|
+
* depends on what the model config declares. `grammar` lists the
|
|
117
|
+
* supported grammar kinds ("json_schema" | "regex" | "ebnf").
|
|
118
|
+
* `code`/`sql`/`guard` are informational flags advertising validated
|
|
119
|
+
* generation jobs that back the model="code"/"sql"/"guard" aliases.
|
|
120
|
+
*
|
|
121
|
+
* These flags mean the model *supports* a task — they are NOT a
|
|
122
|
+
* precision-independent quality SLA. A flag is true at the model level even
|
|
123
|
+
* when quality is profile/precision-dependent (e.g. `sql` quality regresses
|
|
124
|
+
* under FP8; route SQL-critical traffic to a BF16 bundle via the `sql` alias).
|
|
125
|
+
*/
|
|
126
|
+
interface ModelCapabilities {
|
|
127
|
+
/** Supported grammar kinds: ["json_schema", "regex", "ebnf"] */
|
|
128
|
+
grammar?: string[];
|
|
129
|
+
/** Whether the model supports tool / function calling */
|
|
130
|
+
tools?: boolean;
|
|
131
|
+
/** Union of LoRA served-names across profiles (display summary) */
|
|
132
|
+
lora_adapters?: string[];
|
|
133
|
+
/** Per-profile LoRA served-names, keyed by profile name */
|
|
134
|
+
profile_lora_adapters?: Record<string, string[]>;
|
|
135
|
+
/** Validated for code generation; backs model="code" */
|
|
136
|
+
code?: boolean;
|
|
137
|
+
/** Supports text-to-SQL; backs model="sql". Precision-sensitive (FP8 regresses SQL) — a support flag, not a per-profile quality guarantee. */
|
|
138
|
+
sql?: boolean;
|
|
139
|
+
/** Generative guard model; backs model="guard" */
|
|
140
|
+
guard?: boolean;
|
|
141
|
+
}
|
|
111
142
|
/**
|
|
112
143
|
* Information about a model returned by listModels().
|
|
113
144
|
*/
|
|
@@ -124,6 +155,8 @@ interface ModelInfo {
|
|
|
124
155
|
dims?: ModelDims;
|
|
125
156
|
/** Maximum sequence length the model supports */
|
|
126
157
|
maxSequenceLength?: number;
|
|
158
|
+
/** Advertised model capabilities (grammar, tools, code/sql/guard, LoRA adapters) */
|
|
159
|
+
capabilities?: ModelCapabilities;
|
|
127
160
|
}
|
|
128
161
|
/**
|
|
129
162
|
* A single score entry from reranking.
|
|
@@ -1235,7 +1268,7 @@ declare class SIEClient {
|
|
|
1235
1268
|
private detectEndpointType;
|
|
1236
1269
|
}
|
|
1237
1270
|
|
|
1238
|
-
declare const SDK_VERSION = "0.
|
|
1271
|
+
declare const SDK_VERSION = "0.6.0";
|
|
1239
1272
|
|
|
1240
1273
|
/**
|
|
1241
1274
|
* Helpers for converting SIE encode results to plain JavaScript types.
|
|
@@ -1635,4 +1668,4 @@ declare function toImageWireFormat(input: ImageInput, format?: "jpeg" | "png" |
|
|
|
1635
1668
|
*/
|
|
1636
1669
|
declare function detectImageFormat(bytes: Uint8Array): "jpeg" | "png" | "webp" | "unknown";
|
|
1637
1670
|
|
|
1638
|
-
export { type CapacityInfo, type ChatChoice, type ChatChunkChoice, type ChatCompletion, type ChatCompletionChunk, type ChatCompletionRequest, type ChatDelta, type ChatFinishReason, type ChatMessage, type ChatUsage, type Classification, type ClusterStatusMessage, type ClusterSummary, type ClusterWorkerInfo, type DType, type DetectedObject, type EncodeOptions, type EncodeResult, type Entity, type ExtractOptions, type ExtractResult, type FinishReason, type GPUMetrics, type GenerateChunk, type GenerateOptions, type GenerateResult, type GenerationUsage, type ImageInput, type ImageWireFormat, InputTooLongError, type Item, LoraLoadingError, type ModelConfig, type ModelDims, type ModelInfo, ModelLoadFailedError, ModelLoadingError, type ModelState, type ModelStatus, type ModelSummary, type OutputType, PoolError, type PoolInfo, type PoolSpec, type PoolStatus, ProvisioningError, type Relation, RequestError, type ResponseFormat, SDK_VERSION, SIEClient, type SIEClientOptions, SIEConnectionError, SIEError, SIEStreamError, type ScoreEntry, type ScoreOptions, type ScoreResult, ServerError, type ServerInfo, type SparseResult, type SparseVector, type StatusMessage, type TimingInfo, type ToolCall, type ToolCallDelta, type ToolChoice, type ToolSpec, type WorkerInfo, type WorkerStatusMessage, denseEmbedding, detectImageFormat, multivectorEmbedding, normalizeSparseVector, packMessage, sparseEmbedding, sparseEmbeddingMap, toFloat32Array, toImageBytes, toImageWireFormat, toNumberArray, unpackMessage };
|
|
1671
|
+
export { type CapacityInfo, type ChatChoice, type ChatChunkChoice, type ChatCompletion, type ChatCompletionChunk, type ChatCompletionRequest, type ChatDelta, type ChatFinishReason, type ChatMessage, type ChatUsage, type Classification, type ClusterStatusMessage, type ClusterSummary, type ClusterWorkerInfo, type DType, type DetectedObject, type EncodeOptions, type EncodeResult, type Entity, type ExtractOptions, type ExtractResult, type FinishReason, type GPUMetrics, type GenerateChunk, type GenerateOptions, type GenerateResult, type GenerationUsage, type ImageInput, type ImageWireFormat, InputTooLongError, type Item, LoraLoadingError, type ModelCapabilities, type ModelConfig, type ModelDims, type ModelInfo, ModelLoadFailedError, ModelLoadingError, type ModelState, type ModelStatus, type ModelSummary, type OutputType, PoolError, type PoolInfo, type PoolSpec, type PoolStatus, ProvisioningError, type Relation, RequestError, type ResponseFormat, SDK_VERSION, SIEClient, type SIEClientOptions, SIEConnectionError, SIEError, SIEStreamError, type ScoreEntry, type ScoreOptions, type ScoreResult, ServerError, type ServerInfo, type SparseResult, type SparseVector, type StatusMessage, type TimingInfo, type ToolCall, type ToolCallDelta, type ToolChoice, type ToolSpec, type WorkerInfo, type WorkerStatusMessage, denseEmbedding, detectImageFormat, multivectorEmbedding, normalizeSparseVector, packMessage, sparseEmbedding, sparseEmbeddingMap, toFloat32Array, toImageBytes, toImageWireFormat, toNumberArray, unpackMessage };
|