node-llama-cpp 2.8.0 → 3.0.0-beta.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/dist/chatWrappers/generateContextTextFromConversationHistory.d.ts +0 -8
- package/dist/chatWrappers/generateContextTextFromConversationHistory.js +0 -8
- package/dist/chatWrappers/generateContextTextFromConversationHistory.js.map +1 -1
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +13 -0
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +49 -0
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +1 -0
- package/dist/cli/cli.js +1 -1
- package/dist/cli/cli.js.map +1 -1
- package/dist/cli/commands/ChatCommand.js +20 -10
- package/dist/cli/commands/ChatCommand.js.map +1 -1
- package/dist/index.d.ts +6 -4
- package/dist/index.js +5 -4
- package/dist/index.js.map +1 -1
- package/dist/llamaEvaluator/LlamaBins.d.ts +19 -4
- package/dist/llamaEvaluator/LlamaBins.js +3 -3
- package/dist/llamaEvaluator/LlamaChatSession.d.ts +24 -23
- package/dist/llamaEvaluator/LlamaChatSession.js +90 -36
- package/dist/llamaEvaluator/LlamaChatSession.js.map +1 -1
- package/dist/llamaEvaluator/LlamaContext/LlamaContext.d.ts +112 -0
- package/dist/llamaEvaluator/LlamaContext/LlamaContext.js +640 -0
- package/dist/llamaEvaluator/LlamaContext/LlamaContext.js.map +1 -0
- package/dist/llamaEvaluator/LlamaContext/types.d.ts +90 -0
- package/dist/llamaEvaluator/LlamaContext/types.js +2 -0
- package/dist/llamaEvaluator/LlamaContext/types.js.map +1 -0
- package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.d.ts +5 -0
- package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js +16 -0
- package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +1 -0
- package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.d.ts +5 -0
- package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js +42 -0
- package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +1 -0
- package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +2 -0
- package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js +13 -0
- package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +1 -0
- package/dist/llamaEvaluator/LlamaGrammar.d.ts +5 -5
- package/dist/llamaEvaluator/LlamaGrammar.js +7 -7
- package/dist/llamaEvaluator/LlamaGrammarEvaluationState.d.ts +6 -5
- package/dist/llamaEvaluator/LlamaGrammarEvaluationState.js +8 -7
- package/dist/llamaEvaluator/LlamaGrammarEvaluationState.js.map +1 -1
- package/dist/llamaEvaluator/LlamaModel.d.ts +93 -112
- package/dist/llamaEvaluator/LlamaModel.js +294 -59
- package/dist/llamaEvaluator/LlamaModel.js.map +1 -1
- package/dist/types.d.ts +3 -1
- package/dist/utils/ReplHistory.js +1 -1
- package/dist/utils/ReplHistory.js.map +1 -1
- package/dist/utils/getBin.d.ts +71 -39
- package/dist/utils/getBin.js.map +1 -1
- package/dist/utils/getReleaseInfo.d.ts +1 -1
- package/dist/utils/getReleaseInfo.js.map +1 -1
- package/dist/utils/parseModelFileName.d.ts +9 -0
- package/dist/utils/parseModelFileName.js +68 -0
- package/dist/utils/parseModelFileName.js.map +1 -0
- package/dist/utils/parseModelTypeDescription.d.ts +6 -0
- package/dist/utils/parseModelTypeDescription.js +9 -0
- package/dist/utils/parseModelTypeDescription.js.map +1 -0
- package/llama/.clang-format +10 -9
- package/llama/addon.cpp +689 -356
- package/llama/binariesGithubRelease.json +1 -1
- package/llama/gitRelease.bundle +0 -0
- package/llama/grammars/README.md +2 -2
- package/llamaBins/linux-arm64/llama-addon.node +0 -0
- package/llamaBins/linux-armv7l/llama-addon.node +0 -0
- package/llamaBins/linux-x64/llama-addon.node +0 -0
- package/llamaBins/mac-arm64/ggml-metal.metal +107 -1
- package/llamaBins/mac-arm64/llama-addon.node +0 -0
- package/llamaBins/mac-x64/ggml-metal.metal +107 -1
- package/llamaBins/mac-x64/llama-addon.node +0 -0
- package/llamaBins/win-x64/llama-addon.exp +0 -0
- package/llamaBins/win-x64/llama-addon.lib +0 -0
- package/llamaBins/win-x64/llama-addon.node +0 -0
- package/package.json +13 -7
- package/dist/chatWrappers/createChatWrapperByBos.d.ts +0 -2
- package/dist/chatWrappers/createChatWrapperByBos.js +0 -14
- package/dist/chatWrappers/createChatWrapperByBos.js.map +0 -1
- package/dist/llamaEvaluator/LlamaContext.d.ts +0 -100
- package/dist/llamaEvaluator/LlamaContext.js +0 -141
- package/dist/llamaEvaluator/LlamaContext.js.map +0 -1
- package/dist/utils/withLock.d.ts +0 -1
- package/dist/utils/withLock.js +0 -19
- package/dist/utils/withLock.js.map +0 -1
|
@@ -1,76 +1,311 @@
|
|
|
1
1
|
import process from "process";
|
|
2
2
|
import path from "path";
|
|
3
|
+
import { DisposedError, EventRelay } from "lifecycle-utils";
|
|
3
4
|
import { removeNullFields } from "../utils/removeNullFields.js";
|
|
4
|
-
import {
|
|
5
|
+
import { addonBinding, AddonModel } from "./LlamaBins.js";
|
|
5
6
|
export class LlamaModel {
|
|
6
|
-
/** @internal */
|
|
7
|
-
|
|
8
|
-
/** @internal */
|
|
9
|
-
|
|
10
|
-
/** @internal */
|
|
11
|
-
|
|
7
|
+
/** @internal */ _model;
|
|
8
|
+
/** @internal */ _tokens;
|
|
9
|
+
/** @internal */ _filename;
|
|
10
|
+
/** @internal */ _disposedState = { disposed: false };
|
|
11
|
+
/** @internal */ _typeDescription;
|
|
12
|
+
/** @internal */ _trainContextSize;
|
|
13
|
+
onDispose = new EventRelay();
|
|
12
14
|
/**
|
|
13
15
|
* > options source:
|
|
14
16
|
* > [github:ggerganov/llama.cpp/llama.h](
|
|
15
|
-
* > https://github.com/ggerganov/llama.cpp/blob/
|
|
16
|
-
* @param
|
|
17
|
-
* @param
|
|
18
|
-
* @param
|
|
19
|
-
* @param
|
|
20
|
-
* @param
|
|
21
|
-
* @param
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
* A higher temperature (e.g., 1.5) makes the output more random and creative,
|
|
26
|
-
* while a lower temperature (e.g., 0.5) makes the output more focused, deterministic, and conservative.
|
|
27
|
-
* The suggested temperature is 0.8, which provides a balance between randomness and determinism.
|
|
28
|
-
* At the extreme, a temperature of 0 will always pick the most likely next token, leading to identical outputs in each run.
|
|
29
|
-
*
|
|
30
|
-
* Set to `0` to disable.
|
|
31
|
-
* @param {number} [options.topK] - Limits the model to consider only the K most likely next tokens for sampling at each step of
|
|
32
|
-
* sequence generation.
|
|
33
|
-
* An integer number between `1` and the size of the vocabulary.
|
|
34
|
-
* Set to `0` to disable (which uses the full vocabulary).
|
|
35
|
-
*
|
|
36
|
-
* Only relevant when `temperature` is set to a value greater than 0.
|
|
37
|
-
* @param {number} [options.topP] - Dynamically selects the smallest set of tokens whose cumulative probability exceeds the threshold P,
|
|
38
|
-
* and samples the next token only from this set.
|
|
39
|
-
* A float number between `0` and `1`.
|
|
40
|
-
* Set to `1` to disable.
|
|
41
|
-
*
|
|
42
|
-
* Only relevant when `temperature` is set to a value greater than `0`.
|
|
43
|
-
* @param {boolean} [options.f16Kv] - use fp16 for KV cache
|
|
44
|
-
* @param {boolean} [options.logitsAll] - the llama_eval() call computes all logits, not just the last one
|
|
45
|
-
* @param {boolean} [options.vocabOnly] - only load the vocabulary, no weights
|
|
46
|
-
* @param {boolean} [options.useMmap] - use mmap if possible
|
|
47
|
-
* @param {boolean} [options.useMlock] - force system to keep model in RAM
|
|
48
|
-
* @param {boolean} [options.embedding] - embedding mode only
|
|
49
|
-
*/
|
|
50
|
-
constructor({ modelPath, seed = null, contextSize = 1024 * 4, batchSize, gpuLayers, threads = 6, temperature = 0, topK = 40, topP = 0.95, f16Kv, logitsAll, vocabOnly, useMmap, useMlock, embedding }) {
|
|
51
|
-
this._model = new LLAMAModel(path.resolve(process.cwd(), modelPath), removeNullFields({
|
|
17
|
+
* > https://github.com/ggerganov/llama.cpp/blob/05816027d649f977468fc804cdb54e99eac246d1/llama.h#L161) (`struct llama_model_params`)
|
|
18
|
+
* @param options
|
|
19
|
+
* @param options.modelPath - path to the model on the filesystem
|
|
20
|
+
* @param [options.gpuLayers] - number of layers to store in VRAM
|
|
21
|
+
* @param [options.vocabOnly] - only load the vocabulary, no weights
|
|
22
|
+
* @param [options.useMmap] - use mmap if possible
|
|
23
|
+
* @param [options.useMlock] - force system to keep model in RAM
|
|
24
|
+
*/
|
|
25
|
+
constructor({ modelPath, gpuLayers, vocabOnly, useMmap, useMlock }) {
|
|
26
|
+
this._model = new AddonModel(path.resolve(process.cwd(), modelPath), removeNullFields({
|
|
52
27
|
gpuLayers,
|
|
53
28
|
vocabOnly,
|
|
54
29
|
useMmap,
|
|
55
30
|
useMlock
|
|
56
31
|
}));
|
|
57
|
-
this.
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
32
|
+
this._tokens = LlamaModelTokens._create(this._model, this._disposedState);
|
|
33
|
+
this._filename = path.basename(modelPath);
|
|
34
|
+
}
|
|
35
|
+
dispose() {
|
|
36
|
+
if (this._disposedState.disposed)
|
|
37
|
+
return;
|
|
38
|
+
this.onDispose.dispatchEvent();
|
|
39
|
+
this._model.dispose();
|
|
40
|
+
this._disposedState.disposed = true;
|
|
41
|
+
}
|
|
42
|
+
/** @hidden */
|
|
43
|
+
[Symbol.dispose]() {
|
|
44
|
+
this.dispose();
|
|
45
|
+
}
|
|
46
|
+
get disposed() {
|
|
47
|
+
return this._disposedState.disposed;
|
|
48
|
+
}
|
|
49
|
+
get tokens() {
|
|
50
|
+
return this._tokens;
|
|
51
|
+
}
|
|
52
|
+
get filename() {
|
|
53
|
+
return this._filename;
|
|
54
|
+
}
|
|
55
|
+
/** Transform text into tokens that can be fed to the model */
|
|
56
|
+
tokenize(text) {
|
|
57
|
+
this._ensureNotDisposed();
|
|
58
|
+
if (text === "")
|
|
59
|
+
return [];
|
|
60
|
+
return Array.from(this._model.tokenize(text));
|
|
61
|
+
}
|
|
62
|
+
/** Transform tokens into text */
|
|
63
|
+
detokenize(tokens) {
|
|
64
|
+
this._ensureNotDisposed();
|
|
65
|
+
if (tokens.length === 0)
|
|
66
|
+
return "";
|
|
67
|
+
return this._model.detokenize(Uint32Array.from(tokens));
|
|
68
|
+
}
|
|
69
|
+
/** @hidden `ModelTypeDescription` type alias is too long in the documentation */
|
|
70
|
+
get typeDescription() {
|
|
71
|
+
this._ensureNotDisposed();
|
|
72
|
+
if (this._typeDescription == null)
|
|
73
|
+
this._typeDescription = this._model.getModelDescription();
|
|
74
|
+
return this._typeDescription;
|
|
75
|
+
}
|
|
76
|
+
/** The context size the model was trained on */
|
|
77
|
+
get trainContextSize() {
|
|
78
|
+
this._ensureNotDisposed();
|
|
79
|
+
if (this._trainContextSize == null)
|
|
80
|
+
this._trainContextSize = this._model.getTrainContextSize();
|
|
81
|
+
return this._trainContextSize;
|
|
82
|
+
}
|
|
83
|
+
/** @internal */
|
|
84
|
+
_ensureNotDisposed() {
|
|
85
|
+
if (this._disposedState.disposed)
|
|
86
|
+
throw new DisposedError();
|
|
71
87
|
}
|
|
72
88
|
static get systemInfo() {
|
|
73
|
-
return
|
|
89
|
+
return addonBinding.systemInfo();
|
|
90
|
+
}
|
|
91
|
+
}
|
|
92
|
+
export class LlamaModelTokens {
|
|
93
|
+
/** @internal */ _model;
|
|
94
|
+
/** @internal */ _disposedState;
|
|
95
|
+
/** @internal */ _infillTokens;
|
|
96
|
+
/** @internal */ _bosToken;
|
|
97
|
+
/** @internal */ _eosToken;
|
|
98
|
+
/** @internal */ _nlToken;
|
|
99
|
+
/** @internal */ _bosString;
|
|
100
|
+
/** @internal */ _eosString;
|
|
101
|
+
/** @internal */ _nlString;
|
|
102
|
+
constructor(model, disposedState) {
|
|
103
|
+
this._model = model;
|
|
104
|
+
this._disposedState = disposedState;
|
|
105
|
+
}
|
|
106
|
+
/**
|
|
107
|
+
* @returns infill tokens
|
|
108
|
+
*/
|
|
109
|
+
get infill() {
|
|
110
|
+
this._ensureNotDisposed();
|
|
111
|
+
if (this._infillTokens == null)
|
|
112
|
+
this._infillTokens = LlamaModelInfillTokens._create(this._model, this._disposedState);
|
|
113
|
+
return this._infillTokens;
|
|
114
|
+
}
|
|
115
|
+
/**
|
|
116
|
+
* @returns The BOS (Beginning Of Sequence) token.
|
|
117
|
+
*/
|
|
118
|
+
get bos() {
|
|
119
|
+
this._ensureNotDisposed();
|
|
120
|
+
if (this._bosToken == null)
|
|
121
|
+
this._bosToken = this._model.tokenBos();
|
|
122
|
+
if (this._bosToken === -1)
|
|
123
|
+
return null;
|
|
124
|
+
return this._bosToken;
|
|
125
|
+
}
|
|
126
|
+
/**
|
|
127
|
+
* @returns The EOS (End Of Sequence) token.
|
|
128
|
+
*/
|
|
129
|
+
get eos() {
|
|
130
|
+
this._ensureNotDisposed();
|
|
131
|
+
if (this._eosToken == null)
|
|
132
|
+
this._eosToken = this._model.tokenEos();
|
|
133
|
+
if (this._eosToken === -1)
|
|
134
|
+
return null;
|
|
135
|
+
return this._eosToken;
|
|
136
|
+
}
|
|
137
|
+
/**
|
|
138
|
+
* @returns The NL (New Line) token.
|
|
139
|
+
*/
|
|
140
|
+
get nl() {
|
|
141
|
+
this._ensureNotDisposed();
|
|
142
|
+
if (this._nlToken == null)
|
|
143
|
+
this._nlToken = this._model.tokenNl();
|
|
144
|
+
if (this._nlToken === -1)
|
|
145
|
+
return null;
|
|
146
|
+
return this._nlToken;
|
|
147
|
+
}
|
|
148
|
+
/**
|
|
149
|
+
* @returns The BOS (Beginning Of Sequence) token as a string.
|
|
150
|
+
*/
|
|
151
|
+
get bosString() {
|
|
152
|
+
this._ensureNotDisposed();
|
|
153
|
+
const bosToken = this.bos;
|
|
154
|
+
if (bosToken == null)
|
|
155
|
+
return null;
|
|
156
|
+
if (this._bosString == null)
|
|
157
|
+
this._bosString = this._model.getTokenString(bosToken);
|
|
158
|
+
return this._bosString;
|
|
159
|
+
}
|
|
160
|
+
/**
|
|
161
|
+
* @returns The EOS (End Of Sequence) token as a string.
|
|
162
|
+
*/
|
|
163
|
+
get eosString() {
|
|
164
|
+
this._ensureNotDisposed();
|
|
165
|
+
const eosToken = this.eos;
|
|
166
|
+
if (eosToken == null)
|
|
167
|
+
return null;
|
|
168
|
+
if (this._eosString == null)
|
|
169
|
+
this._eosString = this._model.getTokenString(eosToken);
|
|
170
|
+
return this._eosString;
|
|
171
|
+
}
|
|
172
|
+
/**
|
|
173
|
+
* @returns The NL (New Line) token as a string.
|
|
174
|
+
*/
|
|
175
|
+
get nlString() {
|
|
176
|
+
this._ensureNotDisposed();
|
|
177
|
+
const nlToken = this.nl;
|
|
178
|
+
if (nlToken == null)
|
|
179
|
+
return null;
|
|
180
|
+
if (this._nlString == null)
|
|
181
|
+
this._nlString = this._model.getTokenString(nlToken);
|
|
182
|
+
return this._nlString;
|
|
183
|
+
}
|
|
184
|
+
/** @internal */
|
|
185
|
+
_ensureNotDisposed() {
|
|
186
|
+
if (this._disposedState.disposed)
|
|
187
|
+
throw new DisposedError();
|
|
188
|
+
}
|
|
189
|
+
/** @internal */
|
|
190
|
+
static _create(model, disposedState) {
|
|
191
|
+
return new LlamaModelTokens(model, disposedState);
|
|
192
|
+
}
|
|
193
|
+
}
|
|
194
|
+
export class LlamaModelInfillTokens {
|
|
195
|
+
/** @internal */ _model;
|
|
196
|
+
/** @internal */ _disposedState;
|
|
197
|
+
/** @internal */ _prefixToken;
|
|
198
|
+
/** @internal */ _middleToken;
|
|
199
|
+
/** @internal */ _suffixToken;
|
|
200
|
+
/** @internal */ _eotToken;
|
|
201
|
+
/** @internal */ _prefixString;
|
|
202
|
+
/** @internal */ _middleString;
|
|
203
|
+
/** @internal */ _suffixString;
|
|
204
|
+
/** @internal */ _eotString;
|
|
205
|
+
constructor(model, disposedState) {
|
|
206
|
+
this._model = model;
|
|
207
|
+
this._disposedState = disposedState;
|
|
208
|
+
}
|
|
209
|
+
/**
|
|
210
|
+
* @returns The beginning of infill prefix token.
|
|
211
|
+
*/
|
|
212
|
+
get prefix() {
|
|
213
|
+
this._ensureNotDisposed();
|
|
214
|
+
if (this._prefixToken == null)
|
|
215
|
+
this._prefixToken = this._model.prefixToken();
|
|
216
|
+
if (this._prefixToken === -1)
|
|
217
|
+
return null;
|
|
218
|
+
return this._prefixToken;
|
|
219
|
+
}
|
|
220
|
+
/**
|
|
221
|
+
* @returns The beginning of infill middle token.
|
|
222
|
+
*/
|
|
223
|
+
get middle() {
|
|
224
|
+
this._ensureNotDisposed();
|
|
225
|
+
if (this._middleToken == null)
|
|
226
|
+
this._middleToken = this._model.middleToken();
|
|
227
|
+
if (this._middleToken === -1)
|
|
228
|
+
return null;
|
|
229
|
+
return this._middleToken;
|
|
230
|
+
}
|
|
231
|
+
/**
|
|
232
|
+
* @returns The beginning of infill suffix token.
|
|
233
|
+
*/
|
|
234
|
+
get suffix() {
|
|
235
|
+
this._ensureNotDisposed();
|
|
236
|
+
if (this._suffixToken == null)
|
|
237
|
+
this._suffixToken = this._model.suffixToken();
|
|
238
|
+
if (this._suffixToken === -1)
|
|
239
|
+
return null;
|
|
240
|
+
return this._suffixToken;
|
|
241
|
+
}
|
|
242
|
+
/**
|
|
243
|
+
* @returns End of infill middle token (End Of Text).
|
|
244
|
+
*/
|
|
245
|
+
get eot() {
|
|
246
|
+
this._ensureNotDisposed();
|
|
247
|
+
if (this._eotToken == null)
|
|
248
|
+
this._eotToken = this._model.eotToken();
|
|
249
|
+
if (this._eotToken === -1)
|
|
250
|
+
return null;
|
|
251
|
+
return this._eotToken;
|
|
252
|
+
}
|
|
253
|
+
/**
|
|
254
|
+
* @returns The beginning of infill prefix token as a string.
|
|
255
|
+
*/
|
|
256
|
+
get prefixString() {
|
|
257
|
+
this._ensureNotDisposed();
|
|
258
|
+
const prefixToken = this.prefix;
|
|
259
|
+
if (prefixToken == null)
|
|
260
|
+
return null;
|
|
261
|
+
if (this._prefixString == null)
|
|
262
|
+
this._prefixString = this._model.getTokenString(prefixToken);
|
|
263
|
+
return this._prefixString;
|
|
264
|
+
}
|
|
265
|
+
/**
|
|
266
|
+
* @returns The beginning of infill middle token as a string.
|
|
267
|
+
*/
|
|
268
|
+
get middleString() {
|
|
269
|
+
this._ensureNotDisposed();
|
|
270
|
+
const middleToken = this.middle;
|
|
271
|
+
if (middleToken == null)
|
|
272
|
+
return null;
|
|
273
|
+
if (this._middleString == null)
|
|
274
|
+
this._middleString = this._model.getTokenString(middleToken);
|
|
275
|
+
return this._middleString;
|
|
276
|
+
}
|
|
277
|
+
/**
|
|
278
|
+
* @returns The beginning of infill suffix token as a string.
|
|
279
|
+
*/
|
|
280
|
+
get suffixString() {
|
|
281
|
+
this._ensureNotDisposed();
|
|
282
|
+
const suffixToken = this.suffix;
|
|
283
|
+
if (suffixToken == null)
|
|
284
|
+
return null;
|
|
285
|
+
if (this._suffixString == null)
|
|
286
|
+
this._suffixString = this._model.getTokenString(suffixToken);
|
|
287
|
+
return this._suffixString;
|
|
288
|
+
}
|
|
289
|
+
/**
|
|
290
|
+
* @returns End of infill middle token (End Of Text) as a string.
|
|
291
|
+
*/
|
|
292
|
+
get eotString() {
|
|
293
|
+
this._ensureNotDisposed();
|
|
294
|
+
const eotToken = this.eot;
|
|
295
|
+
if (eotToken == null)
|
|
296
|
+
return null;
|
|
297
|
+
if (this._eotString == null)
|
|
298
|
+
this._eotString = this._model.getTokenString(eotToken);
|
|
299
|
+
return this._eotString;
|
|
300
|
+
}
|
|
301
|
+
/** @internal */
|
|
302
|
+
_ensureNotDisposed() {
|
|
303
|
+
if (this._disposedState.disposed)
|
|
304
|
+
throw new DisposedError();
|
|
305
|
+
}
|
|
306
|
+
/** @internal */
|
|
307
|
+
static _create(model, disposedState) {
|
|
308
|
+
return new LlamaModelInfillTokens(model, disposedState);
|
|
74
309
|
}
|
|
75
310
|
}
|
|
76
311
|
//# sourceMappingURL=LlamaModel.js.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"LlamaModel.js","sourceRoot":"","sources":["../../src/llamaEvaluator/LlamaModel.ts"],"names":[],"mappings":"AAAA,OAAO,OAAO,MAAM,SAAS,CAAC;AAC9B,OAAO,IAAI,MAAM,MAAM,CAAC;AACxB,OAAO,EAAC,gBAAgB,EAAC,MAAM,8BAA8B,CAAC;
|
|
1
|
+
{"version":3,"file":"LlamaModel.js","sourceRoot":"","sources":["../../src/llamaEvaluator/LlamaModel.ts"],"names":[],"mappings":"AAAA,OAAO,OAAO,MAAM,SAAS,CAAC;AAC9B,OAAO,IAAI,MAAM,MAAM,CAAC;AACxB,OAAO,EAAC,aAAa,EAAE,UAAU,EAAC,MAAM,iBAAiB,CAAC;AAC1D,OAAO,EAAC,gBAAgB,EAAC,MAAM,8BAA8B,CAAC;AAG9D,OAAO,EAAC,YAAY,EAAE,UAAU,EAAC,MAAM,gBAAgB,CAAC;AAoBxD,MAAM,OAAO,UAAU;IACnB,gBAAgB,CAAiB,MAAM,CAAa;IACpD,gBAAgB,CAAkB,OAAO,CAAmB;IAC5D,gBAAgB,CAAkB,SAAS,CAAU;IACrD,gBAAgB,CAAkB,cAAc,GAAkB,EAAC,QAAQ,EAAE,KAAK,EAAC,CAAC;IACpF,gBAAgB,CAAS,gBAAgB,CAAwB;IACjE,gBAAgB,CAAS,iBAAiB,CAAU;IAEpC,SAAS,GAAG,IAAI,UAAU,EAAQ,CAAC;IAEnD;;;;;;;;;;OAUG;IACH,YAAmB,EACf,SAAS,EAAE,SAAS,EAAE,SAAS,EAAE,OAAO,EAAE,QAAQ,EAClC;QAChB,IAAI,CAAC,MAAM,GAAG,IAAI,UAAU,CAAC,IAAI,CAAC,OAAO,CAAC,OAAO,CAAC,GAAG,EAAE,EAAE,SAAS,CAAC,EAAE,gBAAgB,CAAC;YAClF,SAAS;YACT,SAAS;YACT,OAAO;YACP,QAAQ;SACX,CAAC,CAAC,CAAC;QACJ,IAAI,CAAC,OAAO,GAAG,gBAAgB,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,cAAc,CAAC,CAAC;QAC1E,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,CAAC;IAC9C,CAAC;IAEM,OAAO;QACV,IAAI,IAAI,CAAC,cAAc,CAAC,QAAQ;YAC5B,OAAO;QAEX,IAAI,CAAC,SAAS,CAAC,aAAa,EAAE,CAAC;QAC/B,IAAI,CAAC,MAAM,CAAC,OAAO,EAAE,CAAC;QACtB,IAAI,CAAC,cAAc,CAAC,QAAQ,GAAG,IAAI,CAAC;IACxC,CAAC;IAED,cAAc;IACP,CAAC,MAAM,CAAC,OAAO,CAAC;QACnB,IAAI,CAAC,OAAO,EAAE,CAAC;IACnB,CAAC;IAED,IAAW,QAAQ;QACf,OAAO,IAAI,CAAC,cAAc,CAAC,QAAQ,CAAC;IACxC,CAAC;IAED,IAAW,MAAM;QACb,OAAO,IAAI,CAAC,OAAO,CAAC;IACxB,CAAC;IAED,IAAW,QAAQ;QACf,OAAO,IAAI,CAAC,SAAS,CAAC;IAC1B,CAAC;IAED,8DAA8D;IACvD,QAAQ,CAAC,IAAY;QACxB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,KAAK,EAAE;YACX,OAAO,EAAE,CAAC;QAEd,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAY,CAAC;IAC7D,CAAC;IAED,iCAAiC;IAC1B,UAAU,CAAC,MAAwB;QACtC,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC;YACnB,OAAO,EAAE,CAAC;QAEd,OAAO,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,WAAW,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC,CAAC;IAC5D,CAAC;IAED,iFAAiF;IACjF,IAAW,eAAe;QACtB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,gBAAgB,IAAI,IAAI;YAC7B,IAAI,CAAC,gBAAgB,GAAG,IAAI,CAAC,MAAM,CAAC,mBAAmB,EAAE,CAAC;QAE9D,OAAO,IAAI,CAAC,gBAAgB,CAAC;IACjC,CAAC;IAED,gDAAgD;IAChD,IAAW,gBAAgB;QACvB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,iBAAiB,IAAI,IAAI;YAC9B,IAAI,CAAC,iBAAiB,GAAG,IAAI,CAAC,MAAM,CAAC,mBAAmB,EAAE,CAAC;QAE/D,OAAO,IAAI,CAAC,iBAAiB,CAAC;IAClC,CAAC;IAED,gBAAgB;IACR,kBAAkB;QACtB,IAAI,IAAI,CAAC,cAAc,CAAC,QAAQ;YAC5B,MAAM,IAAI,aAAa,EAAE,CAAC;IAClC,CAAC;IAEM,MAAM,KAAK,UAAU;QACxB,OAAO,YAAY,CAAC,UAAU,EAAE,CAAC;IACrC,CAAC;CACJ;AAED,MAAM,OAAO,gBAAgB;IACzB,gBAAgB,CAAkB,MAAM,CAAa;IACrD,gBAAgB,CAAkB,cAAc,CAAgB;IAChE,gBAAgB,CAAS,aAAa,CAA0B;IAChE,gBAAgB,CAAS,SAAS,CAAS;IAC3C,gBAAgB,CAAS,SAAS,CAAS;IAC3C,gBAAgB,CAAS,QAAQ,CAAS;IAC1C,gBAAgB,CAAS,UAAU,CAAU;IAC7C,gBAAgB,CAAS,UAAU,CAAU;IAC7C,gBAAgB,CAAS,SAAS,CAAU;IAE5C,YAAoB,KAAiB,EAAE,aAA4B;QAC/D,IAAI,CAAC,MAAM,GAAG,KAAK,CAAC;QACpB,IAAI,CAAC,cAAc,GAAG,aAAa,CAAC;IACxC,CAAC;IAED;;OAEG;IACH,IAAW,MAAM;QACb,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,aAAa,IAAI,IAAI;YAC1B,IAAI,CAAC,aAAa,GAAG,sBAAsB,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,cAAc,CAAC,CAAC;QAE1F,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,IAAW,GAAG;QACV,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,SAAS,IAAI,IAAI;YACtB,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,EAAE,CAAC;QAE5C,IAAI,IAAI,CAAC,SAAS,KAAK,CAAC,CAAC;YACrB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,SAAS,CAAC;IAC1B,CAAC;IAED;;OAEG;IACH,IAAW,GAAG;QACV,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,SAAS,IAAI,IAAI;YACtB,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,EAAE,CAAC;QAE5C,IAAI,IAAI,CAAC,SAAS,KAAK,CAAC,CAAC;YACrB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,SAAS,CAAC;IAC1B,CAAC;IAED;;OAEG;IACH,IAAW,EAAE;QACT,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,QAAQ,IAAI,IAAI;YACrB,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,EAAE,CAAC;QAE1C,IAAI,IAAI,CAAC,QAAQ,KAAK,CAAC,CAAC;YACpB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,QAAQ,CAAC;IACzB,CAAC;IAED;;OAEG;IACH,IAAW,SAAS;QAChB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC;QAE1B,IAAI,QAAQ,IAAI,IAAI;YAChB,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,UAAU,IAAI,IAAI;YACvB,IAAI,CAAC,UAAU,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,QAAQ,CAAC,CAAC;QAE3D,OAAO,IAAI,CAAC,UAAU,CAAC;IAC3B,CAAC;IAED;;OAEG;IACH,IAAW,SAAS;QAChB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC;QAE1B,IAAI,QAAQ,IAAI,IAAI;YAChB,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,UAAU,IAAI,IAAI;YACvB,IAAI,CAAC,UAAU,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,QAAQ,CAAC,CAAC;QAE3D,OAAO,IAAI,CAAC,UAAU,CAAC;IAC3B,CAAC;IAED;;OAEG;IACH,IAAW,QAAQ;QACf,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,OAAO,GAAG,IAAI,CAAC,EAAE,CAAC;QAExB,IAAI,OAAO,IAAI,IAAI;YACf,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,SAAS,IAAI,IAAI;YACtB,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,OAAO,CAAC,CAAC;QAEzD,OAAO,IAAI,CAAC,SAAS,CAAC;IAC1B,CAAC;IAED,gBAAgB;IACR,kBAAkB;QACtB,IAAI,IAAI,CAAC,cAAc,CAAC,QAAQ;YAC5B,MAAM,IAAI,aAAa,EAAE,CAAC;IAClC,CAAC;IAED,gBAAgB;IACT,MAAM,CAAC,OAAO,CAAC,KAAiB,EAAE,aAA4B;QACjE,OAAO,IAAI,gBAAgB,CAAC,KAAK,EAAE,aAAa,CAAC,CAAC;IACtD,CAAC;CACJ;AAED,MAAM,OAAO,sBAAsB;IAC/B,gBAAgB,CAAkB,MAAM,CAAa;IACrD,gBAAgB,CAAkB,cAAc,CAAgB;IAChE,gBAAgB,CAAS,YAAY,CAAS;IAC9C,gBAAgB,CAAS,YAAY,CAAS;IAC9C,gBAAgB,CAAS,YAAY,CAAS;IAC9C,gBAAgB,CAAS,SAAS,CAAS;IAC3C,gBAAgB,CAAS,aAAa,CAAU;IAChD,gBAAgB,CAAS,aAAa,CAAU;IAChD,gBAAgB,CAAS,aAAa,CAAU;IAChD,gBAAgB,CAAS,UAAU,CAAU;IAE7C,YAAoB,KAAiB,EAAE,aAA4B;QAC/D,IAAI,CAAC,MAAM,GAAG,KAAK,CAAC;QACpB,IAAI,CAAC,cAAc,GAAG,aAAa,CAAC;IACxC,CAAC;IAED;;OAEG;IACH,IAAW,MAAM;QACb,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,YAAY,IAAI,IAAI;YACzB,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,MAAM,CAAC,WAAW,EAAE,CAAC;QAElD,IAAI,IAAI,CAAC,YAAY,KAAK,CAAC,CAAC;YACxB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,YAAY,CAAC;IAC7B,CAAC;IAED;;OAEG;IACH,IAAW,MAAM;QACb,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,YAAY,IAAI,IAAI;YACzB,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,MAAM,CAAC,WAAW,EAAE,CAAC;QAElD,IAAI,IAAI,CAAC,YAAY,KAAK,CAAC,CAAC;YACxB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,YAAY,CAAC;IAC7B,CAAC;IAED;;OAEG;IACH,IAAW,MAAM;QACb,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,YAAY,IAAI,IAAI;YACzB,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,MAAM,CAAC,WAAW,EAAE,CAAC;QAElD,IAAI,IAAI,CAAC,YAAY,KAAK,CAAC,CAAC;YACxB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,YAAY,CAAC;IAC7B,CAAC;IAED;;OAEG;IACH,IAAW,GAAG;QACV,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,IAAI,IAAI,CAAC,SAAS,IAAI,IAAI;YACtB,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,EAAE,CAAC;QAE5C,IAAI,IAAI,CAAC,SAAS,KAAK,CAAC,CAAC;YACrB,OAAO,IAAI,CAAC;QAEhB,OAAO,IAAI,CAAC,SAAS,CAAC;IAC1B,CAAC;IAED;;OAEG;IACH,IAAW,YAAY;QACnB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,WAAW,GAAG,IAAI,CAAC,MAAM,CAAC;QAEhC,IAAI,WAAW,IAAI,IAAI;YACnB,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,aAAa,IAAI,IAAI;YAC1B,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,WAAW,CAAC,CAAC;QAEjE,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,IAAW,YAAY;QACnB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,WAAW,GAAG,IAAI,CAAC,MAAM,CAAC;QAEhC,IAAI,WAAW,IAAI,IAAI;YACnB,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,aAAa,IAAI,IAAI;YAC1B,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,WAAW,CAAC,CAAC;QAEjE,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,IAAW,YAAY;QACnB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,WAAW,GAAG,IAAI,CAAC,MAAM,CAAC;QAEhC,IAAI,WAAW,IAAI,IAAI;YACnB,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,aAAa,IAAI,IAAI;YAC1B,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,WAAW,CAAC,CAAC;QAEjE,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,IAAW,SAAS;QAChB,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAE1B,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC;QAE1B,IAAI,QAAQ,IAAI,IAAI;YAChB,OAAO,IAAI,CAAC;QAEhB,IAAI,IAAI,CAAC,UAAU,IAAI,IAAI;YACvB,IAAI,CAAC,UAAU,GAAG,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,QAAQ,CAAC,CAAC;QAE3D,OAAO,IAAI,CAAC,UAAU,CAAC;IAC3B,CAAC;IAED,gBAAgB;IACR,kBAAkB;QACtB,IAAI,IAAI,CAAC,cAAc,CAAC,QAAQ;YAC5B,MAAM,IAAI,aAAa,EAAE,CAAC;IAClC,CAAC;IAED,gBAAgB;IACT,MAAM,CAAC,OAAO,CAAC,KAAiB,EAAE,aAA4B;QACjE,OAAO,IAAI,sBAAsB,CAAC,KAAK,EAAE,aAAa,CAAC,CAAC;IAC5D,CAAC;CACJ"}
|
package/dist/types.d.ts
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"ReplHistory.js","sourceRoot":"","sources":["../../src/utils/ReplHistory.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,UAAU,CAAC;AAC1B,OAAO,EAAC,QAAQ,EAAC,MAAM,
|
|
1
|
+
{"version":3,"file":"ReplHistory.js","sourceRoot":"","sources":["../../src/utils/ReplHistory.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,UAAU,CAAC;AAC1B,OAAO,EAAC,QAAQ,EAAC,MAAM,iBAAiB,CAAC;AAMzC,MAAM,YAAY,GAAqB;IACnC,OAAO,EAAE,EAAE;CACd,CAAC;AAEF,MAAM,OAAO,WAAW;IACH,SAAS,CAAgB;IAClC,YAAY,CAAmB;IAEvC,YAAoB,QAAuB,EAAE,WAA6B;QACtE,IAAI,CAAC,SAAS,GAAG,QAAQ,CAAC;QAC1B,IAAI,CAAC,YAAY,GAAG,WAAW,CAAC;IACpC,CAAC;IAEM,KAAK,CAAC,GAAG,CAAC,IAAY;QACzB,IAAI,IAAI,CAAC,SAAS,IAAI,IAAI,EAAE;YACxB,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,iBAAiB,CAAC,IAAI,EAAE,IAAI,CAAC,YAAY,CAAC,CAAC;YACpE,OAAO;SACV;QAED,MAAM,QAAQ,CAAC,IAAI,EAAE,MAAM,EAAE,KAAK,IAAI,EAAE;YACpC,IAAI;gBACA,MAAM,IAAI,GAAG,iBAAiB,CAAC,MAAM,EAAE,CAAC,QAAQ,CAAC,IAAI,CAAC,SAAU,CAAC,CAAC,CAAC;gBACnE,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,iBAAiB,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;gBAEvD,MAAM,EAAE,CAAC,SAAS,CAAC,IAAI,CAAC,SAAU,EAAE,IAAI,CAAC,YAAY,EAAE;oBACnD,MAAM,EAAE,CAAC;iBACZ,CAAC,CAAC;aACN;YAAC,OAAO,GAAG,EAAE,GAAE;QACpB,CAAC,CAAC,CAAC;IACP,CAAC;IAED,IAAW,OAAO;QACd,OAAO,IAAI,CAAC,YAAY,CAAC,OAAO,CAAC;IACrC,CAAC;IAEO,iBAAiB,CAAC,IAAY,EAAE,WAA6B;QACjE,MAAM,UAAU,GAAG,WAAW,CAAC,OAAO,CAAC,KAAK,EAAE,CAAC;QAC/C,MAAM,gBAAgB,GAAG,UAAU,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;QAElD,IAAI,gBAAgB,KAAK,CAAC,CAAC;YACvB,UAAU,CAAC,MAAM,CAAC,gBAAgB,EAAE,CAAC,CAAC,CAAC;QAE3C,UAAU,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;QAEzB,OAAO;YACH,GAAG,WAAW;YACd,OAAO,EAAE,UAAU;SACtB,CAAC;IACN,CAAC;IAEM,MAAM,CAAC,KAAK,CAAC,IAAI,CAAC,QAAgB,EAAE,qBAA8B,IAAI;QACzE,IAAI,CAAC,kBAAkB;YACnB,OAAO,IAAI,WAAW,CAAC,IAAI,EAAE;gBACzB,OAAO,EAAE,EAAE;aACd,CAAC,CAAC;QAEP,IAAI;YACA,IAAI,CAAC,CAAC,MAAM,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC;gBAChC,MAAM,EAAE,CAAC,SAAS,CAAC,QAAQ,EAAE,YAAY,EAAE;oBACvC,MAAM,EAAE,CAAC;iBACZ,CAAC,CAAC;YAEP,MAAM,IAAI,GAAG,iBAAiB,CAAC,MAAM,EAAE,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC,CAAC;YAC5D,OAAO,IAAI,WAAW,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;SAC1C;QAAC,OAAO,GAAG,EAAE;YACV,OAAO,IAAI,WAAW,CAAC,IAAI,EAAE;gBACzB,OAAO,EAAE,EAAE;aACd,CAAC,CAAC;SACN;IACL,CAAC;CACJ;AAED,SAAS,iBAAiB,CAAC,IAAa;IACpC,IAAI,OAAO,IAAI,KAAK,QAAQ,IAAI,IAAI,IAAI,IAAI,IAAI,CAAC,CAAC,SAAS,IAAI,IAAI,CAAC,IAAI,CAAC,CAAC,IAAI,CAAC,OAAO,YAAY,KAAK,CAAC,IAAI,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,OAAO,IAAI,KAAK,QAAQ,CAAC;QAC7J,MAAM,IAAI,KAAK,CAAC,2BAA2B,CAAC,CAAC;IAEjD,OAAO,IAAwB,CAAC;AACpC,CAAC"}
|
package/dist/utils/getBin.d.ts
CHANGED
|
@@ -1,32 +1,60 @@
|
|
|
1
|
+
import { Token } from "../types.js";
|
|
1
2
|
export declare function getPrebuildBinPath(): Promise<string | null>;
|
|
2
|
-
export declare function loadBin(): Promise<
|
|
3
|
-
export type
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
3
|
+
export declare function loadBin(): Promise<BindingModule>;
|
|
4
|
+
export type BindingModule = {
|
|
5
|
+
AddonModel: {
|
|
6
|
+
new (modelPath: string, params: {
|
|
7
|
+
gpuLayers?: number;
|
|
8
|
+
vocabOnly?: boolean;
|
|
9
|
+
useMmap?: boolean;
|
|
10
|
+
useMlock?: boolean;
|
|
11
|
+
}): AddonModel;
|
|
12
|
+
};
|
|
13
|
+
AddonContext: {
|
|
14
|
+
new (model: AddonModel, params: {
|
|
15
|
+
seed?: number;
|
|
16
|
+
contextSize?: number;
|
|
17
|
+
batchSize?: number;
|
|
18
|
+
f16Kv?: boolean;
|
|
19
|
+
logitsAll?: boolean;
|
|
20
|
+
embedding?: boolean;
|
|
21
|
+
threads?: number;
|
|
22
|
+
}): AddonContext;
|
|
23
|
+
};
|
|
24
|
+
AddonGrammar: {
|
|
25
|
+
new (grammarPath: string, params?: {
|
|
26
|
+
printGrammar?: boolean;
|
|
27
|
+
}): AddonGrammar;
|
|
28
|
+
};
|
|
29
|
+
AddonGrammarEvaluationState: {
|
|
30
|
+
new (grammar: AddonGrammar): AddonGrammarEvaluationState;
|
|
31
|
+
};
|
|
8
32
|
systemInfo(): string;
|
|
9
33
|
};
|
|
10
|
-
export type
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
34
|
+
export type AddonModel = {
|
|
35
|
+
dispose(): void;
|
|
36
|
+
tokenize(text: string): Uint32Array;
|
|
37
|
+
detokenize(tokens: Uint32Array): string;
|
|
38
|
+
getTrainContextSize(): number;
|
|
39
|
+
getTotalSize(): number;
|
|
40
|
+
getTotalParameters(): number;
|
|
41
|
+
getModelDescription(): ModelTypeDescription;
|
|
42
|
+
tokenBos(): Token;
|
|
43
|
+
tokenEos(): Token;
|
|
44
|
+
tokenNl(): Token;
|
|
45
|
+
prefixToken(): Token;
|
|
46
|
+
middleToken(): Token;
|
|
47
|
+
suffixToken(): Token;
|
|
48
|
+
eotToken(): Token;
|
|
49
|
+
getTokenString(token: number): string;
|
|
17
50
|
};
|
|
18
|
-
export type
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
embedding?: boolean;
|
|
26
|
-
threads?: number;
|
|
27
|
-
}): LLAMAContext;
|
|
28
|
-
encode(text: string): Uint32Array;
|
|
29
|
-
eval(tokens: Uint32Array, options?: {
|
|
51
|
+
export type AddonContext = {
|
|
52
|
+
dispose(): void;
|
|
53
|
+
getContextSize(): number;
|
|
54
|
+
initBatch(size: number): void;
|
|
55
|
+
addToBatch(sequenceId: number, firstTokenSequenceIndex: number, tokens: Uint32Array, generateLogitAtTheEnd: boolean): BatchLogitIndex | undefined;
|
|
56
|
+
decodeBatch(): Promise<void>;
|
|
57
|
+
sampleToken(batchLogitIndex: BatchLogitIndex, options?: {
|
|
30
58
|
temperature?: number;
|
|
31
59
|
topK?: number;
|
|
32
60
|
topP?: number;
|
|
@@ -34,20 +62,24 @@ export type LLAMAContext = {
|
|
|
34
62
|
repeatPenaltyTokens?: Uint32Array;
|
|
35
63
|
repeatPenaltyPresencePenalty?: number;
|
|
36
64
|
repeatPenaltyFrequencyPenalty?: number;
|
|
37
|
-
grammarEvaluationState?:
|
|
38
|
-
}): Promise<
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
65
|
+
grammarEvaluationState?: AddonGrammarEvaluationState;
|
|
66
|
+
}): Promise<Token>;
|
|
67
|
+
disposeSequence(sequenceId: number): void;
|
|
68
|
+
removeTokenCellsFromSequence(sequenceId: number, startPos: number, endPos: number): void;
|
|
69
|
+
shiftSequenceTokenCells(sequenceId: number, startPos: number, endPos: number, shiftDelta: number): void;
|
|
70
|
+
};
|
|
71
|
+
export type BatchLogitIndex = number & {
|
|
72
|
+
__batchLogitIndex: never;
|
|
45
73
|
};
|
|
46
|
-
export type
|
|
47
|
-
|
|
48
|
-
printGrammar?: boolean;
|
|
49
|
-
}): LLAMAGrammar;
|
|
74
|
+
export type AddonGrammar = "AddonGrammar" & {
|
|
75
|
+
__brand: never;
|
|
50
76
|
};
|
|
51
|
-
export type
|
|
52
|
-
|
|
77
|
+
export type AddonGrammarEvaluationState = "AddonGrammarEvaluationState" & {
|
|
78
|
+
__brand: never;
|
|
53
79
|
};
|
|
80
|
+
export type ModelTypeDescription = `${AddonModelArchName} ${AddonModelTypeName} ${AddonModelFileTypeName}`;
|
|
81
|
+
export type AddonModelArchName = "unknown" | "llama" | "falcon" | "gpt2" | "gptj" | "gptneox" | "mpt" | "baichuan" | "starcoder" | "persimmon" | "refact" | "bloom" | "stablelm";
|
|
82
|
+
export type AddonModelTypeName = "1B" | "3B" | "7B" | "8B" | "13B" | "15B" | "30B" | "34B" | "40B" | "65B" | "70B" | "?B";
|
|
83
|
+
export type AddonModelFileTypeName = _AddonModelFileTypeName | `${_AddonModelFileTypeName} (guessed)`;
|
|
84
|
+
type _AddonModelFileTypeName = "all F32" | "mostly F16" | "mostly Q4_0" | "mostly Q4_1" | "mostly Q4_1, some F16" | "mostly Q5_0" | "mostly Q5_1" | "mostly Q8_0" | "mostly Q2_K" | "mostly Q3_K - Small" | "mostly Q3_K - Medium" | "mostly Q3_K - Large" | "mostly Q4_K - Small" | "mostly Q4_K - Medium" | "mostly Q5_K - Small" | "mostly Q5_K - Medium" | "mostly Q6_K" | "unknown, may not work";
|
|
85
|
+
export {};
|
package/dist/utils/getBin.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"getBin.js","sourceRoot":"","sources":["../../src/utils/getBin.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,aAAa,EAAC,MAAM,QAAQ,CAAC;AACrC,OAAO,KAAK,OAAO,MAAM,SAAS,CAAC;AACnC,OAAO,IAAI,MAAM,MAAM,CAAC;AACxB,OAAO,OAAO,MAAM,SAAS,CAAC;AAC9B,OAAO,EAAE,MAAM,UAAU,CAAC;AAC1B,OAAO,EACH,0BAA0B,EAAE,yBAAyB,EAAE,2BAA2B,EAAE,sBAAsB,EAAE,mBAAmB,EAC/H,kBAAkB,EACrB,MAAM,cAAc,CAAC;AACtB,OAAO,EAAC,uBAAuB,EAAC,MAAM,oCAAoC,CAAC;
|
|
1
|
+
{"version":3,"file":"getBin.js","sourceRoot":"","sources":["../../src/utils/getBin.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,aAAa,EAAC,MAAM,QAAQ,CAAC;AACrC,OAAO,KAAK,OAAO,MAAM,SAAS,CAAC;AACnC,OAAO,IAAI,MAAM,MAAM,CAAC;AACxB,OAAO,OAAO,MAAM,SAAS,CAAC;AAC9B,OAAO,EAAE,MAAM,UAAU,CAAC;AAC1B,OAAO,EACH,0BAA0B,EAAE,yBAAyB,EAAE,2BAA2B,EAAE,sBAAsB,EAAE,mBAAmB,EAC/H,kBAAkB,EACrB,MAAM,cAAc,CAAC;AACtB,OAAO,EAAC,uBAAuB,EAAC,MAAM,oCAAoC,CAAC;AAE3E,OAAO,EAAC,cAAc,EAAC,MAAM,kBAAkB,CAAC;AAChD,OAAO,EAAC,6BAA6B,EAAC,MAAM,sBAAsB,CAAC;AAEnE,MAAM,OAAO,GAAG,aAAa,CAAC,MAAM,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;AAE/C,MAAM,CAAC,KAAK,UAAU,kBAAkB;IACpC,SAAS,UAAU,CAAC,QAAgB,EAAE,IAAY;QAC9C,OAAO,IAAI,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,QAAQ,IAAI,IAAI,mBAAmB,CAAC,CAAC;IACjF,CAAC;IAED,KAAK,UAAU,WAAW,CAAC,QAAgB,EAAE,IAAY;QACrD,MAAM,OAAO,GAAG,UAAU,CAAC,QAAQ,EAAE,IAAI,CAAC,CAAC;QAE3C,IAAI,MAAM,EAAE,CAAC,UAAU,CAAC,OAAO,CAAC;YAC5B,OAAO,OAAO,CAAC;QAEnB,OAAO,IAAI,CAAC;IAChB,CAAC;IAED,KAAK,UAAU,OAAO;QAClB,QAAQ,OAAO,CAAC,QAAQ,EAAE;YACtB,KAAK,OAAO,CAAC;YACb,KAAK,QAAQ;gBACT,OAAO,WAAW,CAAC,KAAK,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;YAE5C,KAAK,OAAO,CAAC;YACb,KAAK,SAAS;gBACV,OAAO,WAAW,CAAC,OAAO,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;YAE9C,KAAK,QAAQ;gBACT,OAAO,WAAW,CAAC,KAAK,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;SAC/C;QAED,OAAO,IAAI,CAAC;IAChB,CAAC;IAED,OAAO,MAAM,OAAO,EAAE,CAAC;AAC3B,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,OAAO;IACzB,MAAM,WAAW,GAAG,MAAM,cAAc,EAAE,CAAC;IAE3C,IAAI,WAAW,KAAK,kBAAkB,EAAE;QACpC,MAAM,eAAe,GAAG,MAAM,kBAAkB,EAAE,CAAC;QAEnD,IAAI,eAAe,IAAI,IAAI,EAAE;YACzB,OAAO,CAAC,IAAI,CAAC,wEAAwE,CAAC,CAAC;SAC1F;aAAM;YACH,IAAI;gBACA,OAAO,OAAO,CAAC,eAAe,CAAC,CAAC;aACnC;YAAC,OAAO,GAAG,EAAE;gBACV,OAAO,CAAC,KAAK,CAAC,gDAAgD,OAAO,CAAC,QAAQ,MAAM,OAAO,CAAC,IAAI,WAAW,EAAE,GAAG,CAAC,CAAC;gBAClH,OAAO,CAAC,IAAI,CAAC,wCAAwC,CAAC,CAAC;gBAEvD,IAAI;oBACA,OAAO,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,OAAO,CAAC,eAAe,CAAC,CAAC,CAAC;iBAC1D;gBAAC,OAAO,GAAG,EAAE,GAAE;aACnB;SACJ;KACJ;IAED,MAAM,UAAU,GAAG,MAAM,6BAA6B,EAAE,CAAC;IAEzD,IAAI,UAAU,IAAI,IAAI,EAAE;QACpB,IAAI,mBAAmB,EAAE;YACrB,MAAM,IAAI,KAAK,CAAC,oFAAoF,CAAC,CAAC;SACzG;aAAM;YACH,MAAM,uBAAuB,CAAC;gBAC1B,IAAI,EAAE,yBAAyB;gBAC/B,OAAO,EAAE,sBAAsB;gBAC/B,KAAK,EAAE,2BAA2B;gBAClC,IAAI,EAAE,0BAA0B;aACnC,CAAC,CAAC;YAEH,MAAM,UAAU,GAAG,MAAM,6BAA6B,EAAE,CAAC;YAEzD,IAAI,UAAU,IAAI,IAAI,EAAE;gBACpB,MAAM,IAAI,KAAK,CAAC,0CAA0C,CAAC,CAAC;aAC/D;YAED,OAAO,OAAO,CAAC,UAAU,CAAC,CAAC;SAC9B;KACJ;IAED,OAAO,OAAO,CAAC,UAAU,CAAC,CAAC;AAC/B,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"getReleaseInfo.js","sourceRoot":"","sources":["../../src/utils/getReleaseInfo.ts"],"names":[],"mappings":"AAAA,OAAO,IAAI,MAAM,MAAM,CAAC;AACxB,OAAO,EAAC,aAAa,EAAC,MAAM,KAAK,CAAC;AAClC,OAAO,EAAE,MAAM,UAAU,CAAC;AAC1B,OAAO,EAAC,cAAc,EAAC,MAAM,kBAAkB,CAAC;AAChD,OAAO,EAAC,+BAA+B,EAAC,MAAM,wBAAwB,CAAC;AACvE,OAAO,EAAC,wBAAwB,EAAC,MAAM,4BAA4B,CAAC;AAEpE,MAAM,SAAS,GAAG,IAAI,CAAC,OAAO,CAAC,aAAa,CAAC,MAAM,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC;AAE/D,MAAM,CAAC,KAAK,UAAU,cAAc;
|
|
1
|
+
{"version":3,"file":"getReleaseInfo.js","sourceRoot":"","sources":["../../src/utils/getReleaseInfo.ts"],"names":[],"mappings":"AAAA,OAAO,IAAI,MAAM,MAAM,CAAC;AACxB,OAAO,EAAC,aAAa,EAAC,MAAM,KAAK,CAAC;AAClC,OAAO,EAAE,MAAM,UAAU,CAAC;AAC1B,OAAO,EAAC,cAAc,EAAC,MAAM,kBAAkB,CAAC;AAChD,OAAO,EAAC,+BAA+B,EAAC,MAAM,wBAAwB,CAAC;AACvE,OAAO,EAAC,wBAAwB,EAAC,MAAM,4BAA4B,CAAC;AAEpE,MAAM,SAAS,GAAG,IAAI,CAAC,OAAO,CAAC,aAAa,CAAC,MAAM,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC;AAE/D,MAAM,CAAC,KAAK,UAAU,cAAc;IAOhC,MAAM,CAAC,WAAW,EAAE,aAAa,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;QACnD,cAAc,EAAE;QAChB,gBAAgB,EAAE;KACrB,CAAC,CAAC;IAEH,MAAM,OAAO,GAAG,WAAW,KAAK,kBAAkB;QAC9C,CAAC,CAAC,MAAM,wBAAwB,EAAE;QAClC,CAAC,CAAC,CAAC,MAAM,+BAA+B,EAAE,IAAI,MAAM,wBAAwB,EAAE,CAAC,CAAC;IAEpF,OAAO;QACH,QAAQ,EAAE;YACN,YAAY,EAAE,WAAW,KAAK,kBAAkB;gBAC5C,CAAC,CAAC,UAAU;gBACZ,CAAC,CAAC,cAAc;YACpB,OAAO;SACV;QACD,aAAa;KAChB,CAAC;AACN,CAAC;AAED,KAAK,UAAU,gBAAgB;IAC3B,MAAM,WAAW,GAAG,MAAM,EAAE,CAAC,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,IAAI,EAAE,IAAI,EAAE,cAAc,CAAC,CAAC,CAAC;IAExF,OAAO,WAAW,CAAC,OAAO,CAAC;AAC/B,CAAC"}
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
export declare function parseModelFileName(filename: string): {
|
|
2
|
+
name: string | undefined;
|
|
3
|
+
subType: string;
|
|
4
|
+
quantization: string | undefined;
|
|
5
|
+
fileType: string | undefined;
|
|
6
|
+
version: string | undefined;
|
|
7
|
+
contextSize: string | undefined;
|
|
8
|
+
parameters: `${number}B` | undefined;
|
|
9
|
+
};
|
|
@@ -0,0 +1,68 @@
|
|
|
1
|
+
export function parseModelFileName(filename) {
|
|
2
|
+
const parts = filename.split("-");
|
|
3
|
+
let quantization;
|
|
4
|
+
let fileType;
|
|
5
|
+
let version;
|
|
6
|
+
let contextSize;
|
|
7
|
+
if (parts.length > 0) {
|
|
8
|
+
const lastPart = parts[parts.length - 1];
|
|
9
|
+
const lastParts = lastPart.split(".");
|
|
10
|
+
fileType = lastParts.pop();
|
|
11
|
+
quantization = lastParts.pop();
|
|
12
|
+
if (lastParts.length > 0)
|
|
13
|
+
parts[parts.length - 1] = lastParts.join(".");
|
|
14
|
+
else
|
|
15
|
+
parts.pop();
|
|
16
|
+
}
|
|
17
|
+
const { previousParts, parameters, nextParts } = splitByModelParameters(parts);
|
|
18
|
+
const name = previousParts.shift();
|
|
19
|
+
for (let i = 0; i < nextParts.length; i++) {
|
|
20
|
+
const part = nextParts[i];
|
|
21
|
+
if (isContextSizeText(part)) {
|
|
22
|
+
contextSize = part.toUpperCase();
|
|
23
|
+
nextParts.splice(i, 1);
|
|
24
|
+
i--;
|
|
25
|
+
}
|
|
26
|
+
else if (isVersionText(part)) {
|
|
27
|
+
version = part.toLowerCase();
|
|
28
|
+
nextParts.splice(i, 1);
|
|
29
|
+
i--;
|
|
30
|
+
}
|
|
31
|
+
}
|
|
32
|
+
return {
|
|
33
|
+
name,
|
|
34
|
+
subType: previousParts.join("-"),
|
|
35
|
+
quantization,
|
|
36
|
+
fileType,
|
|
37
|
+
version,
|
|
38
|
+
contextSize,
|
|
39
|
+
parameters
|
|
40
|
+
};
|
|
41
|
+
}
|
|
42
|
+
function isParametersText(text) {
|
|
43
|
+
return /^[0-9]+[Bb]$/.test(text);
|
|
44
|
+
}
|
|
45
|
+
function isVersionText(text) {
|
|
46
|
+
return /^[vV]?[0-9]/.test(text);
|
|
47
|
+
}
|
|
48
|
+
function isContextSizeText(text) {
|
|
49
|
+
return /^[0-9]+[kKmM]$/.test(text);
|
|
50
|
+
}
|
|
51
|
+
function splitByModelParameters(parts) {
|
|
52
|
+
for (let i = 0; i < parts.length; i++) {
|
|
53
|
+
const part = parts[i];
|
|
54
|
+
if (isParametersText(part)) {
|
|
55
|
+
return {
|
|
56
|
+
parameters: part.toUpperCase(),
|
|
57
|
+
previousParts: parts.slice(0, i),
|
|
58
|
+
nextParts: parts.slice(i + 1)
|
|
59
|
+
};
|
|
60
|
+
}
|
|
61
|
+
}
|
|
62
|
+
return {
|
|
63
|
+
parameters: undefined,
|
|
64
|
+
previousParts: parts,
|
|
65
|
+
nextParts: []
|
|
66
|
+
};
|
|
67
|
+
}
|
|
68
|
+
//# sourceMappingURL=parseModelFileName.js.map
|