@appkit/llamacpp-cli 1.8.0 → 1.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (116) hide show
  1. package/CHANGELOG.md +58 -0
  2. package/README.md +249 -40
  3. package/dist/cli.js +154 -10
  4. package/dist/cli.js.map +1 -1
  5. package/dist/commands/completion.d.ts +9 -0
  6. package/dist/commands/completion.d.ts.map +1 -0
  7. package/dist/commands/completion.js +83 -0
  8. package/dist/commands/completion.js.map +1 -0
  9. package/dist/commands/monitor.js +1 -1
  10. package/dist/commands/monitor.js.map +1 -1
  11. package/dist/commands/ps.d.ts +1 -3
  12. package/dist/commands/ps.d.ts.map +1 -1
  13. package/dist/commands/ps.js +36 -115
  14. package/dist/commands/ps.js.map +1 -1
  15. package/dist/commands/router/config.d.ts +11 -0
  16. package/dist/commands/router/config.d.ts.map +1 -0
  17. package/dist/commands/router/config.js +100 -0
  18. package/dist/commands/router/config.js.map +1 -0
  19. package/dist/commands/router/logs.d.ts +12 -0
  20. package/dist/commands/router/logs.d.ts.map +1 -0
  21. package/dist/commands/router/logs.js +238 -0
  22. package/dist/commands/router/logs.js.map +1 -0
  23. package/dist/commands/router/restart.d.ts +2 -0
  24. package/dist/commands/router/restart.d.ts.map +1 -0
  25. package/dist/commands/router/restart.js +39 -0
  26. package/dist/commands/router/restart.js.map +1 -0
  27. package/dist/commands/router/start.d.ts +2 -0
  28. package/dist/commands/router/start.d.ts.map +1 -0
  29. package/dist/commands/router/start.js +60 -0
  30. package/dist/commands/router/start.js.map +1 -0
  31. package/dist/commands/router/status.d.ts +2 -0
  32. package/dist/commands/router/status.d.ts.map +1 -0
  33. package/dist/commands/router/status.js +116 -0
  34. package/dist/commands/router/status.js.map +1 -0
  35. package/dist/commands/router/stop.d.ts +2 -0
  36. package/dist/commands/router/stop.d.ts.map +1 -0
  37. package/dist/commands/router/stop.js +36 -0
  38. package/dist/commands/router/stop.js.map +1 -0
  39. package/dist/commands/tui.d.ts +2 -0
  40. package/dist/commands/tui.d.ts.map +1 -0
  41. package/dist/commands/tui.js +27 -0
  42. package/dist/commands/tui.js.map +1 -0
  43. package/dist/lib/completion.d.ts +5 -0
  44. package/dist/lib/completion.d.ts.map +1 -0
  45. package/dist/lib/completion.js +195 -0
  46. package/dist/lib/completion.js.map +1 -0
  47. package/dist/lib/model-downloader.d.ts +5 -1
  48. package/dist/lib/model-downloader.d.ts.map +1 -1
  49. package/dist/lib/model-downloader.js +53 -20
  50. package/dist/lib/model-downloader.js.map +1 -1
  51. package/dist/lib/router-logger.d.ts +61 -0
  52. package/dist/lib/router-logger.d.ts.map +1 -0
  53. package/dist/lib/router-logger.js +200 -0
  54. package/dist/lib/router-logger.js.map +1 -0
  55. package/dist/lib/router-manager.d.ts +103 -0
  56. package/dist/lib/router-manager.d.ts.map +1 -0
  57. package/dist/lib/router-manager.js +394 -0
  58. package/dist/lib/router-manager.js.map +1 -0
  59. package/dist/lib/router-server.d.ts +61 -0
  60. package/dist/lib/router-server.d.ts.map +1 -0
  61. package/dist/lib/router-server.js +485 -0
  62. package/dist/lib/router-server.js.map +1 -0
  63. package/dist/tui/ConfigApp.d.ts +7 -0
  64. package/dist/tui/ConfigApp.d.ts.map +1 -0
  65. package/dist/tui/ConfigApp.js +1002 -0
  66. package/dist/tui/ConfigApp.js.map +1 -0
  67. package/dist/tui/HistoricalMonitorApp.d.ts.map +1 -1
  68. package/dist/tui/HistoricalMonitorApp.js +85 -49
  69. package/dist/tui/HistoricalMonitorApp.js.map +1 -1
  70. package/dist/tui/ModelsApp.d.ts +7 -0
  71. package/dist/tui/ModelsApp.d.ts.map +1 -0
  72. package/dist/tui/ModelsApp.js +362 -0
  73. package/dist/tui/ModelsApp.js.map +1 -0
  74. package/dist/tui/MultiServerMonitorApp.d.ts +6 -1
  75. package/dist/tui/MultiServerMonitorApp.d.ts.map +1 -1
  76. package/dist/tui/MultiServerMonitorApp.js +1038 -122
  77. package/dist/tui/MultiServerMonitorApp.js.map +1 -1
  78. package/dist/tui/RootNavigator.d.ts +7 -0
  79. package/dist/tui/RootNavigator.d.ts.map +1 -0
  80. package/dist/tui/RootNavigator.js +55 -0
  81. package/dist/tui/RootNavigator.js.map +1 -0
  82. package/dist/tui/SearchApp.d.ts +6 -0
  83. package/dist/tui/SearchApp.d.ts.map +1 -0
  84. package/dist/tui/SearchApp.js +451 -0
  85. package/dist/tui/SearchApp.js.map +1 -0
  86. package/dist/tui/SplashScreen.d.ts +16 -0
  87. package/dist/tui/SplashScreen.d.ts.map +1 -0
  88. package/dist/tui/SplashScreen.js +129 -0
  89. package/dist/tui/SplashScreen.js.map +1 -0
  90. package/dist/types/router-config.d.ts +19 -0
  91. package/dist/types/router-config.d.ts.map +1 -0
  92. package/dist/types/router-config.js +3 -0
  93. package/dist/types/router-config.js.map +1 -0
  94. package/package.json +1 -1
  95. package/src/cli.ts +121 -10
  96. package/src/commands/monitor.ts +1 -1
  97. package/src/commands/ps.ts +44 -133
  98. package/src/commands/router/config.ts +116 -0
  99. package/src/commands/router/logs.ts +256 -0
  100. package/src/commands/router/restart.ts +36 -0
  101. package/src/commands/router/start.ts +60 -0
  102. package/src/commands/router/status.ts +119 -0
  103. package/src/commands/router/stop.ts +33 -0
  104. package/src/commands/tui.ts +25 -0
  105. package/src/lib/model-downloader.ts +57 -20
  106. package/src/lib/router-logger.ts +201 -0
  107. package/src/lib/router-manager.ts +414 -0
  108. package/src/lib/router-server.ts +538 -0
  109. package/src/tui/ConfigApp.ts +1085 -0
  110. package/src/tui/HistoricalMonitorApp.ts +88 -49
  111. package/src/tui/ModelsApp.ts +368 -0
  112. package/src/tui/MultiServerMonitorApp.ts +1163 -122
  113. package/src/tui/RootNavigator.ts +74 -0
  114. package/src/tui/SearchApp.ts +511 -0
  115. package/src/tui/SplashScreen.ts +149 -0
  116. package/src/types/router-config.ts +25 -0
@@ -0,0 +1,538 @@
1
+ #!/usr/bin/env node
2
+
3
+ import * as http from 'http';
4
+ import * as https from 'https';
5
+ import { URL } from 'url';
6
+ import * as fs from 'fs/promises';
7
+ import * as path from 'path';
8
+ import { RouterConfig } from '../types/router-config';
9
+ import { ServerConfig } from '../types/server-config';
10
+ import { readJson, fileExists, getConfigDir, getServersDir } from '../utils/file-utils';
11
+ import { RouterLogger, RequestTimer, RouterLogEntry } from './router-logger';
12
+
13
+ interface ErrorResponse {
14
+ error: string;
15
+ details?: string;
16
+ }
17
+
18
+ interface ModelInfo {
19
+ id: string;
20
+ object: 'model';
21
+ created: number;
22
+ owned_by: string;
23
+ }
24
+
25
+ interface ModelsResponse {
26
+ object: 'list';
27
+ data: ModelInfo[];
28
+ }
29
+
30
+ /**
31
+ * Router HTTP server - proxies requests to backend llama.cpp servers
32
+ */
33
+ class RouterServer {
34
+ private config!: RouterConfig;
35
+ private server!: http.Server;
36
+ private logger!: RouterLogger;
37
+
38
+ async initialize(): Promise<void> {
39
+ // Load router config
40
+ const configPath = path.join(getConfigDir(), 'router.json');
41
+ if (!(await fileExists(configPath))) {
42
+ throw new Error('Router configuration not found');
43
+ }
44
+ this.config = await readJson<RouterConfig>(configPath);
45
+
46
+ // Initialize logger with verbose setting
47
+ this.logger = new RouterLogger(this.config.verbose);
48
+
49
+ // Rotate log file if needed
50
+ await this.logger.rotateIfNeeded();
51
+
52
+ // Create HTTP server
53
+ this.server = http.createServer(async (req, res) => {
54
+ await this.handleRequest(req, res);
55
+ });
56
+
57
+ // Graceful shutdown
58
+ process.on('SIGTERM', async () => {
59
+ console.error('[Router] Received SIGTERM, shutting down gracefully...');
60
+ this.server.close(() => {
61
+ console.error('[Router] Server closed');
62
+ process.exit(0);
63
+ });
64
+ });
65
+
66
+ process.on('SIGINT', async () => {
67
+ console.error('[Router] Received SIGINT, shutting down gracefully...');
68
+ this.server.close(() => {
69
+ console.error('[Router] Server closed');
70
+ process.exit(0);
71
+ });
72
+ });
73
+ }
74
+
75
+ async start(): Promise<void> {
76
+ await this.initialize();
77
+
78
+ this.server.listen(this.config.port, this.config.host, () => {
79
+ console.error(`[Router] Listening on http://${this.config.host}:${this.config.port}`);
80
+ console.error(`[Router] PID: ${process.pid}`);
81
+ });
82
+ }
83
+
84
+ /**
85
+ * Main request handler
86
+ */
87
+ private async handleRequest(req: http.IncomingMessage, res: http.ServerResponse): Promise<void> {
88
+ // CORS headers
89
+ res.setHeader('Access-Control-Allow-Origin', '*');
90
+ res.setHeader('Access-Control-Allow-Methods', 'GET, POST, OPTIONS');
91
+ res.setHeader('Access-Control-Allow-Headers', 'Content-Type, Authorization');
92
+
93
+ // Handle OPTIONS preflight
94
+ if (req.method === 'OPTIONS') {
95
+ res.writeHead(200);
96
+ res.end();
97
+ return;
98
+ }
99
+
100
+ try {
101
+ // Route based on path
102
+ if (req.url === '/health' && req.method === 'GET') {
103
+ await this.handleHealth(req, res);
104
+ } else if (req.url === '/v1/models' && req.method === 'GET') {
105
+ await this.handleModels(req, res);
106
+ } else if (req.url === '/v1/chat/completions' && req.method === 'POST') {
107
+ await this.handleChatCompletions(req, res);
108
+ } else if (req.url === '/v1/embeddings' && req.method === 'POST') {
109
+ await this.handleEmbeddings(req, res);
110
+ } else {
111
+ this.sendError(res, 404, 'Not Found', `Unknown endpoint: ${req.url}`);
112
+ }
113
+ } catch (error) {
114
+ console.error('[Router] Error handling request:', error);
115
+ this.sendError(res, 500, 'Internal Server Error', (error as Error).message);
116
+ }
117
+ }
118
+
119
+ /**
120
+ * Health check endpoint
121
+ */
122
+ private async handleHealth(req: http.IncomingMessage, res: http.ServerResponse): Promise<void> {
123
+ res.writeHead(200, { 'Content-Type': 'application/json' });
124
+ res.end(JSON.stringify({
125
+ status: 'healthy',
126
+ uptime: process.uptime(),
127
+ timestamp: new Date().toISOString(),
128
+ }));
129
+ }
130
+
131
+ /**
132
+ * List models endpoint - aggregate from all running servers
133
+ */
134
+ private async handleModels(req: http.IncomingMessage, res: http.ServerResponse): Promise<void> {
135
+ const servers = await this.getAllServers();
136
+ const runningServers = servers.filter(s => s.status === 'running');
137
+
138
+ const models: ModelInfo[] = runningServers.map(server => ({
139
+ id: server.modelName,
140
+ object: 'model',
141
+ created: Math.floor(new Date(server.createdAt).getTime() / 1000),
142
+ owned_by: 'llamacpp',
143
+ }));
144
+
145
+ const response: ModelsResponse = {
146
+ object: 'list',
147
+ data: models,
148
+ };
149
+
150
+ res.writeHead(200, { 'Content-Type': 'application/json' });
151
+ res.end(JSON.stringify(response));
152
+ }
153
+
154
+ /**
155
+ * Chat completions endpoint - route to backend server
156
+ */
157
+ private async handleChatCompletions(req: http.IncomingMessage, res: http.ServerResponse): Promise<void> {
158
+ const timer = new RequestTimer();
159
+ let modelName = 'unknown';
160
+ let statusCode = 500;
161
+ let errorMsg: string | undefined;
162
+ let promptPreview: string | undefined;
163
+
164
+ try {
165
+ // Parse request body
166
+ const body = await this.readBody(req);
167
+ let requestData: any;
168
+ try {
169
+ requestData = JSON.parse(body);
170
+ } catch (error) {
171
+ statusCode = 400;
172
+ errorMsg = 'Invalid JSON in request body';
173
+ this.sendError(res, statusCode, 'Bad Request', errorMsg);
174
+ await this.logRequest(modelName, '/v1/chat/completions', statusCode, timer.elapsed(), errorMsg);
175
+ return;
176
+ }
177
+
178
+ // Extract model name and prompt preview
179
+ modelName = requestData.model || 'unknown';
180
+ promptPreview = this.extractPromptPreview(requestData);
181
+
182
+ if (!requestData.model) {
183
+ statusCode = 400;
184
+ errorMsg = 'Missing "model" field in request';
185
+ this.sendError(res, statusCode, 'Bad Request', errorMsg);
186
+ await this.logRequest(modelName, '/v1/chat/completions', statusCode, timer.elapsed(), errorMsg, undefined, promptPreview);
187
+ return;
188
+ }
189
+
190
+ // Find server for model
191
+ const server = await this.findServerForModel(modelName);
192
+ if (!server) {
193
+ statusCode = 404;
194
+ errorMsg = `No server found for model: ${modelName}`;
195
+ this.sendError(res, statusCode, 'Not Found', errorMsg);
196
+ await this.logRequest(modelName, '/v1/chat/completions', statusCode, timer.elapsed(), errorMsg, undefined, promptPreview);
197
+ return;
198
+ }
199
+
200
+ if (server.status !== 'running') {
201
+ statusCode = 503;
202
+ errorMsg = `Server for model "${modelName}" is not running`;
203
+ this.sendError(res, statusCode, 'Service Unavailable', errorMsg);
204
+ await this.logRequest(modelName, '/v1/chat/completions', statusCode, timer.elapsed(), errorMsg, `${server.host}:${server.port}`, promptPreview);
205
+ return;
206
+ }
207
+
208
+ // Proxy request to backend
209
+ const backendUrl = `http://${server.host}:${server.port}/v1/chat/completions`;
210
+ await this.proxyRequest(backendUrl, requestData, req, res);
211
+
212
+ // Log success
213
+ statusCode = 200;
214
+ await this.logRequest(modelName, '/v1/chat/completions', statusCode, timer.elapsed(), undefined, `${server.host}:${server.port}`, promptPreview);
215
+ } catch (error) {
216
+ errorMsg = (error as Error).message;
217
+ await this.logRequest(modelName, '/v1/chat/completions', statusCode, timer.elapsed(), errorMsg, undefined, promptPreview);
218
+ throw error;
219
+ }
220
+ }
221
+
222
+ /**
223
+ * Embeddings endpoint - route to backend server
224
+ */
225
+ private async handleEmbeddings(req: http.IncomingMessage, res: http.ServerResponse): Promise<void> {
226
+ const timer = new RequestTimer();
227
+ let modelName = 'unknown';
228
+ let statusCode = 500;
229
+ let errorMsg: string | undefined;
230
+ let promptPreview: string | undefined;
231
+
232
+ try {
233
+ // Parse request body
234
+ const body = await this.readBody(req);
235
+ let requestData: any;
236
+ try {
237
+ requestData = JSON.parse(body);
238
+ } catch (error) {
239
+ statusCode = 400;
240
+ errorMsg = 'Invalid JSON in request body';
241
+ this.sendError(res, statusCode, 'Bad Request', errorMsg);
242
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), errorMsg);
243
+ return;
244
+ }
245
+
246
+ // Extract model name and prompt preview
247
+ modelName = requestData.model || 'unknown';
248
+ promptPreview = this.extractPromptPreview(requestData);
249
+
250
+ if (!requestData.model) {
251
+ statusCode = 400;
252
+ errorMsg = 'Missing "model" field in request';
253
+ this.sendError(res, statusCode, 'Bad Request', errorMsg);
254
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), errorMsg, undefined, promptPreview);
255
+ return;
256
+ }
257
+
258
+ // Find server for model
259
+ const server = await this.findServerForModel(modelName);
260
+ if (!server) {
261
+ statusCode = 404;
262
+ errorMsg = `No server found for model: ${modelName}`;
263
+ this.sendError(res, statusCode, 'Not Found', errorMsg);
264
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), errorMsg, undefined, promptPreview);
265
+ return;
266
+ }
267
+
268
+ if (server.status !== 'running') {
269
+ statusCode = 503;
270
+ errorMsg = `Server for model "${modelName}" is not running`;
271
+ this.sendError(res, statusCode, 'Service Unavailable', errorMsg);
272
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), errorMsg, `${server.host}:${server.port}`, promptPreview);
273
+ return;
274
+ }
275
+
276
+ // Check if server has embeddings enabled
277
+ if (!server.embeddings) {
278
+ statusCode = 400;
279
+ errorMsg = `Server for model "${modelName}" does not have embeddings enabled`;
280
+ this.sendError(res, statusCode, 'Bad Request', errorMsg);
281
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), errorMsg, `${server.host}:${server.port}`, promptPreview);
282
+ return;
283
+ }
284
+
285
+ // Proxy request to backend
286
+ const backendUrl = `http://${server.host}:${server.port}/v1/embeddings`;
287
+ await this.proxyRequest(backendUrl, requestData, req, res);
288
+
289
+ // Log success
290
+ statusCode = 200;
291
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), undefined, `${server.host}:${server.port}`, promptPreview);
292
+ } catch (error) {
293
+ errorMsg = (error as Error).message;
294
+ await this.logRequest(modelName, '/v1/embeddings', statusCode, timer.elapsed(), errorMsg, undefined, promptPreview);
295
+ throw error;
296
+ }
297
+ }
298
+
299
+ /**
300
+ * Proxy a request to a backend server
301
+ */
302
+ private async proxyRequest(
303
+ backendUrl: string,
304
+ requestData: any,
305
+ originalReq: http.IncomingMessage,
306
+ res: http.ServerResponse
307
+ ): Promise<void> {
308
+ const url = new URL(backendUrl);
309
+ const isHttps = url.protocol === 'https:';
310
+ const httpModule = isHttps ? https : http;
311
+
312
+ const requestBody = JSON.stringify(requestData);
313
+
314
+ const options: http.RequestOptions = {
315
+ hostname: url.hostname,
316
+ port: url.port || (isHttps ? 443 : 80),
317
+ path: url.pathname + url.search,
318
+ method: 'POST',
319
+ headers: {
320
+ 'Content-Type': 'application/json',
321
+ 'Content-Length': Buffer.byteLength(requestBody),
322
+ },
323
+ timeout: this.config.requestTimeout,
324
+ };
325
+
326
+ return new Promise((resolve, reject) => {
327
+ const proxyReq = httpModule.request(options, (proxyRes) => {
328
+ // Forward status and headers
329
+ res.writeHead(proxyRes.statusCode || 200, proxyRes.headers);
330
+
331
+ // Stream response
332
+ proxyRes.pipe(res);
333
+
334
+ proxyRes.on('end', () => {
335
+ resolve();
336
+ });
337
+ });
338
+
339
+ proxyReq.on('error', (error) => {
340
+ console.error('[Router] Proxy request failed:', error);
341
+ if (!res.headersSent) {
342
+ this.sendError(res, 502, 'Bad Gateway', 'Failed to connect to backend server');
343
+ }
344
+ reject(error);
345
+ });
346
+
347
+ proxyReq.on('timeout', () => {
348
+ console.error('[Router] Proxy request timed out');
349
+ proxyReq.destroy();
350
+ if (!res.headersSent) {
351
+ this.sendError(res, 504, 'Gateway Timeout', 'Backend server did not respond in time');
352
+ }
353
+ reject(new Error('Request timeout'));
354
+ });
355
+
356
+ // Send request body
357
+ proxyReq.write(requestBody);
358
+ proxyReq.end();
359
+ });
360
+ }
361
+
362
+ /**
363
+ * Read request body as string
364
+ */
365
+ private async readBody(req: http.IncomingMessage): Promise<string> {
366
+ return new Promise((resolve, reject) => {
367
+ const chunks: Buffer[] = [];
368
+ req.on('data', (chunk: Buffer) => chunks.push(chunk));
369
+ req.on('end', () => resolve(Buffer.concat(chunks).toString('utf-8')));
370
+ req.on('error', reject);
371
+ });
372
+ }
373
+
374
+ /**
375
+ * Send error response
376
+ */
377
+ private sendError(res: http.ServerResponse, statusCode: number, error: string, details?: string): void {
378
+ if (res.headersSent) return;
379
+
380
+ const response: ErrorResponse = { error };
381
+ if (details) response.details = details;
382
+
383
+ res.writeHead(statusCode, { 'Content-Type': 'application/json' });
384
+ res.end(JSON.stringify(response));
385
+ }
386
+
387
+ /**
388
+ * Get all server configurations
389
+ */
390
+ private async getAllServers(): Promise<ServerConfig[]> {
391
+ const serversDir = getServersDir();
392
+ try {
393
+ const files = await fs.readdir(serversDir);
394
+ const configFiles = files.filter(f => f.endsWith('.json'));
395
+
396
+ const servers: ServerConfig[] = [];
397
+ for (const file of configFiles) {
398
+ const filePath = path.join(serversDir, file);
399
+ try {
400
+ const config = await readJson<ServerConfig>(filePath);
401
+ servers.push(config);
402
+ } catch (error) {
403
+ console.error(`[Router] Failed to load server config ${file}:`, error);
404
+ }
405
+ }
406
+
407
+ return servers;
408
+ } catch (error) {
409
+ console.error('[Router] Failed to read servers directory:', error);
410
+ return [];
411
+ }
412
+ }
413
+
414
+ /**
415
+ * Helper method to log a request
416
+ */
417
+ private async logRequest(
418
+ model: string,
419
+ endpoint: string,
420
+ statusCode: number,
421
+ durationMs: number,
422
+ error?: string,
423
+ backend?: string,
424
+ prompt?: string
425
+ ): Promise<void> {
426
+ const entry: RouterLogEntry = {
427
+ timestamp: RequestTimer.now(),
428
+ model,
429
+ endpoint,
430
+ method: 'POST',
431
+ status: statusCode >= 200 && statusCode < 300 ? 'success' : 'error',
432
+ statusCode,
433
+ durationMs,
434
+ error,
435
+ backend,
436
+ prompt,
437
+ };
438
+
439
+ await this.logger.logRequest(entry);
440
+ }
441
+
442
+ /**
443
+ * Extract prompt preview from request data (first 50 chars)
444
+ */
445
+ private extractPromptPreview(requestData: any): string | undefined {
446
+ try {
447
+ // For chat completions, get the last user message
448
+ if (requestData.messages && Array.isArray(requestData.messages)) {
449
+ const lastUserMessage = [...requestData.messages]
450
+ .reverse()
451
+ .find((msg: any) => msg.role === 'user');
452
+
453
+ if (lastUserMessage?.content) {
454
+ const content = typeof lastUserMessage.content === 'string'
455
+ ? lastUserMessage.content
456
+ : JSON.stringify(lastUserMessage.content);
457
+ return content.substring(0, 50).replace(/\n/g, ' ');
458
+ }
459
+ }
460
+
461
+ // For embeddings, get the input text
462
+ if (requestData.input) {
463
+ const input = typeof requestData.input === 'string'
464
+ ? requestData.input
465
+ : Array.isArray(requestData.input)
466
+ ? requestData.input[0]
467
+ : JSON.stringify(requestData.input);
468
+ return input.substring(0, 50).replace(/\n/g, ' ');
469
+ }
470
+
471
+ return undefined;
472
+ } catch {
473
+ return undefined;
474
+ }
475
+ }
476
+
477
+ /**
478
+ * Find a server by model name
479
+ */
480
+ private async findServerForModel(modelName: string): Promise<ServerConfig | null> {
481
+ const servers = await this.getAllServers();
482
+
483
+ // Normalize a model name for flexible matching (lowercase, no extension, normalize separators)
484
+ const normalize = (name: string): string => {
485
+ return name
486
+ .toLowerCase()
487
+ .replace(/\.gguf$/i, '')
488
+ .replace(/[_-]/g, '-'); // Normalize underscores and hyphens to hyphens
489
+ };
490
+
491
+ const normalizedRequest = normalize(modelName);
492
+
493
+ // Try exact match first
494
+ const exactMatch = servers.find(s => s.modelName === modelName);
495
+ if (exactMatch) return exactMatch;
496
+
497
+ // Try case-insensitive match
498
+ const caseInsensitiveMatch = servers.find(
499
+ s => s.modelName.toLowerCase() === modelName.toLowerCase()
500
+ );
501
+ if (caseInsensitiveMatch) return caseInsensitiveMatch;
502
+
503
+ // Try adding .gguf extension if not present
504
+ if (!modelName.endsWith('.gguf')) {
505
+ const withExtension = modelName + '.gguf';
506
+ const extensionMatch = servers.find(
507
+ s => s.modelName.toLowerCase() === withExtension.toLowerCase()
508
+ );
509
+ if (extensionMatch) return extensionMatch;
510
+ }
511
+
512
+ // Try normalized matching (handles case, extension, and underscore/hyphen variations)
513
+ const normalizedMatch = servers.find(
514
+ s => normalize(s.modelName) === normalizedRequest
515
+ );
516
+ if (normalizedMatch) return normalizedMatch;
517
+
518
+ return null;
519
+ }
520
+ }
521
+
522
+ // Main entry point
523
+ async function main() {
524
+ try {
525
+ const server = new RouterServer();
526
+ await server.start();
527
+ } catch (error) {
528
+ console.error('[Router] Failed to start:', error);
529
+ process.exit(1);
530
+ }
531
+ }
532
+
533
+ // Only run if this is the main module
534
+ if (require.main === module) {
535
+ main();
536
+ }
537
+
538
+ export { RouterServer };