vllm-sr 0.1.0b2.dev20260202094318__py3-none-any.whl → 0.1.0b2.dev20260202230157__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- cli/templates/router-defaults.yaml +48 -0
- {vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/METADATA +1 -1
- {vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/RECORD +6 -6
- {vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/WHEEL +0 -0
- {vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/entry_points.txt +0 -0
- {vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/top_level.txt +0 -0
|
@@ -177,3 +177,51 @@ looper:
|
|
|
177
177
|
headers: {} # Optional headers (e.g., {"Authorization": "Bearer xxx"})
|
|
178
178
|
|
|
179
179
|
clear_route_cache: true
|
|
180
|
+
|
|
181
|
+
# Model Selection Configuration
|
|
182
|
+
# ML-based algorithms for intelligent model routing within decisions
|
|
183
|
+
# Reference: https://github.com/ulab-uiuc/LLMRouter
|
|
184
|
+
model_selection:
|
|
185
|
+
enabled: true
|
|
186
|
+
# Default algorithm: knn, kmeans, svm
|
|
187
|
+
default_algorithm: "knn"
|
|
188
|
+
|
|
189
|
+
# LLM candidates configuration
|
|
190
|
+
llm_candidates_path: "config/model_selection/llm_candidates.json"
|
|
191
|
+
|
|
192
|
+
# Pre-trained models path (contains saved model weights)
|
|
193
|
+
models_path: "models/model_selection"
|
|
194
|
+
|
|
195
|
+
# Training data path (for custom training)
|
|
196
|
+
training_data_path: "config/model_selection/routing_training_data.jsonl"
|
|
197
|
+
|
|
198
|
+
# Algorithm-specific configurations
|
|
199
|
+
knn:
|
|
200
|
+
k: 5 # Number of neighbors
|
|
201
|
+
weights: "distance" # "uniform" or "distance"
|
|
202
|
+
metric: "cosine" # "cosine", "euclidean", "manhattan"
|
|
203
|
+
# Pre-trained model file (relative to models_path)
|
|
204
|
+
model_file: "knn_model.json"
|
|
205
|
+
|
|
206
|
+
kmeans:
|
|
207
|
+
num_clusters: 8
|
|
208
|
+
efficiency_weight: 0.3 # Balance between quality (0) and efficiency (1)
|
|
209
|
+
max_iterations: 100
|
|
210
|
+
model_file: "kmeans_model.json"
|
|
211
|
+
|
|
212
|
+
svm:
|
|
213
|
+
kernel: "rbf" # "linear", "rbf", "poly"
|
|
214
|
+
c: 1.0 # Regularization parameter
|
|
215
|
+
gamma: "auto" # Kernel coefficient
|
|
216
|
+
model_file: "svm_model.json"
|
|
217
|
+
|
|
218
|
+
# Custom training options
|
|
219
|
+
# Allows customers to train on their own models
|
|
220
|
+
custom_training:
|
|
221
|
+
enabled: false
|
|
222
|
+
# Path to customer-provided training data
|
|
223
|
+
custom_data_path: ""
|
|
224
|
+
# Whether to merge with pre-trained data or replace
|
|
225
|
+
merge_with_pretrained: true
|
|
226
|
+
# Minimum training samples required
|
|
227
|
+
min_samples: 50
|
{vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/RECORD
RENAMED
|
@@ -28,10 +28,10 @@ cli/templates/grafana-datasource.serve.yaml,sha256=Cxjz1zVWoUdSzbSsS_iJhMHRrmRi6
|
|
|
28
28
|
cli/templates/grafana.serve.ini,sha256=x9bCkzxqm5gC4fKToY2lhNPdWhwAaJGVe5ABMW6Dv-c,1674
|
|
29
29
|
cli/templates/llm-router-dashboard.serve.json,sha256=pwnTjUh7z3_3LnIwtaLXjDWH4aHd2Mc57z0oekgt-Bk,60903
|
|
30
30
|
cli/templates/prometheus.serve.yaml,sha256=MGYq8dlRq_i2m5sogQ--kwTvJpkf44QQoCNoI7oyVT8,270
|
|
31
|
-
cli/templates/router-defaults.yaml,sha256=
|
|
31
|
+
cli/templates/router-defaults.yaml,sha256=IIiQWQAQ5KsCJMYbTOdOjwb98KSNbzcMS_VHby4y5Hs,9373
|
|
32
32
|
cli/templates/tools_db.json,sha256=CPqPBkd5nc966m1YEozz06frrmv3Pd5rrkxKkO3rTiA,4537
|
|
33
|
-
vllm_sr-0.1.0b2.
|
|
34
|
-
vllm_sr-0.1.0b2.
|
|
35
|
-
vllm_sr-0.1.0b2.
|
|
36
|
-
vllm_sr-0.1.0b2.
|
|
37
|
-
vllm_sr-0.1.0b2.
|
|
33
|
+
vllm_sr-0.1.0b2.dev20260202230157.dist-info/METADATA,sha256=iSZecpgzkF_9XSPSKQo1SldYguiA4j1EKaENEx6YOJY,7298
|
|
34
|
+
vllm_sr-0.1.0b2.dev20260202230157.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
|
|
35
|
+
vllm_sr-0.1.0b2.dev20260202230157.dist-info/entry_points.txt,sha256=WhlBPbLHUpWUsMuUQX9cnvsYMf0ih5i57vvJ1jJNi0k,42
|
|
36
|
+
vllm_sr-0.1.0b2.dev20260202230157.dist-info/top_level.txt,sha256=2ImG917oaVHlm0nP9oJE-Qrgs-fq_fGWgba2H1f8fpE,4
|
|
37
|
+
vllm_sr-0.1.0b2.dev20260202230157.dist-info/RECORD,,
|
{vllm_sr-0.1.0b2.dev20260202094318.dist-info → vllm_sr-0.1.0b2.dev20260202230157.dist-info}/WHEEL
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|