vllm-sr 0.1.0b2.dev20260202181733__tar.gz → 0.1.0b2.dev20260202230157__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (46) hide show
  1. {vllm_sr-0.1.0b2.dev20260202181733/vllm_sr.egg-info → vllm_sr-0.1.0b2.dev20260202230157}/PKG-INFO +1 -1
  2. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/router-defaults.yaml +48 -0
  3. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/pyproject.toml +1 -1
  4. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157/vllm_sr.egg-info}/PKG-INFO +1 -1
  5. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/MANIFEST.in +0 -0
  6. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/README.md +0 -0
  7. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/__init__.py +0 -0
  8. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/__init__.py +0 -0
  9. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/config.py +0 -0
  10. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/generate.py +0 -0
  11. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/init.py +0 -0
  12. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/serve.py +0 -0
  13. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/show_config.py +0 -0
  14. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/show_defaults.py +0 -0
  15. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/commands/validate.py +0 -0
  16. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/config_generator.py +0 -0
  17. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/consts.py +0 -0
  18. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/core.py +0 -0
  19. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/defaults.py +0 -0
  20. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/docker_cli.py +0 -0
  21. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/logo.py +0 -0
  22. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/main.py +0 -0
  23. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/merger.py +0 -0
  24. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/models.py +0 -0
  25. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/parser.py +0 -0
  26. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/config.template.yaml +0 -0
  27. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/envoy.template.yaml +0 -0
  28. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/generate_dashboard.py +0 -0
  29. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/grafana-dashboard.serve.yaml +0 -0
  30. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/grafana-datasource-jaeger.serve.yaml +0 -0
  31. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/grafana-datasource.serve.yaml +0 -0
  32. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/grafana.serve.ini +0 -0
  33. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/llm-router-dashboard.serve.json +0 -0
  34. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/prometheus.serve.yaml +0 -0
  35. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/templates/tools_db.json +0 -0
  36. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/utils.py +0 -0
  37. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/cli/validator.py +0 -0
  38. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/requirements.txt +0 -0
  39. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/setup.cfg +0 -0
  40. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/tests/test_plugin_parsing.py +0 -0
  41. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/tests/test_plugin_yaml_generation.py +0 -0
  42. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/vllm_sr.egg-info/SOURCES.txt +0 -0
  43. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/vllm_sr.egg-info/dependency_links.txt +0 -0
  44. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/vllm_sr.egg-info/entry_points.txt +0 -0
  45. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/vllm_sr.egg-info/requires.txt +0 -0
  46. {vllm_sr-0.1.0b2.dev20260202181733 → vllm_sr-0.1.0b2.dev20260202230157}/vllm_sr.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: vllm-sr
3
- Version: 0.1.0b2.dev20260202181733
3
+ Version: 0.1.0b2.dev20260202230157
4
4
  Summary: vLLM Semantic Router - Intelligent routing for Mixture-of-Models
5
5
  Author: vLLM-SR Team
6
6
  License: Apache-2.0
@@ -177,3 +177,51 @@ looper:
177
177
  headers: {} # Optional headers (e.g., {"Authorization": "Bearer xxx"})
178
178
 
179
179
  clear_route_cache: true
180
+
181
+ # Model Selection Configuration
182
+ # ML-based algorithms for intelligent model routing within decisions
183
+ # Reference: https://github.com/ulab-uiuc/LLMRouter
184
+ model_selection:
185
+ enabled: true
186
+ # Default algorithm: knn, kmeans, svm
187
+ default_algorithm: "knn"
188
+
189
+ # LLM candidates configuration
190
+ llm_candidates_path: "config/model_selection/llm_candidates.json"
191
+
192
+ # Pre-trained models path (contains saved model weights)
193
+ models_path: "models/model_selection"
194
+
195
+ # Training data path (for custom training)
196
+ training_data_path: "config/model_selection/routing_training_data.jsonl"
197
+
198
+ # Algorithm-specific configurations
199
+ knn:
200
+ k: 5 # Number of neighbors
201
+ weights: "distance" # "uniform" or "distance"
202
+ metric: "cosine" # "cosine", "euclidean", "manhattan"
203
+ # Pre-trained model file (relative to models_path)
204
+ model_file: "knn_model.json"
205
+
206
+ kmeans:
207
+ num_clusters: 8
208
+ efficiency_weight: 0.3 # Balance between quality (0) and efficiency (1)
209
+ max_iterations: 100
210
+ model_file: "kmeans_model.json"
211
+
212
+ svm:
213
+ kernel: "rbf" # "linear", "rbf", "poly"
214
+ c: 1.0 # Regularization parameter
215
+ gamma: "auto" # Kernel coefficient
216
+ model_file: "svm_model.json"
217
+
218
+ # Custom training options
219
+ # Allows customers to train on their own models
220
+ custom_training:
221
+ enabled: false
222
+ # Path to customer-provided training data
223
+ custom_data_path: ""
224
+ # Whether to merge with pre-trained data or replace
225
+ merge_with_pretrained: true
226
+ # Minimum training samples required
227
+ min_samples: 50
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "vllm-sr"
7
- version = "0.1.0.beta.2.dev20260202181733"
7
+ version = "0.1.0.beta.2.dev20260202230157"
8
8
  description = "vLLM Semantic Router - Intelligent routing for Mixture-of-Models"
9
9
  authors = [{name = "vLLM-SR Team"}]
10
10
  readme = "README.md"
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: vllm-sr
3
- Version: 0.1.0b2.dev20260202181733
3
+ Version: 0.1.0b2.dev20260202230157
4
4
  Summary: vLLM Semantic Router - Intelligent routing for Mixture-of-Models
5
5
  Author: vLLM-SR Team
6
6
  License: Apache-2.0