vllm-sr 0.1.0b2.dev20260129021803__tar.gz → 0.1.0b2.dev20260129021916__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (46) hide show
  1. {vllm_sr-0.1.0b2.dev20260129021803/vllm_sr.egg-info → vllm_sr-0.1.0b2.dev20260129021916}/PKG-INFO +1 -1
  2. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/router-defaults.yaml +10 -0
  3. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/pyproject.toml +1 -1
  4. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916/vllm_sr.egg-info}/PKG-INFO +1 -1
  5. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/MANIFEST.in +0 -0
  6. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/README.md +0 -0
  7. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/__init__.py +0 -0
  8. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/__init__.py +0 -0
  9. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/config.py +0 -0
  10. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/generate.py +0 -0
  11. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/init.py +0 -0
  12. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/serve.py +0 -0
  13. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/show_config.py +0 -0
  14. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/show_defaults.py +0 -0
  15. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/commands/validate.py +0 -0
  16. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/config_generator.py +0 -0
  17. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/consts.py +0 -0
  18. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/core.py +0 -0
  19. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/defaults.py +0 -0
  20. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/docker_cli.py +0 -0
  21. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/logo.py +0 -0
  22. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/main.py +0 -0
  23. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/merger.py +0 -0
  24. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/models.py +0 -0
  25. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/parser.py +0 -0
  26. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/config.template.yaml +0 -0
  27. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/envoy.template.yaml +0 -0
  28. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/generate_dashboard.py +0 -0
  29. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/grafana-dashboard.serve.yaml +0 -0
  30. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/grafana-datasource-jaeger.serve.yaml +0 -0
  31. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/grafana-datasource.serve.yaml +0 -0
  32. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/grafana.serve.ini +0 -0
  33. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/llm-router-dashboard.serve.json +0 -0
  34. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/prometheus.serve.yaml +0 -0
  35. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/templates/tools_db.json +0 -0
  36. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/utils.py +0 -0
  37. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/cli/validator.py +0 -0
  38. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/requirements.txt +0 -0
  39. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/setup.cfg +0 -0
  40. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/tests/test_plugin_parsing.py +0 -0
  41. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/tests/test_plugin_yaml_generation.py +0 -0
  42. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/vllm_sr.egg-info/SOURCES.txt +0 -0
  43. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/vllm_sr.egg-info/dependency_links.txt +0 -0
  44. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/vllm_sr.egg-info/entry_points.txt +0 -0
  45. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/vllm_sr.egg-info/requires.txt +0 -0
  46. {vllm_sr-0.1.0b2.dev20260129021803 → vllm_sr-0.1.0b2.dev20260129021916}/vllm_sr.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: vllm-sr
3
- Version: 0.1.0b2.dev20260129021803
3
+ Version: 0.1.0b2.dev20260129021916
4
4
  Summary: vLLM Semantic Router - Intelligent routing for Mixture-of-Models
5
5
  Author: vLLM-SR Team
6
6
  License: Apache-2.0
@@ -19,6 +19,16 @@ response_api:
19
19
  ttl_seconds: 86400 # 24 hours
20
20
  max_responses: 1000
21
21
 
22
+ # Router Replay Configuration
23
+ # Records all routing decisions for debugging and analysis
24
+ router_replay:
25
+ enabled: true
26
+ store_backend: "memory" # Options: "memory"
27
+ max_records: 1000
28
+ capture_request_body: true
29
+ capture_response_body: true
30
+ max_body_bytes: 4096
31
+
22
32
  semantic_cache:
23
33
  enabled: true
24
34
  backend_type: "memory" # Options: "memory", "milvus", or "hybrid"
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "vllm-sr"
7
- version = "0.1.0.beta.2.dev20260129021803"
7
+ version = "0.1.0.beta.2.dev20260129021916"
8
8
  description = "vLLM Semantic Router - Intelligent routing for Mixture-of-Models"
9
9
  authors = [{name = "vLLM-SR Team"}]
10
10
  readme = "README.md"
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: vllm-sr
3
- Version: 0.1.0b2.dev20260129021803
3
+ Version: 0.1.0b2.dev20260129021916
4
4
  Summary: vLLM Semantic Router - Intelligent routing for Mixture-of-Models
5
5
  Author: vLLM-SR Team
6
6
  License: Apache-2.0