lmcache 0.4.7__tar.gz → 0.4.8.dev24__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- lmcache-0.4.8.dev24/.buildkite/k3_tests/comprehensive/pipeline.yml +143 -0
- lmcache-0.4.8.dev24/.buildkite/k3_tests/multiprocess/pipeline.yml +221 -0
- lmcache-0.4.8.dev24/.buildkite/k3_tests/sglang/pipeline.yml +54 -0
- lmcache-0.4.8.dev24/.github/scripts/cpu_device_test.sh +156 -0
- lmcache-0.4.8.dev24/.github/scripts/cpu_server_bench_test.sh +139 -0
- lmcache-0.4.8.dev24/.github/scripts/cpu_vllm_e2e_test.sh +84 -0
- lmcache-0.4.8.dev24/.github/scripts/download_model.sh +87 -0
- lmcache-0.4.8.dev24/.github/scripts/run-cpu-e2e-validation.sh +635 -0
- lmcache-0.4.8.dev24/.github/workflows/aerospike_integration.yml +142 -0
- lmcache-0.4.8.dev24/.github/workflows/build_cli_artifacts.yml +95 -0
- lmcache-0.4.8.dev24/.github/workflows/code_quality_checks.yml +68 -0
- lmcache-0.4.8.dev24/.github/workflows/cpu_device.yml +168 -0
- lmcache-0.4.8.dev24/.github/workflows/publish.yml +467 -0
- lmcache-0.4.8.dev24/.github/workflows/test.yml +170 -0
- lmcache-0.4.8.dev24/.gitignore +153 -0
- lmcache-0.4.8.dev24/PKG-INFO +213 -0
- lmcache-0.4.8.dev24/benchmarks/musa/README.md +18 -0
- lmcache-0.4.8.dev24/benchmarks/musa/bench_inprocess_transfer.py +286 -0
- lmcache-0.4.8.dev24/csrc/mem_kernels.cu +1098 -0
- lmcache-0.4.8.dev24/csrc/mem_kernels.cuh +157 -0
- lmcache-0.4.8.dev24/csrc/mp_mem_kernels.cu +390 -0
- lmcache-0.4.8.dev24/csrc/mp_mem_kernels.cuh +90 -0
- lmcache-0.4.8.dev24/csrc/pybind.cpp +123 -0
- lmcache-0.4.8.dev24/csrc/storage_backends/README.md +311 -0
- lmcache-0.4.8.dev24/csrc/storage_backends/aerospike/connector.cpp +533 -0
- lmcache-0.4.8.dev24/csrc/storage_backends/aerospike/connector.h +103 -0
- lmcache-0.4.8.dev24/csrc/storage_backends/aerospike/pybind.cpp +25 -0
- lmcache-0.4.8.dev24/csrc/sycl/mem_kernels_sycl.cpp +1028 -0
- lmcache-0.4.8.dev24/csrc/sycl/mem_kernels_sycl.h +159 -0
- lmcache-0.4.8.dev24/csrc/sycl/pybind_sycl.cpp +77 -0
- lmcache-0.4.8.dev24/docker/Dockerfile +152 -0
- lmcache-0.4.8.dev24/docker/Dockerfile.standalone +151 -0
- lmcache-0.4.8.dev24/docs/design/cli/commands/describe.md +416 -0
- lmcache-0.4.8.dev24/docs/design/integration/vllm/hybrid-kv-cache-groups.md +177 -0
- lmcache-0.4.8.dev24/docs/design/v1/distributed/l2_adapters/l2_per_user_quota.md +850 -0
- lmcache-0.4.8.dev24/docs/design/v1/distributed/serde/README.md +269 -0
- lmcache-0.4.8.dev24/docs/design/v1/gpu_connector/layout-invariant.md +193 -0
- lmcache-0.4.8.dev24/docs/design/v1/mp_observability/EVENTS.md +243 -0
- lmcache-0.4.8.dev24/docs/design/v1/mp_observability/METRICS.md +526 -0
- lmcache-0.4.8.dev24/docs/design/v1/mp_observability/README.md +208 -0
- lmcache-0.4.8.dev24/docs/design/v1/mp_observability/blend_v3_observability.md +207 -0
- lmcache-0.4.8.dev24/docs/design/v1/mp_observability/event-bus.md +203 -0
- lmcache-0.4.8.dev24/docs/design/v1/mp_observability/trace.md +546 -0
- lmcache-0.4.8.dev24/docs/design/v1/multiprocess/engine_driven_transfer_design.md +264 -0
- lmcache-0.4.8.dev24/docs/design/v1/multiprocess/raw_cuda_ipc.md +70 -0
- lmcache-0.4.8.dev24/docs/design/v1/multiprocess/worker_liveness.md +193 -0
- lmcache-0.4.8.dev24/docs/source/_static/custom.css +126 -0
- lmcache-0.4.8.dev24/docs/source/_static/custom.js +283 -0
- lmcache-0.4.8.dev24/docs/source/_static/scroll.css +32 -0
- lmcache-0.4.8.dev24/docs/source/cli/bench.rst +1309 -0
- lmcache-0.4.8.dev24/docs/source/cli/index.rst +108 -0
- lmcache-0.4.8.dev24/docs/source/community/index.rst +11 -0
- lmcache-0.4.8.dev24/docs/source/developer_guide/cli.rst +96 -0
- lmcache-0.4.8.dev24/docs/source/developer_guide/extending_http_api.rst +109 -0
- lmcache-0.4.8.dev24/docs/source/developer_guide/extending_lmcache/native_connectors.rst +686 -0
- lmcache-0.4.8.dev24/docs/source/developer_guide/index.rst +13 -0
- lmcache-0.4.8.dev24/docs/source/developer_guide/usage/index.rst +7 -0
- lmcache-0.4.8.dev24/docs/source/distributed_kv_cache.rst +14 -0
- lmcache-0.4.8.dev24/docs/source/getting_started/benchmarking.rst +157 -0
- lmcache-0.4.8.dev24/docs/source/getting_started/index.rst +16 -0
- lmcache-0.4.8.dev24/docs/source/getting_started/installation.rst +256 -0
- lmcache-0.4.8.dev24/docs/source/getting_started/quickstart.rst +466 -0
- lmcache-0.4.8.dev24/docs/source/index.rst +145 -0
- lmcache-0.4.8.dev24/docs/source/interacting_with_server.rst +12 -0
- lmcache-0.4.8.dev24/docs/source/kv_cache/storage_backends/fs.rst +189 -0
- lmcache-0.4.8.dev24/docs/source/kv_cache_optimizations/cacheblend.rst +26 -0
- lmcache-0.4.8.dev24/docs/source/kv_cache_optimizations/index.rst +11 -0
- lmcache-0.4.8.dev24/docs/source/kv_cache_optimizations/segmented_prefill.rst +6 -0
- lmcache-0.4.8.dev24/docs/source/legacy/index.rst +58 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/cli/bench.po +1740 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/cli/coordinator.po +146 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/cli/describe.po +186 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/cli/index.po +239 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/cli/quota.po +239 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/cli/server.po +216 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/offload_kv_cache.po +349 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/bigtable.po +311 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/dax.po +390 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/fs.po +282 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/hfbucket.po +303 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/nixl.po +376 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/architecture.po +962 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/configuration.po +1058 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/coordinator.po +403 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/http_api.po +1099 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/hybrid_models.po +384 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/index.po +162 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/l2_storage.po +1570 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/observability.po +1638 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/operator.po +1212 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/quickstart.po +252 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/mp/tracing_and_debugging.po +517 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/deepseek_v4_flash.po +157 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/devstral.po +131 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/gemma3.po +163 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/gemma4.po +177 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/gpt_oss.po +135 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/index.po +312 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/llama.po +181 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/minimax_m2.po +159 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/mixtral.po +138 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/phi3.po +138 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/qwen3.po +159 -0
- lmcache-0.4.8.dev24/docs/source/locale/zh_CN/LC_MESSAGES/recipes/qwen3_5.po +220 -0
- lmcache-0.4.8.dev24/docs/source/mp/cachegen.rst +8 -0
- lmcache-0.4.8.dev24/docs/source/mp/configuration.rst +504 -0
- lmcache-0.4.8.dev24/docs/source/mp/coordinator.rst +209 -0
- lmcache-0.4.8.dev24/docs/source/mp/deployment.rst +270 -0
- lmcache-0.4.8.dev24/docs/source/mp/disaggregated_prefill.rst +13 -0
- lmcache-0.4.8.dev24/docs/source/mp/http_api.rst +840 -0
- lmcache-0.4.8.dev24/docs/source/mp/hybrid_models.rst +248 -0
- lmcache-0.4.8.dev24/docs/source/mp/index.rst +609 -0
- lmcache-0.4.8.dev24/docs/source/mp/kv_cache_management.rst +13 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/aerospike.rst +63 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/dax.rst +101 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/file_and_block.rst +13 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/fs.rst +32 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/fs_native.rst +82 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/hfbucket.rst +52 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/index.rst +343 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/mock.rst +14 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/mooncake_store.rst +111 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/nixl.rst +135 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/raw_block.rst +76 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/remote_and_distributed.rst +14 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/resp.rst +34 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/s3.rst +40 -0
- lmcache-0.4.8.dev24/docs/source/mp/l2_storage/supported_storages.rst +57 -0
- lmcache-0.4.8.dev24/docs/source/mp/observability/index.rst +104 -0
- lmcache-0.4.8.dev24/docs/source/mp/observability/logs.rst +34 -0
- lmcache-0.4.8.dev24/docs/source/mp/observability/metrics.rst +532 -0
- lmcache-0.4.8.dev24/docs/source/mp/observability/traces.rst +192 -0
- lmcache-0.4.8.dev24/docs/source/mp/operator.rst +841 -0
- lmcache-0.4.8.dev24/docs/source/mp/p2p.rst +12 -0
- lmcache-0.4.8.dev24/docs/source/mp/serde.rst +140 -0
- lmcache-0.4.8.dev24/docs/source/mp/tracing_and_debugging.rst +330 -0
- lmcache-0.4.8.dev24/docs/source/non_kv_cache/encodings.rst +9 -0
- lmcache-0.4.8.dev24/docs/source/non_kv_cache/hidden_states.rst +6 -0
- lmcache-0.4.8.dev24/docs/source/non_kv_cache/index.rst +10 -0
- lmcache-0.4.8.dev24/docs/source/production/dynamo_coordination.rst +7 -0
- lmcache-0.4.8.dev24/docs/source/production/index.rst +13 -0
- lmcache-0.4.8.dev24/docs/source/recipes/deepseek_v4_flash.rst +107 -0
- lmcache-0.4.8.dev24/docs/source/recipes/devstral.rst +80 -0
- lmcache-0.4.8.dev24/docs/source/recipes/gemma3.rst +95 -0
- lmcache-0.4.8.dev24/docs/source/recipes/gemma4.rst +100 -0
- lmcache-0.4.8.dev24/docs/source/recipes/gpt_oss.rst +93 -0
- lmcache-0.4.8.dev24/docs/source/recipes/index.rst +22 -0
- lmcache-0.4.8.dev24/docs/source/recipes/llama.rst +132 -0
- lmcache-0.4.8.dev24/docs/source/recipes/minimax_m2.rst +119 -0
- lmcache-0.4.8.dev24/docs/source/recipes/mixtral.rst +92 -0
- lmcache-0.4.8.dev24/docs/source/recipes/phi3.rst +90 -0
- lmcache-0.4.8.dev24/docs/source/recipes/qwen3.rst +124 -0
- lmcache-0.4.8.dev24/docs/source/recipes/qwen3_5.rst +124 -0
- lmcache-0.4.8.dev24/docs/source/recipes/uniform_attention_models.rst +116 -0
- lmcache-0.4.8.dev24/lmcache/_version.py +24 -0
- lmcache-0.4.8.dev24/lmcache/cli/commands/bench/server_bench/command.py +719 -0
- lmcache-0.4.8.dev24/lmcache/cli/commands/bench/server_bench/helpers.py +1125 -0
- lmcache-0.4.8.dev24/lmcache/cli/commands/describe.py +340 -0
- lmcache-0.4.8.dev24/lmcache/integration/sglang/multi_process_adapter.py +544 -0
- lmcache-0.4.8.dev24/lmcache/integration/sglang/sglang_adapter.py +376 -0
- lmcache-0.4.8.dev24/lmcache/integration/tensorrt_llm/tensorrt_mp_adapter.py +488 -0
- lmcache-0.4.8.dev24/lmcache/integration/vllm/kv_cache_groups.py +190 -0
- lmcache-0.4.8.dev24/lmcache/integration/vllm/lmcache_mp_connector_0180.py +1080 -0
- lmcache-0.4.8.dev24/lmcache/integration/vllm/lmcache_mp_connector_0201.py +1201 -0
- lmcache-0.4.8.dev24/lmcache/integration/vllm/vllm_multi_process_adapter.py +1634 -0
- lmcache-0.4.8.dev24/lmcache/python_ops_fallback.py +2629 -0
- lmcache-0.4.8.dev24/lmcache/v1/distributed/api.py +277 -0
- lmcache-0.4.8.dev24/lmcache/v1/distributed/l2_adapters/aerospike_l2_adapter.py +239 -0
- lmcache-0.4.8.dev24/lmcache/v1/distributed/serde/__init__.py +55 -0
- lmcache-0.4.8.dev24/lmcache/v1/distributed/serde/asym_k16_v8.py +537 -0
- lmcache-0.4.8.dev24/lmcache/v1/distributed/serde/async_processor.py +233 -0
- lmcache-0.4.8.dev24/lmcache/v1/distributed/serde/multi.py +293 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/__init__.py +247 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/gpu_connectors.py +2218 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/hpu_connector.py +337 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/musa_connectors.py +825 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/musa_native.py +218 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/utils.py +1613 -0
- lmcache-0.4.8.dev24/lmcache/v1/gpu_connector/xpu_connectors.py +1796 -0
- lmcache-0.4.8.dev24/lmcache/v1/kv_codec/__init__.py +63 -0
- lmcache-0.4.8.dev24/lmcache/v1/kv_codec/asym_k16_v8.py +473 -0
- lmcache-0.4.8.dev24/lmcache/v1/kv_codec/encoded_kv.py +403 -0
- lmcache-0.4.8.dev24/lmcache/v1/kv_codec/errors.py +39 -0
- lmcache-0.4.8.dev24/lmcache/v1/kv_layer_groups.py +817 -0
- lmcache-0.4.8.dev24/lmcache/v1/memory_management.py +2885 -0
- lmcache-0.4.8.dev24/lmcache/v1/metadata.py +118 -0
- lmcache-0.4.8.dev24/lmcache/v1/mp_coordinator/http_apis/instances_api.py +136 -0
- lmcache-0.4.8.dev24/lmcache/v1/mp_coordinator/registry.py +161 -0
- lmcache-0.4.8.dev24/lmcache/v1/mp_coordinator/schemas.py +286 -0
- lmcache-0.4.8.dev24/lmcache/v1/mp_observability/README.md +208 -0
- lmcache-0.4.8.dev24/lmcache/v1/mp_observability/otel_init.py +219 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/config.py +489 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/custom_types.py +428 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/engine_context.py +247 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/engine_module.py +65 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/http_apis/cache_api.py +263 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/blend.py +1185 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/blend_v3.py +1522 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/engine_driven_transfer.py +444 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/lmcache_driven_transfer.py +968 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/lookup.py +467 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/management.py +129 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/modules/server_transfer.py +440 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/native_completion.py +150 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/protocol.py +86 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/protocols/base.py +101 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/protocols/blend.py +109 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/protocols/blend_v2.py +57 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/protocols/blend_v3.py +69 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/protocols/engine.py +240 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/server.py +390 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/session.py +191 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/token_hasher.py +450 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/transfer_context/__init__.py +43 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/transfer_context/base.py +714 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/transfer_context/pickle.py +110 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/transfer_context/shm.py +218 -0
- lmcache-0.4.8.dev24/lmcache/v1/multiprocess/transfer_context/worker_transfer.py +550 -0
- lmcache-0.4.8.dev24/lmcache/v1/periodic_thread.py +584 -0
- lmcache-0.4.8.dev24/lmcache/v1/platform/__init__.py +69 -0
- lmcache-0.4.8.dev24/lmcache/v1/platform/base_cache_context.py +339 -0
- lmcache-0.4.8.dev24/lmcache/v1/platform/cache_context.py +205 -0
- lmcache-0.4.8.dev24/lmcache/v1/platform/cpu/cache_context.py +443 -0
- lmcache-0.4.8.dev24/lmcache/v1/platform/cuda/cache_context.py +631 -0
- lmcache-0.4.8.dev24/lmcache/v1/storage_backend/native_clients/aerospike_client.py +74 -0
- lmcache-0.4.8.dev24/lmcache/v1/utils/subclass_discovery.py +219 -0
- lmcache-0.4.8.dev24/lmcache.egg-info/PKG-INFO +213 -0
- lmcache-0.4.8.dev24/lmcache.egg-info/SOURCES.txt +1829 -0
- lmcache-0.4.8.dev24/lmcache.egg-info/requires.txt +35 -0
- lmcache-0.4.8.dev24/operator/DESIGN.md +499 -0
- lmcache-0.4.8.dev24/operator/Makefile +55 -0
- lmcache-0.4.8.dev24/operator/internal/controller/reconcile_helpers_test.go +741 -0
- lmcache-0.4.8.dev24/operator/make/dev.mk +17 -0
- lmcache-0.4.8.dev24/operator/make/unit.mk +47 -0
- lmcache-0.4.8.dev24/setup.py +52 -0
- lmcache-0.4.8.dev24/setup_extensions/__init__.py +24 -0
- lmcache-0.4.8.dev24/setup_extensions/build_profiles/__init__.py +151 -0
- lmcache-0.4.8.dev24/setup_extensions/build_profiles/cuda.py +93 -0
- lmcache-0.4.8.dev24/setup_extensions/build_profiles/musa.py +36 -0
- lmcache-0.4.8.dev24/setup_extensions/build_profiles/rocm.py +125 -0
- lmcache-0.4.8.dev24/setup_extensions/build_profiles/sycl.py +91 -0
- lmcache-0.4.8.dev24/setup_extensions/common_cpp.py +97 -0
- lmcache-0.4.8.dev24/setup_extensions/policy.py +249 -0
- lmcache-0.4.8.dev24/setup_extensions/storage_backend_profiles/__init__.py +59 -0
- lmcache-0.4.8.dev24/setup_extensions/storage_backend_profiles/aerospike.py +95 -0
- lmcache-0.4.8.dev24/setup_extensions/storage_backend_profiles/mooncake.py +65 -0
- lmcache-0.4.8.dev24/tests/aerospike_ce.conf.template +53 -0
- lmcache-0.4.8.dev24/tests/benchmarks/test_musa_inprocess_benchmark.py +37 -0
- lmcache-0.4.8.dev24/tests/cli/test_describe.py +385 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/serde/test_asym_k16_v8_multi.py +195 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/serde/test_asym_k16_v8_v_only.py +237 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/serde/test_async_processor.py +256 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/serde/test_multi.py +449 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/test_aerospike_l2_adapter_config.py +92 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/test_aerospike_l2_integration.py +149 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/test_fs_l2_adapter_keys.py +323 -0
- lmcache-0.4.8.dev24/tests/v1/distributed/test_object_key_parallel.py +734 -0
- lmcache-0.4.8.dev24/tests/v1/gpu_connector/test_blocks_first_fused_kv_format.py +182 -0
- lmcache-0.4.8.dev24/tests/v1/gpu_connector/test_concrete_shape.py +68 -0
- lmcache-0.4.8.dev24/tests/v1/gpu_connector/test_utils_shape_desc.py +236 -0
- lmcache-0.4.8.dev24/tests/v1/mp_coordinator/test_api.py +130 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/http_apis/test_common_api.py +156 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_batched_iteration_with_skip.py +112 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_cache_server.py +753 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_custom_types.py +285 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_engine_driven_transfer.py +1290 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_engine_passthroughs.py +56 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_free_locks.py +270 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_http_api_registry.py +195 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_http_server.py +305 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_lmcache_driven_layout_registry.py +126 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_mq.py +872 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_session.py +334 -0
- lmcache-0.4.8.dev24/tests/v1/multiprocess/test_unified_touch.py +335 -0
- lmcache-0.4.8.dev24/tests/v1/platform/test_cache_context_dispatch.py +192 -0
- lmcache-0.4.8.dev24/tests/v1/platform/test_gpu_cache_context.py +553 -0
- lmcache-0.4.8.dev24/tests/v1/storage_backend/test_dax_backend.py +2087 -0
- lmcache-0.4.8.dev24/tests/v1/test_gpu_connector.py +961 -0
- lmcache-0.4.8.dev24/tests/v1/test_kv_layer_groups_manager.py +556 -0
- lmcache-0.4.8.dev24/tests/v1/test_mem_kernels.py +971 -0
- lmcache-0.4.8.dev24/tests/v1/test_memory_management.py +1122 -0
- lmcache-0.4.8.dev24/tests/v1/test_mp_mem_kernels.py +471 -0
- lmcache-0.4.8.dev24/tests/v1/test_musa_connector.py +1023 -0
- lmcache-0.4.8.dev24/tests/v1/test_musa_native.py +200 -0
- lmcache-0.4.8.dev24/tests/v1/test_musa_support.py +279 -0
- lmcache-0.4.8.dev24/tests/v1/test_python_ops_fallback.py +2867 -0
- lmcache-0.4.8.dev24/tests/v1/test_subclass_discovery.py +612 -0
- lmcache-0.4.8.dev24/tests/v1/test_trtllm_integration.py +394 -0
- lmcache-0.4.8.dev24/tests/v1/test_vllm_mp_adapter.py +742 -0
- lmcache-0.4.8.dev24/tests/v1/test_xpu_connector.py +836 -0
- lmcache-0.4.8.dev24/tests/v1/test_xpu_sglang_connector.py +898 -0
- lmcache-0.4.8.dev24/tests/v1/utils.py +857 -0
- lmcache-0.4.7/.buildkite/k3_tests/comprehensive/pipeline.yml +0 -126
- lmcache-0.4.7/.buildkite/k3_tests/multiprocess/pipeline.yml +0 -221
- lmcache-0.4.7/.buildkite/k3_tests/sglang/pipeline.yml +0 -48
- lmcache-0.4.7/.github/scripts/cpu_device_test.sh +0 -156
- lmcache-0.4.7/.github/scripts/cpu_server_bench_test.sh +0 -138
- lmcache-0.4.7/.github/scripts/cpu_vllm_e2e_test.sh +0 -88
- lmcache-0.4.7/.github/scripts/download_model.sh +0 -79
- lmcache-0.4.7/.github/scripts/run-cpu-e2e-validation.sh +0 -626
- lmcache-0.4.7/.github/workflows/build_cli_artifacts.yml +0 -95
- lmcache-0.4.7/.github/workflows/code_quality_checks.yml +0 -69
- lmcache-0.4.7/.github/workflows/cpu_device.yml +0 -159
- lmcache-0.4.7/.github/workflows/publish.yml +0 -450
- lmcache-0.4.7/.github/workflows/test.yml +0 -171
- lmcache-0.4.7/.gitignore +0 -149
- lmcache-0.4.7/PKG-INFO +0 -215
- lmcache-0.4.7/csrc/mem_kernels.cu +0 -1089
- lmcache-0.4.7/csrc/mem_kernels.cuh +0 -157
- lmcache-0.4.7/csrc/mp_mem_kernels.cu +0 -390
- lmcache-0.4.7/csrc/mp_mem_kernels.cuh +0 -90
- lmcache-0.4.7/csrc/pybind.cpp +0 -121
- lmcache-0.4.7/csrc/storage_backends/README.md +0 -288
- lmcache-0.4.7/csrc/sycl/mem_kernels_sycl.cpp +0 -806
- lmcache-0.4.7/csrc/sycl/mem_kernels_sycl.h +0 -145
- lmcache-0.4.7/csrc/sycl/pybind_sycl.cpp +0 -64
- lmcache-0.4.7/docker/Dockerfile +0 -146
- lmcache-0.4.7/docker/Dockerfile.standalone +0 -150
- lmcache-0.4.7/docs/design/cli/commands/describe.md +0 -416
- lmcache-0.4.7/docs/design/integration/vllm/hybrid-kv-cache-groups.md +0 -177
- lmcache-0.4.7/docs/design/v1/distributed/l2_adapters/l2_per_user_quota.md +0 -850
- lmcache-0.4.7/docs/design/v1/distributed/serde/README.md +0 -177
- lmcache-0.4.7/docs/design/v1/gpu_connector/layout-invariant.md +0 -193
- lmcache-0.4.7/docs/design/v1/mp_observability/EVENTS.md +0 -243
- lmcache-0.4.7/docs/design/v1/mp_observability/METRICS.md +0 -526
- lmcache-0.4.7/docs/design/v1/mp_observability/README.md +0 -208
- lmcache-0.4.7/docs/design/v1/mp_observability/blend_v3_observability.md +0 -207
- lmcache-0.4.7/docs/design/v1/mp_observability/event-bus.md +0 -203
- lmcache-0.4.7/docs/design/v1/mp_observability/trace.md +0 -546
- lmcache-0.4.7/docs/design/v1/multiprocess/non_gpu_context_design.md +0 -260
- lmcache-0.4.7/docs/design/v1/multiprocess/raw_cuda_ipc.md +0 -70
- lmcache-0.4.7/docs/source/_static/custom.css +0 -110
- lmcache-0.4.7/docs/source/_static/custom.js +0 -167
- lmcache-0.4.7/docs/source/_static/scroll.css +0 -17
- lmcache-0.4.7/docs/source/cli/bench.rst +0 -1232
- lmcache-0.4.7/docs/source/cli/index.rst +0 -107
- lmcache-0.4.7/docs/source/developer_guide/cli.rst +0 -129
- lmcache-0.4.7/docs/source/developer_guide/docker_file.rst +0 -24
- lmcache-0.4.7/docs/source/developer_guide/extending_lmcache/index.rst +0 -130
- lmcache-0.4.7/docs/source/developer_guide/extending_lmcache/native_connectors.rst +0 -642
- lmcache-0.4.7/docs/source/developer_guide/usage/index.rst +0 -8
- lmcache-0.4.7/docs/source/getting_started/benchmarking.rst +0 -157
- lmcache-0.4.7/docs/source/getting_started/faq.rst +0 -41
- lmcache-0.4.7/docs/source/getting_started/installation.rst +0 -251
- lmcache-0.4.7/docs/source/getting_started/quickstart.rst +0 -441
- lmcache-0.4.7/docs/source/getting_started/troubleshoot.rst +0 -4
- lmcache-0.4.7/docs/source/index.rst +0 -214
- lmcache-0.4.7/docs/source/kv_cache/storage_backends/fs.rst +0 -189
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/cli/bench.po +0 -1679
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/cli/coordinator.po +0 -111
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/cli/describe.po +0 -183
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/cli/index.po +0 -233
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/cli/server.po +0 -196
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/offload_kv_cache.po +0 -301
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/dax.po +0 -274
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/hfbucket.po +0 -168
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/nixl.po +0 -329
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/architecture.po +0 -912
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/configuration.po +0 -999
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/coordinator.po +0 -222
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/http_api.po +0 -955
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/hybrid_models.po +0 -180
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/index.po +0 -158
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/l2_storage.po +0 -1272
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/observability.po +0 -1643
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/operator.po +0 -978
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/quickstart.po +0 -201
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/mp/tracing_and_debugging.po +0 -469
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/devstral.po +0 -124
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/gemma3.po +0 -151
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/gemma4.po +0 -163
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/gpt_oss.po +0 -130
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/index.po +0 -276
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/llama.po +0 -165
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/minimax_m2.po +0 -150
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/mixtral.po +0 -131
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/phi3.po +0 -131
- lmcache-0.4.7/docs/source/locale/zh_CN/LC_MESSAGES/recipes/qwen3.po +0 -150
- lmcache-0.4.7/docs/source/mp/architecture.rst +0 -484
- lmcache-0.4.7/docs/source/mp/configuration.rst +0 -563
- lmcache-0.4.7/docs/source/mp/coordinator.rst +0 -208
- lmcache-0.4.7/docs/source/mp/deployment.rst +0 -269
- lmcache-0.4.7/docs/source/mp/http_api.rst +0 -840
- lmcache-0.4.7/docs/source/mp/hybrid_models.rst +0 -210
- lmcache-0.4.7/docs/source/mp/index.rst +0 -67
- lmcache-0.4.7/docs/source/mp/l2_storage.rst +0 -971
- lmcache-0.4.7/docs/source/mp/observability.rst +0 -857
- lmcache-0.4.7/docs/source/mp/operator.rst +0 -841
- lmcache-0.4.7/docs/source/mp/quickstart.rst +0 -244
- lmcache-0.4.7/docs/source/mp/serde.rst +0 -129
- lmcache-0.4.7/docs/source/mp/tracing_and_debugging.rst +0 -330
- lmcache-0.4.7/docs/source/recipes/deepseek_v4_flash.rst +0 -107
- lmcache-0.4.7/docs/source/recipes/devstral.rst +0 -80
- lmcache-0.4.7/docs/source/recipes/gemma3.rst +0 -95
- lmcache-0.4.7/docs/source/recipes/gemma4.rst +0 -100
- lmcache-0.4.7/docs/source/recipes/gpt_oss.rst +0 -93
- lmcache-0.4.7/docs/source/recipes/index.rst +0 -160
- lmcache-0.4.7/docs/source/recipes/llama.rst +0 -132
- lmcache-0.4.7/docs/source/recipes/minimax_m2.rst +0 -119
- lmcache-0.4.7/docs/source/recipes/mixtral.rst +0 -92
- lmcache-0.4.7/docs/source/recipes/phi3.rst +0 -90
- lmcache-0.4.7/docs/source/recipes/qwen3.rst +0 -124
- lmcache-0.4.7/docs/source/recipes/qwen3_5.rst +0 -124
- lmcache-0.4.7/lmcache/_version.py +0 -24
- lmcache-0.4.7/lmcache/cli/commands/bench/server_bench/command.py +0 -575
- lmcache-0.4.7/lmcache/cli/commands/bench/server_bench/helpers.py +0 -1093
- lmcache-0.4.7/lmcache/cli/commands/describe.py +0 -340
- lmcache-0.4.7/lmcache/integration/sglang/multi_process_adapter.py +0 -544
- lmcache-0.4.7/lmcache/integration/sglang/sglang_adapter.py +0 -346
- lmcache-0.4.7/lmcache/integration/tensorrt_llm/tensorrt_mp_adapter.py +0 -488
- lmcache-0.4.7/lmcache/integration/vllm/kv_cache_groups.py +0 -190
- lmcache-0.4.7/lmcache/integration/vllm/lmcache_mp_connector_0180.py +0 -1080
- lmcache-0.4.7/lmcache/integration/vllm/lmcache_mp_connector_0201.py +0 -1201
- lmcache-0.4.7/lmcache/integration/vllm/vllm_multi_process_adapter.py +0 -1534
- lmcache-0.4.7/lmcache/python_ops_fallback.py +0 -2625
- lmcache-0.4.7/lmcache/v1/distributed/api.py +0 -277
- lmcache-0.4.7/lmcache/v1/distributed/serde/__init__.py +0 -39
- lmcache-0.4.7/lmcache/v1/distributed/serde/async_processor.py +0 -218
- lmcache-0.4.7/lmcache/v1/gpu_connector/__init__.py +0 -208
- lmcache-0.4.7/lmcache/v1/gpu_connector/gpu_connectors.py +0 -2212
- lmcache-0.4.7/lmcache/v1/gpu_connector/hpu_connector.py +0 -337
- lmcache-0.4.7/lmcache/v1/gpu_connector/musa_connectors.py +0 -346
- lmcache-0.4.7/lmcache/v1/gpu_connector/utils.py +0 -1600
- lmcache-0.4.7/lmcache/v1/gpu_connector/xpu_connectors.py +0 -1229
- lmcache-0.4.7/lmcache/v1/kv_layer_groups.py +0 -817
- lmcache-0.4.7/lmcache/v1/memory_management.py +0 -2810
- lmcache-0.4.7/lmcache/v1/metadata.py +0 -118
- lmcache-0.4.7/lmcache/v1/mp_coordinator/http_apis/instances_api.py +0 -134
- lmcache-0.4.7/lmcache/v1/mp_coordinator/registry.py +0 -158
- lmcache-0.4.7/lmcache/v1/mp_coordinator/schemas.py +0 -282
- lmcache-0.4.7/lmcache/v1/mp_observability/README.md +0 -208
- lmcache-0.4.7/lmcache/v1/mp_observability/otel_init.py +0 -219
- lmcache-0.4.7/lmcache/v1/multiprocess/config.py +0 -489
- lmcache-0.4.7/lmcache/v1/multiprocess/custom_types.py +0 -428
- lmcache-0.4.7/lmcache/v1/multiprocess/engine_context.py +0 -247
- lmcache-0.4.7/lmcache/v1/multiprocess/engine_module.py +0 -65
- lmcache-0.4.7/lmcache/v1/multiprocess/gpu_context.py +0 -841
- lmcache-0.4.7/lmcache/v1/multiprocess/http_apis/cache_api.py +0 -263
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/blend.py +0 -1185
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/blend_v3.py +0 -1522
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/gpu_transfer.py +0 -968
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/lookup.py +0 -467
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/management.py +0 -129
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/non_gpu_transfer.py +0 -440
- lmcache-0.4.7/lmcache/v1/multiprocess/modules/server_transfer.py +0 -440
- lmcache-0.4.7/lmcache/v1/multiprocess/native_completion.py +0 -150
- lmcache-0.4.7/lmcache/v1/multiprocess/protocol.py +0 -86
- lmcache-0.4.7/lmcache/v1/multiprocess/protocols/base.py +0 -101
- lmcache-0.4.7/lmcache/v1/multiprocess/protocols/blend.py +0 -109
- lmcache-0.4.7/lmcache/v1/multiprocess/protocols/blend_v2.py +0 -57
- lmcache-0.4.7/lmcache/v1/multiprocess/protocols/blend_v3.py +0 -69
- lmcache-0.4.7/lmcache/v1/multiprocess/protocols/engine.py +0 -240
- lmcache-0.4.7/lmcache/v1/multiprocess/server.py +0 -375
- lmcache-0.4.7/lmcache/v1/multiprocess/session.py +0 -191
- lmcache-0.4.7/lmcache/v1/multiprocess/token_hasher.py +0 -450
- lmcache-0.4.7/lmcache/v1/multiprocess/transfer_context/__init__.py +0 -43
- lmcache-0.4.7/lmcache/v1/multiprocess/transfer_context/base.py +0 -714
- lmcache-0.4.7/lmcache/v1/multiprocess/transfer_context/pickle.py +0 -110
- lmcache-0.4.7/lmcache/v1/multiprocess/transfer_context/shm.py +0 -218
- lmcache-0.4.7/lmcache/v1/multiprocess/transfer_context/worker_transfer.py +0 -536
- lmcache-0.4.7/lmcache/v1/periodic_thread.py +0 -579
- lmcache-0.4.7/lmcache/v1/platform/__init__.py +0 -33
- lmcache-0.4.7/lmcache/v1/platform/cache_context.py +0 -85
- lmcache-0.4.7/lmcache/v1/platform/cpu/cache_context.py +0 -642
- lmcache-0.4.7/lmcache/v1/utils/subclass_discovery.py +0 -106
- lmcache-0.4.7/lmcache.egg-info/PKG-INFO +0 -215
- lmcache-0.4.7/lmcache.egg-info/SOURCES.txt +0 -1754
- lmcache-0.4.7/lmcache.egg-info/requires.txt +0 -39
- lmcache-0.4.7/operator/DESIGN.md +0 -499
- lmcache-0.4.7/operator/Makefile +0 -54
- lmcache-0.4.7/operator/internal/controller/reconcile_helpers_test.go +0 -47
- lmcache-0.4.7/operator/make/dev.mk +0 -21
- lmcache-0.4.7/setup.py +0 -480
- lmcache-0.4.7/tests/cli/test_describe.py +0 -385
- lmcache-0.4.7/tests/v1/distributed/serde/test_async_processor.py +0 -141
- lmcache-0.4.7/tests/v1/distributed/test_fs_l2_adapter_keys.py +0 -323
- lmcache-0.4.7/tests/v1/distributed/test_object_key_parallel.py +0 -734
- lmcache-0.4.7/tests/v1/gpu_connector/test_blocks_first_fused_kv_format.py +0 -182
- lmcache-0.4.7/tests/v1/gpu_connector/test_concrete_shape.py +0 -68
- lmcache-0.4.7/tests/v1/gpu_connector/test_utils_shape_desc.py +0 -236
- lmcache-0.4.7/tests/v1/mp_coordinator/test_api.py +0 -104
- lmcache-0.4.7/tests/v1/multiprocess/http_apis/test_common_api.py +0 -156
- lmcache-0.4.7/tests/v1/multiprocess/test_batched_iteration_with_skip.py +0 -112
- lmcache-0.4.7/tests/v1/multiprocess/test_cache_server.py +0 -753
- lmcache-0.4.7/tests/v1/multiprocess/test_custom_types.py +0 -285
- lmcache-0.4.7/tests/v1/multiprocess/test_engine_passthroughs.py +0 -56
- lmcache-0.4.7/tests/v1/multiprocess/test_free_locks.py +0 -270
- lmcache-0.4.7/tests/v1/multiprocess/test_gpu_context.py +0 -551
- lmcache-0.4.7/tests/v1/multiprocess/test_gpu_transfer_layout_registry.py +0 -118
- lmcache-0.4.7/tests/v1/multiprocess/test_http_api_registry.py +0 -195
- lmcache-0.4.7/tests/v1/multiprocess/test_http_server.py +0 -302
- lmcache-0.4.7/tests/v1/multiprocess/test_mq.py +0 -872
- lmcache-0.4.7/tests/v1/multiprocess/test_non_cuda_data_transfer.py +0 -1254
- lmcache-0.4.7/tests/v1/multiprocess/test_session.py +0 -334
- lmcache-0.4.7/tests/v1/multiprocess/test_unified_touch.py +0 -335
- lmcache-0.4.7/tests/v1/storage_backend/test_dax_backend.py +0 -2087
- lmcache-0.4.7/tests/v1/test_gpu_connector.py +0 -958
- lmcache-0.4.7/tests/v1/test_kv_layer_groups_manager.py +0 -556
- lmcache-0.4.7/tests/v1/test_mem_kernels.py +0 -970
- lmcache-0.4.7/tests/v1/test_memory_management.py +0 -958
- lmcache-0.4.7/tests/v1/test_mp_mem_kernels.py +0 -465
- lmcache-0.4.7/tests/v1/test_musa_connector.py +0 -537
- lmcache-0.4.7/tests/v1/test_musa_support.py +0 -250
- lmcache-0.4.7/tests/v1/test_python_ops_fallback.py +0 -2861
- lmcache-0.4.7/tests/v1/test_subclass_discovery.py +0 -330
- lmcache-0.4.7/tests/v1/test_trtllm_integration.py +0 -390
- lmcache-0.4.7/tests/v1/test_vllm_mp_adapter.py +0 -293
- lmcache-0.4.7/tests/v1/test_xpu_connector.py +0 -833
- lmcache-0.4.7/tests/v1/utils.py +0 -856
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/cases/comprehensive-cases.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/cases/integration-cases.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/async.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/dummy.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/layerwise.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/lmcache_configs/local_cpu_mla.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/local_cpu.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/local_cpu_mla.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/local_cpu_with_v3.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/local_disk.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/local_disk_with_v3.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/multi_device.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/p2p.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/p2p_with_v3.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/configs/pd.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/async_request.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/compare_files.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/mmlu-test.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/pipeline.correctness.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/pipeline.mmlu.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/setup.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/sharegpt2openai.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/correctness/summarize-results.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/ARCHITECTURE.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/ci-base.Dockerfile +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/gpu-monitor.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/install-agent-stack.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/setup-cluster.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/setup-env.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/setup-gpu-monitor.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/setup-lmcache-only-env.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/setup-sglang-env.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/smoke-test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/teardown.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_harness/values.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/common_scripts/helpers.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/common_scripts/path-filter.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/common_scripts/upload-pipeline.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/comprehensive/BK_WEB_SETUP.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/comprehensive/buildkite-pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/comprehensive/run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/comprehensive/scripts/run-single-config.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/comprehensive/scripts/upload-baselines.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/correctness/BK_WEB_SETUP.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/correctness/buildkite-pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/correctness/pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/correctness/run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/correctness/scripts/run-correctness.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/integration/BK_WEB_SETUP.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/integration/buildkite-pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/integration/pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/integration/run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/integration/scripts/run-integration.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/BK_WEB_SETUP.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/buildkite-pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/cleanup.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/launch-processes.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-cache-stats.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-deadlock.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-fault-tolerance.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-gds-smoke.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-hma-lm-eval.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-http-api.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-lm-eval.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-long-doc-qa-l2.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-long-doc-qa.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-mp-test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-restart-recovery.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-single-test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/run-vllm-bench.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/multiprocess/scripts/wait-for-servers.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/sglang/BK_WEB_SETUP.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/sglang/buildkite-pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/sglang/run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/sglang/scripts/common.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/sglang/scripts/run-correctness.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/sglang/scripts/run-perf.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/unit/buildkite-pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/unit/pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/k3_tests/unit/run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/operator/integration/pipeline.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/operator/integration/tests.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/pipeline.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/pipelines/clean.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/pipelines/comprehensive-tests.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/pipelines/end-to-end-tests.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/pipelines/multiprocessing-test.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/bare-machine-cleanup.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/clean.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/end-to-end-test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/gpu_zombie_killer.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multi-round-qa.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/build-mp-docker-image.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/cleanup.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/common.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/launch-containers.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/run-fault-tolerance.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/run-lm-eval.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/run-long-doc-qa.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/run-mp-test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/run-vllm-bench.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/test-launch.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/multiprocessing-test/wait-for-vllm.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/pick-free-gpu-amd.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/pick-free-gpu.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/should-run-comprehensive.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/vllm-correctness.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/scripts/vllm-integration-tests.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.buildkite/vllm-integration-tests.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.clang-format +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.claude/skills/create-pr/SKILL.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.claude/skills/pr-review/SKILL.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.claude/skills/pre-pr-check/SKILL.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.cursor/BUGBOT.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.gemini/styleguide.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/CODEOWNERS +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/ISSUE_TEMPLATE/blank_issue.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/PULL_REQUEST_TEMPLATE.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/actions/free-disk-space/action.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/dependabot.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/scripts/install_lmcache_cpu.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/scripts/install_vllm_cpu.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/actionlint.dockerfile +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/actionlint.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/automerge-labeler.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/build_cpu_artifacts.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/build_cu129_artifacts.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/build_doc.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/build_main_artifacts.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/codeql.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/matchers/actionlint.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/matchers/mypy.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/nightly_build.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/operator_ci.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/operator_nightly.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/operator_release.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/pr_full_build.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/scorecard.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/stale_bot.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/sync_torch_version.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.github/workflows/translate_doc_zh.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.isort.cfg +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/.pre-commit-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/AGENTS.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/CLAUDE.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/CMakeLists.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/CODE_OF_CONDUCT.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/CONTRIBUTING.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/DCO +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/LICENSE +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/MAINTAINERS.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/MANIFEST.in +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/SECURITY.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/asset/deployment_modes_dark.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/asset/deployment_modes_light.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/asset/ecosystem.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/asset/logo.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/asset/partner_dark.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/asset/partner_light.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/long_doc_qa/long_doc_qa.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/long_doc_qa/long_doc_qa_recommender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/microbenchmark/ttl_lock_benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_doc_qa/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_doc_qa/lmcache.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_doc_qa/lmcache_blend.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_doc_qa/multi_doc_qa.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_doc_qa/shuffle_doc_qa.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_round_qa/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_round_qa/data_preprocessing.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_round_qa/multi-round-qa.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_round_qa/prepare_sharegpt_data.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_round_qa/requirements.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/multi_round_qa/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/launch_lmcache.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/launch_vllm.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/precompute.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/rag.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/requirements.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/rag/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/storage_backend_io/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/storage_backend_io/storage_backend_io_benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/ttft-estimator/llama-h100-example.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/benchmarks/ttft-estimator/ttft-estimator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/ac_dec.cu +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/ac_enc.cu +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/cachegen_kernels.cuh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/cal_cdf.cu +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/completion_recorder.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/completion_recorder.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/cuda_compat.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/dispatch_utils.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/event_recorder.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/event_recorder.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/mem_alloc.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/mem_alloc.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/pos_kernels.cu +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/pos_kernels.cuh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/connector_base.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/connector_interface.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/connector_pybind_utils.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/connector_types.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/event_notifier.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/fs/connector.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/fs/connector.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/fs/pybind.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/mooncake/connector.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/mooncake/connector.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/mooncake/pybind.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/redis/connector.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/redis/connector.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_backends/redis/pybind.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/bitmap.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/bitmap.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/periodic_event_notifier.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/periodic_event_notifier.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/pybind.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/ttl_lock.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/ttl_lock.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/utils.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/storage_manager/utils.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/sycl/ac_dec_sycl.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/sycl/ac_enc_sycl.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/sycl/cachegen_kernels_sycl.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/sycl/cal_cdf_sycl.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/sycl/pos_kernels_sycl.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/utils.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/csrc/utils.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docker/Dockerfile.lightweight +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docker/Dockerfile.rocm +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docker/Dockerfile.rocm-lightweight +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docker/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docker/example_build.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docker/example_run.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/Makefile +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/coding_standards.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/ARCHITECTURE_MULTI_HARDWARE.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/cli/commands/bench/engine_bench/bench-engine.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/cli/commands/kvcache-command.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/cli/commands/ping.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/cli/commands/query-command.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/cli/commands.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/cli/framework-and-metrics.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/integration/tensorrt_llm/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/integration/vllm/kv_cache_group_edits.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/observability/request-event-span.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/tools/controller_benchmark/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/dax.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/l2_eviction.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/nixl_store.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/overall.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/plugin.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/raw_block.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/distributed/l2_adapters/serde_wrapper.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/encoder-cache.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/mp_coordinator/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/mp_coordinator/blend_lookup.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/mp_coordinator/l2_usage_and_eviction.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/mp_observability/DEBUG.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/multiprocess/http_api_extension.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/multiprocess/mp_runtime_plugin.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/multiprocess/protocols/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/pd_async_reservation_design.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/design/v1/platform/event_notifier.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/make.bat +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/.nojekyll +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_static/basic_codepath.svg +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_static/bench_interactive_demo.gif +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_static/full_layerwise_diagram.svg +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_static/kv_cache_calculator.html +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_static/modelconfig.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_templates/custom.html +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/_templates/versioning.html +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/api_reference/configurations.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/api_reference/dynamic_connector.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/api_reference/multimodality.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/api_reference/storage_backends.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/assets/InfiniStore-usage.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/assets/lmcache-controller.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/assets/lmcache-logo.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/assets/lmcache-logo_crop.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/assets/maru-kvcache.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/assets/mooncake-store-preview.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/coordinator.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/describe.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/kvcache.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/ping.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/query.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/quota.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/server.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/tool.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/cli/trace.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/community/blogs.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/community/meetings.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/conf.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/controller/freeze_mode.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/controller/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/architecture.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/contributing.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/extending_lmcache/remote_storage_plugins.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/extending_lmcache/runtime_plugins.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/extending_lmcache/storage_plugins.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/integration.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/usage/basic_check.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/developer_guide/usage/usage_stats_collection.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/disaggregated_prefill/nixl/1p1d.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/disaggregated_prefill/nixl/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/disaggregated_prefill/nixl/xpyd.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/disaggregated_prefill/shared_storage.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/Installation_compatibility_matrix.csv +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/kv_cache_calculator.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/quickstart/disaggregated_prefill.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/quickstart/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/quickstart/multimodality.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/quickstart/offload_kv_cache.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/quickstart/share_kv_cache.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/getting_started/quickstart/standalone_starter.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/internal_api_server/common_apis.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/internal_api_server/controller_apis.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/internal_api_server/dynamic_backend_management.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/internal_api_server/internal_api_server.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/internal_api_server/vllm_apis.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/async_loading.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/caching_policies.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/multiprocess_mode.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/p2p_sharing.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/3fs.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/bigtable.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/cpu_ram.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/custom_backend.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/dax.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/eic.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/gds.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/hfbucket.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/infinistore.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/local_storage.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/maru.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/mock.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/mooncake.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/nixl.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/redis.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/resp.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/s3.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/sagemaker_hyperpod.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/valkey.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache/storage_backends/weka.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/check_finish.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/clear.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/compress.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/health.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/lookup.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/move.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/pin.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_management/query_worker_info.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_optimizations/blending.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_optimizations/compression/cachegen.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_optimizations/compression/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/kv_cache_optimizations/layerwise.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/api_reference/configurations.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/api_reference/dynamic_connector.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/api_reference/multimodality.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/api_reference/storage_backends.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/cli/kvcache.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/cli/ping.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/cli/query.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/cli/tool.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/cli/trace.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/community/blogs.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/community/meetings.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/controller/freeze_mode.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/controller/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/architecture.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/cli.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/contributing.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/docker_file.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/extending_lmcache/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/extending_lmcache/native_connectors.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/extending_lmcache/remote_storage_plugins.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/extending_lmcache/runtime_plugins.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/extending_lmcache/storage_plugins.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/integration.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/usage/basic_check.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/usage/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/developer_guide/usage/usage_stats_collection.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/disaggregated_prefill/nixl/1p1d.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/disaggregated_prefill/nixl/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/disaggregated_prefill/nixl/xpyd.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/disaggregated_prefill/shared_storage.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/benchmarking.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/faq.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/installation.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/kv_cache_calculator.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/disaggregated_prefill.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/multimodality.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/share_kv_cache.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart/standalone_starter.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/quickstart.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/getting_started/troubleshoot.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/internal_api_server/common_apis.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/internal_api_server/controller_apis.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/internal_api_server/dynamic_backend_management.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/internal_api_server/internal_api_server.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/internal_api_server/vllm_apis.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/async_loading.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/caching_policies.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/multiprocess_mode.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/p2p_sharing.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/3fs.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/cpu_ram.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/custom_backend.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/eic.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/gds.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/infinistore.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/local_storage.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/maru.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/mock.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/mooncake.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/redis.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/resp.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/s3.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/sagemaker_hyperpod.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/valkey.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache/storage_backends/weka.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/check_finish.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/clear.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/compress.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/health.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/lookup.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/move.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/pin.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_management/query_worker_info.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_optimizations/blending.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_optimizations/compression/cachegen.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_optimizations/compression/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/kv_cache_optimizations/layerwise.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/mp/deployment.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/mp/frontend_dashboard.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/mp/serde.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/non_kv_cache/encoder_cache.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/docker_deployment.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/kubernetes_deployment.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/kv_cache_events.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/chunk_statistics.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/frontend.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/health_monitor.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/index.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/internal_api_server.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/metrics.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/periodic_thread_api.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/observability/vllm_endpoint.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/locale/zh_CN/LC_MESSAGES/production/performance_tuning.po +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/mp/architecture.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/mp/frontend_dashboard.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/non_kv_cache/encoder_cache.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/docker_deployment.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/kubernetes_deployment.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/kv_cache_events.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/chunk_statistics.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/frontend.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/health_monitor.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/index.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/internal_api_server.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/metrics.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/periodic_thread_api.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/observability/vllm_endpoint.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/docs/source/production/performance_tuning.rst +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/agents/prefix_analysis.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/agents/requirements.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/basic_check/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/basic_check/example_config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/batched_kv.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/batched_tp_kv.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/blend_kv.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/chunk1.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/chunk2.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/example_blending.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/online_kv.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv/tp_kv.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv_v1/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/blend_kv_v1/blend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/clear/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/clear/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/compress/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/compress/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/health/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/health/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/lookup/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/lookup/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/move/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/move/instance1.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/move/instance2.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/pin/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_controller/pin/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_interface/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_interface/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_with_configs/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/cache_with_configs/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/chunk_statistics/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/chunk_statistics/analyze_chunk_hashes.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/chunk_statistics/auto_stop.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/chunk_statistics/file_hash.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/chunk_statistics/memory_bloom_filter.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/configs/lmcache-decoder-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/configs/lmcache-decoder-pd-with-remote-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/configs/lmcache-prefiller-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/configs/lmcache-prefiller-pd-with-remote-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/disagg_example_1p1d.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/1p1d/disagg_vllm_launcher.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/disagg_proxy_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/configs/lmcache-decoder-1-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/configs/lmcache-decoder-1-pd-with-remote-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/configs/lmcache-decoder-2-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/configs/lmcache-decoder-2-pd-with-remote-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/configs/lmcache-prefiller-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/configs/lmcache-prefiller-pd-with-remote-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/disagg_example_xpyd.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill/xpyd/disagg_vllm_launcher.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill_mp/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill_mp/architecture.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/disagg_prefill_mp/disagg_proxy_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/frontend/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/frontend/chat_session.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/frontend/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/frontend/ffmpeg.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/frontend/frontend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kubernetes/health_probe.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_calculator/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_calculator/generate_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_calculator/kv_cache_calculator.html +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_calculator/modelconfig.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_calculator/requirement.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/local_backends/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/local_backends/offload.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/local_backends/rust_backend_offload.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/external/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/external/backend_type.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/fs/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/infinistore/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/infinistore/backend_type.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/mock/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/mock/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/mooncakestore/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/mooncakestore/mooncake.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/resp/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/resp/benchmark_resp_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/resp/resp.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/s3/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/s3/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/valkey/VALKEY_CONNECTOR_BENCHMARKING.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/valkey/benchmark_l2.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/remote_backends/valkey/valkey.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/share_across_instances/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/share_across_instances/centralized_sharing/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/share_across_instances/centralized_sharing/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/share_across_instances/p2p_sharing/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/share_across_instances/p2p_sharing/example1.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/kv_cache_reuse/share_across_instances/p2p_sharing/example2.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_l2_adapter/pyproject.toml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_l2_adapter/scripts/install_and_test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_l2_adapter/src/lmc_external_l2_adapter/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_l2_adapter/src/lmc_external_l2_adapter/adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_l2_adapter/tests/test_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/csrc/connector.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/csrc/connector.h +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/csrc/pybind.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/pyproject.toml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/setup.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/src/lmc_external_native_connector/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/lmc_external_native_connector/src/lmc_external_native_connector/connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/mp_runtime_plugins/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/mp_runtime_plugins/mp_heartbeat.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/mp_runtime_plugins/mp_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/multi_process/lmcache-daemonset.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/multi_process/vllm-deployment.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/docker-compose.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/grafana/provisioning/dashboards/dashboards.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/grafana/provisioning/dashboards/lmcache.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/grafana/provisioning/datasources/datasources.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/otel-collector.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/prometheus.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/start-server.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/observability/tempo.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/online_session/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/online_session/bench_ttft_sweep.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/online_session/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/online_session/ffmpeg.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/online_session/openai_chat_completion_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/redis_lookup/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/remote_config_server/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/remote_config_server/config_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/remote_config_server/example.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/runtime_plugins/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/runtime_plugins/all_plugin.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/runtime_plugins/scheduler_foo_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/runtime_plugins/worker_0_test.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/serde/fp8/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/serde/fp8/run_serde_fp8_example.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/examples/sgl_integration/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/format.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/banner.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/interactive/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/interactive/config.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/interactive/schema.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/interactive/state.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/interactive/terminal.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/progress.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/request_sender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/stats.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/long_doc_permutator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/long_doc_qa.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/multi_round_chat.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/prefix_suffix_tuner.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/engine_bench/workloads/random_prefill.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/l2_adapter_bench/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/l2_adapter_bench/command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/l2_adapter_bench/data.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/l2_adapter_bench/result.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/l2_adapter_bench/runner.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/bench/server_bench/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/coordinator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/kvcache.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/mock.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/ping.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/query/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/query/engine_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/query/kvcache_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/query/prompt.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/query/request.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/quota/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/quota/delete_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/quota/get_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/quota/helpers.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/quota/list_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/quota/set_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/tool/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/tool/cache_simulator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/trace/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/trace/dispatch.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/trace/driver.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/trace/info_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/trace/replay_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/commands/trace/stats.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/documents/lmcache.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/main.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/metrics/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/metrics/formatter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/metrics/handler.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/metrics/metrics.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/cli/metrics/section.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/connections.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/base_service_factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/request_telemetry/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/request_telemetry/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/request_telemetry/factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/request_telemetry/fastapi.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/request_telemetry/noop.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/sglang/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/sglang/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/tensorrt_llm/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/tensorrt_llm/tensorrt_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/tensorrt_llm/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/kv_cache_group_edits.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/lmcache_connector_v1.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/lmcache_connector_v1_085.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/lmcache_mp_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/tests/test_mm_hash_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/vllm_ec_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/vllm_service_factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/integration/vllm/vllm_v1_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/app.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/config.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/heartbeat.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/lmcache_mp_plugin/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/lmcache_mp_plugin/lmcache_mp_frontend_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/run_mp_server_with_frontend.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/static/css/style.css +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/static/img/logo.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/static/index.html +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/lmcache_frontend/static/js/app.js +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/logging.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/native_storage_ops.pyi +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/observability.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/storage_backend/serde/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/storage_backend/serde/cachegen_basics.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/storage_backend/serde/cachegen_decoder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/storage_backend/serde/cachegen_encoder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/storage_backend/serde/serde.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/docs/simulate_example.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/docs/sweep_example.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/gen_bench_dataset.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/lru_cache.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/plot_hit_rate.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/cache_simulator/simulator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/__main__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/constants.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/admit.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/deregister.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/evict.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/heartbeat.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/p2p_lookup.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/controller_benchmark/handlers/register.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/mp_status_viewer/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/mp_status_viewer/__main__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/tools/simple_discover_service.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/usage_context.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/api_server/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/api_server/__main__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/basic_check.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/commands/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/commands/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/commands/full_sync.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/controller_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/controllers/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/controllers/full_sync_tracker.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/controllers/kv_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/controllers/registration_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/executor.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/frontend/static/css/style.css +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/frontend/static/img/logo.png +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/frontend/static/index.html +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/frontend/static/js/controller_app.js +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/full_sync_sender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/locks.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/message.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/observability.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_controller/worker.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_engine.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/cache_interface.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/check/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/check/check_mode_gen.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/check/check_mode_test_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/check/check_mode_test_remote.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/check/check_mode_test_storage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/check/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/abstract.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/flash_attn.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/flash_infer_sparse.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/metadata.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/triton_kernels/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/triton_kernels/block_sparse_attention.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/triton_sparse.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/attention/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/blend/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/blend/blender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/blend/metadata.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/blend/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/models/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/models/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/models/llama.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/models/qwen3.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/models/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/compute/positional_encoding.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/config_base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/error.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/eviction.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/eviction_policy/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/eviction_policy/factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/eviction_policy/isolated_lru.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/eviction_policy/lru.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/eviction_policy/noop.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/internal_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l1_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/dax_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/fs_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/fs_native_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/hfbucket_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/mock_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/mooncake_store_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/native_connector_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/native_plugin_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/nixl_store_dynamic_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/nixl_store_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/plugin_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/raw_block_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/reconfiguration.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/resp_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/s3_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/l2_adapters/serde_wrapper.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/memory_manager/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/memory_manager/gds_l1_memory_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/memory_manager/l1_manager_protocol.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/memory_manager/l1_memory_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/quota_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/serde/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/serde/factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/serde/fp8.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/serde/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controllers/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controllers/eviction_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controllers/prefetch_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controllers/prefetch_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controllers/store_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_controllers/store_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/distributed/storage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/ec_engine.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/event_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/exceptions/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/gpu_connector/_cufile_async.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/gpu_connector/gds_context.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/gpu_connector/gpu_ops.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/gpu_connector/mock_gpu_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/health_monitor/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/health_monitor/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/health_monitor/checks/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/health_monitor/checks/remote_backend_check.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/health_monitor/constants.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/api_registry.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/api_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/env_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/loglevel_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/metrics_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/periodic_thread_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/run_script_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/common/thread_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/controller/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/controller/key_stats_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/controller/worker_info_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/backend_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/bypass_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/cache_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/chunk_statistics_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/conf_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/freeze_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/hot_cache_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/inference_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/load_fs_chunks_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/lookup_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/internal_api_server/vllm/version_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lazy_memory_allocator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/abstract_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/async_lookup_message.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/chunk_statistics_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/hit_limit_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/lmcache_async_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/lmcache_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/lmcache_lookup_client_bypass.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/mooncake_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/record_strategies/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/record_strategies/base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/record_strategies/file_hash.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/lookup_client/record_strategies/memory_bloom_filter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/__main__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/app.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/blend_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/blend_directory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/http_apis/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/http_apis/blend_directory_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/http_apis/health_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/http_apis/l2_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/l2/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/l2/event_listener.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/l2/eviction_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/l2/usage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_coordinator/registrar.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/AGENTS.override.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/event.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/event_bus.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/cb_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/l1.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/l2.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/lookup_hash.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/mp_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/logging/sm.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/cb_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/engine.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/event_bus.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l0_l1_throughput.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l0_lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l1.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l1_eviction_loop.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l1_failures.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l1_lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l2.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l2_failures.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/l2_throughput.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/lookup.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/sm_lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/metrics/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/tracing/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/tracing/cb_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/tracing/mp_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/subscribers/tracing/span_registry.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/codecs.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/decorator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/format.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/reader.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/mp_observability/trace/recorder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/affinity_pool.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/futures.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/group_view.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_api_registry.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/common_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/conf_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/healthcheck_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/quota_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/reconfigure_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/root_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/status_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_apis/version_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/http_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/modules/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/mp_runtime_plugin_launcher.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/mq.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/posix_shm.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/protocols/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/protocols/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/protocols/controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/protocols/debug.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/multiprocess/protocols/observability.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/offload_server/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/offload_server/abstract_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/offload_server/message.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/offload_server/zmq_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/pin_monitor.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/platform/_registry.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/platform/cpu/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/platform/cpu/shm.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/platform/cpu/stub_cpu_device.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/platform/cuda/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/platform/event_notifier.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/plugin/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/plugin/runtime_plugin_launcher.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/protocol.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/rpc/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/rpc/transport.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/rpc/zmq_transport.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/rpc_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/server/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/server/__main__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/server/storage_backend/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/server/storage_backend/abstract_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/server/storage_backend/local_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/server/utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/standalone/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/standalone/__main__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/standalone/manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/standalone/standalone_service_factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/abstract_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/audit_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/batched_message_sender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/cache_policy/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/cache_policy/base_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/cache_policy/fifo.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/cache_policy/lfu.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/cache_policy/lru.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/cache_policy/mru.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/audit_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/audit_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/base_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/bigtable_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/bigtable_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/bigtable_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/bigtable_schema.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/blackhole_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/blackhole_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/eic_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/eic_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/external_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/fs_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/fs_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/hf3fs_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/hf3fs_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/hfbucket_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/hfbucket_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/infinistore_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/infinistore_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/instrumented_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/lm_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/lm_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/mock_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/mock_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/mooncakestore_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/mooncakestore_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/redis_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/redis_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/s3_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/s3_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/sagemaker_hyperpod_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/sagemaker_hyperpod_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/valkey_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/connector/valkey_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/dax/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/dax/core.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/gds_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/hipfile_shim.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/job_executor/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/job_executor/base_executor.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/job_executor/pq_executor.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/local_cpu_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/local_disk_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/maru_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/cachegen_basics.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/cachegen_decoder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/cachegen_encoder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/kivi_serde.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/naive_serde.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/naive_serde/serde.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/native_clients/connector_client_base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/native_clients/resp_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/nixl_storage_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/p2p_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/path_sharder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/pd_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/pd_backend_async.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/plugins/dax_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/plugins/rust_raw_block_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/raw_block/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/raw_block/core.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/raw_block/key_codec.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/remote_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/resp_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/storage_backend_listener.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/storage_backend/storage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/system_detection.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/token_database.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/transfer_channel/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/transfer_channel/abstract.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/transfer_channel/mock_memory_channel.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/transfer_channel/nixl_channel.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/transfer_channel/py_socket_channel.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/transfer_channel/transfer_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/utils/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/utils/bloom_filter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/utils/cache_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/utils/json_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache/v1/utils/router_discovery.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache.egg-info/dependency_links.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache.egg-info/entry_points.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/lmcache.egg-info/top_level.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/.custom-gcl.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/.devcontainer/devcontainer.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/.devcontainer/post-install.sh +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/.dockerignore +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/.golangci.yml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/.pre-commit-config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/AGENTS.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/Dockerfile +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/PROJECT +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/cacheblendengine_defaults.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/cacheblendengine_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/cacheblendengine_types.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/cacheblendengine_validation.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/groupversion_info.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/lmcacheengine_defaults.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/lmcacheengine_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/lmcacheengine_types.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/lmcacheengine_validation.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/api/v1alpha1/zz_generated.deepcopy.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/cmd/main.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/certmanager/certificate.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/certmanager/issuer.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/certmanager/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/certmanager/kustomizeconfig.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/crd/bases/lmcache.lmcache.ai_cacheblendengines.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/crd/bases/lmcache.lmcache.ai_lmcacheengines.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/crd/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/crd/kustomizeconfig.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/default/cert_metrics_manager_patch.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/default/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/default/manager_metrics_patch.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/default/manager_webhook_patch.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/default/metrics_service.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/manager/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/manager/manager.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/network-policy/allow-metrics-traffic.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/network-policy/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/prometheus/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/prometheus/monitor.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/prometheus/monitor_tls_patch.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/leader_election_role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/leader_election_role_binding.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/lmcacheengine_admin_role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/lmcacheengine_editor_role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/lmcacheengine_viewer_role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/metrics_auth_role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/metrics_auth_role_binding.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/metrics_reader_role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/role.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/role_binding.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/rbac/service_account.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/lmcache_v1alpha1_cacheblendengine.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/lmcache_v1alpha1_lmcacheengine.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/lmcache_v1alpha1_lmcacheengine_amd.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/lmcache_v1alpha1_lmcacheengine_l2_redis.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/lmcache_v1alpha1_lmcacheengine_production.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/vllm_cacheblend_deployment.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/samples/vllm_deployment.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/webhook/kustomization.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/webhook/kustomizeconfig.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/webhook/manifests.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/webhook/mutating_webhook_selectors_patch.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/config/webhook/service.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/go.mod +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/go.sum +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/hack/boilerplate.go.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/hack/pre-commit +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/cacheblend_reconcile_helpers.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/cacheblendengine_controller.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/cacheblendengine_controller_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/lmcacheengine_controller.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/lmcacheengine_controller_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/reconcile_helpers.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/controller/suite_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/cacheblend_engine.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/cacheblend_engine_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/compute.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/configmap.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/daemonset.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/helpers.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/labels.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/resources_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/service.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/resources/servicemonitor.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/webhook/cacheblend_inject_builders.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/webhook/pod_injector.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/webhook/pod_injector_envtest_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/webhook/pod_injector_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/internal/webhook/webhook_suite_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/make/build.mk +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/make/deploy.mk +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/make/e2e-gpu.mk +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/make/e2e.mk +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/make/lint.mk +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/make/tools.mk +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/auth_smoke_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/crd_smoke_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/e2e_suite_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/e2e_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/field_coverage_smoke_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/lifecycle_smoke_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/runtime_smoke_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/smoke_helpers_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/e2e/vllm_integration_smoke_test.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/golden/kv_transfer_config_minimal.json +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/lmc_custom_port.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/lmc_minimal.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/lmc_runtime.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/lmc_servicemonitor.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/lmc_with_redis_l2_authsecret.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures/vllm_deployment.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/fixtures.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/http.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/lmc.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/portforward.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/runner.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/utils.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/operator/test/utils/wait.go +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/pyproject.toml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/pyproject_cli.toml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/pytest.ini +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/bench.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/build.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/cli.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/common.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/cuda.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/cuda12_core.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/cuda13_core.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/docs.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/lint.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/rocm_core.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/requirements/test.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/rust/raw_block/.gitignore +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/rust/raw_block/Cargo.toml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/rust/raw_block/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/rust/raw_block/pyproject.toml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/rust/raw_block/src/lib.rs +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/setup.cfg +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/benchmarks/test_benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/benchmarks/test_cachegen.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/benchmarks/test_xpu_connector_benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/benchmarks/test_xpu_kernels_microbench.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/benchmarks/test_xpu_layerwise_connector_benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/interactive/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/interactive/test_schema.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/interactive/test_state.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/test_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/test_progress.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/test_request_sender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/test_stats.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_base_workload.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_create_workload.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_long_doc_permutator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_long_doc_qa.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_multi_round_chat.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_prefix_suffix_tuner.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/engine_bench/workloads/test_random_prefill.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/l2_adapter_bench/test_data.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/test_bench_command.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/bench/test_server_bench.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/test_query.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/test_quota.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/test_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/trace/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/trace/test_dispatch.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/trace/test_driver.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/commands/trace/test_stats.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/conftest.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/cli/test_ping.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/conftest.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/data/test_creation_from_file/disk.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/data/test_creation_from_file/fail.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/data/test_creation_from_file/hybrid.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/data/test_creation_from_file/local.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/data/test_creation_from_file/remote.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/disagg/README.md +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/disagg/test_nixl_cache_engine.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/disagg/test_nixl_channel.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/disagg/test_nixl_storage_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/lmcache_frontend/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/lmcache_frontend/lmcache_mp_plugin/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/lmcache_frontend/lmcache_mp_plugin/test_lmcache_mp_frontend_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/lmcache_frontend/test_heartbeat.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/test_banner.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/test_observability.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/test_serde.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/test_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/tools/test_cache_simulator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/tools/test_controller_zmq_benchmark.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/conftest.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/pytest.ini +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_full_sync.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_full_sync_sender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_kv_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_locks.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_messages.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_registration_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/cache_controller/test_registry_tree.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/compute/attention/test_triton_kernels.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/compute/attention/test_triton_sparse_e2e.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/data/gds.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/data/hipfile.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/data/hipfile_gds.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/data/nixl.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/data/nixl_multipath.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/data/test_config.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/conftest.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/memory_manager/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/memory_manager/test_gds_l1_memory_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/serde/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/serde/test_factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/serde/test_fp8.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/serde/test_serde_e2e.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/serde/test_serde_fs_e2e.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/serde/test_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_cache_salt_l2_eviction.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_dax_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_distributed_storage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_hfbucket_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_isolated_lru_eviction_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_l1_l2_state_metrics.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_l1_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_l1_memory_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_l2_adapter_base.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_l2_adapter_factory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_lru_eviction_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_mock_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_mooncake_store_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_multimodel.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_native_connector_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_nixl_store_dynamic_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_nixl_store_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_prefetch_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_prefetch_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_quota_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_raw_block_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_report_status.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_resp_env_vars.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_resp_l2_adapter_integration.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_s3_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_store_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/distributed/test_store_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/gpu_connector/test_gds_context.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_backend_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_cache_clear.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_hot_cache_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_kvcache_check_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_load_fs_chunks.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_lookup_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_per_instance_app.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_run_script.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/allowed_imports.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/basic.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/builtin_functions.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/default_result.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/empty_allowed_imports.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/exception.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/invalid_module.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/math_module.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/multiple_imports.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/os_module.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_scripts/without_allowed_imports.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/internal_api_server/test_worker_info_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/lookup_client/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/lookup_client/test_chunk_statistics_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/lookup_client/test_lmcache_lookup_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_blend_client.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_blend_directory.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_blend_directory_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_eviction_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_health.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_integration.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_l2_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_registrar.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_registry.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_coordinator/test_usage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/logging/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/logging/test_cb_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/logging/test_lookup_hash_logger.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/logging/test_mp_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/counter_helpers.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/otel_setup.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_cb_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_engine.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_event_bus_self_metrics.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l0_l1_throughput.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l0_lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l1.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l1_eviction_loop.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l1_failures.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l1_lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l2.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l2_failures.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_l2_throughput.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_lookup.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/metrics/test_sm_lifecycle.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/tracing/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/tracing/test_cb_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/subscribers/tracing/test_mp_server.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/test_event_bus.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/test_event_recorder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/test_otel_init.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/test_register_gauge.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/trace/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/trace/test_codecs.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/trace/test_decorator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/mp_observability/trace/test_recorder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/http_apis/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/http_apis/test_conf_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/http_apis/test_reconfigure_api.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_affinity_pool.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_blend_v3_load_store_opts.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_completion_recorder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_compute_mp_checksums.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_futures.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_http_quota_endpoints.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_mp_runtime_plugin_launcher.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_mq_handler_helpers.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_optimized_lookup_v3.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_posix_shm.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_query_lookup_hits.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_raw_block_l2_adapter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_skip_first_n_tokens.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/multiprocess/test_token_hasher.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/native_storage_ops/test_bitmap.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/native_storage_ops/test_pattern_matcher.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/native_storage_ops/test_periodic_event_notifier.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/native_storage_ops/test_ttl_lock.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/platform/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/platform/test_cpu_shm.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/plugin/test_runtime_plugin_launcher.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/csrc/.gitignore +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/csrc/CMakeLists.txt +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/csrc/shm_file_worker.cpp +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/shmfile_basic_check.yaml +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/shmfile_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/test_shm_allocator.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/shm_allocator/verify_shmfile_tcp.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/__init__.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/raw_block_test_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_audit_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_batched_message_sender.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_bigtable_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_bigtable_integration.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_eic.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_fs_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_gds_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_hf3fs_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_hfbucket_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_local_cpu_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_local_cpu_backend_nixl_paged.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_local_disk_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_maru_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_nixl_shared_pool.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_p2p_backend_with_controller.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_path_sharder.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_pd_backend_async.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_pd_backend_bidirectional.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_pd_backend_buffer_alignment.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_raw_block_core.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_raw_block_device.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_raw_block_key_codec.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_raw_block_uring_cmd.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_remote_storage_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_resp_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_rust_raw_block_backend.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_storage_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_storage_plugin.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/storage_backend/test_valkey_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_address_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_basic_check.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_bloom_filter.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_c_ops_fallback_parity.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_cache_engine.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_cache_engine_cleanup.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_cache_interface.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_cache_policy.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_config.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_connector_discovery.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_decode_save_and_preemption.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_device_id_race.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_ec_connector.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_event_notifier.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_freeze_mode_integration.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_gds.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_health_monitor.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_health_monitor_fallback_recovery.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_impl_completeness.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_json_utils.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_kv_cache_groups.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_manager.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_nixl_batched_contains.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_nixl_doca_memos.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_nixl_multipath.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_nixl_storage.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_pos_kernels.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_remote_metadata.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_remote_mla_worker_id_as0.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_token_database.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_v1_adapter_state_desync.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_vllm_integration.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_vllm_kv_cache_groups.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tests/v1/test_vllm_layerwise_wait_for_save.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tools/check_spdx_header.py +0 -0
- {lmcache-0.4.7 → lmcache-0.4.8.dev24}/tools/translate_docs_zh.py +0 -0
|
@@ -0,0 +1,143 @@
|
|
|
1
|
+
# Comprehensive integration tests — one step per config, run in parallel.
|
|
2
|
+
# Each step gets its own K8s pod with the exact GPU count it needs.
|
|
3
|
+
# 2-GPU group is listed first so these heavier jobs get scheduled before 1-GPU jobs.
|
|
4
|
+
|
|
5
|
+
x-perf-retry: &perf-retry
|
|
6
|
+
automatic:
|
|
7
|
+
- exit_status: -1
|
|
8
|
+
limit: 2
|
|
9
|
+
- exit_status: 1
|
|
10
|
+
limit: 2
|
|
11
|
+
|
|
12
|
+
steps:
|
|
13
|
+
- group: ":test_tube: Comprehensive (2-GPU)"
|
|
14
|
+
steps:
|
|
15
|
+
- label: ":test_tube: pd"
|
|
16
|
+
command: .buildkite/k3_tests/comprehensive/run.sh pd.yaml
|
|
17
|
+
timeout_in_minutes: 30
|
|
18
|
+
retry: *perf-retry
|
|
19
|
+
agents: { queue: "k8s" }
|
|
20
|
+
plugins:
|
|
21
|
+
- kubernetes:
|
|
22
|
+
podSpec: &pod-2gpu
|
|
23
|
+
containers:
|
|
24
|
+
- name: container-0
|
|
25
|
+
image: lmcache/ci-base:latest
|
|
26
|
+
imagePullPolicy: Never
|
|
27
|
+
resources: { limits: { "nvidia.com/gpu": "2" } }
|
|
28
|
+
volumeMounts: &vol-mounts
|
|
29
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
30
|
+
- { name: datasets, mountPath: /root/correctness }
|
|
31
|
+
volumes: &vols
|
|
32
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
33
|
+
- { name: datasets, hostPath: { path: /data/datasets, type: DirectoryOrCreate } }
|
|
34
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
35
|
+
|
|
36
|
+
- label: ":test_tube: p2p"
|
|
37
|
+
command: .buildkite/k3_tests/comprehensive/run.sh p2p.yaml
|
|
38
|
+
timeout_in_minutes: 30
|
|
39
|
+
retry: *perf-retry
|
|
40
|
+
agents: { queue: "k8s" }
|
|
41
|
+
plugins: [{ kubernetes: { podSpec: *pod-2gpu } }]
|
|
42
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
43
|
+
|
|
44
|
+
- label: ":test_tube: p2p_with_v3"
|
|
45
|
+
command: .buildkite/k3_tests/comprehensive/run.sh p2p_with_v3.yaml
|
|
46
|
+
timeout_in_minutes: 30
|
|
47
|
+
retry: *perf-retry
|
|
48
|
+
agents: { queue: "k8s" }
|
|
49
|
+
plugins: [{ kubernetes: { podSpec: *pod-2gpu } }]
|
|
50
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
51
|
+
|
|
52
|
+
- group: ":test_tube: Comprehensive (1-GPU)"
|
|
53
|
+
steps:
|
|
54
|
+
- label: ":test_tube: local_cpu"
|
|
55
|
+
command: .buildkite/k3_tests/comprehensive/run.sh local_cpu.yaml
|
|
56
|
+
timeout_in_minutes: 30
|
|
57
|
+
retry: *perf-retry
|
|
58
|
+
agents: { queue: "k8s" }
|
|
59
|
+
plugins:
|
|
60
|
+
- kubernetes:
|
|
61
|
+
podSpec: &pod-1gpu
|
|
62
|
+
containers:
|
|
63
|
+
- name: container-0
|
|
64
|
+
image: lmcache/ci-base:latest
|
|
65
|
+
imagePullPolicy: Never
|
|
66
|
+
resources: { limits: { "nvidia.com/gpu": "1" } }
|
|
67
|
+
volumeMounts: *vol-mounts
|
|
68
|
+
volumes: *vols
|
|
69
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
70
|
+
|
|
71
|
+
- label: ":test_tube: local_disk"
|
|
72
|
+
command: .buildkite/k3_tests/comprehensive/run.sh local_disk.yaml
|
|
73
|
+
timeout_in_minutes: 30
|
|
74
|
+
retry: *perf-retry
|
|
75
|
+
agents: { queue: "k8s" }
|
|
76
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
77
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
78
|
+
|
|
79
|
+
- label: ":test_tube: async"
|
|
80
|
+
command: .buildkite/k3_tests/comprehensive/run.sh async.yaml
|
|
81
|
+
timeout_in_minutes: 30
|
|
82
|
+
retry: *perf-retry
|
|
83
|
+
agents: { queue: "k8s" }
|
|
84
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
85
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
86
|
+
|
|
87
|
+
- label: ":test_tube: local_cpu_with_v3"
|
|
88
|
+
command: .buildkite/k3_tests/comprehensive/run.sh local_cpu_with_v3.yaml
|
|
89
|
+
timeout_in_minutes: 30
|
|
90
|
+
retry: *perf-retry
|
|
91
|
+
agents: { queue: "k8s" }
|
|
92
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
93
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
94
|
+
|
|
95
|
+
- label: ":test_tube: local_disk_with_v3"
|
|
96
|
+
command: .buildkite/k3_tests/comprehensive/run.sh local_disk_with_v3.yaml
|
|
97
|
+
timeout_in_minutes: 30
|
|
98
|
+
retry: *perf-retry
|
|
99
|
+
agents: { queue: "k8s" }
|
|
100
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
101
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
102
|
+
|
|
103
|
+
- label: ":test_tube: multi_device"
|
|
104
|
+
command: .buildkite/k3_tests/comprehensive/run.sh multi_device.yaml
|
|
105
|
+
timeout_in_minutes: 30
|
|
106
|
+
retry: *perf-retry
|
|
107
|
+
agents: { queue: "k8s" }
|
|
108
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
109
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
110
|
+
|
|
111
|
+
- label: ":test_tube: layerwise"
|
|
112
|
+
command: .buildkite/k3_tests/comprehensive/run.sh layerwise.yaml
|
|
113
|
+
timeout_in_minutes: 30
|
|
114
|
+
retry: *perf-retry
|
|
115
|
+
agents: { queue: "k8s" }
|
|
116
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
117
|
+
artifact_paths: ["*.log", "benchmarks/long_doc_qa/*.json"]
|
|
118
|
+
|
|
119
|
+
# Nightly baseline upload: only runs when NEED_UPLOAD=true (scheduled build).
|
|
120
|
+
# Collects date-stamped baseline artifacts from all config steps,
|
|
121
|
+
# prunes files older than 5 days, and pushes a single commit to benchmarks-main.
|
|
122
|
+
- wait: ~
|
|
123
|
+
if: build.env("NEED_UPLOAD") == "true"
|
|
124
|
+
|
|
125
|
+
- label: ":arrow_up: Upload rolling baselines"
|
|
126
|
+
if: build.env("NEED_UPLOAD") == "true"
|
|
127
|
+
command: .buildkite/k3_tests/comprehensive/scripts/upload-baselines.sh
|
|
128
|
+
timeout_in_minutes: 5
|
|
129
|
+
agents: { queue: "k8s" }
|
|
130
|
+
plugins:
|
|
131
|
+
- kubernetes:
|
|
132
|
+
podSpec:
|
|
133
|
+
containers:
|
|
134
|
+
- name: container-0
|
|
135
|
+
image: lmcache/ci-base:latest
|
|
136
|
+
imagePullPolicy: Never
|
|
137
|
+
resources: { limits: { cpu: "1", memory: "2Gi" } }
|
|
138
|
+
env:
|
|
139
|
+
- name: GITHUB_TOKEN
|
|
140
|
+
valueFrom:
|
|
141
|
+
secretKeyRef:
|
|
142
|
+
name: buildkite-git-creds
|
|
143
|
+
key: GITHUB_TOKEN
|
|
@@ -0,0 +1,221 @@
|
|
|
1
|
+
# Multiprocess tests — one step per test, run in parallel.
|
|
2
|
+
# Each step gets its own K8s pod with the exact GPU count it needs.
|
|
3
|
+
# Tests are grouped by GPU requirement; the 2-GPU group is listed first so
|
|
4
|
+
# these heavier jobs get scheduled before 1-GPU jobs.
|
|
5
|
+
# 2-GPU: LMCache+vLLM on GPU 0, baseline on GPU 1 (or TP=2 across both).
|
|
6
|
+
# 1-GPU: LMCache+vLLM on GPU 0 only (no baseline server).
|
|
7
|
+
|
|
8
|
+
steps:
|
|
9
|
+
- group: ":compression: Multiprocess (2-GPU)"
|
|
10
|
+
steps:
|
|
11
|
+
- label: ":compression: vllm_bench"
|
|
12
|
+
command: .buildkite/k3_tests/multiprocess/run.sh vllm_bench
|
|
13
|
+
timeout_in_minutes: 30
|
|
14
|
+
agents: { queue: "k8s" }
|
|
15
|
+
plugins:
|
|
16
|
+
- kubernetes:
|
|
17
|
+
podSpec: &pod-2gpu
|
|
18
|
+
containers:
|
|
19
|
+
- name: container-0
|
|
20
|
+
image: lmcache/ci-base:latest
|
|
21
|
+
imagePullPolicy: Never
|
|
22
|
+
resources: { limits: { "nvidia.com/gpu": "2" } }
|
|
23
|
+
volumeMounts: &vol-mounts
|
|
24
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
25
|
+
volumes: &vols
|
|
26
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
27
|
+
artifact_paths: ["*.log"]
|
|
28
|
+
|
|
29
|
+
- label: ":compression: long_doc_qa"
|
|
30
|
+
command: .buildkite/k3_tests/multiprocess/run.sh long_doc_qa
|
|
31
|
+
timeout_in_minutes: 30
|
|
32
|
+
agents: { queue: "k8s" }
|
|
33
|
+
plugins: [{ kubernetes: { podSpec: *pod-2gpu } }]
|
|
34
|
+
artifact_paths: ["*.log"]
|
|
35
|
+
|
|
36
|
+
- label: ":compression: long_doc_qa_l2"
|
|
37
|
+
command: .buildkite/k3_tests/multiprocess/run.sh long_doc_qa_l2
|
|
38
|
+
timeout_in_minutes: 30
|
|
39
|
+
agents: { queue: "k8s" }
|
|
40
|
+
plugins: [{ kubernetes: { podSpec: *pod-2gpu } }]
|
|
41
|
+
artifact_paths: ["*.log"]
|
|
42
|
+
|
|
43
|
+
- label: ":compression: deadlock"
|
|
44
|
+
command: .buildkite/k3_tests/multiprocess/run.sh deadlock
|
|
45
|
+
timeout_in_minutes: 30
|
|
46
|
+
agents: { queue: "k8s" }
|
|
47
|
+
plugins: [{ kubernetes: { podSpec: *pod-2gpu } }]
|
|
48
|
+
artifact_paths: ["*.log"]
|
|
49
|
+
|
|
50
|
+
- group: ":compression: Multiprocess (1-GPU)"
|
|
51
|
+
steps:
|
|
52
|
+
- label: ":compression: lm_eval"
|
|
53
|
+
command: .buildkite/k3_tests/multiprocess/run.sh lm_eval
|
|
54
|
+
timeout_in_minutes: 30
|
|
55
|
+
agents: { queue: "k8s" }
|
|
56
|
+
plugins:
|
|
57
|
+
- kubernetes:
|
|
58
|
+
podSpec: &pod-1gpu
|
|
59
|
+
containers:
|
|
60
|
+
- name: container-0
|
|
61
|
+
image: lmcache/ci-base:latest
|
|
62
|
+
imagePullPolicy: Never
|
|
63
|
+
resources: { limits: { "nvidia.com/gpu": "1" } }
|
|
64
|
+
volumeMounts: *vol-mounts
|
|
65
|
+
volumes: *vols
|
|
66
|
+
artifact_paths: ["*.log"]
|
|
67
|
+
|
|
68
|
+
# HMA correctness check on google/gemma-4-31B-it (a hybrid model whose KV
|
|
69
|
+
# cache groups get different block sizes). Runs gsm8k, resets vLLM's prefix
|
|
70
|
+
# cache (LMCache preserved), reruns served by LMCache, and asserts the two
|
|
71
|
+
# runs' scores match. Single GPU, no baseline.
|
|
72
|
+
- label: ":compression: hma_lm_eval_gemma4"
|
|
73
|
+
command: .buildkite/k3_tests/multiprocess/run.sh hma_lm_eval_gemma4
|
|
74
|
+
timeout_in_minutes: 60
|
|
75
|
+
env:
|
|
76
|
+
MODEL: "google/gemma-4-31B-it"
|
|
77
|
+
# Allow a small score difference between the two runs.
|
|
78
|
+
SCORE_TOLERANCE: "0.03"
|
|
79
|
+
ATTENTION_BACKEND: "auto"
|
|
80
|
+
GPU_MEMORY_UTILIZATION: "0.85"
|
|
81
|
+
# 31B load + CUDA-graph capture is slow; raise the readiness timeout
|
|
82
|
+
# above the 300s default.
|
|
83
|
+
MAX_WAIT_SECONDS: "600"
|
|
84
|
+
# Cap samples and enlarge the CPU pool so the retrieve run stays
|
|
85
|
+
# cache-served (31B's per-token KV is large).
|
|
86
|
+
LIMIT: "100"
|
|
87
|
+
CPU_BUFFER_SIZE: "200"
|
|
88
|
+
agents: { queue: "k8s" }
|
|
89
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
90
|
+
artifact_paths: ["*.log"]
|
|
91
|
+
|
|
92
|
+
- label: ":compression: fault_tolerance"
|
|
93
|
+
command: .buildkite/k3_tests/multiprocess/run.sh fault_tolerance
|
|
94
|
+
timeout_in_minutes: 30
|
|
95
|
+
agents: { queue: "k8s" }
|
|
96
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
97
|
+
artifact_paths: ["*.log"]
|
|
98
|
+
|
|
99
|
+
- label: ":compression: restart_recovery"
|
|
100
|
+
command: .buildkite/k3_tests/multiprocess/run.sh restart_recovery
|
|
101
|
+
timeout_in_minutes: 30
|
|
102
|
+
agents: { queue: "k8s" }
|
|
103
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
104
|
+
artifact_paths: ["*.log"]
|
|
105
|
+
|
|
106
|
+
- label: ":compression: cache_stats"
|
|
107
|
+
command: .buildkite/k3_tests/multiprocess/run.sh cache_stats
|
|
108
|
+
timeout_in_minutes: 30
|
|
109
|
+
agents: { queue: "k8s" }
|
|
110
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
111
|
+
artifact_paths: ["*.log"]
|
|
112
|
+
|
|
113
|
+
- label: ":compression: http_api"
|
|
114
|
+
command: .buildkite/k3_tests/multiprocess/run.sh http_api
|
|
115
|
+
timeout_in_minutes: 30
|
|
116
|
+
agents: { queue: "k8s" }
|
|
117
|
+
plugins: [{ kubernetes: { podSpec: *pod-1gpu } }]
|
|
118
|
+
artifact_paths: ["*.log"]
|
|
119
|
+
|
|
120
|
+
- label: ":compression: gds_smoke_test"
|
|
121
|
+
command: .buildkite/k3_tests/multiprocess/run.sh gds_smoke_test
|
|
122
|
+
timeout_in_minutes: 30
|
|
123
|
+
agents: { queue: "k8s" }
|
|
124
|
+
plugins:
|
|
125
|
+
- kubernetes:
|
|
126
|
+
podSpec:
|
|
127
|
+
containers:
|
|
128
|
+
- name: container-0
|
|
129
|
+
image: lmcache/ci-base:latest
|
|
130
|
+
imagePullPolicy: Never
|
|
131
|
+
resources: { limits: { "nvidia.com/gpu": "1" } }
|
|
132
|
+
volumeMounts:
|
|
133
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
134
|
+
- { name: scratch, mountPath: /scratch }
|
|
135
|
+
- { name: udev, mountPath: /run/udev, readOnly: true }
|
|
136
|
+
volumes:
|
|
137
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
138
|
+
- { name: scratch, hostPath: { path: /data/gds-scratch, type: DirectoryOrCreate } }
|
|
139
|
+
- { name: udev, hostPath: { path: /run/udev, type: Directory } }
|
|
140
|
+
artifact_paths: ["*.log"]
|
|
141
|
+
|
|
142
|
+
- group: ":compression: Multiprocess (CPU-only)"
|
|
143
|
+
steps:
|
|
144
|
+
- label: ":compression: cpu_e2e_validation (shm)"
|
|
145
|
+
command: bash .github/scripts/run-cpu-e2e-validation.sh
|
|
146
|
+
timeout_in_minutes: 30
|
|
147
|
+
agents: { queue: "k8s" }
|
|
148
|
+
plugins:
|
|
149
|
+
- kubernetes:
|
|
150
|
+
podSpec:
|
|
151
|
+
containers:
|
|
152
|
+
- name: container-0
|
|
153
|
+
image: lmcache/ci-base:latest
|
|
154
|
+
imagePullPolicy: Never
|
|
155
|
+
resources:
|
|
156
|
+
requests:
|
|
157
|
+
cpu: "8"
|
|
158
|
+
memory: "256Gi"
|
|
159
|
+
limits:
|
|
160
|
+
cpu: "8"
|
|
161
|
+
memory: "256Gi"
|
|
162
|
+
volumeMounts:
|
|
163
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
164
|
+
- { name: dshm, mountPath: /dev/shm }
|
|
165
|
+
volumes:
|
|
166
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
167
|
+
- { name: dshm, emptyDir: { medium: Memory, sizeLimit: 4Gi } }
|
|
168
|
+
|
|
169
|
+
- label: ":compression: cpu_e2e_validation (pickle)"
|
|
170
|
+
command: bash .github/scripts/run-cpu-e2e-validation.sh
|
|
171
|
+
env:
|
|
172
|
+
LMCACHE_SHM_NAME: ""
|
|
173
|
+
timeout_in_minutes: 30
|
|
174
|
+
agents: { queue: "k8s" }
|
|
175
|
+
plugins:
|
|
176
|
+
- kubernetes:
|
|
177
|
+
podSpec:
|
|
178
|
+
containers:
|
|
179
|
+
- name: container-0
|
|
180
|
+
image: lmcache/ci-base:latest
|
|
181
|
+
imagePullPolicy: Never
|
|
182
|
+
resources:
|
|
183
|
+
requests:
|
|
184
|
+
cpu: "8"
|
|
185
|
+
memory: "256Gi"
|
|
186
|
+
limits:
|
|
187
|
+
cpu: "8"
|
|
188
|
+
memory: "256Gi"
|
|
189
|
+
volumeMounts:
|
|
190
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
191
|
+
- { name: dshm, mountPath: /dev/shm }
|
|
192
|
+
volumes:
|
|
193
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
194
|
+
- { name: dshm, emptyDir: { medium: Memory, sizeLimit: 4Gi } }
|
|
195
|
+
|
|
196
|
+
- label: ":compression: cpu_e2e_validation (server-side copy)"
|
|
197
|
+
command: bash .github/scripts/run-cpu-e2e-validation.sh
|
|
198
|
+
env:
|
|
199
|
+
LMCACHE_MP_TRANSFER_MODE: "lmcache_driven"
|
|
200
|
+
timeout_in_minutes: 30
|
|
201
|
+
agents: { queue: "k8s" }
|
|
202
|
+
plugins:
|
|
203
|
+
- kubernetes:
|
|
204
|
+
podSpec:
|
|
205
|
+
containers:
|
|
206
|
+
- name: container-0
|
|
207
|
+
image: lmcache/ci-base:latest
|
|
208
|
+
imagePullPolicy: Never
|
|
209
|
+
resources:
|
|
210
|
+
requests:
|
|
211
|
+
cpu: "8"
|
|
212
|
+
memory: "256Gi"
|
|
213
|
+
limits:
|
|
214
|
+
cpu: "8"
|
|
215
|
+
memory: "256Gi"
|
|
216
|
+
volumeMounts:
|
|
217
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
218
|
+
- { name: dshm, mountPath: /dev/shm }
|
|
219
|
+
volumes:
|
|
220
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
221
|
+
- { name: dshm, emptyDir: { medium: Memory, sizeLimit: 4Gi } }
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
# SGLang + LMCache MP integration tests.
|
|
2
|
+
# 1) Correctness: LMCache does not change output, and is actually exercised.
|
|
3
|
+
# 2) Performance: LMCache makes TTFT smaller.
|
|
4
|
+
|
|
5
|
+
steps:
|
|
6
|
+
- label: ":test_tube: SGLang+LMCache — Correctness"
|
|
7
|
+
command: .buildkite/k3_tests/sglang/run.sh correctness
|
|
8
|
+
timeout_in_minutes: 15
|
|
9
|
+
agents: { queue: "k8s" }
|
|
10
|
+
plugins:
|
|
11
|
+
- kubernetes:
|
|
12
|
+
podSpec:
|
|
13
|
+
containers:
|
|
14
|
+
- name: container-0
|
|
15
|
+
image: lmcache/ci-base:latest
|
|
16
|
+
imagePullPolicy: Never
|
|
17
|
+
resources:
|
|
18
|
+
limits:
|
|
19
|
+
nvidia.com/gpu: "1"
|
|
20
|
+
volumeMounts:
|
|
21
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
22
|
+
volumes:
|
|
23
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
24
|
+
artifact_paths:
|
|
25
|
+
- "*.log"
|
|
26
|
+
- "*.json"
|
|
27
|
+
|
|
28
|
+
- label: ":zap: SGLang+LMCache — Performance"
|
|
29
|
+
command: .buildkite/k3_tests/sglang/run.sh perf
|
|
30
|
+
timeout_in_minutes: 15
|
|
31
|
+
retry:
|
|
32
|
+
automatic:
|
|
33
|
+
- exit_status: -1
|
|
34
|
+
limit: 2
|
|
35
|
+
- exit_status: 1
|
|
36
|
+
limit: 2
|
|
37
|
+
agents: { queue: "k8s" }
|
|
38
|
+
plugins:
|
|
39
|
+
- kubernetes:
|
|
40
|
+
podSpec:
|
|
41
|
+
containers:
|
|
42
|
+
- name: container-0
|
|
43
|
+
image: lmcache/ci-base:latest
|
|
44
|
+
imagePullPolicy: Never
|
|
45
|
+
resources:
|
|
46
|
+
limits:
|
|
47
|
+
nvidia.com/gpu: "1"
|
|
48
|
+
volumeMounts:
|
|
49
|
+
- { name: hf-cache, mountPath: /root/.cache/huggingface }
|
|
50
|
+
volumes:
|
|
51
|
+
- { name: hf-cache, hostPath: { path: /data/huggingface, type: DirectoryOrCreate } }
|
|
52
|
+
artifact_paths:
|
|
53
|
+
- "*.log"
|
|
54
|
+
- "*.json"
|
|
@@ -0,0 +1,156 @@
|
|
|
1
|
+
#!/usr/bin/env bash
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# CPU device test: runs both server bench and vLLM e2e tests
|
|
5
|
+
# in the same environment to avoid repeated vLLM installation.
|
|
6
|
+
#
|
|
7
|
+
# Usage: cpu_device_test.sh [mode]
|
|
8
|
+
# mode: server_bench, vllm_e2e, or all (default)
|
|
9
|
+
#
|
|
10
|
+
# Environment variables:
|
|
11
|
+
# LMCACHE_BENCH_TRANSFER_MODE engine_driven|lmcache_driven
|
|
12
|
+
# (default: engine_driven)
|
|
13
|
+
# LMCACHE_E2E_TRANSPORT_MODE engine_driven|lmcache_driven|shm|pickle
|
|
14
|
+
# (default: engine_driven)
|
|
15
|
+
# LMCACHE_E2E_DATA_MODE shm|pickle (default: shm)
|
|
16
|
+
# LMCACHE_HTTP_PORT_BENCH HTTP port for bench (default: 18080)
|
|
17
|
+
# LMCACHE_ZMQ_PORT_BENCH ZMQ port for bench (default: 15555)
|
|
18
|
+
# LMCACHE_HTTP_PORT_E2E HTTP port for e2e (default: 18081)
|
|
19
|
+
# LMCACHE_ZMQ_PORT_E2E ZMQ port for e2e (default: 15557)
|
|
20
|
+
# VLLM_PORT_E2E HTTP port for vLLM (default: 18000)
|
|
21
|
+
|
|
22
|
+
set -euo pipefail
|
|
23
|
+
|
|
24
|
+
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
|
25
|
+
OS="$(uname -s)"
|
|
26
|
+
TEST_MODE="${1:-all}"
|
|
27
|
+
|
|
28
|
+
echo "==> CPU device test (OS: ${OS}, Mode: ${TEST_MODE})"
|
|
29
|
+
echo " Python: $(python3 --version 2>&1 || true)"
|
|
30
|
+
|
|
31
|
+
# Configuration
|
|
32
|
+
BENCH_TRANSFER_MODE="${LMCACHE_BENCH_TRANSFER_MODE:-engine_driven}"
|
|
33
|
+
E2E_TRANSPORT_MODE="${LMCACHE_E2E_TRANSPORT_MODE:-engine_driven}"
|
|
34
|
+
E2E_DATA_MODE="${LMCACHE_E2E_DATA_MODE:-shm}"
|
|
35
|
+
HTTP_PORT_BENCH="${LMCACHE_HTTP_PORT_BENCH:-18080}"
|
|
36
|
+
ZMQ_PORT_BENCH="${LMCACHE_ZMQ_PORT_BENCH:-15555}"
|
|
37
|
+
HTTP_PORT_E2E="${LMCACHE_HTTP_PORT_E2E:-18081}"
|
|
38
|
+
ZMQ_PORT_E2E="${LMCACHE_ZMQ_PORT_E2E:-15557}"
|
|
39
|
+
VLLM_PORT_E2E="${VLLM_PORT_E2E:-18000}"
|
|
40
|
+
|
|
41
|
+
# Validate modes
|
|
42
|
+
case "${BENCH_TRANSFER_MODE}" in
|
|
43
|
+
lmcache_driven|engine_driven) ;;
|
|
44
|
+
*)
|
|
45
|
+
echo "!! Unknown LMCACHE_BENCH_TRANSFER_MODE='${BENCH_TRANSFER_MODE}'"
|
|
46
|
+
exit 1
|
|
47
|
+
;;
|
|
48
|
+
esac
|
|
49
|
+
|
|
50
|
+
# Map user-facing LMCACHE_E2E_TRANSPORT_MODE to internal representation.
|
|
51
|
+
# shm/pickle are aliases for lmcache_driven mode with sub-mode selection.
|
|
52
|
+
case "${E2E_TRANSPORT_MODE}" in
|
|
53
|
+
lmcache_driven|engine_driven)
|
|
54
|
+
MAPPED_TRANSPORT_MODE="${E2E_TRANSPORT_MODE}"
|
|
55
|
+
MAPPED_DATA_MODE="${E2E_DATA_MODE}"
|
|
56
|
+
;;
|
|
57
|
+
shm)
|
|
58
|
+
MAPPED_TRANSPORT_MODE="engine_driven"
|
|
59
|
+
MAPPED_DATA_MODE="shm"
|
|
60
|
+
;;
|
|
61
|
+
pickle)
|
|
62
|
+
MAPPED_TRANSPORT_MODE="engine_driven"
|
|
63
|
+
MAPPED_DATA_MODE="pickle"
|
|
64
|
+
;;
|
|
65
|
+
*)
|
|
66
|
+
echo "!! Unknown LMCACHE_E2E_TRANSPORT_MODE='${E2E_TRANSPORT_MODE}'"
|
|
67
|
+
echo " Valid values: engine_driven, lmcache_driven, shm, pickle"
|
|
68
|
+
exit 1
|
|
69
|
+
;;
|
|
70
|
+
esac
|
|
71
|
+
|
|
72
|
+
echo " Bench transfer mode: ${BENCH_TRANSFER_MODE}"
|
|
73
|
+
echo " E2E transport mode: ${E2E_TRANSPORT_MODE}"
|
|
74
|
+
echo " Ports: bench=${HTTP_PORT_BENCH}/${ZMQ_PORT_BENCH}, e2e=${HTTP_PORT_E2E}/${ZMQ_PORT_E2E}/${VLLM_PORT_E2E}"
|
|
75
|
+
|
|
76
|
+
# Reap any LMCache/vLLM children started by this run on exit so the
|
|
77
|
+
# next workflow step does not collide on default ZMQ/HTTP ports.
|
|
78
|
+
cleanup_processes_safe() {
|
|
79
|
+
local rc=$?
|
|
80
|
+
set +e
|
|
81
|
+
# Kill child processes started by this shell first (e.g. lmcache server
|
|
82
|
+
# backgrounded by the shared validation script).
|
|
83
|
+
pkill -P $$ 2>/dev/null || true
|
|
84
|
+
sleep 1
|
|
85
|
+
pkill -9 -P $$ 2>/dev/null || true
|
|
86
|
+
return $rc
|
|
87
|
+
}
|
|
88
|
+
trap cleanup_processes_safe EXIT
|
|
89
|
+
|
|
90
|
+
# Function to run server bench test
|
|
91
|
+
run_server_bench() {
|
|
92
|
+
echo ""
|
|
93
|
+
echo "==> Running CPU server bench test"
|
|
94
|
+
|
|
95
|
+
# Set environment for bench test
|
|
96
|
+
export LMCACHE_BENCH_TRANSFER_MODE="${BENCH_TRANSFER_MODE}"
|
|
97
|
+
export LMCACHE_HTTP_PORT="${HTTP_PORT_BENCH}"
|
|
98
|
+
export LMCACHE_ZMQ_PORT="${ZMQ_PORT_BENCH}"
|
|
99
|
+
export LMCACHE_LOG_FILE="/tmp/cpu_device_bench_${BENCH_TRANSFER_MODE}_lmcache.log"
|
|
100
|
+
export BENCH_OUTPUT_LOG="/tmp/cpu_device_bench_${BENCH_TRANSFER_MODE}_output.log"
|
|
101
|
+
export LMCACHE_HEALTHCHECK_TIMEOUT="30"
|
|
102
|
+
export BENCH_NUM_REQUESTS="3"
|
|
103
|
+
export BENCH_NUM_TOKENS="512"
|
|
104
|
+
|
|
105
|
+
# Run bench test
|
|
106
|
+
bash "${SCRIPT_DIR}/cpu_server_bench_test.sh"
|
|
107
|
+
|
|
108
|
+
echo "==> CPU server bench test completed successfully"
|
|
109
|
+
}
|
|
110
|
+
|
|
111
|
+
# Function to run vLLM e2e test
|
|
112
|
+
run_vllm_e2e() {
|
|
113
|
+
echo ""
|
|
114
|
+
echo "==> Running CPU vLLM e2e test"
|
|
115
|
+
|
|
116
|
+
# Set environment for e2e test
|
|
117
|
+
export LMCACHE_TRANSPORT_MODE="${MAPPED_TRANSPORT_MODE}"
|
|
118
|
+
export LMCACHE_DATA_MODE="${MAPPED_DATA_MODE}"
|
|
119
|
+
export LMCACHE_HTTP_PORT="${HTTP_PORT_E2E}"
|
|
120
|
+
export LMCACHE_ZMQ_PORT="${ZMQ_PORT_E2E}"
|
|
121
|
+
export VLLM_PORT="${VLLM_PORT_E2E}"
|
|
122
|
+
export LMCACHE_LOG_FILE="/tmp/cpu_device_e2e_${E2E_TRANSPORT_MODE}_lmcache.log"
|
|
123
|
+
export VLLM_LOG_FILE="/tmp/cpu_device_e2e_${E2E_TRANSPORT_MODE}_vllm.log"
|
|
124
|
+
export LMCACHE_HEALTHCHECK_TIMEOUT="30"
|
|
125
|
+
export VLLM_READY_TIMEOUT="300"
|
|
126
|
+
|
|
127
|
+
# Run e2e test
|
|
128
|
+
bash "${SCRIPT_DIR}/cpu_vllm_e2e_test.sh"
|
|
129
|
+
|
|
130
|
+
echo "==> CPU vLLM e2e test completed successfully"
|
|
131
|
+
}
|
|
132
|
+
|
|
133
|
+
# Determine which tests to run
|
|
134
|
+
case "${TEST_MODE}" in
|
|
135
|
+
"server_bench")
|
|
136
|
+
run_server_bench
|
|
137
|
+
;;
|
|
138
|
+
"vllm_e2e")
|
|
139
|
+
run_vllm_e2e
|
|
140
|
+
;;
|
|
141
|
+
"all")
|
|
142
|
+
run_server_bench
|
|
143
|
+
run_vllm_e2e
|
|
144
|
+
;;
|
|
145
|
+
*)
|
|
146
|
+
echo "!! Unknown test mode: ${TEST_MODE}"
|
|
147
|
+
echo " Supported modes: server_bench, vllm_e2e, all"
|
|
148
|
+
exit 1
|
|
149
|
+
;;
|
|
150
|
+
esac
|
|
151
|
+
|
|
152
|
+
echo ""
|
|
153
|
+
echo "==> CPU device test passed for modes:"
|
|
154
|
+
echo " Test mode: ${TEST_MODE}"
|
|
155
|
+
echo " Server bench: ${BENCH_TRANSFER_MODE}"
|
|
156
|
+
echo " vLLM e2e: ${E2E_TRANSPORT_MODE}"
|