PyPI - vllm-cpu - Versions diffs - 0.11.0.post2__cp312-cp312-manylinux_2_17_x86_64.whl - Mend

@@ -0,0 +1,19 @@
+# SPDX-License-Identifier: Apache-2.0
+# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
+# Adapted from llama.py
+"""Inference-only Phi3 model code inherit from Llama.py"""
+from vllm.model_executor.models.llama import LlamaForCausalLM
+class Phi3ForCausalLM(LlamaForCausalLM):
+    packed_modules_mapping = {
+        "qkv_proj": [
+            "qkv_proj",
+        ],
+        "gate_up_proj": [
+            "gate_up_proj",
+        ],
+    }

vllm-cpu 0.11.0.post2__cp312-cp312-manylinux_2_17_x86_64.whl