From e7ebd71b2c515c86a2f2b2b2091ef6b8143672a5 Mon Sep 17 00:00:00 2001 From: Divakar Verma <137818590+divakar-amd@users.noreply.github.com> Date: Mon, 20 May 2024 19:29:03 -0500 Subject: [PATCH] Update setup.py Keeping in sync with upstream vllm - Preventing breakage for intel. --- setup.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/setup.py b/setup.py index a4f7a61e8ef71..c0c6d1821fd0f 100644 --- a/setup.py +++ b/setup.py @@ -365,10 +365,12 @@ def _read_requirements(filename: str) -> List[str]: if _is_cuda() and _install_punica(): ext_modules.append(CMakeExtension(name="vllm._punica_C")) +if _is_cuda() or _is_hip(): + ext_modules.append(CMakeExtension(name="vllm._moe_C")) + if not _is_neuron(): ext_modules.append(CMakeExtension(name="vllm._C")) ext_modules.append(CMakeExtension(name="vllm._custom_C")) - ext_modules.append(CMakeExtension(name="vllm._moe_C")) package_data = { "vllm": ["py.typed", "model_executor/layers/fused_moe/configs/*.json"]