Don't build punica kernels by default (#2605)

This commit is contained in:
Philipp Moritz
2024-01-26 15:19:19 -08:00
committed by GitHub
parent 3a0e1fc070
commit 390b495ff3
4 changed files with 11 additions and 4 deletions

View File

@ -265,7 +265,7 @@ if _is_cuda():
with contextlib.suppress(ValueError):
torch_cpp_ext.COMMON_NVCC_FLAGS.remove(flag)
install_punica = bool(int(os.getenv("VLLM_INSTALL_PUNICA_KERNELS", "1")))
install_punica = bool(int(os.getenv("VLLM_INSTALL_PUNICA_KERNELS", "0")))
device_count = torch.cuda.device_count()
for i in range(device_count):
major, minor = torch.cuda.get_device_capability(i)