From dc5e4a653c859573dfcca99f1b0141c2db9f94cc Mon Sep 17 00:00:00 2001 From: "Po-Han Huang (NVIDIA)" <53919306+nvpohanh@users.noreply.github.com> Date: Tue, 12 Aug 2025 10:58:41 +0800 Subject: [PATCH] Upgrade FlashInfer to v0.2.11 (#22613) Signed-off-by: Po-Han Huang Co-authored-by: mgoin --- docker/Dockerfile | 2 +- setup.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/docker/Dockerfile b/docker/Dockerfile index 85f55cac8d..b96d50f0a1 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -387,7 +387,7 @@ RUN --mount=type=bind,from=build,src=/workspace/dist,target=/vllm-workspace/dist ARG FLASHINFER_GIT_REPO="https://github.com/flashinfer-ai/flashinfer.git" # Keep this in sync with https://github.com/vllm-project/vllm/blob/main/requirements/cuda.txt # We use `--force-reinstall --no-deps` to avoid issues with the existing FlashInfer wheel. -ARG FLASHINFER_GIT_REF="v0.2.10" +ARG FLASHINFER_GIT_REF="v0.2.11" RUN --mount=type=cache,target=/root/.cache/uv bash - <<'BASH' . /etc/environment git clone --depth 1 --recursive --shallow-submodules \ diff --git a/setup.py b/setup.py index 7f6c787129..919300e143 100644 --- a/setup.py +++ b/setup.py @@ -684,7 +684,7 @@ setup( "mistral_common[audio]"], # Required for audio processing "video": [], # Kept for backwards compatibility # FlashInfer should be updated together with the Dockerfile - "flashinfer": ["flashinfer-python==0.2.10"], + "flashinfer": ["flashinfer-python==0.2.11"], }, cmdclass=cmdclass, package_data=package_data,