From 5e3168be42b043d274b9a3522f97b246551aafbe Mon Sep 17 00:00:00 2001 From: Shang Wang Date: Tue, 10 Feb 2026 03:36:17 -0500 Subject: [PATCH] Pin FlashInfer version to RC2 --- docker/Dockerfile | 2 +- docker/versions.json | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/docker/Dockerfile b/docker/Dockerfile index 9064ea51632b..16dacddb5fe9 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -495,7 +495,7 @@ RUN --mount=type=cache,target=/root/.cache/uv \ # Install FlashInfer from CentML fork # https://github.com/CentML/flashinfer/tree/mlperf-inf-mm-q3vl-v6.0 ARG FLASHINFER_REPO=https://github.com/CentML/flashinfer.git -ARG FLASHINFER_BRANCH=mlperf-inf-mm-q3vl-v6.0 +ARG FLASHINFER_BRANCH=mlperf-inf-mm-q3vl-v6.0-rc2 ARG FLASHINFER_CUBIN_VERSION=0.5.3 ARG FLASHINFER_JIT_CACHE_VERSION=0.5.3 RUN --mount=type=cache,target=/root/.cache/uv \ diff --git a/docker/versions.json b/docker/versions.json index 3bb174eea948..72b7e487e099 100644 --- a/docker/versions.json +++ b/docker/versions.json @@ -71,7 +71,7 @@ "default": "https://github.com/CentML/flashinfer.git" }, "FLASHINFER_BRANCH": { - "default": "mlperf-inf-mm-q3vl-v6.0" + "default": "mlperf-inf-mm-q3vl-v6.0-rc2" }, "FLASHINFER_CUBIN_VERSION": { "default": "0.5.3"