From dfa6d462c8b252c5dfe71a0906816f25a1bf26c7 Mon Sep 17 00:00:00 2001 From: Siddharth Venkatesan Date: Thu, 6 Feb 2025 15:17:46 -0800 Subject: [PATCH] [vllm] add flashinfer wheel for 0.2.0.post2 --- serving/docker/requirements-vllm.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/serving/docker/requirements-vllm.txt b/serving/docker/requirements-vllm.txt index 0c5ace26d..3e3a8f428 100644 --- a/serving/docker/requirements-vllm.txt +++ b/serving/docker/requirements-vllm.txt @@ -1,3 +1,4 @@ peft==0.14.0 llmcompressor==0.4.0 vllm==0.7.1 +https://github.com/flashinfer-ai/flashinfer/releases/download/v0.2.0.post2/flashinfer_python-0.2.0.post2+cu124torch2.5-cp311-cp311-linux_x86_64.whl