Skip to content

Commit b32a814

Browse files
youkaichaoshreyankg
authored andcommitted
[ci/build] update flashinfer (vllm-project#13323)
1 parent 66739f7 commit b32a814

File tree

1 file changed

+5
-2
lines changed

1 file changed

+5
-2
lines changed

Dockerfile

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -195,19 +195,22 @@ RUN --mount=type=bind,from=build,src=/workspace/dist,target=/vllm-workspace/dist
195195
--mount=type=cache,target=/root/.cache/pip \
196196
python3 -m pip install dist/*.whl --verbose
197197

198-
# How to build this FlashInfer wheel:
198+
# If we need to build FlashInfer wheel before its release:
199199
# $ export FLASHINFER_ENABLE_AOT=1
200200
# $ # Note we remove 7.0 from the arch list compared to the list below, since FlashInfer only supports sm75+
201201
# $ export TORCH_CUDA_ARCH_LIST='7.5 8.0 8.6 8.9 9.0+PTX'
202202
# $ git clone https://github.com/flashinfer-ai/flashinfer.git --recursive
203203
# $ cd flashinfer
204204
# $ git checkout 524304395bd1d8cd7d07db083859523fcaa246a4
205+
# $ rm -rf build
205206
# $ python3 setup.py bdist_wheel --dist-dir=dist --verbose
207+
# $ ls dist
208+
# $ # upload the wheel to a public location, e.g. https://wheels.vllm.ai/flashinfer/524304395bd1d8cd7d07db083859523fcaa246a4/flashinfer_python-0.2.1.post1+cu124torch2.5-cp38-abi3-linux_x86_64.whl
206209

207210
RUN --mount=type=cache,target=/root/.cache/pip \
208211
. /etc/environment && \
209212
if [ "$TARGETPLATFORM" != "linux/arm64" ]; then \
210-
python3 -m pip install https://wheels.vllm.ai/flashinfer/524304395bd1d8cd7d07db083859523fcaa246a4/flashinfer_python-0.2.0.post1-cp${PYTHON_VERSION_STR}-cp${PYTHON_VERSION_STR}-linux_x86_64.whl; \
213+
python3 -m pip install https://github.com/flashinfer-ai/flashinfer/releases/download/v0.2.1.post1/flashinfer_python-0.2.1.post1+cu124torch2.5-cp38-abi3-linux_x86_64.whl ; \
211214
fi
212215
COPY examples examples
213216

0 commit comments

Comments
 (0)