mirror of https://github.com/vllm-project/vllm
18 lines
725 B
Docker
18 lines
725 B
Docker
ARG NIGHTLY_DATE="20240808"
|
|
ARG BASE_IMAGE="us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla:nightly_3.10_tpuvm_$NIGHTLY_DATE"
|
|
|
|
FROM $BASE_IMAGE
|
|
WORKDIR /workspace
|
|
|
|
# Install the TPU and Pallas dependencies.
|
|
RUN python3 -m pip install torch_xla[tpu] -f https://storage.googleapis.com/libtpu-releases/index.html
|
|
RUN python3 -m pip install torch_xla[pallas] -f https://storage.googleapis.com/jax-releases/jax_nightly_releases.html -f https://storage.googleapis.com/jax-releases/jaxlib_nightly_releases.html
|
|
|
|
# Build vLLM.
|
|
COPY . /workspace/vllm
|
|
ENV VLLM_TARGET_DEVICE="tpu"
|
|
RUN cd /workspace/vllm && python3 -m pip install -r requirements-tpu.txt
|
|
RUN cd /workspace/vllm && python3 setup.py develop
|
|
|
|
CMD ["/bin/bash"]
|