Skip to content

Commit

Permalink
update vllm container
Browse files Browse the repository at this point in the history
  • Loading branch information
mmoskal committed Jan 12, 2024
1 parent 2dd3375 commit baa1da0
Showing 1 changed file with 12 additions and 0 deletions.
12 changes: 12 additions & 0 deletions .devcontainer/Dockerfile-vllm
Original file line number Diff line number Diff line change
@@ -1,6 +1,8 @@
# syntax = edrevo/dockerfile-plus
# ^^^ this line enables the INCLUDE+ directive

FROM nvcr.io/nvidia/pytorch:23.09-py3

INCLUDE+ cuda-settings.dockerfile
INCLUDE+ common.dockerfile

Expand All @@ -17,3 +19,13 @@ RUN pip install git+https://github.com/NVIDIA/TransformerEngine.git@stable
# RUN pip install typing_extensions==4.5.0

RUN pip install -U flash-attn


# RUN pip install torch==2.1.0 nvidia-cuda-runtime
# the .so file seems to be missing
RUN ln -s /usr/local/lib/python3.10/dist-packages/nvidia/cuda_runtime/lib/libcudart.so{.12,}

# perf tool
RUN apt-get install -y linux-tools-`uname -r`

RUN source /usr/local/nvm/nvm.sh && npm install -g yarn

0 comments on commit baa1da0

Please sign in to comment.