Skip to content

Commit

Permalink
Build test image with ray included
Browse files Browse the repository at this point in the history
  • Loading branch information
njhill committed Mar 31, 2024
1 parent 87300e2 commit ad7cda6
Show file tree
Hide file tree
Showing 3 changed files with 7 additions and 1 deletion.
1 change: 1 addition & 0 deletions .github/workflows/build.yml
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ on:
push:
branches:
- release
- ray-test
paths-ignore:
- "**.md"
- "proto/**"
Expand Down
6 changes: 5 additions & 1 deletion Dockerfile.ubi
Original file line number Diff line number Diff line change
Expand Up @@ -150,6 +150,8 @@ RUN --mount=type=cache,target=/root/.cache/pip \
# copy input files
COPY csrc csrc
COPY setup.py setup.py
COPY cmake cmake
COPY CMakeLists.txt CMakeLists.txt
COPY requirements.txt requirements.txt
COPY pyproject.toml pyproject.toml
COPY vllm/__init__.py vllm/__init__.py
Expand Down Expand Up @@ -224,7 +226,7 @@ RUN --mount=type=bind,from=flash-attn-builder,src=/usr/src/flash-attention-v2,ta
# ignore build dependencies installation because we are using pre-complied extensions
RUN rm pyproject.toml
RUN --mount=type=cache,target=/root/.cache/pip \
VLLM_USE_PRECOMPILED=1 pip install . --verbose
VLLM_USE_PRECOMPILED=1 pip install .[ray] --verbose


## Proto Compilation ###########################################################
Expand Down Expand Up @@ -304,5 +306,7 @@ RUN microdnf install -y shadow-utils \
&& microdnf clean all \
&& chmod g+rwx $HOME /usr/src /workspace

COPY LICENSE /licenses/vllm.md

USER 2000
ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]
1 change: 1 addition & 0 deletions requirements.txt
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
cmake>=3.21
ninja # For faster builds.
psutil
ray >= 2.9
sentencepiece # Required for LLaMA tokenizer.
numpy
torch == 2.1.2
Expand Down

0 comments on commit ad7cda6

Please sign in to comment.