Skip to content

Commit

Permalink
♻️ try VLLM_USE_PRECOMPILED
Browse files Browse the repository at this point in the history
Signed-off-by: Prashant Gupta <prashantgupta@us.ibm.com>
  • Loading branch information
prashantgupta24 committed Apr 29, 2024
1 parent 9b3e80d commit 36eee72
Showing 1 changed file with 6 additions and 6 deletions.
12 changes: 6 additions & 6 deletions Dockerfile.ubi
Original file line number Diff line number Diff line change
Expand Up @@ -205,24 +205,24 @@ ENV VLLM_INSTALL_PUNICA_KERNELS=1
ENV PATH=/usr/local/cuda/bin:$PATH
ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH



# Copy the entire directory before building wheel
COPY --link vllm vllm

# Comment if building *.so files from scratch
##################################################
# Copy the prebuilt *.so files
COPY --from=prebuilt-wheel --link /workspace/vllm/*.so /workspace/vllm/*.so
##################################################

RUN python3 setup.py build_ext --inplace

# Copy the entire directory before building wheel
COPY --link vllm vllm

# Copy over the generated *.pb2 files
COPY --from=gen-protos --link /workspace/vllm/entrypoints/grpc/pb vllm/entrypoints/grpc/pb

ENV CCACHE_DIR=/root/.cache/ccache
RUN --mount=type=cache,target=/root/.cache/ccache \
--mount=type=cache,target=/root/.cache/pip \
python3 setup.py bdist_wheel --dist-dir=dist
VLLM_USE_PRECOMPILED=1 python3 setup.py bdist_wheel --dist-dir=dist

#################### FLASH_ATTENTION Build IMAGE ####################
FROM dev as flash-attn-builder
Expand Down

0 comments on commit 36eee72

Please sign in to comment.