Skip to content

Commit

Permalink
Merge pull request #6 from z103cb/ibm_main_docker_ubi_updates
Browse files Browse the repository at this point in the history
[CI/Build] Dockerfile.ubi : Remove test stage
  • Loading branch information
z103cb authored Apr 26, 2024
2 parents 1e44f5e + 769521f commit 91e4a51
Showing 1 changed file with 0 additions and 21 deletions.
21 changes: 0 additions & 21 deletions Dockerfile.ubi
Original file line number Diff line number Diff line change
Expand Up @@ -219,27 +219,6 @@ WORKDIR /usr/src/flash-attention-v2
RUN pip --verbose wheel flash-attn==${FLASH_ATTN_VERSION} \
--no-build-isolation --no-deps --no-cache-dir


## Test ########################################################################
FROM dev AS test

WORKDIR /vllm-workspace
# ADD is used to preserve directory structure
# NB: Could leak secrets from local context, the test image should not be pushed
# to a registry
ADD . /vllm-workspace/
# copy pytorch extensions separately to avoid having to rebuild
# when python code changes
COPY --from=build /workspace/vllm/*.so /vllm-workspace/vllm/
# Install flash attention (from pre-built wheel)
RUN --mount=type=bind,from=flash-attn-builder,src=/usr/src/flash-attention-v2,target=/usr/src/flash-attention-v2 \
pip install /usr/src/flash-attention-v2/*.whl --no-cache-dir
# ignore build dependencies installation because we are using pre-complied extensions
RUN rm pyproject.toml
RUN --mount=type=cache,target=/root/.cache/pip \
VLLM_USE_PRECOMPILED=1 pip install . --verbose


## Proto Compilation ###########################################################
FROM python-base AS gen-protos

Expand Down

0 comments on commit 91e4a51

Please sign in to comment.