Skip to content

Commit

Permalink
Merge pull request #278 from nvonpentz/dockerfile
Browse files Browse the repository at this point in the history
Add vLLM Dockerfile
  • Loading branch information
jeffreymeetkai authored Jan 13, 2025
2 parents dfd08d3 + 37332ed commit 7cbe866
Showing 1 changed file with 25 additions and 0 deletions.
25 changes: 25 additions & 0 deletions dockerfiles/Dockerfile.vllm
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
# Use vLLM's vllm-openai server image as the base
FROM vllm/vllm-openai:v0.6.3.post1

# Define a build argument for the working directory, defaulting to /workspace
ARG WORKDIR_ARG=/workspace

# Set the working directory
WORKDIR ${WORKDIR_ARG}

# Install necessary build dependencies for sentencepiece
RUN apt-get update && apt-get install -y \
pkg-config \
cmake \
build-essential

# Copy functionary code and requirements into workspace
COPY . .

# Install additional Python dependencies
RUN --mount=type=cache,target=/root/.cache/pip \
python3 -m pip install .[vllm]

# Override the VLLM entrypoint with the functionary server
ENTRYPOINT ["python3", "server_vllm.py", "--model", "meetkai/functionary-small-v3.2", "--host", "0.0.0.0", "--max-model-len", "8192"]
CMD []

0 comments on commit 7cbe866

Please sign in to comment.