-
Notifications
You must be signed in to change notification settings - Fork 14
Expand file tree
/
Copy pathDockerfile
More file actions
61 lines (49 loc) · 2.05 KB
/
Dockerfile
File metadata and controls
61 lines (49 loc) · 2.05 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
FROM nvidia/cuda:13.0.1-devel-ubuntu24.04 AS rvllm-builder
RUN apt-get update && apt-get install -y curl build-essential pkg-config libssl-dev && \
curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y
ENV PATH="/root/.cargo/bin:${PATH}"
WORKDIR /build/rvllm
COPY rvllm /build/rvllm
RUN bash kernels/build.sh
RUN cargo build --release --features cuda -p rvllm-server
FROM nvidia/cuda:13.0.1-runtime-ubuntu24.04 AS runtime
RUN apt-get update && apt-get install -y \
python3 \
python3-pip \
python3-venv \
libssl3t64 \
ca-certificates \
&& rm -rf /var/lib/apt/lists/*
COPY rvLLM-serverless/builder/requirements.txt /tmp/requirements.txt
RUN python3 -m venv /opt/venv && \
/opt/venv/bin/python -m pip install --upgrade pip && \
/opt/venv/bin/python -m pip install --no-cache-dir -r /tmp/requirements.txt
COPY --from=rvllm-builder /build/rvllm/target/release/rvllm /usr/local/bin/rvllm
COPY --from=rvllm-builder /build/rvllm/kernels/*.ptx /usr/local/share/rvllm/kernels/
ARG BAKE_MODEL=false
ARG MODEL_ID=""
ARG MODEL_REVISION="main"
ARG MODEL_DIR="/models/default"
ENV PYTHONUNBUFFERED=1 \
PATH=/opt/venv/bin:${PATH} \
RVLLM_KERNEL_DIR=/usr/local/share/rvllm/kernels \
HF_HOME=/runpod-volume/huggingface \
HUGGINGFACE_HUB_CACHE=/runpod-volume/huggingface/hub \
MODEL_ID=${MODEL_ID} \
SERVED_MODEL_NAME=${MODEL_ID}
COPY rvLLM-serverless/builder /opt/rvllm-serverless/builder
RUN --mount=type=secret,id=HF_TOKEN,required=false \
if [ "${BAKE_MODEL}" = "true" ] && [ -n "${MODEL_ID}" ]; then \
export HF_TOKEN=""; \
if [ -f /run/secrets/HF_TOKEN ]; then \
export HF_TOKEN="$(cat /run/secrets/HF_TOKEN)"; \
fi; \
python3 /opt/rvllm-serverless/builder/download_model.py \
--model-id "${MODEL_ID}" \
--revision "${MODEL_REVISION}" \
--target-dir "${MODEL_DIR}"; \
fi
ENV MODEL_DIR=${MODEL_DIR}
COPY rvLLM-serverless/src /opt/rvllm-serverless/src
WORKDIR /opt/rvllm-serverless
CMD ["python3", "/opt/rvllm-serverless/src/handler.py"]