Skip to content

Commit c18aabb

Browse files
committed
Downgrade Ray to 2.43.0, update vec-inf version, use base image NCCL instead of fixing vllm_nccl version
1 parent 631c0e4 commit c18aabb

File tree

3 files changed

+37
-140
lines changed

3 files changed

+37
-140
lines changed

Dockerfile

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -54,9 +54,9 @@ COPY . /vec-inf
5454
RUN PIP_INDEX_URL="https://download.pytorch.org/whl/cu128" uv pip install --system -e .[dev]
5555

5656
# Final configuration
57-
RUN mkdir -p /vec-inf/nccl && \
58-
mv /root/.config/vllm/nccl/cu12/libnccl.so.2.18.1 /vec-inf/nccl/libnccl.so.2.18.1
59-
ENV VLLM_NCCL_SO_PATH=/vec-inf/nccl/libnccl.so.2.18.1
57+
# RUN mkdir -p /vec-inf/nccl && \
58+
# mv /root/.config/vllm/nccl/cu12/libnccl.so.2.18.1 /vec-inf/nccl/libnccl.so.2.18.1
59+
# ENV VLLM_NCCL_SO_PATH=/vec-inf/nccl/libnccl.so.2.18.1
6060
ENV NCCL_DEBUG=INFO
6161

6262
# Set the default command to start an interactive shell

pyproject.toml

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[project]
22
name = "vec-inf"
3-
version = "0.7.0"
3+
version = "0.7.1"
44
description = "Efficient LLM inference on Slurm clusters using vLLM."
55
readme = "README.md"
66
authors = [{name = "Marshall Wang", email = "[email protected]"}]
@@ -42,8 +42,7 @@ dev = [
4242
"xgrammar>=0.1.11",
4343
"torch>=2.7.0",
4444
"vllm>=0.10.0",
45-
"vllm-nccl-cu12>=2.18,<2.19",
46-
"ray>=2.40.0",
45+
"ray==2.43.0",
4746
"cupy-cuda12x==12.1.0"
4847
]
4948

0 commit comments

Comments
 (0)