Skip to content

Commit 2a6b980

Browse files
committed
Update ray to 2.50.0 to for prepackaged click version ban, install additional packages for RDMA support, add additional env vars for RDMA, remove UCX
1 parent 9087b94 commit 2a6b980

File tree

3 files changed

+1041
-887
lines changed

3 files changed

+1041
-887
lines changed

Dockerfile

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -35,17 +35,21 @@ RUN wget https://bootstrap.pypa.io/get-pip.py && \
3535
rm get-pip.py && \
3636
python3.10 -m pip install --upgrade pip setuptools wheel uv
3737

38-
# Install Infiniband/RDMA support
38+
# Install RDMA support
3939
RUN apt-get update && apt-get install -y \
4040
libibverbs1 libibverbs-dev ibverbs-utils \
4141
librdmacm1 librdmacm-dev rdmacm-utils \
42+
rdma-core ibverbs-providers infiniband-diags perftest \
4243
&& rm -rf /var/lib/apt/lists/*
4344

4445
# Set up RDMA environment (these will persist in the final container)
4546
ENV LD_LIBRARY_PATH="/usr/lib/x86_64-linux-gnu:$LD_LIBRARY_PATH"
46-
ENV UCX_NET_DEVICES=all
4747
ENV NCCL_IB_DISABLE=0
48-
ENV NCCL_SOCKET_IFNAME=ib0
48+
ENV NCCL_SOCKET_IFNAME="^lo,docker0"
49+
ENV NCCL_NET_GDR_LEVEL=PHB
50+
ENV NCCL_IB_TIMEOUT=22
51+
ENV NCCL_IB_RETRY_CNT=7
52+
ENV NCCL_DEBUG=WARN
4953

5054
# Set up project
5155
WORKDIR /vec-inf
@@ -59,8 +63,5 @@ RUN apt-get update && apt-get install -y --allow-change-held-packages\
5963
libnccl2 libnccl-dev \
6064
&& rm -rf /var/lib/apt/lists/*
6165

62-
# Final configuration
63-
ENV NCCL_DEBUG=INFO
64-
6566
# Set the default command to start an interactive shell
6667
CMD ["bash"]

pyproject.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ license = "MIT"
88
requires-python = ">=3.10"
99
dependencies = [
1010
"requests>=2.31.0",
11-
"click>=8.1.0,!=8.3.0",
11+
"click>=8.1.0",
1212
"rich>=13.7.0",
1313
"pydantic>=2.10.6",
1414
"pyyaml>=6.0.2",
@@ -42,7 +42,7 @@ dev = [
4242
"xgrammar>=0.1.11",
4343
"torch>=2.7.0",
4444
"vllm>=0.10.0",
45-
"ray>=2.40.0,<2.46.0",
45+
"ray>=2.50.0",
4646
"cupy-cuda12x==12.1.0"
4747
]
4848

0 commit comments

Comments
 (0)