File tree Expand file tree Collapse file tree 3 files changed +1041
-887
lines changed Expand file tree Collapse file tree 3 files changed +1041
-887
lines changed Original file line number Diff line number Diff line change @@ -35,17 +35,21 @@ RUN wget https://bootstrap.pypa.io/get-pip.py && \
3535 rm get-pip.py && \
3636 python3.10 -m pip install --upgrade pip setuptools wheel uv
3737
38- # Install Infiniband/ RDMA support
38+ # Install RDMA support
3939RUN apt-get update && apt-get install -y \
4040 libibverbs1 libibverbs-dev ibverbs-utils \
4141 librdmacm1 librdmacm-dev rdmacm-utils \
42+ rdma-core ibverbs-providers infiniband-diags perftest \
4243 && rm -rf /var/lib/apt/lists/*
4344
4445# Set up RDMA environment (these will persist in the final container)
4546ENV LD_LIBRARY_PATH="/usr/lib/x86_64-linux-gnu:$LD_LIBRARY_PATH"
46- ENV UCX_NET_DEVICES=all
4747ENV NCCL_IB_DISABLE=0
48- ENV NCCL_SOCKET_IFNAME=ib0
48+ ENV NCCL_SOCKET_IFNAME="^lo,docker0"
49+ ENV NCCL_NET_GDR_LEVEL=PHB
50+ ENV NCCL_IB_TIMEOUT=22
51+ ENV NCCL_IB_RETRY_CNT=7
52+ ENV NCCL_DEBUG=WARN
4953
5054# Set up project
5155WORKDIR /vec-inf
@@ -59,8 +63,5 @@ RUN apt-get update && apt-get install -y --allow-change-held-packages\
5963 libnccl2 libnccl-dev \
6064 && rm -rf /var/lib/apt/lists/*
6165
62- # Final configuration
63- ENV NCCL_DEBUG=INFO
64-
6566# Set the default command to start an interactive shell
6667CMD ["bash" ]
Original file line number Diff line number Diff line change @@ -8,7 +8,7 @@ license = "MIT"
88requires-python = " >=3.10"
99dependencies = [
1010 " requests>=2.31.0" ,
11- " click>=8.1.0,!=8.3.0 " ,
11+ " click>=8.1.0" ,
1212 " rich>=13.7.0" ,
1313 " pydantic>=2.10.6" ,
1414 " pyyaml>=6.0.2" ,
@@ -42,7 +42,7 @@ dev = [
4242 " xgrammar>=0.1.11" ,
4343 " torch>=2.7.0" ,
4444 " vllm>=0.10.0" ,
45- " ray>=2.40.0,<2.46 .0" ,
45+ " ray>=2.50 .0" ,
4646 " cupy-cuda12x==12.1.0"
4747]
4848
You can’t perform that action at this time.
0 commit comments