diff --git a/.azure-pipelines/templates/sglang-test.yaml b/.azure-pipelines/templates/sglang-test.yaml index d5a8cccc..1b2d0768 100644 --- a/.azure-pipelines/templates/sglang-test.yaml +++ b/.azure-pipelines/templates/sglang-test.yaml @@ -78,6 +78,8 @@ steps: parallel-ssh -o . -t 0 -h ${HOSTFILE} -x "-i ${KeyFilePath}" \ -O $SSH_OPTION 'sudo docker run -itd --name=mscclpp-sglang-test --privileged --net=host --ipc=host --gpus=all -w /root -v /mnt:/mnt lmsysorg/sglang:latest bash && \ sudo docker exec -t mscclpp-sglang-test bash -c " \ + python3 -m venv /root/venv && \ + export PATH=/root/venv/bin:\\\$PATH && \ git clone https://github.com/microsoft/mscclpp.git && \ cd mscclpp && \ mkdir build && \ @@ -85,7 +87,6 @@ steps: cmake -DCMAKE_BUILD_TYPE=Release .. && \ make -j && \ cd .. && \ - hostname pip install . && \ pip install -r ./python/requirements_cuda12.txt \ "' diff --git a/docker/build.sh b/docker/build.sh index fcb03704..46a107a5 100755 --- a/docker/build.sh +++ b/docker/build.sh @@ -10,7 +10,7 @@ baseImageTable=( ["cuda12.9"]="nvidia/cuda:12.9.1-devel-ubuntu24.04" ["cuda13.0"]="nvidia/cuda:13.0.2-devel-ubuntu24.04" ["rocm6.2"]="rocm/dev-ubuntu-22.04:6.2.2" - ["sglang"]="nvidia/cuda:13.0.2-devel-ubuntu24.04" + ["sglang"]="nvidia/cuda:12.9.1-devel-ubuntu24.04" ) declare -A extraLdPathTable @@ -21,7 +21,7 @@ extraLdPathTable=( ["cuda12.9"]="/usr/local/cuda-12.9/compat" ["cuda13.0"]="/usr/local/cuda-13.0/compat" ["rocm6.2"]="/opt/rocm/lib" - ["sglang"]="/usr/local/cuda-13.0/compat" + ["sglang"]="/usr/local/cuda-12.9/compat" ) declare -A ofedVersionTable @@ -32,7 +32,7 @@ ofedVersionTable=( ["cuda12.9"]="24.10-1.1.4.0" ["cuda13.0"]="24.10-3.2.5.0" ["rocm6.2"]="24.10-1.1.4.0" - ["sglang"]="24.10-3.2.5.0" + ["sglang"]="24.10-1.1.4.0" ) TARGET=${1}