diff --git a/.azure-pipelines/templates/sglang-test.yml b/.azure-pipelines/templates/sglang-test.yml index 85a945aa..be889f08 100644 --- a/.azure-pipelines/templates/sglang-test.yml +++ b/.azure-pipelines/templates/sglang-test.yml @@ -87,8 +87,8 @@ steps: export RANK=0 export MASTER_ADDR=127.0.0.1 export MASTER_PORT=12345 - - ls -la + + cd sglang torchrun --nproc_per_node gpu \ --nnodes $WORLD_SIZE \ diff --git a/test/deploy/run-remote.sh b/test/deploy/run-remote.sh index e18221ba..a3b25358 100755 --- a/test/deploy/run-remote.sh +++ b/test/deploy/run-remote.sh @@ -103,7 +103,6 @@ if $USE_DOCKER; then # If using the sglang container, launch it first if [ "${CONTAINER_NAME}" = "mscclpp-sglang-test" ]; then parallel-ssh -i "${PSSH_COMMON[@]}" \ - "sudo docker rm -f ${CONTAINER_NAME} 2>/dev/null; \ sudo docker run -itd --name=${CONTAINER_NAME} --privileged --net=host --ipc=host --gpus=all -w /root -v /mnt:/mnt lmsysorg/sglang:latest bash" INNER="set -euxo pipefail;"