Skip to content

Commit 02eb7ca

Browse files
committed
fix nvshmem
1 parent e9e9046 commit 02eb7ca

File tree

2 files changed

+4
-3
lines changed

2 files changed

+4
-3
lines changed

scripts/ci/ci_install_deepep.sh

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -46,9 +46,6 @@ if [ ! -e "$LIB_PATH/libmlx5.so" ]; then
4646
fi
4747
apt-get update && apt-get install -y libfabric-dev
4848

49-
# Install NVSHMEM
50-
pip install nvidia-nvshmem-cu12==3.4.5 --force-reinstall
51-
5249
# Install DeepEP
5350
DEEPEP_DIR=/root/.cache/deepep
5451
rm -rf ${DEEPEP_DIR}

scripts/ci/ci_install_dependency.sh

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -134,6 +134,10 @@ if [ "$IS_BLACKWELL" != "1" ]; then
134134
git clone --branch v0.5 --depth 1 https://github.com/EvolvingLMMs-Lab/lmms-eval.git
135135
$PIP_CMD install -e lmms-eval/ $PIP_INSTALL_SUFFIX
136136
fi
137+
138+
# DeepEP depends on nvshmem 3.4.5
139+
$PIP_CMD install nvidia-nvshmem-cu12==3.4.5 --force-reinstall $PIP_INSTALL_SUFFIX
140+
137141
# Cudnn with version less than 9.16.0.29 will cause performance regression on Conv3D kernel
138142
$PIP_CMD install nvidia-cudnn-cu12==9.16.0.29 --force-reinstall $PIP_INSTALL_SUFFIX
139143
$PIP_CMD uninstall xformers || true

0 commit comments

Comments
 (0)