Skip to content

Commit 799804d

Browse files
Bump nvshmem to 3.3.24 and fix CUDA 13 installation (#30149)
Signed-off-by: Dmitry Tokarev <dtokarev@nvidia.com> Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
1 parent 0d402d2 commit 799804d

File tree

1 file changed

+6
-12
lines changed

1 file changed

+6
-12
lines changed

tools/ep_kernels/install_python_libraries.sh

Lines changed: 6 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -10,9 +10,10 @@ set -ex
1010
CUDA_HOME=${CUDA_HOME:-/usr/local/cuda}
1111
PPLX_COMMIT_HASH=${PPLX_COMMIT_HASH:-"12cecfd"}
1212
DEEPEP_COMMIT_HASH=${DEEPEP_COMMIT_HASH:-"73b6ea4"}
13-
NVSHMEM_VER=3.3.9
13+
NVSHMEM_VER=3.3.24 # Suppports both CUDA 12 and 13
1414
WORKSPACE=${WORKSPACE:-$(pwd)/ep_kernels_workspace}
1515
MODE=${MODE:-install}
16+
CUDA_VERSION_MAJOR=$(${CUDA_HOME}/bin/nvcc --version | egrep -o "release [0-9]+" | cut -d ' ' -f 2)
1617

1718
# Parse arguments
1819
while [[ $# -gt 0 ]]; do
@@ -75,18 +76,17 @@ ARCH=$(uname -m)
7576
case "${ARCH,,}" in
7677
x86_64|amd64)
7778
NVSHMEM_SUBDIR="linux-x86_64"
78-
NVSHMEM_FILE="libnvshmem-linux-x86_64-${NVSHMEM_VER}_cuda12-archive.tar.xz"
7979
;;
8080
aarch64|arm64)
8181
NVSHMEM_SUBDIR="linux-sbsa"
82-
NVSHMEM_FILE="libnvshmem-linux-sbsa-${NVSHMEM_VER}_cuda12-archive.tar.xz"
8382
;;
8483
*)
8584
echo "Unsupported architecture: ${ARCH}" >&2
8685
exit 1
8786
;;
8887
esac
8988

89+
NVSHMEM_FILE="libnvshmem-${NVSHMEM_SUBDIR}-${NVSHMEM_VER}_cuda${CUDA_VERSION_MAJOR}-archive.tar.xz"
9090
NVSHMEM_URL="https://developer.download.nvidia.com/compute/nvshmem/redist/libnvshmem/${NVSHMEM_SUBDIR}/${NVSHMEM_FILE}"
9191

9292
pushd "$WORKSPACE"
@@ -142,13 +142,6 @@ clone_repo() {
142142
fi
143143
}
144144

145-
deepep_cuda13_patch() {
146-
cuda_version_major=$(${CUDA_HOME}/bin/nvcc --version | egrep -o "release [0-9]+" | cut -d ' ' -f 2)
147-
if [ ${cuda_version_major} -ge 13 ]; then
148-
sed -i "s|f'{nvshmem_dir}/include']|f'{nvshmem_dir}/include', '${CUDA_HOME}/include/cccl']|" "setup.py"
149-
fi
150-
}
151-
152145
do_build() {
153146
local repo=$1
154147
local name=$2
@@ -160,8 +153,9 @@ do_build() {
160153
clone_repo "$repo" "$name" "$key" "$commit"
161154
cd "$name"
162155

163-
if [ "$name" == "DeepEP" ]; then
164-
deepep_cuda13_patch
156+
# DeepEP CUDA 13 patch
157+
if [[ "$name" == "DeepEP" && "${CUDA_VERSION_MAJOR}" -ge 13 ]]; then
158+
sed -i "s|f'{nvshmem_dir}/include']|f'{nvshmem_dir}/include', '${CUDA_HOME}/include/cccl']|" "setup.py"
165159
fi
166160

167161
if [ "$MODE" = "install" ]; then

0 commit comments

Comments
 (0)