Skip to content

Commit e40ab7c

Browse files
authored
add sm_90 to CUDA11.8 builds (pytorch#1278)
1 parent 1380f48 commit e40ab7c

File tree

6 files changed

+13
-18
lines changed

6 files changed

+13
-18
lines changed

common/install_cuda.sh

+2-2
Original file line numberDiff line numberDiff line change
@@ -155,8 +155,8 @@ function prune_118 {
155155
export NVPRUNE="/usr/local/cuda-11.8/bin/nvprune"
156156
export CUDA_LIB_DIR="/usr/local/cuda-11.8/lib64"
157157

158-
export GENCODE="-gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=sm_75 -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86"
159-
export GENCODE_CUDNN="-gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=sm_75 -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86"
158+
export GENCODE="-gencode arch=compute_35,code=sm_35 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=sm_75 -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86 -gencode arch=compute_90,code=sm_90"
159+
export GENCODE_CUDNN="-gencode arch=compute_35,code=sm_35 -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_61,code=sm_61 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_75,code=sm_75 -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86 -gencode arch=compute_90,code=sm_90"
160160

161161
if [[ -n "$OVERRIDE_GENCODE" ]]; then
162162
export GENCODE=$OVERRIDE_GENCODE

conda/pytorch-nightly/bld.bat

+2-5
Original file line numberDiff line numberDiff line change
@@ -20,21 +20,18 @@ if "%build_with_cuda%" == "" goto cuda_flags_end
2020
set CUDA_PATH=C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v%desired_cuda%
2121
set CUDA_BIN_PATH=%CUDA_PATH%\bin
2222
set TORCH_NVCC_FLAGS=-Xfatbin -compress-all
23-
set TORCH_CUDA_ARCH_LIST=3.7+PTX;5.0
23+
set TORCH_CUDA_ARCH_LIST=3.7+PTX;5.0;6.0;6.1;7.0;7.5;8.0;8.6
2424
if "%desired_cuda%" == "11.5" (
25-
set TORCH_CUDA_ARCH_LIST=%TORCH_CUDA_ARCH_LIST%;6.0;6.1;7.0;7.5;8.0;8.6
2625
set TORCH_NVCC_FLAGS=-Xfatbin -compress-all --threads 2
2726
)
2827
if "%desired_cuda%" == "11.6" (
29-
set TORCH_CUDA_ARCH_LIST=%TORCH_CUDA_ARCH_LIST%;6.0;6.1;7.0;7.5;8.0;8.6
3028
set TORCH_NVCC_FLAGS=-Xfatbin -compress-all --threads 2
3129
)
3230
if "%desired_cuda%" == "11.7" (
33-
set TORCH_CUDA_ARCH_LIST=%TORCH_CUDA_ARCH_LIST%;6.0;6.1;7.0;7.5;8.0;8.6
3431
set TORCH_NVCC_FLAGS=-Xfatbin -compress-all --threads 2
3532
)
3633
if "%desired_cuda%" == "11.8" (
37-
set TORCH_CUDA_ARCH_LIST=%TORCH_CUDA_ARCH_LIST%;6.0;6.1;7.0;7.5;8.0;8.6
34+
set TORCH_CUDA_ARCH_LIST=%TORCH_CUDA_ARCH_LIST%;9.0
3835
set TORCH_NVCC_FLAGS=-Xfatbin -compress-all --threads 2
3936
)
4037

conda/pytorch-nightly/build.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ if [[ -n "$build_with_cuda" ]]; then
7070
#for cuda 11.7 include all dynamic loading libraries
7171
DEPS_LIST=(/usr/local/cuda/lib64/libcudnn*.so.8 /usr/local/cuda-11.7/extras/CUPTI/lib64/libcupti.so.11.7)
7272
elif [[ $CUDA_VERSION == 11.8* ]]; then
73-
export TORCH_CUDA_ARCH_LIST="$TORCH_CUDA_ARCH_LIST;6.0;6.1;7.0;7.5;8.0;8.6"
73+
export TORCH_CUDA_ARCH_LIST="$TORCH_CUDA_ARCH_LIST;6.0;6.1;7.0;7.5;8.0;8.6;9.0"
7474
#for cuda 11.8 we use cudnn 8.5
7575
#which does not have single static libcudnn_static.a deliverable to link with
7676
export USE_STATIC_CUDNN=0

magma/Makefile

+2-4
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ SHELL=/usr/bin/env bash
22

33
DESIRED_CUDA ?= 11.6
44
PACKAGE_NAME ?= magma-cuda116
5-
CUDA_ARCH_LIST ?= -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_70,code=sm_70
5+
CUDA_ARCH_LIST ?= -gencode arch=compute_37,code=sm_37 -gencode arch=compute_50,code=sm_50 -gencode arch=compute_60,code=sm_60 -gencode arch=compute_70,code=sm_70 -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86
66

77
DOCKER_RUN = set -eou pipefail; docker run --rm -i \
88
-v $(shell git rev-parse --show-toplevel):/builder \
@@ -26,20 +26,18 @@ clean:
2626
.PHONY: magma-cuda118
2727
magma-cuda118: DESIRED_CUDA := 11.8
2828
magma-cuda118: PACKAGE_NAME := magma-cuda118
29-
magma-cuda118: CUDA_ARCH_LIST += -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86
29+
magma-cuda118: CUDA_ARCH_LIST += -gencode arch=compute_90,code=sm_90
3030
magma-cuda118:
3131
$(DOCKER_RUN)
3232

3333
.PHONY: magma-cuda117
3434
magma-cuda117: DESIRED_CUDA := 11.7
3535
magma-cuda117: PACKAGE_NAME := magma-cuda117
36-
magma-cuda117: CUDA_ARCH_LIST += -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86
3736
magma-cuda117:
3837
$(DOCKER_RUN)
3938

4039
.PHONY: magma-cuda116
4140
magma-cuda116: DESIRED_CUDA := 11.6
4241
magma-cuda116: PACKAGE_NAME := magma-cuda116
43-
magma-cuda116: CUDA_ARCH_LIST += -gencode arch=compute_80,code=sm_80 -gencode arch=compute_86,code=sm_86
4442
magma-cuda116:
4543
$(DOCKER_RUN)

manywheel/build_cuda.sh

+4-4
Original file line numberDiff line numberDiff line change
@@ -58,12 +58,12 @@ cuda_version_nodot=$(echo $CUDA_VERSION | tr -d '.')
5858

5959
TORCH_CUDA_ARCH_LIST="3.7;5.0;6.0;7.0"
6060
case ${CUDA_VERSION} in
61-
11.[678])
62-
TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST};7.5;8.0;8.6"
61+
11.8)
62+
TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST};7.5;8.0;8.6;9.0"
6363
EXTRA_CAFFE2_CMAKE_FLAGS+=("-DATEN_NO_TEST=ON")
6464
;;
65-
10.*)
66-
TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST}"
65+
11.[67])
66+
TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST};7.5;8.0;8.6"
6767
EXTRA_CAFFE2_CMAKE_FLAGS+=("-DATEN_NO_TEST=ON")
6868
;;
6969
*)

windows/cuda118.bat

+2-2
Original file line numberDiff line numberDiff line change
@@ -37,10 +37,10 @@ IF "%CUDA_PATH_V118%"=="" (
3737
)
3838

3939
IF "%BUILD_VISION%" == "" (
40-
set TORCH_CUDA_ARCH_LIST=3.7+PTX;5.0;6.0;6.1;7.0;7.5;8.0;8.6
40+
set TORCH_CUDA_ARCH_LIST=3.7+PTX;5.0;6.0;6.1;7.0;7.5;8.0;8.6;9.0
4141
set TORCH_NVCC_FLAGS=-Xfatbin -compress-all
4242
) ELSE (
43-
set NVCC_FLAGS=-D__CUDA_NO_HALF_OPERATORS__ --expt-relaxed-constexpr -gencode=arch=compute_35,code=sm_35 -gencode=arch=compute_50,code=sm_50 -gencode=arch=compute_60,code=sm_60 -gencode=arch=compute_70,code=sm_70 -gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_80,code=compute_80 -gencode=arch=compute_86,code=compute_86
43+
set NVCC_FLAGS=-D__CUDA_NO_HALF_OPERATORS__ --expt-relaxed-constexpr -gencode=arch=compute_35,code=sm_35 -gencode=arch=compute_50,code=sm_50 -gencode=arch=compute_60,code=sm_60 -gencode=arch=compute_70,code=sm_70 -gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_80,code=compute_80 -gencode=arch=compute_86,code=compute_86 -gencode=arch=compute_90,code=compute_90
4444
)
4545

4646
set "CUDA_PATH=%CUDA_PATH_V118%"

0 commit comments

Comments
 (0)