Skip to content

Commit db90eff

Browse files
Initial support blackwell (#1481)
* initial support blackwell * Update CHANGELOG.md Co-authored-by: Matthew Douglas <[email protected]> * Update CMakeLists.txt * Update CHANGELOG.md * fix build-cuda.sh * fix build-cuda.sh * fix cuda 12.7 build-cuda.sh * Update build-cuda.sh * Update cuda from 12.6.2 to 12.6.3 * Update .github/workflows/python-package.yml Co-authored-by: Matthew Douglas <[email protected]> * Update install_cuda.py Co-authored-by: Matthew Douglas <[email protected]> * Update install_cuda.sh Co-authored-by: Matthew Douglas <[email protected]> * Update .github/scripts/build-cuda.sh * Update install_cuda.sh --------- Co-authored-by: Matthew Douglas <[email protected]>
1 parent a9cfd1b commit db90eff

File tree

3 files changed

+25
-4
lines changed

3 files changed

+25
-4
lines changed

.github/scripts/build-cuda.sh

+7-3
Original file line numberDiff line numberDiff line change
@@ -4,9 +4,13 @@ declare build_os
44
declare cuda_version
55

66
set -xeuo pipefail
7-
build_capability="50;52;60;61;70;75;80;86;89;90"
8-
[[ "${cuda_version}" == 11.7.* ]] && build_capability=${build_capability%??????}
9-
[[ "${cuda_version}" == 11.8.* ]] && build_capability=${build_capability%???}
7+
build_capability="50;52;60;61;70;75;80;86;89;90;100;120"
8+
remove_for_11_7=";89;90;100;120"
9+
remove_for_11_8=";89;90;100;120"
10+
remove_for_lt_12_7=";100;120"
11+
[[ "${cuda_version}" == 11.7.* ]] && build_capability=$(sed 's|'"$remove_for_11_7"'||g' <<< "$build_capability")
12+
[[ "${cuda_version}" == 11.8.* ]] && build_capability=$(sed 's|'"$remove_for_11_8"'||g' <<< "$build_capability")
13+
[[ "${cuda_version}" < 12.7 ]] && build_capability=$(sed 's|'"$remove_for_lt_12_7"'||g; s|'"${remove_for_lt_12_7#;}"';||g' <<< "$build_capability")
1014
[[ "${build_os}" = windows-* ]] && python3 -m pip install ninja
1115

1216
if [ "${build_os:0:6}" == ubuntu ]; then

CHANGELOG.md

+6
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,9 @@
1+
### 0.45.1
2+
3+
#### Improvements:
4+
5+
- Initial Support Blackwell B100 GPUs, RTX 50 Blackwell series GPUs and Jetson Thor Blackwell
6+
17
### 0.43.3
28

39
#### Improvements:

CMakeLists.txt

+12-1
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
# - CUDA_VERSION: The expected CUDA version, for sanity checking. The actual version
88
# is whatever CMake finds on your path.
99
# - COMPUTE_CAPABILITY: Which GPU Arch/Compute codes to provide to NVCC.
10-
# Separate by semicolons, i.e. `-DCOMPUTE_CAPABILITY=89;90`
10+
# Separate by semicolons, i.e. `-DCOMPUTE_CAPABILITY=89;90;100;120`
1111
# Check your compute capability here: https://developer.nvidia.com/cuda-gpus
1212
# - PTXAS_VERBOSE: Pass the `-v` option to the PTX Assembler
1313
cmake_minimum_required(VERSION 3.22.1)
@@ -122,6 +122,17 @@ if(BUILD_CUDA)
122122
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 89 90)
123123
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 90)
124124
endif()
125+
# CUDA 12.7 adds support for Blackwell B100.
126+
if (CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL "12.7")
127+
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 100)
128+
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 100)
129+
endif()
130+
131+
# CUDA 12.8 adds support for RTX 50 Blackwell.
132+
if (CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL "12.8")
133+
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 101 120)
134+
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 101 120)
135+
endif()
125136
endif()
126137

127138
string(APPEND CMAKE_CUDA_FLAGS " --use_fast_math")

0 commit comments

Comments
 (0)