Skip to content

Commit

Permalink
initial support blackwell
Browse files Browse the repository at this point in the history
  • Loading branch information
johnnynunez committed Jan 22, 2025
1 parent a9cfd1b commit a9c63ee
Show file tree
Hide file tree
Showing 3 changed files with 19 additions and 2 deletions.
2 changes: 1 addition & 1 deletion .github/scripts/build-cuda.sh
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@ declare build_os
declare cuda_version

set -xeuo pipefail
build_capability="50;52;60;61;70;75;80;86;89;90"
build_capability="50;52;60;61;70;75;80;86;89;90;100;120"
[[ "${cuda_version}" == 11.7.* ]] && build_capability=${build_capability%??????}
[[ "${cuda_version}" == 11.8.* ]] && build_capability=${build_capability%???}
[[ "${build_os}" = windows-* ]] && python3 -m pip install ninja
Expand Down
6 changes: 6 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
@@ -1,3 +1,9 @@
### 0.43.4

#### Improvements:

- Initial Support Blackwell B100 GPUs and RTX 50 series GPUs

### 0.43.3

#### Improvements:
Expand Down
13 changes: 12 additions & 1 deletion CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
# - CUDA_VERSION: The expected CUDA version, for sanity checking. The actual version
# is whatever CMake finds on your path.
# - COMPUTE_CAPABILITY: Which GPU Arch/Compute codes to provide to NVCC.
# Separate by semicolons, i.e. `-DCOMPUTE_CAPABILITY=89;90`
# Separate by semicolons, i.e. `-DCOMPUTE_CAPABILITY=89;90;100;120`
# Check your compute capability here: https://developer.nvidia.com/cuda-gpus
# - PTXAS_VERBOSE: Pass the `-v` option to the PTX Assembler
cmake_minimum_required(VERSION 3.22.1)
Expand Down Expand Up @@ -122,6 +122,17 @@ if(BUILD_CUDA)
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 89 90)
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 90)
endif()
# CUDA 12.7 adds support for Blackwell B100.
if (CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL "12.7")
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 100)
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 100)
endif()

# CUDA 12.8 adds support for RTX 50 Blackwell.
if (CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL "12.8")
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 120)
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 120)
endif()
endif()

string(APPEND CMAKE_CUDA_FLAGS " --use_fast_math")
Expand Down

0 comments on commit a9c63ee

Please sign in to comment.