Skip to content

Commit 263d38a

Browse files
committed
Merge branch 'main' into install_cmake
2 parents ec188d7 + 7882c23 commit 263d38a

File tree

2 files changed

+39
-32
lines changed

2 files changed

+39
-32
lines changed

install.md

+38-32
Original file line numberDiff line numberDiff line change
@@ -324,14 +324,14 @@ They can be deduced from the device if present at CMake configuration time.
324324

325325
</summary>
326326

327-
| Option | Architecture |
328-
|--------------------------------|-----------------------|
329-
| `-DKokkos_ARCH_INTEL_GEN=ON` | Generic JIT |
330-
| `-DKokkos_ARCH_INTEL_XEHP=ON` | Xe-HP |
331-
| `-DKokkos_ARCH_INTEL_PVC=ON` | GPU Max/Ponte Vecchio |
332-
| `-DKokkos_ARCH_INTEL_DG1=ON` | Iris XeMAX |
333-
| `-DKokkos_ARCH_INTEL_GEN12=ON` | Gen12 |
334-
| `-DKokkos_ARCH_INTEL_GEN11=ON` | Gen11 |
327+
| Option | Architecture |
328+
|--------------------------------|-------------------------|
329+
| `-DKokkos_ARCH_INTEL_GEN=ON` | Generic JIT |
330+
| `-DKokkos_ARCH_INTEL_XEHP=ON` | Xe-HP |
331+
| `-DKokkos_ARCH_INTEL_PVC=ON` | GPU Max (Ponte Vecchio) |
332+
| `-DKokkos_ARCH_INTEL_DG1=ON` | Iris XeMAX |
333+
| `-DKokkos_ARCH_INTEL_GEN12=ON` | Gen12 |
334+
| `-DKokkos_ARCH_INTEL_GEN11=ON` | Gen11 |
335335

336336
<!--#ifndef PRINT-->
337337

@@ -364,10 +364,6 @@ They can be deduced from the device if present at CMake configuration time.
364364
| `-DKokkos_ARCH_MAXWELL53=ON` | Maxwell | 5.3 | |
365365
| `-DKokkos_ARCH_MAXWELL52=ON` | Maxwell | 5.2 | M6, M60, M4, M40 |
366366
| `-DKokkos_ARCH_MAXWELL50=ON` | Maxwell | 5.0 | M10 |
367-
| `-DKokkos_ARCH_KEPLER37=ON` | Kepler | 3.7 | K80 |
368-
| `-DKokkos_ARCH_KEPLER35=ON` | Kepler | 3.5 | K40, K20 |
369-
| `-DKokkos_ARCH_KEPLER32=ON` | Kepler | 3.2 | |
370-
| `-DKokkos_ARCH_KEPLER30=ON` | Kepler | 3.0 | K10 |
371367

372368
<!--#ifndef PRINT-->
373369

@@ -399,58 +395,68 @@ They can be deduced from the device if present at CMake configuration time.
399395
cmake \
400396
-B build \
401397
-DCMAKE_BUILD_TYPE=Release \
402-
-DKokkos_ARCH_NATIVE=ON \
403-
-DKokkos_ENABLE_OPENMP=ON
398+
-DKokkos_ENABLE_OPENMP=ON \
399+
-DKokkos_ARCH_NATIVE=ON
404400
```
405401

406-
#### AMD MI250 GPU with HIP and OpenMP
402+
#### AMD MI300A APU with HIP
407403

408404
```sh
405+
export HSA_XNACK=1
409406
cmake \
410407
-B build \
411408
-DCMAKE_CXX_COMPILER=hipcc \
412409
-DCMAKE_BUILD_TYPE=Release \
413410
-DKokkos_ENABLE_HIP=ON \
414-
-DKokkos_ARCH_AMD_GFX90A=ON \
415-
-DKokkos_ENABLE_OPENMP=ON
411+
-DKokkos_ARCH_AMD_GFX942_APU=ON
416412
```
417413

418-
#### NVIDIA A100 GPU with CUDA and OpenMP
414+
Environment variable is required to access host allocations from the device.
415+
416+
#### AMD MI250 GPU with HIP
419417

420418
```sh
421419
cmake \
422420
-B build \
421+
-DCMAKE_CXX_COMPILER=hipcc \
423422
-DCMAKE_BUILD_TYPE=Release \
424-
-DKokkos_ENABLE_CUDA=ON \
425-
-DKokkos_ARCH_AMPERE80=ON \
426-
-DKokkos_ENABLE_OPENMP=ON
423+
-DKokkos_ENABLE_HIP=ON \
424+
-DKokkos_ARCH_AMD_GFX90A=ON
427425
```
428426

429-
#### NVIDIA V100 GPU with CUDA and OpenMP
427+
#### Intel GPU Max 1550 (Ponte Vecchio) with SYCL
430428

431429
```sh
432430
cmake \
433431
-B build \
432+
-DCMAKE_CXX_COMPILER=icpx \
434433
-DCMAKE_BUILD_TYPE=Release \
435-
-DKokkos_ENABLE_CUDA=ON \
436-
-DKokkos_ARCH_VOLTA70=ON \
437-
-DKokkos_ENABLE_OPENMP=ON
434+
-DKokkos_ENABLE_SYCL=ON \
435+
-DKokkos_ARCH_INTEL_PVC=ON \
436+
-DCMAKE_CXX_FLAGS="-fp-model=precise"
438437
```
439438

440-
#### Intel GPU Max/Ponte Vecchio GPU with SYCL and OpenMP
439+
Last option is for math operators precision.
440+
441+
#### NVIDIA H100 GPU with CUDA
441442

442443
```sh
443444
cmake \
444445
-B build \
445-
-DCMAKE_CXX_COMPILER=icpx \
446446
-DCMAKE_BUILD_TYPE=Release \
447-
-DKokkos_ENABLE_SYCL=ON \
448-
-DKokkos_ARCH_INTEL_PVC=ON \
449-
-DKokkos_ENABLE_OPENMP=ON \
450-
-DCMAKE_CXX_FLAGS="-fp-model=precise"
447+
-DKokkos_ENABLE_CUDA=ON \
448+
-DKokkos_ARCH_HOPPER90=ON
451449
```
452450

453-
Last option is for math operators precision.
451+
#### NVIDIA A100 GPU with CUDA
452+
453+
```sh
454+
cmake \
455+
-B build \
456+
-DCMAKE_BUILD_TYPE=Release \
457+
-DKokkos_ENABLE_CUDA=ON \
458+
-DKokkos_ARCH_AMPERE80=ON
459+
```
454460

455461
<!--#ifndef PRINT-->
456462
<img title="Code" alt="Code" src="./images/code_txt.svg" height="25"> For more code examples:

typos.toml

+1
Original file line numberDiff line numberDiff line change
@@ -5,3 +5,4 @@ extend-exclude = [
55

66
[default.extend-words]
77
ND = "ND"
8+
HSA = "HSA"

0 commit comments

Comments
 (0)