Skip to content

Commit 844096b

Browse files
committed
[CUDA] Make NVVM builtins available with CUDA-11/PTX6.5
Differential Revision: https://reviews.llvm.org/D79449
1 parent 67175d8 commit 844096b

File tree

2 files changed

+12
-2
lines changed

2 files changed

+12
-2
lines changed

clang/include/clang/Basic/BuiltinsNVPTX.def

Lines changed: 8 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,9 @@
2020
#pragma push_macro("SM_70")
2121
#pragma push_macro("SM_72")
2222
#pragma push_macro("SM_75")
23-
#define SM_75 "sm_75"
23+
#pragma push_macro("SM_80")
24+
#define SM_80 "sm_80"
25+
#define SM_75 "sm_75|" SM_80
2426
#define SM_72 "sm_72|" SM_75
2527
#define SM_70 "sm_70|" SM_72
2628

@@ -31,7 +33,9 @@
3133
#pragma push_macro("PTX61")
3234
#pragma push_macro("PTX63")
3335
#pragma push_macro("PTX64")
34-
#define PTX64 "ptx64"
36+
#pragma push_macro("PTX65")
37+
#define PTX65 "ptx65"
38+
#define PTX64 "ptx64|" PTX65
3539
#define PTX63 "ptx63|" PTX64
3640
#define PTX61 "ptx61|" PTX63
3741
#define PTX60 "ptx60|" PTX61
@@ -721,7 +725,9 @@ TARGET_BUILTIN(__imma_m8n8k32_st_c_i32, "vi*iC*UiIi", "", AND(SM_75,PTX63))
721725
#pragma pop_macro("SM_70")
722726
#pragma pop_macro("SM_72")
723727
#pragma pop_macro("SM_75")
728+
#pragma pop_macro("SM_80")
724729
#pragma pop_macro("PTX60")
725730
#pragma pop_macro("PTX61")
726731
#pragma pop_macro("PTX63")
727732
#pragma pop_macro("PTX64")
733+
#pragma pop_macro("PTX65")

clang/test/CodeGen/builtins-nvptx-ptx60.cu

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,10 @@
22
// RUN: -fcuda-is-device -target-feature +ptx60 \
33
// RUN: -S -emit-llvm -o - -x cuda %s \
44
// RUN: | FileCheck -check-prefix=CHECK %s
5+
// RUN: %clang_cc1 -triple nvptx64-unknown-unknown -target-cpu sm_80 \
6+
// RUN: -fcuda-is-device -target-feature +ptx65 \
7+
// RUN: -S -emit-llvm -o - -x cuda %s \
8+
// RUN: | FileCheck -check-prefix=CHECK %s
59
// RUN: %clang_cc1 -triple nvptx-unknown-unknown -target-cpu sm_60 \
610
// RUN: -fcuda-is-device -S -o /dev/null -x cuda -verify %s
711

0 commit comments

Comments
 (0)