Skip to content

Commit 001db64

Browse files
author
git apple-llvm automerger
committed
Merge commit '6b2cf8100088' from apple/master into swift/master-next
2 parents 915213c + 6b2cf81 commit 001db64

File tree

8 files changed

+86
-27
lines changed

8 files changed

+86
-27
lines changed

clang/lib/CodeGen/CGBuiltin.cpp

Lines changed: 29 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -6433,14 +6433,20 @@ Value *CodeGenFunction::GetValueForARMHint(unsigned BuiltinID) {
64336433
llvm::ConstantInt::get(Int32Ty, Value));
64346434
}
64356435

6436+
enum SpecialRegisterAccessKind {
6437+
NormalRead,
6438+
VolatileRead,
6439+
Write,
6440+
};
6441+
64366442
// Generates the IR for the read/write special register builtin,
64376443
// ValueType is the type of the value that is to be written or read,
64386444
// RegisterType is the type of the register being written to or read from.
64396445
static Value *EmitSpecialRegisterBuiltin(CodeGenFunction &CGF,
64406446
const CallExpr *E,
64416447
llvm::Type *RegisterType,
64426448
llvm::Type *ValueType,
6443-
bool IsRead,
6449+
SpecialRegisterAccessKind AccessKind,
64446450
StringRef SysReg = "") {
64456451
// write and register intrinsics only support 32 and 64 bit operations.
64466452
assert((RegisterType->isIntegerTy(32) || RegisterType->isIntegerTy(64))
@@ -6465,8 +6471,12 @@ static Value *EmitSpecialRegisterBuiltin(CodeGenFunction &CGF,
64656471
assert(!(RegisterType->isIntegerTy(32) && ValueType->isIntegerTy(64))
64666472
&& "Can't fit 64-bit value in 32-bit register");
64676473

6468-
if (IsRead) {
6469-
llvm::Function *F = CGM.getIntrinsic(llvm::Intrinsic::read_register, Types);
6474+
if (AccessKind != Write) {
6475+
assert(AccesKind == NormalRead || AccessKind == VolatileRead);
6476+
llvm::Function *F = CGM.getIntrinsic(
6477+
AccessKind == VolatileRead ? llvm::Intrinsic::read_volatile_register
6478+
: llvm::Intrinsic::read_register,
6479+
Types);
64706480
llvm::Value *Call = Builder.CreateCall(F, Metadata);
64716481

64726482
if (MixedTypes)
@@ -6845,9 +6855,11 @@ Value *CodeGenFunction::EmitARMBuiltinExpr(unsigned BuiltinID,
68456855
BuiltinID == ARM::BI__builtin_arm_wsr64 ||
68466856
BuiltinID == ARM::BI__builtin_arm_wsrp) {
68476857

6848-
bool IsRead = BuiltinID == ARM::BI__builtin_arm_rsr ||
6849-
BuiltinID == ARM::BI__builtin_arm_rsr64 ||
6850-
BuiltinID == ARM::BI__builtin_arm_rsrp;
6858+
SpecialRegisterAccessKind AccessKind = Write;
6859+
if (BuiltinID == ARM::BI__builtin_arm_rsr ||
6860+
BuiltinID == ARM::BI__builtin_arm_rsr64 ||
6861+
BuiltinID == ARM::BI__builtin_arm_rsrp)
6862+
AccessKind = VolatileRead;
68516863

68526864
bool IsPointerBuiltin = BuiltinID == ARM::BI__builtin_arm_rsrp ||
68536865
BuiltinID == ARM::BI__builtin_arm_wsrp;
@@ -6866,7 +6878,8 @@ Value *CodeGenFunction::EmitARMBuiltinExpr(unsigned BuiltinID,
68666878
ValueType = RegisterType = Int32Ty;
68676879
}
68686880

6869-
return EmitSpecialRegisterBuiltin(*this, E, RegisterType, ValueType, IsRead);
6881+
return EmitSpecialRegisterBuiltin(*this, E, RegisterType, ValueType,
6882+
AccessKind);
68706883
}
68716884

68726885
// Deal with MVE builtins
@@ -8906,9 +8919,11 @@ Value *CodeGenFunction::EmitAArch64BuiltinExpr(unsigned BuiltinID,
89068919
BuiltinID == AArch64::BI__builtin_arm_wsr64 ||
89078920
BuiltinID == AArch64::BI__builtin_arm_wsrp) {
89088921

8909-
bool IsRead = BuiltinID == AArch64::BI__builtin_arm_rsr ||
8910-
BuiltinID == AArch64::BI__builtin_arm_rsr64 ||
8911-
BuiltinID == AArch64::BI__builtin_arm_rsrp;
8922+
SpecialRegisterAccessKind AccessKind = Write;
8923+
if (BuiltinID == AArch64::BI__builtin_arm_rsr ||
8924+
BuiltinID == AArch64::BI__builtin_arm_rsr64 ||
8925+
BuiltinID == AArch64::BI__builtin_arm_rsrp)
8926+
AccessKind = VolatileRead;
89128927

89138928
bool IsPointerBuiltin = BuiltinID == AArch64::BI__builtin_arm_rsrp ||
89148929
BuiltinID == AArch64::BI__builtin_arm_wsrp;
@@ -8926,7 +8941,8 @@ Value *CodeGenFunction::EmitAArch64BuiltinExpr(unsigned BuiltinID,
89268941
ValueType = Int32Ty;
89278942
}
89288943

8929-
return EmitSpecialRegisterBuiltin(*this, E, RegisterType, ValueType, IsRead);
8944+
return EmitSpecialRegisterBuiltin(*this, E, RegisterType, ValueType,
8945+
AccessKind);
89308946
}
89318947

89328948
if (BuiltinID == AArch64::BI_ReadStatusReg ||
@@ -14869,7 +14885,7 @@ Value *CodeGenFunction::EmitAMDGPUBuiltinExpr(unsigned BuiltinID,
1486914885
}
1487014886
case AMDGPU::BI__builtin_amdgcn_read_exec: {
1487114887
CallInst *CI = cast<CallInst>(
14872-
EmitSpecialRegisterBuiltin(*this, E, Int64Ty, Int64Ty, true, "exec"));
14888+
EmitSpecialRegisterBuiltin(*this, E, Int64Ty, Int64Ty, NormalRead, "exec"));
1487314889
CI->setConvergent();
1487414890
return CI;
1487514891
}
@@ -14878,7 +14894,7 @@ Value *CodeGenFunction::EmitAMDGPUBuiltinExpr(unsigned BuiltinID,
1487814894
StringRef RegName = BuiltinID == AMDGPU::BI__builtin_amdgcn_read_exec_lo ?
1487914895
"exec_lo" : "exec_hi";
1488014896
CallInst *CI = cast<CallInst>(
14881-
EmitSpecialRegisterBuiltin(*this, E, Int32Ty, Int32Ty, true, RegName));
14897+
EmitSpecialRegisterBuiltin(*this, E, Int32Ty, Int32Ty, NormalRead, RegName));
1488214898
CI->setConvergent();
1488314899
return CI;
1488414900
}

clang/test/CodeGen/builtins-arm.c

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -222,19 +222,19 @@ uint64_t mrrc2() {
222222
}
223223

224224
unsigned rsr() {
225-
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i32 @llvm.read_register.i32(metadata ![[M0:.*]])
225+
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i32 @llvm.read_volatile_register.i32(metadata ![[M0:.*]])
226226
// CHECK-NEXT: ret i32 [[V0]]
227227
return __builtin_arm_rsr("cp1:2:c3:c4:5");
228228
}
229229

230230
unsigned long long rsr64() {
231-
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i64 @llvm.read_register.i64(metadata ![[M1:.*]])
231+
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i64 @llvm.read_volatile_register.i64(metadata ![[M1:.*]])
232232
// CHECK-NEXT: ret i64 [[V0]]
233233
return __builtin_arm_rsr64("cp1:2:c3");
234234
}
235235

236236
void *rsrp() {
237-
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i32 @llvm.read_register.i32(metadata ![[M2:.*]])
237+
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i32 @llvm.read_volatile_register.i32(metadata ![[M2:.*]])
238238
// CHECK-NEXT: [[V1:[%A-Za-z0-9.]+]] = inttoptr i32 [[V0]] to i8*
239239
// CHECK-NEXT: ret i8* [[V1]]
240240
return __builtin_arm_rsrp("sysreg");

clang/test/CodeGen/builtins-arm64.c

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -68,20 +68,20 @@ int32_t jcvt(double v) {
6868
__typeof__(__builtin_arm_rsr("1:2:3:4:5")) rsr(void);
6969

7070
uint32_t rsr() {
71-
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i64 @llvm.read_register.i64(metadata ![[M0:[0-9]]])
71+
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i64 @llvm.read_volatile_register.i64(metadata ![[M0:[0-9]]])
7272
// CHECK-NEXT: trunc i64 [[V0]] to i32
7373
return __builtin_arm_rsr("1:2:3:4:5");
7474
}
7575

7676
__typeof__(__builtin_arm_rsr64("1:2:3:4:5")) rsr64(void);
7777

7878
uint64_t rsr64(void) {
79-
// CHECK: call i64 @llvm.read_register.i64(metadata ![[M0:[0-9]]])
79+
// CHECK: call i64 @llvm.read_volatile_register.i64(metadata ![[M0:[0-9]]])
8080
return __builtin_arm_rsr64("1:2:3:4:5");
8181
}
8282

8383
void *rsrp() {
84-
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i64 @llvm.read_register.i64(metadata ![[M0:[0-9]]])
84+
// CHECK: [[V0:[%A-Za-z0-9.]+]] = call i64 @llvm.read_volatile_register.i64(metadata ![[M0:[0-9]]])
8585
// CHECK-NEXT: inttoptr i64 [[V0]] to i8*
8686
return __builtin_arm_rsrp("1:2:3:4:5");
8787
}

llvm/docs/LangRef.rst

Lines changed: 16 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -11650,9 +11650,11 @@ the escaped allocas are allocated, which would break attempts to use
1165011650
'``llvm.localrecover``'.
1165111651

1165211652
.. _int_read_register:
11653+
.. _int_read_volatile_register:
1165311654
.. _int_write_register:
1165411655

11655-
'``llvm.read_register``' and '``llvm.write_register``' Intrinsics
11656+
'``llvm.read_register``', '``llvm.read_volatile_register``', and
11657+
'``llvm.write_register``' Intrinsics
1165611658
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
1165711659

1165811660
Syntax:
@@ -11662,24 +11664,30 @@ Syntax:
1166211664

1166311665
declare i32 @llvm.read_register.i32(metadata)
1166411666
declare i64 @llvm.read_register.i64(metadata)
11667+
declare i32 @llvm.read_volatile_register.i32(metadata)
11668+
declare i64 @llvm.read_volatile_register.i64(metadata)
1166511669
declare void @llvm.write_register.i32(metadata, i32 @value)
1166611670
declare void @llvm.write_register.i64(metadata, i64 @value)
1166711671
!0 = !{!"sp\00"}
1166811672

1166911673
Overview:
1167011674
"""""""""
1167111675

11672-
The '``llvm.read_register``' and '``llvm.write_register``' intrinsics
11673-
provides access to the named register. The register must be valid on
11674-
the architecture being compiled to. The type needs to be compatible
11675-
with the register being read.
11676+
The '``llvm.read_register``', '``llvm.read_volatile_register``', and
11677+
'``llvm.write_register``' intrinsics provide access to the named register.
11678+
The register must be valid on the architecture being compiled to. The type
11679+
needs to be compatible with the register being read.
1167611680

1167711681
Semantics:
1167811682
""""""""""
1167911683

11680-
The '``llvm.read_register``' intrinsic returns the current value of the
11681-
register, where possible. The '``llvm.write_register``' intrinsic sets
11682-
the current value of the register, where possible.
11684+
The '``llvm.read_register``' and '``llvm.read_volatile_register``' intrinsics
11685+
return the current value of the register, where possible. The
11686+
'``llvm.write_register``' intrinsic sets the current value of the register,
11687+
where possible.
11688+
11689+
A call to '``llvm.read_volatile_register``' is assumed to have side-effects
11690+
and possibly return a different value each time (e.g. for a timer register).
1168311691

1168411692
This is useful to implement named register global variables that need
1168511693
to always be mapped to a specific register, as is common practice on

llvm/include/llvm/IR/Intrinsics.td

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -458,6 +458,9 @@ def int_read_register : Intrinsic<[llvm_anyint_ty], [llvm_metadata_ty],
458458
[IntrReadMem], "llvm.read_register">;
459459
def int_write_register : Intrinsic<[], [llvm_metadata_ty, llvm_anyint_ty],
460460
[], "llvm.write_register">;
461+
def int_read_volatile_register : Intrinsic<[llvm_anyint_ty], [llvm_metadata_ty],
462+
[IntrHasSideEffects],
463+
"llvm.read_volatile_register">;
461464

462465
// Gets the address of the local variable area. This is typically a copy of the
463466
// stack, frame, or base pointer depending on the type of prologue.

llvm/lib/CodeGen/GlobalISel/IRTranslator.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1598,6 +1598,7 @@ bool IRTranslator::translateKnownIntrinsic(const CallInst &CI, Intrinsic::ID ID,
15981598
case Intrinsic::sideeffect:
15991599
// Discard annotate attributes, assumptions, and artificial side-effects.
16001600
return true;
1601+
case Intrinsic::read_volatile_register:
16011602
case Intrinsic::read_register: {
16021603
Value *Arg = CI.getArgOperand(0);
16031604
MIRBuilder

llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5715,6 +5715,7 @@ void SelectionDAGBuilder::visitIntrinsicCall(const CallInst &I,
57155715
TLI.getFrameIndexTy(DAG.getDataLayout()),
57165716
getValue(I.getArgOperand(0))));
57175717
return;
5718+
case Intrinsic::read_volatile_register:
57185719
case Intrinsic::read_register: {
57195720
Value *Reg = I.getArgOperand(0);
57205721
SDValue Chain = getRoot();
Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,30 @@
1+
; RUN: opt -S -licm %s | FileCheck %s
2+
3+
; Volatile register shouldn't be hoisted ourside loops.
4+
define i32 @test_read() {
5+
; CHECK-LABEL: define i32 @test_read()
6+
; CHECK: br label %loop
7+
; CHECK: loop:
8+
; CHECK: %counter = tail call i64 @llvm.read_volatile_register
9+
10+
entry:
11+
br label %loop
12+
13+
loop:
14+
%i = phi i32 [ 0, %entry ], [ %i.next, %inc ]
15+
%counter = tail call i64 @llvm.read_volatile_register.i64(metadata !1)
16+
%tst = icmp ult i64 %counter, 1000
17+
br i1 %tst, label %inc, label %done
18+
19+
inc:
20+
%i.next = add nuw nsw i32 %i, 1
21+
br label %loop
22+
23+
done:
24+
ret i32 %i
25+
}
26+
27+
declare i64 @llvm.read_register.i64(metadata)
28+
declare i64 @llvm.read_volatile_register.i64(metadata)
29+
30+
!1 = !{!"cntpct_el0"}

0 commit comments

Comments
 (0)