Skip to content

Commit bad0290

Browse files
author
Thomas Preud'homme
committed
Improve STRICT_FSETCC codegen in absence of no NaN
As for SETCC, use a less expensive condition code when generating STRICT_FSETCC if the node is known not to have Nan. Reviewed By: SjoerdMeijer Differential Revision: https://reviews.llvm.org/D91972
1 parent a56e574 commit bad0290

File tree

2 files changed

+116
-1
lines changed

2 files changed

+116
-1
lines changed

llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7126,7 +7126,10 @@ void SelectionDAGBuilder::visitConstrainedFPIntrinsic(
71267126
case ISD::STRICT_FSETCC:
71277127
case ISD::STRICT_FSETCCS: {
71287128
auto *FPCmp = dyn_cast<ConstrainedFPCmpIntrinsic>(&FPI);
7129-
Opers.push_back(DAG.getCondCode(getFCmpCondCode(FPCmp->getPredicate())));
7129+
ISD::CondCode Condition = getFCmpCondCode(FPCmp->getPredicate());
7130+
if (TM.Options.NoNaNsFPMath)
7131+
Condition = getFCmpCodeWithoutNaN(Condition);
7132+
Opers.push_back(DAG.getCondCode(Condition));
71307133
break;
71317134
}
71327135
}
Lines changed: 112 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,112 @@
1+
; RUN: llc < %s -mtriple=arm64-eabi -mattr=+fullfp16 -enable-no-nans-fp-math | FileCheck %s
2+
3+
declare i1 @llvm.experimental.constrained.fcmp.f32(float, float, metadata, metadata)
4+
declare i1 @llvm.experimental.constrained.fcmp.f64(double, double, metadata, metadata)
5+
6+
; CHECK-LABEL: @f32_constrained_fcmp_ueq
7+
; CHECK: fcmp s0, s1
8+
; CHECK-NEXT: cset w0, eq
9+
; CHECK-NEXT: ret
10+
define i1 @f32_constrained_fcmp_ueq(float %a, float %b) nounwind ssp {
11+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f32(float %a, float %b, metadata !"ueq", metadata !"fpexcept.strict")
12+
ret i1 %cmp
13+
}
14+
15+
; CHECK-LABEL: @f32_constrained_fcmp_une
16+
; CHECK: fcmp s0, s1
17+
; CHECK-NEXT: cset w0, ne
18+
; CHECK-NEXT: ret
19+
define i1 @f32_constrained_fcmp_une(float %a, float %b) nounwind ssp {
20+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f32(float %a, float %b, metadata !"une", metadata !"fpexcept.strict")
21+
ret i1 %cmp
22+
}
23+
24+
; CHECK-LABEL: @f32_constrained_fcmp_ugt
25+
; CHECK: fcmp s0, s1
26+
; CHECK-NEXT: cset w0, gt
27+
; CHECK-NEXT: ret
28+
define i1 @f32_constrained_fcmp_ugt(float %a, float %b) nounwind ssp {
29+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f32(float %a, float %b, metadata !"ugt", metadata !"fpexcept.strict")
30+
ret i1 %cmp
31+
}
32+
33+
; CHECK-LABEL: @f32_constrained_fcmp_uge
34+
; CHECK: fcmp s0, s1
35+
; CHECK-NEXT: cset w0, ge
36+
; CHECK-NEXT: ret
37+
define i1 @f32_constrained_fcmp_uge(float %a, float %b) nounwind ssp {
38+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f32(float %a, float %b, metadata !"uge", metadata !"fpexcept.strict")
39+
ret i1 %cmp
40+
}
41+
42+
; CHECK-LABEL: @f32_constrained_fcmp_ult
43+
; CHECK: fcmp s0, s1
44+
; CHECK-NEXT: cset w0, lt
45+
; CHECK-NEXT: ret
46+
define i1 @f32_constrained_fcmp_ult(float %a, float %b) nounwind ssp {
47+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f32(float %a, float %b, metadata !"ult", metadata !"fpexcept.strict")
48+
ret i1 %cmp
49+
}
50+
51+
; CHECK-LABEL: @f32_constrained_fcmp_ule
52+
; CHECK: fcmp s0, s1
53+
; CHECK-NEXT: cset w0, le
54+
; CHECK-NEXT: ret
55+
define i1 @f32_constrained_fcmp_ule(float %a, float %b) nounwind ssp {
56+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f32(float %a, float %b, metadata !"ule", metadata !"fpexcept.strict")
57+
ret i1 %cmp
58+
}
59+
60+
; CHECK-LABEL: @f64_constrained_fcmp_ueq
61+
; CHECK: fcmp d0, d1
62+
; CHECK-NEXT: cset w0, eq
63+
; CHECK-NEXT: ret
64+
define i1 @f64_constrained_fcmp_ueq(double %a, double %b) nounwind ssp {
65+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %a, double %b, metadata !"ueq", metadata !"fpexcept.strict")
66+
ret i1 %cmp
67+
}
68+
69+
; CHECK-LABEL: @f64_constrained_fcmp_une
70+
; CHECK: fcmp d0, d1
71+
; CHECK-NEXT: cset w0, ne
72+
; CHECK-NEXT: ret
73+
define i1 @f64_constrained_fcmp_une(double %a, double %b) nounwind ssp {
74+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %a, double %b, metadata !"une", metadata !"fpexcept.strict")
75+
ret i1 %cmp
76+
}
77+
78+
; CHECK-LABEL: @f64_constrained_fcmp_ugt
79+
; CHECK: fcmp d0, d1
80+
; CHECK-NEXT: cset w0, gt
81+
; CHECK-NEXT: ret
82+
define i1 @f64_constrained_fcmp_ugt(double %a, double %b) nounwind ssp {
83+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %a, double %b, metadata !"ugt", metadata !"fpexcept.strict")
84+
ret i1 %cmp
85+
}
86+
87+
; CHECK-LABEL: @f64_constrained_fcmp_uge
88+
; CHECK: fcmp d0, d1
89+
; CHECK-NEXT: cset w0, ge
90+
; CHECK-NEXT: ret
91+
define i1 @f64_constrained_fcmp_uge(double %a, double %b) nounwind ssp {
92+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %a, double %b, metadata !"uge", metadata !"fpexcept.strict")
93+
ret i1 %cmp
94+
}
95+
96+
; CHECK-LABEL: @f64_constrained_fcmp_ult
97+
; CHECK: fcmp d0, d1
98+
; CHECK-NEXT: cset w0, lt
99+
; CHECK-NEXT: ret
100+
define i1 @f64_constrained_fcmp_ult(double %a, double %b) nounwind ssp {
101+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %a, double %b, metadata !"ult", metadata !"fpexcept.strict")
102+
ret i1 %cmp
103+
}
104+
105+
; CHECK-LABEL: @f64_constrained_fcmp_ule
106+
; CHECK: fcmp d0, d1
107+
; CHECK-NEXT: cset w0, le
108+
; CHECK-NEXT: ret
109+
define i1 @f64_constrained_fcmp_ule(double %a, double %b) nounwind ssp {
110+
%cmp = tail call i1 @llvm.experimental.constrained.fcmp.f64(double %a, double %b, metadata !"ule", metadata !"fpexcept.strict")
111+
ret i1 %cmp
112+
}

0 commit comments

Comments
 (0)