[x86] add tests for fma folds with fast-math-flags; NFC

rotateright · rotateright · commit 9b59a61cfc4e · 2021-05-19T14:28:57.000-04:00
Part of prep work for D90901
diff --git a/llvm/test/CodeGen/X86/fma-fneg-combine.ll b/llvm/test/CodeGen/X86/fma-fneg-combine.ll
@@ -38,6 +38,16 @@ define <16 x float> @test2(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
   ret <16 x float> %neg
 }
 
+define <16 x float> @test2_nsz(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
+; CHECK-LABEL: test2_nsz:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    vfnmsub213ps {{.*#+}} zmm0 = -(zmm1 * zmm0) - zmm2
+; CHECK-NEXT:    retq
+  %fma = call nsz <16 x float> @llvm.fma.v16f32(<16 x float> %a, <16 x float> %b, <16 x float> %c)
+  %neg = fneg <16 x float> %fma
+  ret <16 x float> %neg
+}
+
 define <16 x float> @test3(<16 x float> %a, <16 x float> %b, <16 x float> %c)  {
 ; CHECK-LABEL: test3:
 ; CHECK:       # %bb.0:
@@ -49,6 +59,17 @@ define <16 x float> @test3(<16 x float> %a, <16 x float> %b, <16 x float> %c)  {
   ret <16 x float> %sub.i
 }
 
+define <16 x float> @test3_nsz(<16 x float> %a, <16 x float> %b, <16 x float> %c)  {
+; CHECK-LABEL: test3_nsz:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    vfmsub213ps {{.*#+}} zmm0 = (zmm1 * zmm0) - zmm2
+; CHECK-NEXT:    retq
+  %t0 = fneg <16 x float> %b
+  %t1 = call nsz <16 x float> @llvm.fma.v16f32(<16 x float> %a, <16 x float> %t0, <16 x float> %c)
+  %sub.i = fneg <16 x float> %t1
+  ret <16 x float> %sub.i
+}
+
 define <16 x float> @test4(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
 ; CHECK-LABEL: test4:
 ; CHECK:       # %bb.0:
@@ -61,6 +82,18 @@ define <16 x float> @test4(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
   ret <16 x float> %sub.i
 }
 
+define <16 x float> @test4_nsz(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
+; CHECK-LABEL: test4_nsz:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    vfmadd213ps {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2
+; CHECK-NEXT:    retq
+  %t0 = fneg <16 x float> %b
+  %t1 = fneg <16 x float> %c
+  %t2 = call nsz <16 x float> @llvm.fma.v16f32(<16 x float> %a, <16 x float> %t0, <16 x float> %t1)
+  %sub.i = fsub <16 x float> <float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0>, %t2
+  ret <16 x float> %sub.i
+}
+
 define <16 x float> @test5(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
 ; CHECK-LABEL: test5:
 ; CHECK:       # %bb.0: # %entry
@@ -84,6 +117,18 @@ define <16 x float> @test6(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
   ret <16 x float> %sub.i
 }
 
+define <16 x float> @test6_nsz(<16 x float> %a, <16 x float> %b, <16 x float> %c) {
+; CHECK-LABEL: test6_nsz:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    vfmadd213ps {ru-sae}, %zmm2, %zmm1, %zmm0
+; CHECK-NEXT:    retq
+  %t0 = fneg <16 x float> %b
+  %t1 = fneg <16 x float> %c
+  %t2 = call nsz <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %a, <16 x float> %t0, <16 x float> %t1, i32 10)
+  %sub.i = fsub <16 x float> <float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0>, %t2
+  ret <16 x float> %sub.i
+}
+
 define <8 x float> @test7(<8 x float> %a, <8 x float> %b, <8 x float> %c) {
 ; CHECK-LABEL: test7:
 ; CHECK:       # %bb.0:
@@ -95,6 +140,17 @@ define <8 x float> @test7(<8 x float> %a, <8 x float> %b, <8 x float> %c) {
   ret <8 x float> %sub.i
 }
 
+define <8 x float> @test7_nsz(<8 x float> %a, <8 x float> %b, <8 x float> %c) {
+; CHECK-LABEL: test7_nsz:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    vfnmadd213ps {{.*#+}} ymm0 = -(ymm1 * ymm0) + ymm2
+; CHECK-NEXT:    retq
+  %t0 = fneg <8 x float> %c
+  %t1 = call nsz <8 x float> @llvm.fma.v8f32(<8 x float> %a, <8 x float> %b, <8 x float> %t0)
+  %sub.i = fsub <8 x float> <float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0, float -0.0>, %t1
+  ret <8 x float> %sub.i
+}
+
 define <8 x float> @test8(<8 x float> %a, <8 x float> %b, <8 x float> %c) {
 ; CHECK-LABEL: test8:
 ; CHECK:       # %bb.0: # %entry
@@ -116,6 +172,16 @@ define <8 x double> @test9(<8 x double> %a, <8 x double> %b, <8 x double> %c) {
   ret <8 x double> %sub.i
 }
 
+define <8 x double> @test9_nsz(<8 x double> %a, <8 x double> %b, <8 x double> %c) {
+; CHECK-LABEL: test9_nsz:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    vfnmsub213pd {{.*#+}} zmm0 = -(zmm1 * zmm0) - zmm2
+; CHECK-NEXT:    retq
+  %t0 = tail call nsz <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %a, <8 x double> %b, <8 x double> %c, i32 4)
+  %sub.i = fneg <8 x double> %t0
+  ret <8 x double> %sub.i
+}
+
 define <2 x double> @test10(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
 ; CHECK-LABEL: test10:
 ; CHECK:       # %bb.0: # %entry