@@ -77,6 +77,7 @@ declare float @llvm.exp2.f32(float) #0
77
77
78
78
define void @sin_f64 (ptr nocapture %varray ) {
79
79
; CHECK-LABEL: @sin_f64(
80
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_sin(<2 x double> [[TMP4:%.*]])
80
81
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_sin(<4 x double> [[TMP4:%.*]])
81
82
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_sin(<8 x double> [[TMP4:%.*]])
82
83
; CHECK: ret void
@@ -102,6 +103,7 @@ for.end:
102
103
define void @sin_f32 (ptr nocapture %varray ) {
103
104
; CHECK-LABEL: @sin_f32(
104
105
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_sinf(<4 x float> [[TMP4:%.*]])
106
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_sinf(<8 x float> [[TMP4:%.*]])
105
107
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_sinf(<16 x float> [[TMP4:%.*]])
106
108
; CHECK: ret void
107
109
;
@@ -125,6 +127,7 @@ for.end:
125
127
126
128
define void @sin_f64_intrinsic (ptr nocapture %varray ) {
127
129
; CHECK-LABEL: @sin_f64_intrinsic(
130
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_sin(<2 x double> [[TMP4:%.*]])
128
131
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_sin(<4 x double> [[TMP4:%.*]])
129
132
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_sin(<8 x double> [[TMP4:%.*]])
130
133
; CHECK: ret void
@@ -150,6 +153,7 @@ for.end:
150
153
define void @sin_f32_intrinsic (ptr nocapture %varray ) {
151
154
; CHECK-LABEL: @sin_f32_intrinsic(
152
155
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_sinf(<4 x float> [[TMP4:%.*]])
156
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_sinf(<8 x float> [[TMP4:%.*]])
153
157
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_sinf(<16 x float> [[TMP4:%.*]])
154
158
; CHECK: ret void
155
159
;
@@ -173,6 +177,7 @@ for.end:
173
177
174
178
define void @cos_f64 (ptr nocapture %varray ) {
175
179
; CHECK-LABEL: @cos_f64(
180
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_cos(<2 x double> [[TMP4:%.*]])
176
181
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_cos(<4 x double> [[TMP4:%.*]])
177
182
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_cos(<8 x double> [[TMP4:%.*]])
178
183
; CHECK: ret void
@@ -198,6 +203,7 @@ for.end:
198
203
define void @cos_f32 (ptr nocapture %varray ) {
199
204
; CHECK-LABEL: @cos_f32(
200
205
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_cosf(<4 x float> [[TMP4:%.*]])
206
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_cosf(<8 x float> [[TMP4:%.*]])
201
207
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_cosf(<16 x float> [[TMP4:%.*]])
202
208
; CHECK: ret void
203
209
;
@@ -221,6 +227,7 @@ for.end:
221
227
222
228
define void @cos_f64_intrinsic (ptr nocapture %varray ) {
223
229
; CHECK-LABEL: @cos_f64_intrinsic(
230
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_cos(<2 x double> [[TMP4:%.*]])
224
231
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_cos(<4 x double> [[TMP4:%.*]])
225
232
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_cos(<8 x double> [[TMP4:%.*]])
226
233
; CHECK: ret void
@@ -246,6 +253,7 @@ for.end:
246
253
define void @cos_f32_intrinsic (ptr nocapture %varray ) {
247
254
; CHECK-LABEL: @cos_f32_intrinsic(
248
255
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_cosf(<4 x float> [[TMP4:%.*]])
256
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_cosf(<8 x float> [[TMP4:%.*]])
249
257
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_cosf(<16 x float> [[TMP4:%.*]])
250
258
; CHECK: ret void
251
259
;
@@ -295,6 +303,7 @@ for.end:
295
303
define void @tan_f32 (ptr nocapture %varray ) {
296
304
; CHECK-LABEL: @tan_f32(
297
305
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_tanf(<4 x float> [[TMP4:%.*]])
306
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_tanf(<8 x float> [[TMP4:%.*]])
298
307
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_tanf(<16 x float> [[TMP4:%.*]])
299
308
; CHECK: ret void
300
309
;
@@ -344,6 +353,7 @@ for.end:
344
353
define void @tan_f32_intrinsic (ptr nocapture %varray ) {
345
354
; CHECK-LABEL: @tan_f32_intrinsic(
346
355
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_tanf(<4 x float> [[TMP4:%.*]])
356
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_tanf(<8 x float> [[TMP4:%.*]])
347
357
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_tanf(<16 x float> [[TMP4:%.*]])
348
358
; CHECK: ret void
349
359
;
@@ -368,6 +378,7 @@ for.end:
368
378
define void @acos_f32 (ptr nocapture %varray ) {
369
379
; CHECK-LABEL: @acos_f32(
370
380
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_acosf(<4 x float> [[TMP4:%.*]])
381
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_acosf(<8 x float> [[TMP4:%.*]])
371
382
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_acosf(<16 x float> [[TMP4:%.*]])
372
383
; CHECK: ret void
373
384
;
@@ -392,6 +403,7 @@ for.end:
392
403
define void @acos_f32_intrinsic (ptr nocapture %varray ) {
393
404
; CHECK-LABEL: @acos_f32_intrinsic(
394
405
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_acosf(<4 x float> [[TMP4:%.*]])
406
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_acosf(<8 x float> [[TMP4:%.*]])
395
407
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_acosf(<16 x float> [[TMP4:%.*]])
396
408
; CHECK: ret void
397
409
;
@@ -439,6 +451,7 @@ for.end:
439
451
define void @asin_f32 (ptr nocapture %varray ) {
440
452
; CHECK-LABEL: @asin_f32(
441
453
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_asinf(<4 x float> [[TMP4:%.*]])
454
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_asinf(<8 x float> [[TMP4:%.*]])
442
455
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_asinf(<16 x float> [[TMP4:%.*]])
443
456
; CHECK: ret void
444
457
;
@@ -486,6 +499,7 @@ for.end:
486
499
define void @asin_f32_intrinsic (ptr nocapture %varray ) {
487
500
; CHECK-LABEL: @asin_f32_intrinsic(
488
501
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_asinf(<4 x float> [[TMP4:%.*]])
502
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_asinf(<8 x float> [[TMP4:%.*]])
489
503
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_asinf(<16 x float> [[TMP4:%.*]])
490
504
; CHECK: ret void
491
505
;
@@ -535,6 +549,7 @@ for.end:
535
549
define void @atan_f32 (ptr nocapture %varray ) {
536
550
; CHECK-LABEL: @atan_f32(
537
551
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_atanf(<4 x float> [[TMP4:%.*]])
552
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_atanf(<8 x float> [[TMP4:%.*]])
538
553
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_atanf(<16 x float> [[TMP4:%.*]])
539
554
; CHECK: ret void
540
555
;
@@ -584,6 +599,7 @@ for.end:
584
599
define void @atan_f32_intrinsic (ptr nocapture %varray ) {
585
600
; CHECK-LABEL: @atan_f32_intrinsic(
586
601
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_atanf(<4 x float> [[TMP4:%.*]])
602
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_atanf(<8 x float> [[TMP4:%.*]])
587
603
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_atanf(<16 x float> [[TMP4:%.*]])
588
604
; CHECK: ret void
589
605
;
@@ -631,6 +647,7 @@ for.end:
631
647
define void @cosh_f32 (ptr nocapture %varray ) {
632
648
; CHECK-LABEL: @cosh_f32(
633
649
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_coshf(<4 x float> [[TMP4:%.*]])
650
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_coshf(<8 x float> [[TMP4:%.*]])
634
651
; CHECK: ret void
635
652
;
636
653
entry:
@@ -677,6 +694,7 @@ for.end:
677
694
define void @cosh_f32_intrinsic (ptr nocapture %varray ) {
678
695
; CHECK-LABEL: @cosh_f32_intrinsic(
679
696
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_coshf(<4 x float> [[TMP4:%.*]])
697
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_coshf(<8 x float> [[TMP4:%.*]])
680
698
; CHECK: ret void
681
699
;
682
700
entry:
@@ -700,6 +718,7 @@ for.end:
700
718
define void @tanh_f32 (ptr nocapture %varray ) {
701
719
; CHECK-LABEL: @tanh_f32(
702
720
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_tanhf(<4 x float> [[TMP4:%.*]])
721
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_tanhf(<8 x float> [[TMP4:%.*]])
703
722
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_tanhf(<16 x float> [[TMP4:%.*]])
704
723
; CHECK: ret void
705
724
;
@@ -724,6 +743,7 @@ for.end:
724
743
define void @tanh_f32_intrinsic (ptr nocapture %varray ) {
725
744
; CHECK-LABEL: @tanh_f32_intrinsic(
726
745
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_tanhf(<4 x float> [[TMP4:%.*]])
746
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_tanhf(<8 x float> [[TMP4:%.*]])
727
747
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_tanhf(<16 x float> [[TMP4:%.*]])
728
748
; CHECK: ret void
729
749
;
@@ -747,6 +767,7 @@ for.end:
747
767
748
768
define void @pow_f64 (ptr nocapture %varray , ptr nocapture readonly %exp ) {
749
769
; CHECK-LABEL: @pow_f64(
770
+ ; CHECK-VF2: [[TMP8:%.*]] = call <2 x double> @amd_vrd2_pow(<2 x double> [[TMP4:%.*]], <2 x double> [[WIDE_LOAD:%.*]])
750
771
; CHECK-VF4: [[TMP8:%.*]] = call <4 x double> @amd_vrd4_pow(<4 x double> [[TMP4:%.*]], <4 x double> [[WIDE_LOAD:%.*]])
751
772
; CHECK-VF8: [[TMP8:%.*]] = call <8 x double> @amd_vrd8_pow(<8 x double> [[TMP4:%.*]], <8 x double> [[WIDE_LOAD:%.*]])
752
773
; CHECK: ret void
@@ -773,6 +794,7 @@ for.end:
773
794
774
795
define void @pow_f64_intrinsic (ptr nocapture %varray , ptr nocapture readonly %exp ) {
775
796
; CHECK-LABEL: @pow_f64_intrinsic(
797
+ ; CHECK-VF2: [[TMP8:%.*]] = call <2 x double> @amd_vrd2_pow(<2 x double> [[TMP4:%.*]], <2 x double> [[WIDE_LOAD:%.*]])
776
798
; CHECK-VF4: [[TMP8:%.*]] = call <4 x double> @amd_vrd4_pow(<4 x double> [[TMP4:%.*]], <4 x double> [[WIDE_LOAD:%.*]])
777
799
; CHECK-VF8: [[TMP8:%.*]] = call <8 x double> @amd_vrd8_pow(<8 x double> [[TMP4:%.*]], <8 x double> [[WIDE_LOAD:%.*]])
778
800
; CHECK: ret void
@@ -800,6 +822,7 @@ for.end:
800
822
define void @pow_f32 (ptr nocapture %varray , ptr nocapture readonly %exp ) {
801
823
; CHECK-LABEL: @pow_f32(
802
824
; CHECK-VF4: [[TMP8:%.*]] = call <4 x float> @amd_vrs4_powf(<4 x float> [[TMP4:%.*]], <4 x float> [[WIDE_LOAD:%.*]])
825
+ ; CHECK-VF8: [[TMP8:%.*]] = call <8 x float> @amd_vrs8_powf(<8 x float> [[TMP4:%.*]], <8 x float> [[WIDE_LOAD:%.*]])
803
826
; CHECK-VF16: [[TMP8:%.*]] = call <16 x float> @amd_vrs16_powf(<16 x float> [[TMP4:%.*]], <16 x float> [[WIDE_LOAD:%.*]])
804
827
; CHECK: ret void
805
828
;
@@ -826,6 +849,7 @@ for.end:
826
849
define void @pow_f32_intrinsic (ptr nocapture %varray , ptr nocapture readonly %exp ) {
827
850
; CHECK-LABEL: @pow_f32_intrinsic(
828
851
; CHECK-VF4: [[TMP8:%.*]] = call <4 x float> @amd_vrs4_powf(<4 x float> [[TMP4:%.*]], <4 x float> [[WIDE_LOAD:%.*]])
852
+ ; CHECK-VF8: [[TMP8:%.*]] = call <8 x float> @amd_vrs8_powf(<8 x float> [[TMP4:%.*]], <8 x float> [[WIDE_LOAD:%.*]])
829
853
; CHECK-VF16: [[TMP8:%.*]] = call <16 x float> @amd_vrs16_powf(<16 x float> [[TMP4:%.*]], <16 x float> [[WIDE_LOAD:%.*]])
830
854
; CHECK: ret void
831
855
;
@@ -851,6 +875,7 @@ for.end:
851
875
852
876
define void @exp_f64 (ptr nocapture %varray ) {
853
877
; CHECK-LABEL: @exp_f64(
878
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_exp(<2 x double> [[TMP4:%.*]])
854
879
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_exp(<4 x double> [[TMP4:%.*]])
855
880
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_exp(<8 x double> [[TMP4:%.*]])
856
881
; CHECK: ret void
@@ -876,6 +901,7 @@ for.end:
876
901
define void @exp_f32 (ptr nocapture %varray ) {
877
902
; CHECK-LABEL: @exp_f32(
878
903
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_expf(<4 x float> [[TMP4:%.*]])
904
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_expf(<8 x float> [[TMP4:%.*]])
879
905
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_expf(<16 x float> [[TMP4:%.*]])
880
906
; CHECK: ret void
881
907
;
@@ -899,6 +925,7 @@ for.end:
899
925
900
926
define void @exp_f64_intrinsic (ptr nocapture %varray ) {
901
927
; CHECK-LABEL: @exp_f64_intrinsic(
928
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_exp(<2 x double> [[TMP4:%.*]])
902
929
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_exp(<4 x double> [[TMP4:%.*]])
903
930
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_exp(<8 x double> [[TMP4:%.*]])
904
931
; CHECK: ret void
@@ -924,6 +951,7 @@ for.end:
924
951
define void @exp_f32_intrinsic (ptr nocapture %varray ) {
925
952
; CHECK-LABEL: @exp_f32_intrinsic(
926
953
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_expf(<4 x float> [[TMP4:%.*]])
954
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_expf(<8 x float> [[TMP4:%.*]])
927
955
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_expf(<16 x float> [[TMP4:%.*]])
928
956
; CHECK: ret void
929
957
;
@@ -947,6 +975,7 @@ for.end:
947
975
948
976
define void @log_f64 (ptr nocapture %varray ) {
949
977
; CHECK-LABEL: @log_f64(
978
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_log(<2 x double> [[TMP4:%.*]])
950
979
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_log(<4 x double> [[TMP4:%.*]])
951
980
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_log(<8 x double> [[TMP4:%.*]])
952
981
; CHECK: ret void
@@ -972,6 +1001,7 @@ for.end:
972
1001
define void @log_f32 (ptr nocapture %varray ) {
973
1002
; CHECK-LABEL: @log_f32(
974
1003
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_logf(<4 x float> [[TMP4:%.*]])
1004
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_logf(<8 x float> [[TMP4:%.*]])
975
1005
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_logf(<16 x float> [[TMP4:%.*]])
976
1006
; CHECK: ret void
977
1007
;
@@ -995,6 +1025,7 @@ for.end:
995
1025
996
1026
define void @log_f64_intrinsic (ptr nocapture %varray ) {
997
1027
; CHECK-LABEL: @log_f64_intrinsic(
1028
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_log(<2 x double> [[TMP4:%.*]])
998
1029
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_log(<4 x double> [[TMP4:%.*]])
999
1030
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_log(<8 x double> [[TMP4:%.*]])
1000
1031
; CHECK: ret void
@@ -1020,6 +1051,7 @@ for.end:
1020
1051
define void @log_f32_intrinsic (ptr nocapture %varray ) {
1021
1052
; CHECK-LABEL: @log_f32_intrinsic(
1022
1053
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_logf(<4 x float> [[TMP4:%.*]])
1054
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_logf(<8 x float> [[TMP4:%.*]])
1023
1055
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_logf(<16 x float> [[TMP4:%.*]])
1024
1056
; CHECK: ret void
1025
1057
;
@@ -1043,6 +1075,7 @@ for.end:
1043
1075
1044
1076
define void @log2_f64 (ptr nocapture %varray ) {
1045
1077
; CHECK-LABEL: @log2_f64(
1078
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_log2(<2 x double> [[TMP4:%.*]])
1046
1079
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_log2(<4 x double> [[TMP4:%.*]])
1047
1080
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_log2(<8 x double> [[TMP4:%.*]])
1048
1081
; CHECK: ret void
@@ -1068,6 +1101,7 @@ for.end:
1068
1101
define void @log2_f32 (ptr nocapture %varray ) {
1069
1102
; CHECK-LABEL: @log2_f32(
1070
1103
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_log2f(<4 x float> [[TMP4:%.*]])
1104
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_log2f(<8 x float> [[TMP4:%.*]])
1071
1105
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_log2f(<16 x float> [[TMP4:%.*]])
1072
1106
; CHECK: ret void
1073
1107
;
@@ -1091,6 +1125,7 @@ for.end:
1091
1125
1092
1126
define void @log2_f64_intrinsic (ptr nocapture %varray ) {
1093
1127
; CHECK-LABEL: @log2_f64_intrinsic(
1128
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_log2(<2 x double> [[TMP4:%.*]])
1094
1129
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_log2(<4 x double> [[TMP4:%.*]])
1095
1130
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_log2(<8 x double> [[TMP4:%.*]])
1096
1131
; CHECK: ret void
@@ -1116,6 +1151,7 @@ for.end:
1116
1151
define void @log2_f32_intrinsic (ptr nocapture %varray ) {
1117
1152
; CHECK-LABEL: @log2_f32_intrinsic(
1118
1153
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_log2f(<4 x float> [[TMP4:%.*]])
1154
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_log2f(<8 x float> [[TMP4:%.*]])
1119
1155
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_log2f(<16 x float> [[TMP4:%.*]])
1120
1156
; CHECK: ret void
1121
1157
;
@@ -1140,6 +1176,7 @@ for.end:
1140
1176
define void @log10_f32 (ptr nocapture %varray ) {
1141
1177
; CHECK-LABEL: @log10_f32(
1142
1178
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_log10f(<4 x float> [[TMP4:%.*]])
1179
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_log10f(<8 x float> [[TMP4:%.*]])
1143
1180
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_log10f(<16 x float> [[TMP4:%.*]])
1144
1181
; CHECK: ret void
1145
1182
;
@@ -1164,6 +1201,7 @@ for.end:
1164
1201
define void @log10_f32_intrinsic (ptr nocapture %varray ) {
1165
1202
; CHECK-LABEL: @log10_f32_intrinsic(
1166
1203
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_log10f(<4 x float> [[TMP4:%.*]])
1204
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_log10f(<8 x float> [[TMP4:%.*]])
1167
1205
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_log10f(<16 x float> [[TMP4:%.*]])
1168
1206
; CHECK: ret void
1169
1207
;
@@ -1187,6 +1225,7 @@ for.end:
1187
1225
1188
1226
define void @exp2_f64 (ptr nocapture %varray ) {
1189
1227
; CHECK-LABEL: @exp2_f64(
1228
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_exp2(<2 x double> [[TMP4:%.*]])
1190
1229
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_exp2(<4 x double> [[TMP4:%.*]])
1191
1230
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_exp2(<8 x double> [[TMP4:%.*]])
1192
1231
; CHECK: ret void
@@ -1212,6 +1251,7 @@ for.end:
1212
1251
define void @exp2_f32 (ptr nocapture %varray ) {
1213
1252
; CHECK-LABEL: @exp2_f32(
1214
1253
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_exp2f(<4 x float> [[TMP4:%.*]])
1254
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_exp2f(<8 x float> [[TMP4:%.*]])
1215
1255
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_exp2f(<16 x float> [[TMP4:%.*]])
1216
1256
; CHECK: ret void
1217
1257
;
@@ -1235,6 +1275,7 @@ for.end:
1235
1275
1236
1276
define void @exp2_f64_intrinsic (ptr nocapture %varray ) {
1237
1277
; CHECK-LABEL: @exp2_f64_intrinsic(
1278
+ ; CHECK-VF2: [[TMP5:%.*]] = call <2 x double> @amd_vrd2_exp2(<2 x double> [[TMP4:%.*]])
1238
1279
; CHECK-VF4: [[TMP5:%.*]] = call <4 x double> @amd_vrd4_exp2(<4 x double> [[TMP4:%.*]])
1239
1280
; CHECK-VF8: [[TMP5:%.*]] = call <8 x double> @amd_vrd8_exp2(<8 x double> [[TMP4:%.*]])
1240
1281
; CHECK: ret void
@@ -1260,6 +1301,7 @@ for.end:
1260
1301
define void @exp2_f32_intrinsic (ptr nocapture %varray ) {
1261
1302
; CHECK-LABEL: @exp2_f32_intrinsic(
1262
1303
; CHECK-VF4: [[TMP5:%.*]] = call <4 x float> @amd_vrs4_exp2f(<4 x float> [[TMP4:%.*]])
1304
+ ; CHECK-VF8: [[TMP5:%.*]] = call <8 x float> @amd_vrs8_exp2f(<8 x float> [[TMP4:%.*]])
1263
1305
; CHECK-VF16: [[TMP5:%.*]] = call <16 x float> @amd_vrs16_exp2f(<16 x float> [[TMP4:%.*]])
1264
1306
; CHECK: ret void
1265
1307
;
0 commit comments