@@ -795,17 +795,17 @@ define amdgpu_kernel void @shl_i64(ptr addrspace(1) %out, ptr addrspace(1) %in)
795
795
; EG-NEXT: ALU clause starting at 8:
796
796
; EG-NEXT: MOV * T0.X, KC0[2].Z,
797
797
; EG-NEXT: ALU clause starting at 9:
798
- ; EG-NEXT: AND_INT T1.Y, T0.Z, literal.x ,
799
- ; EG-NEXT: LSHR T1.Z, T0.Y, 1 ,
798
+ ; EG-NEXT: LSHR T1.Y, T0.Y, 1 ,
799
+ ; EG-NEXT: NOT_INT T1.Z, T0.Z ,
800
800
; EG-NEXT: BIT_ALIGN_INT T0.W, T0.Y, T0.X, 1,
801
- ; EG-NEXT: NOT_INT * T1.W, T0.Z,
801
+ ; EG-NEXT: AND_INT * T1.W, T0.Z, literal.x ,
802
802
; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
803
- ; EG-NEXT: BIT_ALIGN_INT T1 .Z, PV.Z, PV.W , PS,
804
- ; EG-NEXT: LSHL T0.W, T0.X , PV.Y ,
803
+ ; EG-NEXT: LSHL T2 .Z, T0.X , PS,
804
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, PV.Y , PV.W, PV.Z ,
805
805
; EG-NEXT: AND_INT * T1.W, T0.Z, literal.x,
806
806
; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
807
- ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.Z , PV.W ,
808
- ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.W , 0.0,
807
+ ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.W , PV.Z ,
808
+ ; EG-NEXT: CNDE_INT T0.X, T1.W, T2.Z , 0.0,
809
809
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
810
810
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
811
811
%b_ptr = getelementptr i64 , ptr addrspace (1 ) %in , i64 1
@@ -858,8 +858,8 @@ define amdgpu_kernel void @shl_v2i64(ptr addrspace(1) %out, ptr addrspace(1) %in
858
858
; EG: ; %bb.0:
859
859
; EG-NEXT: ALU 0, @10, KC0[CB0:0-32], KC1[]
860
860
; EG-NEXT: TEX 1 @6
861
- ; EG-NEXT: ALU 22 , @11, KC0[CB0:0-32], KC1[]
862
- ; EG-NEXT: MEM_RAT_CACHELESS STORE_RAW T3 .XYZW, T0.X, 1
861
+ ; EG-NEXT: ALU 23 , @11, KC0[CB0:0-32], KC1[]
862
+ ; EG-NEXT: MEM_RAT_CACHELESS STORE_RAW T2 .XYZW, T0.X, 1
863
863
; EG-NEXT: CF_END
864
864
; EG-NEXT: PAD
865
865
; EG-NEXT: Fetch clause starting at 6:
@@ -868,27 +868,28 @@ define amdgpu_kernel void @shl_v2i64(ptr addrspace(1) %out, ptr addrspace(1) %in
868
868
; EG-NEXT: ALU clause starting at 10:
869
869
; EG-NEXT: MOV * T0.X, KC0[2].Z,
870
870
; EG-NEXT: ALU clause starting at 11:
871
- ; EG-NEXT: AND_INT T1.Y, T1.Z, literal.x,
871
+ ; EG-NEXT: AND_INT * T1.W, T1.Z, literal.x,
872
+ ; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
873
+ ; EG-NEXT: LSHL T2.X, T0.Z, PV.W,
874
+ ; EG-NEXT: AND_INT T1.Y, T1.Z, literal.x, BS:VEC_120/SCL_212
872
875
; EG-NEXT: LSHR T2.Z, T0.W, 1,
873
- ; EG-NEXT: BIT_ALIGN_INT T0.W, T0.W, T0.Z, 1,
876
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, T0.W, T0.Z, 1, BS:VEC_102/SCL_221
874
877
; EG-NEXT: NOT_INT * T1.W, T1.Z,
878
+ ; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
879
+ ; EG-NEXT: BIT_ALIGN_INT T3.X, PV.Z, PV.W, PS,
880
+ ; EG-NEXT: LSHR T2.Y, T0.Y, 1,
881
+ ; EG-NEXT: NOT_INT T0.Z, T1.X,
882
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, T0.Y, T0.X, 1,
883
+ ; EG-NEXT: AND_INT * T1.W, T1.X, literal.x,
875
884
; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
876
- ; EG-NEXT: BIT_ALIGN_INT T0.W, PV.Z, PV.W, PS,
877
- ; EG-NEXT: LSHL * T1.W, T0.Z, PV.Y,
878
- ; EG-NEXT: AND_INT T2.X, T1.Z, literal.x,
879
- ; EG-NEXT: AND_INT T1.Y, T1.X, literal.y,
880
- ; EG-NEXT: LSHR T0.Z, T0.Y, 1,
881
- ; EG-NEXT: BIT_ALIGN_INT T2.W, T0.Y, T0.X, 1,
882
- ; EG-NEXT: NOT_INT * T3.W, T1.X,
883
- ; EG-NEXT: 32(4.484155e-44), 31(4.344025e-44)
884
- ; EG-NEXT: BIT_ALIGN_INT T0.Y, PV.Z, PV.W, PS,
885
- ; EG-NEXT: LSHL T0.Z, T0.X, PV.Y,
886
- ; EG-NEXT: AND_INT T2.W, T1.X, literal.x, BS:VEC_120/SCL_212
887
- ; EG-NEXT: CNDE_INT * T3.W, PV.X, T0.W, T1.W,
885
+ ; EG-NEXT: LSHL T0.Y, T0.X, PS, BS:VEC_120/SCL_212
886
+ ; EG-NEXT: AND_INT T1.Z, T1.X, literal.x, BS:VEC_201
887
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, PV.Y, PV.W, PV.Z,
888
+ ; EG-NEXT: CNDE_INT * T2.W, T1.Y, PV.X, T2.X,
888
889
; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
889
- ; EG-NEXT: CNDE_INT T3 .Y, PV.W , PV.Y , PV.Z ,
890
- ; EG-NEXT: CNDE_INT * T3 .Z, T2.X, T1.W , 0.0,
891
- ; EG-NEXT: CNDE_INT T3 .X, T2.W , T0.Z , 0.0,
890
+ ; EG-NEXT: CNDE_INT T2 .Y, PV.Z , PV.W , PV.Y ,
891
+ ; EG-NEXT: CNDE_INT * T2 .Z, T1.Y, T2.X , 0.0,
892
+ ; EG-NEXT: CNDE_INT T2 .X, T1.Z , T0.Y , 0.0,
892
893
; EG-NEXT: LSHR * T0.X, KC0[2].Y, literal.x,
893
894
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
894
895
%b_ptr = getelementptr <2 x i64 >, ptr addrspace (1 ) %in , i64 1
@@ -955,65 +956,66 @@ define amdgpu_kernel void @shl_v4i64(ptr addrspace(1) %out, ptr addrspace(1) %in
955
956
; EG: ; %bb.0:
956
957
; EG-NEXT: ALU 0, @14, KC0[CB0:0-32], KC1[]
957
958
; EG-NEXT: TEX 3 @6
958
- ; EG-NEXT: ALU 47 , @15, KC0[CB0:0-32], KC1[]
959
- ; EG-NEXT: MEM_RAT_CACHELESS STORE_RAW T1 .XYZW, T2 .X, 0
960
- ; EG-NEXT: MEM_RAT_CACHELESS STORE_RAW T4 .XYZW, T0 .X, 1
959
+ ; EG-NEXT: ALU 48 , @15, KC0[CB0:0-32], KC1[]
960
+ ; EG-NEXT: MEM_RAT_CACHELESS STORE_RAW T2 .XYZW, T0 .X, 0
961
+ ; EG-NEXT: MEM_RAT_CACHELESS STORE_RAW T3 .XYZW, T1 .X, 1
961
962
; EG-NEXT: CF_END
962
963
; EG-NEXT: Fetch clause starting at 6:
963
- ; EG-NEXT: VTX_READ_128 T1.XYZW, T0.X, 48 , #1
964
- ; EG-NEXT: VTX_READ_128 T2.XYZW, T0.X, 0 , #1
965
- ; EG-NEXT: VTX_READ_128 T3.XYZW, T0.X, 32 , #1
966
- ; EG-NEXT: VTX_READ_128 T0.XYZW, T0.X, 16 , #1
964
+ ; EG-NEXT: VTX_READ_128 T1.XYZW, T0.X, 32 , #1
965
+ ; EG-NEXT: VTX_READ_128 T2.XYZW, T0.X, 48 , #1
966
+ ; EG-NEXT: VTX_READ_128 T3.XYZW, T0.X, 16 , #1
967
+ ; EG-NEXT: VTX_READ_128 T0.XYZW, T0.X, 0 , #1
967
968
; EG-NEXT: ALU clause starting at 14:
968
969
; EG-NEXT: MOV * T0.X, KC0[2].Z,
969
970
; EG-NEXT: ALU clause starting at 15:
970
- ; EG-NEXT: AND_INT T4.Z, T1.Z, literal.x,
971
- ; EG-NEXT: LSHR T1.W, T0.W, 1,
972
- ; EG-NEXT: NOT_INT * T3.W, T1.Z,
971
+ ; EG-NEXT: AND_INT * T1.W, T1.Z, literal.x,
973
972
; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
974
- ; EG-NEXT: BIT_ALIGN_INT T4.X, T0.W, T0.Z, 1,
975
- ; EG-NEXT: AND_INT T1.Y, T3.Z, literal.x, BS:VEC_201
976
- ; EG-NEXT: LSHR T5.Z, T2.W, 1, BS:VEC_120/SCL_212
977
- ; EG-NEXT: BIT_ALIGN_INT T0.W, T2.W, T2.Z, 1, BS:VEC_102/SCL_221
978
- ; EG-NEXT: NOT_INT * T2.W, T3.Z,
979
- ; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
980
- ; EG-NEXT: BIT_ALIGN_INT T3.Y, PV.Z, PV.W, PS,
981
- ; EG-NEXT: LSHL T2.Z, T2.Z, PV.Y,
982
- ; EG-NEXT: BIT_ALIGN_INT T0.W, T1.W, PV.X, T3.W,
983
- ; EG-NEXT: LSHL * T1.W, T0.Z, T4.Z,
973
+ ; EG-NEXT: LSHL * T1.W, T0.Z, PV.W,
984
974
; EG-NEXT: AND_INT T4.X, T1.Z, literal.x,
985
- ; EG-NEXT: AND_INT T1.Y, T1.X, literal.y ,
986
- ; EG-NEXT: LSHR T0 .Z, T0.Y, 1,
987
- ; EG-NEXT: BIT_ALIGN_INT T2.W, T0.Y, T0.X , 1,
988
- ; EG-NEXT: NOT_INT * T3.W, T1.X ,
975
+ ; EG-NEXT: LSHR T1.Y, T3.W, 1 ,
976
+ ; EG-NEXT: NOT_INT T4 .Z, T2.Z, BS:VEC_201
977
+ ; EG-NEXT: BIT_ALIGN_INT T2.W, T3.W, T3.Z , 1,
978
+ ; EG-NEXT: AND_INT * T3.W, T2.Z, literal.y ,
989
979
; EG-NEXT: 32(4.484155e-44), 31(4.344025e-44)
990
- ; EG-NEXT: AND_INT T5.X, T3.Z, literal.x,
991
- ; EG-NEXT: BIT_ALIGN_INT T0.Y, PV.Z, PV.W, PS,
992
- ; EG-NEXT: LSHL T0.Z, T0.X, PV.Y,
993
- ; EG-NEXT: AND_INT T2.W, T1.X, literal.x, BS:VEC_120/SCL_212
994
- ; EG-NEXT: CNDE_INT * T4.W, PV.X, T0.W, T1.W,
980
+ ; EG-NEXT: LSHL T5.X, T3.Z, PS,
981
+ ; EG-NEXT: AND_INT T2.Y, T2.Z, literal.x, BS:VEC_120/SCL_212
982
+ ; EG-NEXT: BIT_ALIGN_INT T2.Z, PV.Y, PV.W, PV.Z,
983
+ ; EG-NEXT: LSHR T2.W, T3.Y, 1,
984
+ ; EG-NEXT: NOT_INT * T3.W, T2.X,
985
+ ; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
986
+ ; EG-NEXT: BIT_ALIGN_INT T6.X, T3.Y, T3.X, 1,
987
+ ; EG-NEXT: AND_INT T1.Y, T2.X, literal.x,
988
+ ; EG-NEXT: LSHR T3.Z, T0.W, 1,
989
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, T0.W, T0.Z, 1,
990
+ ; EG-NEXT: NOT_INT * T4.W, T1.Z,
991
+ ; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
992
+ ; EG-NEXT: BIT_ALIGN_INT T7.X, PV.Z, PV.W, PS,
993
+ ; EG-NEXT: LSHL T1.Y, T3.X, PV.Y, BS:VEC_120/SCL_212
994
+ ; EG-NEXT: AND_INT T0.Z, T2.X, literal.x, BS:VEC_201
995
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, T2.W, PV.X, T3.W,
996
+ ; EG-NEXT: CNDE_INT * T3.W, T2.Y, T2.Z, T5.X,
995
997
; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
996
- ; EG-NEXT: AND_INT T0 .X, T3.X, literal.x ,
997
- ; EG-NEXT: CNDE_INT T4 .Y, PV.W , PV.Y , PV.Z ,
998
- ; EG-NEXT: LSHR T1.Z, T2.Y, 1 ,
999
- ; EG-NEXT: BIT_ALIGN_INT T0.W, T2 .Y, T2 .X, 1,
1000
- ; EG-NEXT: NOT_INT * T3 .W, T3.X ,
998
+ ; EG-NEXT: LSHR T2 .X, T0.Y, 1 ,
999
+ ; EG-NEXT: CNDE_INT T3 .Y, PV.Z , PV.W , PV.Y ,
1000
+ ; EG-NEXT: NOT_INT T1.Z, T1.X ,
1001
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, T0 .Y, T0 .X, 1,
1002
+ ; EG-NEXT: AND_INT * T2 .W, T1.X, literal.x ,
1001
1003
; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
1002
- ; EG-NEXT: BIT_ALIGN_INT T1 .X, PV.Z, PV.W , PS,
1003
- ; EG-NEXT: LSHL T0.Y, T2 .X, PV.X,
1004
- ; EG-NEXT: CNDE_INT T4 .Z, T4.X, T1.W , 0.0, BS:VEC_120/SCL_212
1005
- ; EG-NEXT: AND_INT * T0.W, T3 .X, literal.x, BS:VEC_201
1004
+ ; EG-NEXT: LSHL T0 .X, T0.X , PS,
1005
+ ; EG-NEXT: AND_INT T0.Y, T1 .X, literal.x, BS:VEC_120/SCL_212
1006
+ ; EG-NEXT: CNDE_INT T3 .Z, T2.Y, T5.X , 0.0, BS:VEC_021/SCL_122
1007
+ ; EG-NEXT: BIT_ALIGN_INT * T0.W, PV .X, PV.W, PV.Z,
1006
1008
; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
1007
- ; EG-NEXT: CNDE_INT * T1 .W, T5 .X, T3.Y, T2.Z ,
1008
- ; EG-NEXT: CNDE_INT T4 .X, T2.W, T0.Z , 0.0,
1009
- ; EG-NEXT: CNDE_INT T1 .Y, T0.W, T1.X , T0.Y, BS:VEC_120/SCL_212
1010
- ; EG-NEXT: ADD_INT * T2 .W, KC0[2].Y, literal.x,
1009
+ ; EG-NEXT: CNDE_INT * T2 .W, T4 .X, T7.X, T1.W ,
1010
+ ; EG-NEXT: CNDE_INT T3 .X, T0.Z, T1.Y , 0.0,
1011
+ ; EG-NEXT: CNDE_INT T2 .Y, T0.Y, T0.W , T0.X,
1012
+ ; EG-NEXT: ADD_INT * T0 .W, KC0[2].Y, literal.x,
1011
1013
; EG-NEXT: 16(2.242078e-44), 0(0.000000e+00)
1012
- ; EG-NEXT: LSHR T0 .X, PV.W, literal.x,
1013
- ; EG-NEXT: CNDE_INT T1 .Z, T5 .X, T2.Z , 0.0,
1014
- ; EG-NEXT: CNDE_INT * T1 .X, T0.W , T0.Y , 0.0,
1014
+ ; EG-NEXT: LSHR T1 .X, PV.W, literal.x,
1015
+ ; EG-NEXT: CNDE_INT T2 .Z, T4 .X, T1.W , 0.0,
1016
+ ; EG-NEXT: CNDE_INT * T2 .X, T0.Y , T0.X , 0.0,
1015
1017
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1016
- ; EG-NEXT: LSHR * T2 .X, KC0[2].Y, literal.x,
1018
+ ; EG-NEXT: LSHR * T0 .X, KC0[2].Y, literal.x,
1017
1019
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1018
1020
%b_ptr = getelementptr <4 x i64 >, ptr addrspace (1 ) %in , i64 1
1019
1021
%a = load <4 x i64 >, ptr addrspace (1 ) %in
@@ -1172,17 +1174,17 @@ define amdgpu_kernel void @s_shl_constant_i64(ptr addrspace(1) %out, i64 %a) {
1172
1174
; EG-NEXT: CF_END
1173
1175
; EG-NEXT: PAD
1174
1176
; EG-NEXT: ALU clause starting at 4:
1175
- ; EG-NEXT: AND_INT T0.Z, KC0[2].W , literal.x,
1176
- ; EG-NEXT: MOV T0.W, literal.y ,
1177
- ; EG-NEXT: NOT_INT * T1.W, KC0[2].W,
1178
- ; EG-NEXT: 31(4.344025e-44), -1(nan )
1179
- ; EG-NEXT: BIT_ALIGN_INT T1.Z, literal.x, PV.W , PS,
1180
- ; EG-NEXT: LSHL T0.W, literal.y, PV.Z,
1177
+ ; EG-NEXT: MOV T0.Z, literal.x,
1178
+ ; EG-NEXT: NOT_INT T0.W, KC0[2].W ,
1179
+ ; EG-NEXT: AND_INT * T1.W, KC0[2].W, literal.y ,
1180
+ ; EG-NEXT: -1(nan), 31(4.344025e-44)
1181
+ ; EG-NEXT: LSHL T1.Z, literal.x, PS,
1182
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, literal.y, PV.Z, PV.W ,
1181
1183
; EG-NEXT: AND_INT * T1.W, KC0[2].W, literal.z,
1182
- ; EG-NEXT: 32767(4.591635e-41), -1(nan )
1184
+ ; EG-NEXT: -1(nan), 32767(4.591635e-41)
1183
1185
; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
1184
- ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.Z , PV.W ,
1185
- ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.W , 0.0,
1186
+ ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.W , PV.Z ,
1187
+ ; EG-NEXT: CNDE_INT T0.X, T1.W, T1.Z , 0.0,
1186
1188
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
1187
1189
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1188
1190
%shl = shl i64 281474976710655 , %a
@@ -1423,15 +1425,15 @@ define amdgpu_kernel void @s_shl_inline_imm_64_i64(ptr addrspace(1) %out, ptr ad
1423
1425
; EG-NEXT: CF_END
1424
1426
; EG-NEXT: PAD
1425
1427
; EG-NEXT: ALU clause starting at 4:
1426
- ; EG-NEXT: NOT_INT T0.W, KC0[2].W,
1427
- ; EG-NEXT: AND_INT * T1.W, KC0[2].W, literal.x ,
1428
+ ; EG-NEXT: AND_INT T0.W, KC0[2].W, literal.x ,
1429
+ ; EG-NEXT: NOT_INT * T1.W, KC0[2].W,
1428
1430
; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
1429
- ; EG-NEXT: LSHL T0.Z, literal.x, PS,
1430
- ; EG-NEXT: BIT_ALIGN_INT T0 .W, 0.0 , literal.y, PV.W ,
1431
- ; EG-NEXT: AND_INT * T1 .W, KC0[2].W, literal.y ,
1432
- ; EG-NEXT: 64(8.968310e -44), 32(4.484155e -44)
1433
- ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.W, PV.Z,
1434
- ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.Z , 0.0,
1431
+ ; EG-NEXT: BIT_ALIGN_INT T0.Z, 0.0 , literal.x, PS,
1432
+ ; EG-NEXT: AND_INT T1 .W, KC0[2].W , literal.x ,
1433
+ ; EG-NEXT: LSHL * T0 .W, literal.y, PV.W ,
1434
+ ; EG-NEXT: 32(4.484155e -44), 64(8.968310e -44)
1435
+ ; EG-NEXT: CNDE_INT * T0.Y, PV.W, PV.Z, PS ,
1436
+ ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.W , 0.0,
1435
1437
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
1436
1438
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1437
1439
%shl = shl i64 64 , %a
@@ -1903,16 +1905,16 @@ define amdgpu_kernel void @s_shl_inline_imm_f32_4_0_i64(ptr addrspace(1) %out, p
1903
1905
; EG-NEXT: CF_END
1904
1906
; EG-NEXT: PAD
1905
1907
; EG-NEXT: ALU clause starting at 4:
1906
- ; EG-NEXT: NOT_INT T0.W, KC0[2].W,
1907
- ; EG-NEXT: AND_INT * T1.W, KC0[2].W, literal.x ,
1908
+ ; EG-NEXT: AND_INT T0.W, KC0[2].W, literal.x ,
1909
+ ; EG-NEXT: NOT_INT * T1.W, KC0[2].W,
1908
1910
; EG-NEXT: 31(4.344025e-44), 0(0.000000e+00)
1909
- ; EG-NEXT: LSHL T0.Z, literal.x, PS,
1910
- ; EG-NEXT: BIT_ALIGN_INT T0 .W, 0.0 , literal.y, PV.W ,
1911
- ; EG-NEXT: AND_INT * T1 .W, KC0[2].W, literal.z ,
1912
- ; EG-NEXT: 1082130432(4.000000e+00 ), 541065216(1.626303e-19 )
1913
- ; EG-NEXT: 32 (4.484155e-44 ), 0(0.000000e+00)
1914
- ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.W, PV.Z,
1915
- ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.Z , 0.0,
1911
+ ; EG-NEXT: BIT_ALIGN_INT T0.Z, 0.0 , literal.x, PS,
1912
+ ; EG-NEXT: AND_INT T1 .W, KC0[2].W , literal.y,
1913
+ ; EG-NEXT: LSHL * T0 .W, literal.z, PV.W ,
1914
+ ; EG-NEXT: 541065216(1.626303e-19 ), 32(4.484155e-44 )
1915
+ ; EG-NEXT: 1082130432 (4.000000e+00 ), 0(0.000000e+00)
1916
+ ; EG-NEXT: CNDE_INT * T0.Y, PV.W, PV.Z, PS ,
1917
+ ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.W , 0.0,
1916
1918
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
1917
1919
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1918
1920
%shl = shl i64 1082130432 , %a
@@ -1959,17 +1961,17 @@ define amdgpu_kernel void @s_shl_inline_imm_f32_neg_4_0_i64(ptr addrspace(1) %ou
1959
1961
; EG-NEXT: CF_END
1960
1962
; EG-NEXT: PAD
1961
1963
; EG-NEXT: ALU clause starting at 4:
1962
- ; EG-NEXT: AND_INT T0.Z, KC0[2].W , literal.x,
1963
- ; EG-NEXT: MOV T0.W, literal.y ,
1964
- ; EG-NEXT: NOT_INT * T1.W, KC0[2].W,
1965
- ; EG-NEXT: 31(4.344025e-44), - 532676608(-5.534023e+19)
1966
- ; EG-NEXT: BIT_ALIGN_INT T1.Z, literal.x, PV.W , PS,
1967
- ; EG-NEXT: LSHL T0.W, literal.y, PV.Z,
1964
+ ; EG-NEXT: MOV T0.Z, literal.x,
1965
+ ; EG-NEXT: NOT_INT T0.W, KC0[2].W ,
1966
+ ; EG-NEXT: AND_INT * T1.W, KC0[2].W, literal.y ,
1967
+ ; EG-NEXT: - 532676608(-5.534023e+19), 31(4.344025e-44 )
1968
+ ; EG-NEXT: LSHL T1.Z, literal.x, PS,
1969
+ ; EG-NEXT: BIT_ALIGN_INT T0.W, literal.y, PV.Z, PV.W ,
1968
1970
; EG-NEXT: AND_INT * T1.W, KC0[2].W, literal.z,
1969
- ; EG-NEXT: 2147483647(nan), -1065353216(-4.000000e+00)
1971
+ ; EG-NEXT: -1065353216(-4.000000e+00), 2147483647(nan )
1970
1972
; EG-NEXT: 32(4.484155e-44), 0(0.000000e+00)
1971
- ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.Z , PV.W ,
1972
- ; EG-NEXT: CNDE_INT T0.X, T1.W, T0.W , 0.0,
1973
+ ; EG-NEXT: CNDE_INT * T0.Y, PS, PV.W , PV.Z ,
1974
+ ; EG-NEXT: CNDE_INT T0.X, T1.W, T1.Z , 0.0,
1973
1975
; EG-NEXT: LSHR * T1.X, KC0[2].Y, literal.x,
1974
1976
; EG-NEXT: 2(2.802597e-45), 0(0.000000e+00)
1975
1977
%shl = shl i64 -1065353216 , %a
0 commit comments