@@ -339,7 +339,7 @@ define void @v_shuffle_v2f32_v4f32__7_0(ptr addrspace(1) inreg %ptr) {
339
339
; GFX90A-NEXT: ;;#ASMSTART
340
340
; GFX90A-NEXT: ; def v[2:5]
341
341
; GFX90A-NEXT: ;;#ASMEND
342
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
342
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[0:1] op_sel:[1,0]
343
343
; GFX90A-NEXT: global_store_dwordx2 v6, v[0:1], s[16:17]
344
344
; GFX90A-NEXT: s_waitcnt vmcnt(0)
345
345
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -355,7 +355,7 @@ define void @v_shuffle_v2f32_v4f32__7_0(ptr addrspace(1) inreg %ptr) {
355
355
; GFX940-NEXT: ; def v[2:5]
356
356
; GFX940-NEXT: ;;#ASMEND
357
357
; GFX940-NEXT: s_nop 0
358
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
358
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[0:1] op_sel:[1,0]
359
359
; GFX940-NEXT: global_store_dwordx2 v6, v[0:1], s[0:1] sc0 sc1
360
360
; GFX940-NEXT: s_waitcnt vmcnt(0)
361
361
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -445,7 +445,7 @@ define void @v_shuffle_v2f32_v4f32__7_2(ptr addrspace(1) inreg %ptr) {
445
445
; GFX90A-NEXT: ;;#ASMSTART
446
446
; GFX90A-NEXT: ; def v[4:7]
447
447
; GFX90A-NEXT: ;;#ASMEND
448
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[6:7], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
448
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[6:7], v[2:3] op_sel:[1,0]
449
449
; GFX90A-NEXT: global_store_dwordx2 v8, v[0:1], s[16:17]
450
450
; GFX90A-NEXT: s_waitcnt vmcnt(0)
451
451
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -461,7 +461,7 @@ define void @v_shuffle_v2f32_v4f32__7_2(ptr addrspace(1) inreg %ptr) {
461
461
; GFX940-NEXT: ; def v[4:7]
462
462
; GFX940-NEXT: ;;#ASMEND
463
463
; GFX940-NEXT: s_nop 0
464
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[6:7], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
464
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[6:7], v[2:3] op_sel:[1,0]
465
465
; GFX940-NEXT: global_store_dwordx2 v8, v[0:1], s[0:1] sc0 sc1
466
466
; GFX940-NEXT: s_waitcnt vmcnt(0)
467
467
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -634,7 +634,7 @@ define void @v_shuffle_v2f32_v4f32__7_6(ptr addrspace(1) inreg %ptr) {
634
634
; GFX90A-NEXT: ; def v[0:3]
635
635
; GFX90A-NEXT: ;;#ASMEND
636
636
; GFX90A-NEXT: v_mov_b32_e32 v4, 0
637
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
637
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0]
638
638
; GFX90A-NEXT: global_store_dwordx2 v4, v[0:1], s[16:17]
639
639
; GFX90A-NEXT: s_waitcnt vmcnt(0)
640
640
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -646,7 +646,7 @@ define void @v_shuffle_v2f32_v4f32__7_6(ptr addrspace(1) inreg %ptr) {
646
646
; GFX940-NEXT: ; def v[0:3]
647
647
; GFX940-NEXT: ;;#ASMEND
648
648
; GFX940-NEXT: v_mov_b32_e32 v4, 0
649
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
649
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0]
650
650
; GFX940-NEXT: global_store_dwordx2 v4, v[0:1], s[0:1] sc0 sc1
651
651
; GFX940-NEXT: s_waitcnt vmcnt(0)
652
652
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -804,7 +804,7 @@ define void @v_shuffle_v2f32_v4f32__1_0(ptr addrspace(1) inreg %ptr) {
804
804
; GFX90A-NEXT: ; def v[0:3]
805
805
; GFX90A-NEXT: ;;#ASMEND
806
806
; GFX90A-NEXT: v_mov_b32_e32 v4, 0
807
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
807
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0]
808
808
; GFX90A-NEXT: global_store_dwordx2 v4, v[0:1], s[16:17]
809
809
; GFX90A-NEXT: s_waitcnt vmcnt(0)
810
810
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -816,7 +816,7 @@ define void @v_shuffle_v2f32_v4f32__1_0(ptr addrspace(1) inreg %ptr) {
816
816
; GFX940-NEXT: ; def v[0:3]
817
817
; GFX940-NEXT: ;;#ASMEND
818
818
; GFX940-NEXT: v_mov_b32_e32 v4, 0
819
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
819
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0]
820
820
; GFX940-NEXT: global_store_dwordx2 v4, v[0:1], s[0:1] sc0 sc1
821
821
; GFX940-NEXT: s_waitcnt vmcnt(0)
822
822
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -981,7 +981,7 @@ define void @v_shuffle_v2f32_v4f32__5_0(ptr addrspace(1) inreg %ptr) {
981
981
; GFX90A-NEXT: ;;#ASMSTART
982
982
; GFX90A-NEXT: ; def v[2:5]
983
983
; GFX90A-NEXT: ;;#ASMEND
984
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
984
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[0:1] op_sel:[1,0]
985
985
; GFX90A-NEXT: global_store_dwordx2 v6, v[0:1], s[16:17]
986
986
; GFX90A-NEXT: s_waitcnt vmcnt(0)
987
987
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -997,7 +997,7 @@ define void @v_shuffle_v2f32_v4f32__5_0(ptr addrspace(1) inreg %ptr) {
997
997
; GFX940-NEXT: ; def v[2:5]
998
998
; GFX940-NEXT: ;;#ASMEND
999
999
; GFX940-NEXT: s_nop 0
1000
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
1000
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[0:1] op_sel:[1,0]
1001
1001
; GFX940-NEXT: global_store_dwordx2 v6, v[0:1], s[0:1] sc0 sc1
1002
1002
; GFX940-NEXT: s_waitcnt vmcnt(0)
1003
1003
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -1598,7 +1598,7 @@ define void @v_shuffle_v2f32_v4f32__3_2(ptr addrspace(1) inreg %ptr) {
1598
1598
; GFX90A-NEXT: ; def v[0:3]
1599
1599
; GFX90A-NEXT: ;;#ASMEND
1600
1600
; GFX90A-NEXT: v_mov_b32_e32 v4, 0
1601
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
1601
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0]
1602
1602
; GFX90A-NEXT: global_store_dwordx2 v4, v[0:1], s[16:17]
1603
1603
; GFX90A-NEXT: s_waitcnt vmcnt(0)
1604
1604
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -1610,7 +1610,7 @@ define void @v_shuffle_v2f32_v4f32__3_2(ptr addrspace(1) inreg %ptr) {
1610
1610
; GFX940-NEXT: ; def v[0:3]
1611
1611
; GFX940-NEXT: ;;#ASMEND
1612
1612
; GFX940-NEXT: v_mov_b32_e32 v4, 0
1613
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
1613
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[2:3] op_sel:[1,0]
1614
1614
; GFX940-NEXT: global_store_dwordx2 v4, v[0:1], s[0:1] sc0 sc1
1615
1615
; GFX940-NEXT: s_waitcnt vmcnt(0)
1616
1616
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -1687,7 +1687,7 @@ define void @v_shuffle_v2f32_v4f32__5_2(ptr addrspace(1) inreg %ptr) {
1687
1687
; GFX90A-NEXT: ;;#ASMSTART
1688
1688
; GFX90A-NEXT: ; def v[4:7]
1689
1689
; GFX90A-NEXT: ;;#ASMEND
1690
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
1690
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[2:3] op_sel:[1,0]
1691
1691
; GFX90A-NEXT: global_store_dwordx2 v8, v[0:1], s[16:17]
1692
1692
; GFX90A-NEXT: s_waitcnt vmcnt(0)
1693
1693
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -1703,7 +1703,7 @@ define void @v_shuffle_v2f32_v4f32__5_2(ptr addrspace(1) inreg %ptr) {
1703
1703
; GFX940-NEXT: ; def v[4:7]
1704
1704
; GFX940-NEXT: ;;#ASMEND
1705
1705
; GFX940-NEXT: s_nop 0
1706
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[2:3] op_sel:[1,0] op_sel_hi:[0,0]
1706
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[4:5], v[2:3] op_sel:[1,0]
1707
1707
; GFX940-NEXT: global_store_dwordx2 v8, v[0:1], s[0:1] sc0 sc1
1708
1708
; GFX940-NEXT: s_waitcnt vmcnt(0)
1709
1709
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -2319,7 +2319,7 @@ define void @v_shuffle_v2f32_v4f32__5_4(ptr addrspace(1) inreg %ptr) {
2319
2319
; GFX90A-NEXT: ; def v[0:3]
2320
2320
; GFX90A-NEXT: ;;#ASMEND
2321
2321
; GFX90A-NEXT: v_mov_b32_e32 v4, 0
2322
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
2322
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0]
2323
2323
; GFX90A-NEXT: global_store_dwordx2 v4, v[0:1], s[16:17]
2324
2324
; GFX90A-NEXT: s_waitcnt vmcnt(0)
2325
2325
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -2331,7 +2331,7 @@ define void @v_shuffle_v2f32_v4f32__5_4(ptr addrspace(1) inreg %ptr) {
2331
2331
; GFX940-NEXT: ; def v[0:3]
2332
2332
; GFX940-NEXT: ;;#ASMEND
2333
2333
; GFX940-NEXT: v_mov_b32_e32 v4, 0
2334
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0] op_sel_hi:[0,0]
2334
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[0:1] op_sel:[1,0]
2335
2335
; GFX940-NEXT: global_store_dwordx2 v4, v[0:1], s[0:1] sc0 sc1
2336
2336
; GFX940-NEXT: s_waitcnt vmcnt(0)
2337
2337
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -2884,7 +2884,7 @@ define void @v_shuffle_v2f32_v4f32__1_6(ptr addrspace(1) inreg %ptr) {
2884
2884
; GFX90A-NEXT: ;;#ASMSTART
2885
2885
; GFX90A-NEXT: ; def v[2:5]
2886
2886
; GFX90A-NEXT: ;;#ASMEND
2887
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[4:5] op_sel:[1,0] op_sel_hi:[0,0]
2887
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[4:5] op_sel:[1,0]
2888
2888
; GFX90A-NEXT: global_store_dwordx2 v6, v[0:1], s[16:17]
2889
2889
; GFX90A-NEXT: s_waitcnt vmcnt(0)
2890
2890
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -2900,7 +2900,7 @@ define void @v_shuffle_v2f32_v4f32__1_6(ptr addrspace(1) inreg %ptr) {
2900
2900
; GFX940-NEXT: ; def v[2:5]
2901
2901
; GFX940-NEXT: ;;#ASMEND
2902
2902
; GFX940-NEXT: s_nop 0
2903
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[4:5] op_sel:[1,0] op_sel_hi:[0,0]
2903
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[0:1], v[4:5] op_sel:[1,0]
2904
2904
; GFX940-NEXT: global_store_dwordx2 v6, v[0:1], s[0:1] sc0 sc1
2905
2905
; GFX940-NEXT: s_waitcnt vmcnt(0)
2906
2906
; GFX940-NEXT: s_setpc_b64 s[30:31]
@@ -2990,7 +2990,7 @@ define void @v_shuffle_v2f32_v4f32__3_6(ptr addrspace(1) inreg %ptr) {
2990
2990
; GFX90A-NEXT: ;;#ASMSTART
2991
2991
; GFX90A-NEXT: ; def v[4:7]
2992
2992
; GFX90A-NEXT: ;;#ASMEND
2993
- ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[6:7] op_sel:[1,0] op_sel_hi:[0,0]
2993
+ ; GFX90A-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[6:7] op_sel:[1,0]
2994
2994
; GFX90A-NEXT: global_store_dwordx2 v8, v[0:1], s[16:17]
2995
2995
; GFX90A-NEXT: s_waitcnt vmcnt(0)
2996
2996
; GFX90A-NEXT: s_setpc_b64 s[30:31]
@@ -3006,7 +3006,7 @@ define void @v_shuffle_v2f32_v4f32__3_6(ptr addrspace(1) inreg %ptr) {
3006
3006
; GFX940-NEXT: ; def v[4:7]
3007
3007
; GFX940-NEXT: ;;#ASMEND
3008
3008
; GFX940-NEXT: s_nop 0
3009
- ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[6:7] op_sel:[1,0] op_sel_hi:[0,0]
3009
+ ; GFX940-NEXT: v_pk_mov_b32 v[0:1], v[2:3], v[6:7] op_sel:[1,0]
3010
3010
; GFX940-NEXT: global_store_dwordx2 v8, v[0:1], s[0:1] sc0 sc1
3011
3011
; GFX940-NEXT: s_waitcnt vmcnt(0)
3012
3012
; GFX940-NEXT: s_setpc_b64 s[30:31]
0 commit comments