@@ -66,39 +66,38 @@ define amdgpu_vs void @test_3(i32 inreg %arg1, i32 inreg %arg2, ptr addrspace(8)
66
66
; CHECK-NEXT: s_mov_b32 s6, s4
67
67
; CHECK-NEXT: s_mov_b32 s5, s3
68
68
; CHECK-NEXT: s_mov_b32 s4, s2
69
- ; CHECK-NEXT: v_add_i32_e32 v0, vcc, 20 , v1
70
- ; CHECK-NEXT: v_add_i32_e32 v3, vcc, 16 , v1
71
- ; CHECK-NEXT: v_add_i32_e32 v4, vcc, 12 , v1
72
- ; CHECK-NEXT: v_add_i32_e32 v5 , vcc, 8 , v1
73
- ; CHECK-NEXT: v_add_i32_e32 v8 , vcc, 4 , v1
69
+ ; CHECK-NEXT: v_add_i32_e32 v0, vcc, 12 , v1
70
+ ; CHECK-NEXT: v_add_i32_e32 v3, vcc, 8 , v1
71
+ ; CHECK-NEXT: v_add_i32_e32 v4, vcc, 4 , v1
72
+ ; CHECK-NEXT: v_add_i32_e32 v6 , vcc, 20 , v1
73
+ ; CHECK-NEXT: v_add_i32_e32 v7 , vcc, 16 , v1
74
74
; CHECK-NEXT: v_mov_b32_e32 v9, s0
75
- ; CHECK-NEXT: v_add_i32_e32 v10, vcc, 20 , v2
76
- ; CHECK-NEXT: v_add_i32_e32 v11, vcc, 16 , v2
75
+ ; CHECK-NEXT: v_add_i32_e32 v10, vcc, 12 , v2
76
+ ; CHECK-NEXT: v_add_i32_e32 v11, vcc, 8 , v2
77
77
; CHECK-NEXT: s_mov_b32 m0, -1
78
- ; CHECK-NEXT: ds_read_b32 v7 , v3
79
- ; CHECK-NEXT: ds_read_b32 v6 , v4
80
- ; CHECK-NEXT: ds_read_b32 v5, v5
81
- ; CHECK-NEXT: ds_read_b32 v4, v8
82
- ; CHECK-NEXT: ds_read_b32 v8 , v0
78
+ ; CHECK-NEXT: ds_read_b32 v5 , v3
79
+ ; CHECK-NEXT: ds_read_b32 v4 , v4
80
+ ; CHECK-NEXT: ds_read_b32 v8, v6
81
+ ; CHECK-NEXT: ds_read_b32 v7, v7
82
+ ; CHECK-NEXT: ds_read_b32 v6 , v0
83
83
; CHECK-NEXT: ds_read_b32 v3, v1
84
- ; CHECK-NEXT: v_add_i32_e32 v1 , vcc, 12 , v2
85
- ; CHECK-NEXT: v_add_i32_e32 v12 , vcc, 8 , v2
86
- ; CHECK-NEXT: v_add_i32_e32 v13 , vcc, 4 , v2
84
+ ; CHECK-NEXT: v_add_i32_e32 v0 , vcc, 4 , v2
85
+ ; CHECK-NEXT: v_add_i32_e32 v1 , vcc, 20 , v2
86
+ ; CHECK-NEXT: v_add_i32_e32 v12 , vcc, 16 , v2
87
87
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
88
88
; CHECK-NEXT: tbuffer_store_format_xyzw v[3:6], v9, s[4:7], s1 format:[BUF_DATA_FORMAT_32_32_32,BUF_NUM_FORMAT_UINT] idxen offset:264 glc slc
89
89
; CHECK-NEXT: tbuffer_store_format_xy v[7:8], v9, s[4:7], s1 format:[BUF_DATA_FORMAT_INVALID,BUF_NUM_FORMAT_UINT] idxen offset:280 glc slc
90
- ; CHECK-NEXT: ds_read_b32 v0, v11
91
90
; CHECK-NEXT: s_waitcnt expcnt(1)
92
- ; CHECK-NEXT: ds_read_b32 v5, v1
93
- ; CHECK-NEXT: ds_read_b32 v4, v12
94
- ; CHECK-NEXT: ds_read_b32 v3, v13
91
+ ; CHECK-NEXT: ds_read_b32 v4, v11
92
+ ; CHECK-NEXT: ds_read_b32 v3, v0
93
+ ; CHECK-NEXT: ds_read_b32 v1, v1
94
+ ; CHECK-NEXT: ds_read_b32 v0, v12
95
+ ; CHECK-NEXT: ds_read_b32 v5, v10
95
96
; CHECK-NEXT: ds_read_b32 v2, v2
96
- ; CHECK-NEXT: ds_read_b32 v1, v10
97
- ; CHECK-NEXT: s_waitcnt lgkmcnt(5)
97
+ ; CHECK-NEXT: s_waitcnt lgkmcnt(2)
98
98
; CHECK-NEXT: exp mrt0 off, off, off, off
99
- ; CHECK-NEXT: s_waitcnt lgkmcnt(1)
100
- ; CHECK-NEXT: tbuffer_store_format_xyzw v[2:5], v9, s[4:7], s1 format:[BUF_DATA_FORMAT_32_32_32,BUF_NUM_FORMAT_UINT] idxen offset:240 glc slc
101
99
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
100
+ ; CHECK-NEXT: tbuffer_store_format_xyzw v[2:5], v9, s[4:7], s1 format:[BUF_DATA_FORMAT_32_32_32,BUF_NUM_FORMAT_UINT] idxen offset:240 glc slc
102
101
; CHECK-NEXT: tbuffer_store_format_xy v[0:1], v9, s[4:7], s1 format:[BUF_DATA_FORMAT_INVALID,BUF_NUM_FORMAT_UINT] idxen offset:256 glc slc
103
102
; CHECK-NEXT: s_endpgm
104
103
%load1 = load <6 x float >, ptr addrspace (3 ) %arg5 , align 4
0 commit comments