@@ -9,7 +9,7 @@ define void @gep_noflags_alloca(i32 %idx, i32 %val) #0 {
9
9
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
10
10
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 2, v0
11
11
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
12
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
12
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
13
13
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
14
14
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
15
15
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -36,7 +36,7 @@ define void @gep_inbounds_alloca(i32 %idx, i32 %val) #0 {
36
36
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
37
37
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 2, v0
38
38
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
39
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
39
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
40
40
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
41
41
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
42
42
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -63,7 +63,7 @@ define void @gep_nuw_alloca(i32 %idx, i32 %val) #0 {
63
63
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
64
64
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 2, v0
65
65
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
66
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
66
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
67
67
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
68
68
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
69
69
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -90,7 +90,7 @@ define void @gep_nusw_alloca(i32 %idx, i32 %val) #0 {
90
90
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
91
91
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 2, v0
92
92
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
93
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
93
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
94
94
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
95
95
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
96
96
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -117,7 +117,7 @@ define void @gep_inbounds_nuw_alloca(i32 %idx, i32 %val) #0 {
117
117
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
118
118
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 2, v0
119
119
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
120
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
120
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
121
121
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
122
122
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
123
123
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -144,7 +144,7 @@ define void @gep_nusw_nuw_alloca(i32 %idx, i32 %val) #0 {
144
144
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
145
145
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 2, v0
146
146
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
147
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
147
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
148
148
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
149
149
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
150
150
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -172,7 +172,7 @@ define void @gep_inbounds_nuw_alloca_nonpow2_scale(i32 %idx, i32 %val) #0 {
172
172
; GFX8-NEXT: s_movk_i32 s4, 0x84
173
173
; GFX8-NEXT: v_mul_lo_u32 v0, v0, s4
174
174
; GFX8-NEXT: v_lshrrev_b32_e64 v2, 6, s32
175
- ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v2, v0
175
+ ; GFX8-NEXT: v_add_u32_e32 v0, vcc, v0, v2
176
176
; GFX8-NEXT: v_add_u32_e32 v0, vcc, 16, v0
177
177
; GFX8-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen
178
178
; GFX8-NEXT: s_waitcnt vmcnt(0)
@@ -184,7 +184,7 @@ define void @gep_inbounds_nuw_alloca_nonpow2_scale(i32 %idx, i32 %val) #0 {
184
184
; GFX9-NEXT: s_movk_i32 s4, 0x84
185
185
; GFX9-NEXT: v_mul_lo_u32 v0, v0, s4
186
186
; GFX9-NEXT: v_lshrrev_b32_e64 v2, 6, s32
187
- ; GFX9-NEXT: v_add_u32_e32 v0, v2, v0
187
+ ; GFX9-NEXT: v_add_u32_e32 v0, v0, v2
188
188
; GFX9-NEXT: buffer_store_dword v1, v0, s[0:3], 0 offen offset:16
189
189
; GFX9-NEXT: s_waitcnt vmcnt(0)
190
190
; GFX9-NEXT: s_setpc_b64 s[30:31]
0 commit comments