@@ -778,8 +778,8 @@ define amdgpu_kernel void @nested_if_else_if(ptr addrspace(1) nocapture %arg) {
778
778
; GCN-O0-NEXT: s_mov_b64 exec, s[0:1]
779
779
; GCN-O0-NEXT: s_cbranch_execz .LBB3_7
780
780
; GCN-O0-NEXT: ; %bb.3: ; %bb.inner.then
781
- ; GCN-O0-NEXT: s_waitcnt expcnt(1)
782
781
; GCN-O0-NEXT: buffer_load_dword v1, off, s[12:15], 0 offset:4 ; 4-byte Folded Reload
782
+ ; GCN-O0-NEXT: s_waitcnt expcnt(1)
783
783
; GCN-O0-NEXT: buffer_load_dword v2, off, s[12:15], 0 offset:8 ; 4-byte Folded Reload
784
784
; GCN-O0-NEXT: s_mov_b32 s0, 0xf000
785
785
; GCN-O0-NEXT: s_mov_b32 s2, 0
@@ -824,8 +824,8 @@ define amdgpu_kernel void @nested_if_else_if(ptr addrspace(1) nocapture %arg) {
824
824
; GCN-O0-NEXT: s_mov_b64 exec, s[0:1]
825
825
; GCN-O0-NEXT: s_cbranch_execz .LBB3_6
826
826
; GCN-O0-NEXT: ; %bb.5: ; %bb.inner.then2
827
- ; GCN-O0-NEXT: s_waitcnt expcnt(1)
828
827
; GCN-O0-NEXT: buffer_load_dword v1, off, s[12:15], 0 offset:4 ; 4-byte Folded Reload
828
+ ; GCN-O0-NEXT: s_waitcnt expcnt(1)
829
829
; GCN-O0-NEXT: buffer_load_dword v2, off, s[12:15], 0 offset:8 ; 4-byte Folded Reload
830
830
; GCN-O0-NEXT: s_mov_b32 s0, 0xf000
831
831
; GCN-O0-NEXT: s_mov_b32 s2, 0
@@ -1242,10 +1242,13 @@ define void @scc_liveness(i32 %arg) local_unnamed_addr #0 {
1242
1242
; GCN-O0-NEXT: buffer_load_dword v1, off, s[0:3], s32 offset:12 ; 4-byte Folded Reload
1243
1243
; GCN-O0-NEXT: buffer_load_dword v2, off, s[0:3], s32 offset:16 ; 4-byte Folded Reload
1244
1244
; GCN-O0-NEXT: buffer_load_dword v3, off, s[0:3], s32 offset:20 ; 4-byte Folded Reload
1245
- ; GCN-O0-NEXT: s_waitcnt vmcnt(0 )
1245
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3 )
1246
1246
; GCN-O0-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:40 ; 4-byte Folded Spill
1247
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3)
1247
1248
; GCN-O0-NEXT: buffer_store_dword v1, off, s[0:3], s32 offset:44 ; 4-byte Folded Spill
1249
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3)
1248
1250
; GCN-O0-NEXT: buffer_store_dword v2, off, s[0:3], s32 offset:48 ; 4-byte Folded Spill
1251
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3)
1249
1252
; GCN-O0-NEXT: buffer_store_dword v3, off, s[0:3], s32 offset:52 ; 4-byte Folded Spill
1250
1253
; GCN-O0-NEXT: s_branch .LBB5_7
1251
1254
; GCN-O0-NEXT: .LBB5_6: ; %Flow
@@ -1263,10 +1266,13 @@ define void @scc_liveness(i32 %arg) local_unnamed_addr #0 {
1263
1266
; GCN-O0-NEXT: buffer_load_dword v1, off, s[0:3], s32 offset:28 ; 4-byte Folded Reload
1264
1267
; GCN-O0-NEXT: buffer_load_dword v2, off, s[0:3], s32 offset:32 ; 4-byte Folded Reload
1265
1268
; GCN-O0-NEXT: buffer_load_dword v3, off, s[0:3], s32 offset:36 ; 4-byte Folded Reload
1266
- ; GCN-O0-NEXT: s_waitcnt vmcnt(0 )
1269
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3 )
1267
1270
; GCN-O0-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:8 ; 4-byte Folded Spill
1271
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3)
1268
1272
; GCN-O0-NEXT: buffer_store_dword v1, off, s[0:3], s32 offset:12 ; 4-byte Folded Spill
1273
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3)
1269
1274
; GCN-O0-NEXT: buffer_store_dword v2, off, s[0:3], s32 offset:16 ; 4-byte Folded Spill
1275
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(3)
1270
1276
; GCN-O0-NEXT: buffer_store_dword v3, off, s[0:3], s32 offset:20 ; 4-byte Folded Spill
1271
1277
; GCN-O0-NEXT: s_branch .LBB5_5
1272
1278
; GCN-O0-NEXT: .LBB5_7: ; %bb10
@@ -1336,10 +1342,13 @@ define void @scc_liveness(i32 %arg) local_unnamed_addr #0 {
1336
1342
; GCN-O0-NEXT: s_or_saveexec_b64 s[14:15], -1
1337
1343
; GCN-O0-NEXT: buffer_store_dword v4, off, s[0:3], s32 ; 4-byte Folded Spill
1338
1344
; GCN-O0-NEXT: s_mov_b64 exec, s[14:15]
1339
- ; GCN-O0-NEXT: s_waitcnt vmcnt(1 )
1345
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(4 )
1340
1346
; GCN-O0-NEXT: buffer_store_dword v0, off, s[0:3], s32 offset:56 ; 4-byte Folded Spill
1347
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(4)
1341
1348
; GCN-O0-NEXT: buffer_store_dword v1, off, s[0:3], s32 offset:60 ; 4-byte Folded Spill
1349
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(4)
1342
1350
; GCN-O0-NEXT: buffer_store_dword v2, off, s[0:3], s32 offset:64 ; 4-byte Folded Spill
1351
+ ; GCN-O0-NEXT: s_waitcnt vmcnt(4)
1343
1352
; GCN-O0-NEXT: buffer_store_dword v3, off, s[0:3], s32 offset:68 ; 4-byte Folded Spill
1344
1353
; GCN-O0-NEXT: s_andn2_b64 exec, exec, s[4:5]
1345
1354
; GCN-O0-NEXT: s_cbranch_execnz .LBB5_1
@@ -1356,9 +1365,11 @@ define void @scc_liveness(i32 %arg) local_unnamed_addr #0 {
1356
1365
; GCN-O0-NEXT: s_or_saveexec_b64 s[14:15], -1
1357
1366
; GCN-O0-NEXT: buffer_load_dword v0, off, s[0:3], s32 ; 4-byte Folded Reload
1358
1367
; GCN-O0-NEXT: s_mov_b64 exec, s[14:15]
1359
- ; GCN-O0-NEXT: s_waitcnt expcnt(0 )
1368
+ ; GCN-O0-NEXT: s_waitcnt expcnt(2 )
1360
1369
; GCN-O0-NEXT: buffer_load_dword v1, off, s[0:3], s32 offset:56 ; 4-byte Folded Reload
1370
+ ; GCN-O0-NEXT: s_waitcnt expcnt(1)
1361
1371
; GCN-O0-NEXT: buffer_load_dword v2, off, s[0:3], s32 offset:60 ; 4-byte Folded Reload
1372
+ ; GCN-O0-NEXT: s_waitcnt expcnt(0)
1362
1373
; GCN-O0-NEXT: buffer_load_dword v3, off, s[0:3], s32 offset:64 ; 4-byte Folded Reload
1363
1374
; GCN-O0-NEXT: buffer_load_dword v4, off, s[0:3], s32 offset:68 ; 4-byte Folded Reload
1364
1375
; GCN-O0-NEXT: s_waitcnt vmcnt(0)
0 commit comments