@@ -1323,9 +1323,9 @@ define amdgpu_kernel void @add_i32_varying(ptr addrspace(1) %out, ptr addrspace(
1323
1323
; GFX1032_DPP-NEXT: s_or_saveexec_b32 s0, -1
1324
1324
; GFX1032_DPP-NEXT: v_writelane_b32 v3, s1, 16
1325
1325
; GFX1032_DPP-NEXT: s_mov_b32 exec_lo, s0
1326
- ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
1327
1326
; GFX1032_DPP-NEXT: s_mov_b32 s0, s2
1328
1327
; GFX1032_DPP-NEXT: s_mov_b32 s2, -1
1328
+ ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
1329
1329
; GFX1032_DPP-NEXT: ; implicit-def: $vgpr0
1330
1330
; GFX1032_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
1331
1331
; GFX1032_DPP-NEXT: s_cbranch_execz .LBB2_2
@@ -1451,10 +1451,9 @@ define amdgpu_kernel void @add_i32_varying(ptr addrspace(1) %out, ptr addrspace(
1451
1451
; GFX1132_DPP-NEXT: s_or_saveexec_b32 s4, -1
1452
1452
; GFX1132_DPP-NEXT: v_writelane_b32 v3, s5, 16
1453
1453
; GFX1132_DPP-NEXT: s_mov_b32 exec_lo, s4
1454
- ; GFX1132_DPP-NEXT: s_delay_alu instid0(VALU_DEP_2)
1455
- ; GFX1132_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
1456
1454
; GFX1132_DPP-NEXT: s_mov_b32 s4, s6
1457
1455
; GFX1132_DPP-NEXT: s_mov_b32 s6, -1
1456
+ ; GFX1132_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
1458
1457
; GFX1132_DPP-NEXT: ; implicit-def: $vgpr0
1459
1458
; GFX1132_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
1460
1459
; GFX1132_DPP-NEXT: s_cbranch_execz .LBB2_2
@@ -1587,9 +1586,9 @@ define amdgpu_kernel void @add_i32_varying(ptr addrspace(1) %out, ptr addrspace(
1587
1586
; GFX1232_DPP-NEXT: v_writelane_b32 v3, s5, 16
1588
1587
; GFX1232_DPP-NEXT: s_wait_alu 0xfffe
1589
1588
; GFX1232_DPP-NEXT: s_mov_b32 exec_lo, s4
1590
- ; GFX1232_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
1591
1589
; GFX1232_DPP-NEXT: s_mov_b32 s4, s6
1592
1590
; GFX1232_DPP-NEXT: s_mov_b32 s6, -1
1591
+ ; GFX1232_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
1593
1592
; GFX1232_DPP-NEXT: ; implicit-def: $vgpr0
1594
1593
; GFX1232_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
1595
1594
; GFX1232_DPP-NEXT: s_cbranch_execz .LBB2_2
@@ -3228,8 +3227,8 @@ define amdgpu_kernel void @add_i64_varying(ptr addrspace(1) %out, ptr addrspace(
3228
3227
; GFX1032_DPP-NEXT: v_writelane_b32 v2, s8, 16
3229
3228
; GFX1032_DPP-NEXT: v_writelane_b32 v1, s3, 16
3230
3229
; GFX1032_DPP-NEXT: s_mov_b32 exec_lo, s2
3231
- ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
3232
3230
; GFX1032_DPP-NEXT: s_mov_b32 s2, -1
3231
+ ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
3233
3232
; GFX1032_DPP-NEXT: ; implicit-def: $vgpr9_vgpr10
3234
3233
; GFX1032_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
3235
3234
; GFX1032_DPP-NEXT: s_cbranch_execz .LBB5_2
@@ -4991,9 +4990,9 @@ define amdgpu_kernel void @sub_i32_varying(ptr addrspace(1) %out, ptr addrspace(
4991
4990
; GFX1032_DPP-NEXT: s_or_saveexec_b32 s0, -1
4992
4991
; GFX1032_DPP-NEXT: v_writelane_b32 v3, s1, 16
4993
4992
; GFX1032_DPP-NEXT: s_mov_b32 exec_lo, s0
4994
- ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
4995
4993
; GFX1032_DPP-NEXT: s_mov_b32 s0, s2
4996
4994
; GFX1032_DPP-NEXT: s_mov_b32 s2, -1
4995
+ ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
4997
4996
; GFX1032_DPP-NEXT: ; implicit-def: $vgpr0
4998
4997
; GFX1032_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
4999
4998
; GFX1032_DPP-NEXT: s_cbranch_execz .LBB8_2
@@ -5119,10 +5118,9 @@ define amdgpu_kernel void @sub_i32_varying(ptr addrspace(1) %out, ptr addrspace(
5119
5118
; GFX1132_DPP-NEXT: s_or_saveexec_b32 s4, -1
5120
5119
; GFX1132_DPP-NEXT: v_writelane_b32 v3, s5, 16
5121
5120
; GFX1132_DPP-NEXT: s_mov_b32 exec_lo, s4
5122
- ; GFX1132_DPP-NEXT: s_delay_alu instid0(VALU_DEP_2)
5123
- ; GFX1132_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
5124
5121
; GFX1132_DPP-NEXT: s_mov_b32 s4, s6
5125
5122
; GFX1132_DPP-NEXT: s_mov_b32 s6, -1
5123
+ ; GFX1132_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
5126
5124
; GFX1132_DPP-NEXT: ; implicit-def: $vgpr0
5127
5125
; GFX1132_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
5128
5126
; GFX1132_DPP-NEXT: s_cbranch_execz .LBB8_2
@@ -5255,9 +5253,9 @@ define amdgpu_kernel void @sub_i32_varying(ptr addrspace(1) %out, ptr addrspace(
5255
5253
; GFX1232_DPP-NEXT: v_writelane_b32 v3, s5, 16
5256
5254
; GFX1232_DPP-NEXT: s_wait_alu 0xfffe
5257
5255
; GFX1232_DPP-NEXT: s_mov_b32 exec_lo, s4
5258
- ; GFX1232_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
5259
5256
; GFX1232_DPP-NEXT: s_mov_b32 s4, s6
5260
5257
; GFX1232_DPP-NEXT: s_mov_b32 s6, -1
5258
+ ; GFX1232_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
5261
5259
; GFX1232_DPP-NEXT: ; implicit-def: $vgpr0
5262
5260
; GFX1232_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
5263
5261
; GFX1232_DPP-NEXT: s_cbranch_execz .LBB8_2
@@ -6938,8 +6936,8 @@ define amdgpu_kernel void @sub_i64_varying(ptr addrspace(1) %out, ptr addrspace(
6938
6936
; GFX1032_DPP-NEXT: v_writelane_b32 v2, s8, 16
6939
6937
; GFX1032_DPP-NEXT: v_writelane_b32 v1, s3, 16
6940
6938
; GFX1032_DPP-NEXT: s_mov_b32 exec_lo, s2
6941
- ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
6942
6939
; GFX1032_DPP-NEXT: s_mov_b32 s2, -1
6940
+ ; GFX1032_DPP-NEXT: v_cmp_eq_u32_e32 vcc_lo, 0, v0
6943
6941
; GFX1032_DPP-NEXT: ; implicit-def: $vgpr9_vgpr10
6944
6942
; GFX1032_DPP-NEXT: s_and_saveexec_b32 s8, vcc_lo
6945
6943
; GFX1032_DPP-NEXT: s_cbranch_execz .LBB11_2
0 commit comments