Skip to content

Commit 72246b4

Browse files
committed
rebase to main
1 parent 6dee075 commit 72246b4

File tree

255 files changed

+61098
-49795
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

255 files changed

+61098
-49795
lines changed

llvm/test/CodeGen/AMDGPU/GlobalISel/addsubu64.ll

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@ define amdgpu_kernel void @s_add_u64(ptr addrspace(1) %out, i64 %a, i64 %b) {
66
; GFX11-LABEL: s_add_u64:
77
; GFX11: ; %bb.0: ; %entry
88
; GFX11-NEXT: s_clause 0x1
9-
; GFX11-NEXT: s_load_b128 s[4:7], s[0:1], 0x24
10-
; GFX11-NEXT: s_load_b64 s[0:1], s[0:1], 0x34
9+
; GFX11-NEXT: s_load_b128 s[4:7], s[2:3], 0x24
10+
; GFX11-NEXT: s_load_b64 s[0:1], s[2:3], 0x34
1111
; GFX11-NEXT: v_mov_b32_e32 v2, 0
1212
; GFX11-NEXT: s_waitcnt lgkmcnt(0)
1313
; GFX11-NEXT: s_add_u32 s0, s6, s0
@@ -22,8 +22,8 @@ define amdgpu_kernel void @s_add_u64(ptr addrspace(1) %out, i64 %a, i64 %b) {
2222
; GFX12-LABEL: s_add_u64:
2323
; GFX12: ; %bb.0: ; %entry
2424
; GFX12-NEXT: s_clause 0x1
25-
; GFX12-NEXT: s_load_b128 s[4:7], s[0:1], 0x24
26-
; GFX12-NEXT: s_load_b64 s[0:1], s[0:1], 0x34
25+
; GFX12-NEXT: s_load_b128 s[4:7], s[2:3], 0x24
26+
; GFX12-NEXT: s_load_b64 s[0:1], s[2:3], 0x34
2727
; GFX12-NEXT: v_mov_b32_e32 v2, 0
2828
; GFX12-NEXT: s_wait_kmcnt 0x0
2929
; GFX12-NEXT: s_add_nc_u64 s[0:1], s[6:7], s[0:1]
@@ -58,8 +58,8 @@ define amdgpu_kernel void @s_sub_u64(ptr addrspace(1) %out, i64 %a, i64 %b) {
5858
; GFX11-LABEL: s_sub_u64:
5959
; GFX11: ; %bb.0: ; %entry
6060
; GFX11-NEXT: s_clause 0x1
61-
; GFX11-NEXT: s_load_b128 s[4:7], s[0:1], 0x24
62-
; GFX11-NEXT: s_load_b64 s[0:1], s[0:1], 0x34
61+
; GFX11-NEXT: s_load_b128 s[4:7], s[2:3], 0x24
62+
; GFX11-NEXT: s_load_b64 s[0:1], s[2:3], 0x34
6363
; GFX11-NEXT: v_mov_b32_e32 v2, 0
6464
; GFX11-NEXT: s_waitcnt lgkmcnt(0)
6565
; GFX11-NEXT: s_sub_u32 s0, s6, s0
@@ -74,8 +74,8 @@ define amdgpu_kernel void @s_sub_u64(ptr addrspace(1) %out, i64 %a, i64 %b) {
7474
; GFX12-LABEL: s_sub_u64:
7575
; GFX12: ; %bb.0: ; %entry
7676
; GFX12-NEXT: s_clause 0x1
77-
; GFX12-NEXT: s_load_b128 s[4:7], s[0:1], 0x24
78-
; GFX12-NEXT: s_load_b64 s[0:1], s[0:1], 0x34
77+
; GFX12-NEXT: s_load_b128 s[4:7], s[2:3], 0x24
78+
; GFX12-NEXT: s_load_b64 s[0:1], s[2:3], 0x34
7979
; GFX12-NEXT: v_mov_b32_e32 v2, 0
8080
; GFX12-NEXT: s_wait_kmcnt 0x0
8181
; GFX12-NEXT: s_sub_nc_u64 s[0:1], s[6:7], s[0:1]

llvm/test/CodeGen/AMDGPU/GlobalISel/bool-legalization.ll

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,7 @@ define amdgpu_ps i32 @select_sgpr_trunc_and_cond(i32 inreg %a.0, i32 inreg %a.1,
6666
define amdgpu_kernel void @sgpr_trunc_brcond(i32 %cond) {
6767
; WAVE64-LABEL: sgpr_trunc_brcond:
6868
; WAVE64: ; %bb.0: ; %entry
69-
; WAVE64-NEXT: s_load_dword s0, s[0:1], 0x24
69+
; WAVE64-NEXT: s_load_dword s0, s[2:3], 0x24
7070
; WAVE64-NEXT: s_waitcnt lgkmcnt(0)
7171
; WAVE64-NEXT: s_xor_b32 s0, s0, 1
7272
; WAVE64-NEXT: s_and_b32 s0, s0, 1
@@ -83,7 +83,7 @@ define amdgpu_kernel void @sgpr_trunc_brcond(i32 %cond) {
8383
;
8484
; WAVE32-LABEL: sgpr_trunc_brcond:
8585
; WAVE32: ; %bb.0: ; %entry
86-
; WAVE32-NEXT: s_load_dword s0, s[0:1], 0x24
86+
; WAVE32-NEXT: s_load_dword s0, s[2:3], 0x24
8787
; WAVE32-NEXT: s_waitcnt lgkmcnt(0)
8888
; WAVE32-NEXT: s_xor_b32 s0, s0, 1
8989
; WAVE32-NEXT: s_and_b32 s0, s0, 1
@@ -113,9 +113,9 @@ bb1:
113113
define amdgpu_kernel void @brcond_sgpr_trunc_and(i32 %cond0, i32 %cond1) {
114114
; WAVE64-LABEL: brcond_sgpr_trunc_and:
115115
; WAVE64: ; %bb.0: ; %entry
116-
; WAVE64-NEXT: s_load_dwordx2 s[2:3], s[0:1], 0x24
116+
; WAVE64-NEXT: s_load_dwordx2 s[0:1], s[2:3], 0x24
117117
; WAVE64-NEXT: s_waitcnt lgkmcnt(0)
118-
; WAVE64-NEXT: s_and_b32 s0, s2, s3
118+
; WAVE64-NEXT: s_and_b32 s0, s0, s1
119119
; WAVE64-NEXT: s_xor_b32 s0, s0, 1
120120
; WAVE64-NEXT: s_and_b32 s0, s0, 1
121121
; WAVE64-NEXT: s_cmp_lg_u32 s0, 0
@@ -131,7 +131,7 @@ define amdgpu_kernel void @brcond_sgpr_trunc_and(i32 %cond0, i32 %cond1) {
131131
;
132132
; WAVE32-LABEL: brcond_sgpr_trunc_and:
133133
; WAVE32: ; %bb.0: ; %entry
134-
; WAVE32-NEXT: s_load_dwordx2 s[0:1], s[0:1], 0x24
134+
; WAVE32-NEXT: s_load_dwordx2 s[0:1], s[2:3], 0x24
135135
; WAVE32-NEXT: s_waitcnt lgkmcnt(0)
136136
; WAVE32-NEXT: s_and_b32 s0, s0, s1
137137
; WAVE32-NEXT: s_xor_b32 s0, s0, 1

0 commit comments

Comments
 (0)