Skip to content

Commit 6ca7b67

Browse files
author
git apple-llvm automerger
committed
Merge commit '2c37833931ee' from llvm.org/master into apple/master
2 parents fa3d14a + 2c37833 commit 6ca7b67

File tree

5 files changed

+9
-12
lines changed

5 files changed

+9
-12
lines changed

llvm/test/CodeGen/AMDGPU/fexp.ll

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,3 @@
1-
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
21
;RUN: llc -mtriple=amdgcn-- < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=SI %s
32
;RUN: llc -mtriple=amdgcn-- -mcpu=fiji < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=VI %s
43
;RUN: llc -mtriple=amdgcn-- -mcpu=gfx900 < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=GFX9 %s

llvm/test/CodeGen/AMDGPU/load-lo16.ll

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -994,13 +994,14 @@ define void @load_flat_lo_v2f16_reghi_vreg(half* %in, i32 %reg) #0 {
994994
; GFX803: ; %bb.0: ; %entry
995995
; GFX803-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
996996
; GFX803-NEXT: flat_load_ushort v0, v[0:1]
997-
; FIXME: and should be removable
998997
; GFX803-NEXT: v_and_b32_e32 v1, 0xffff0000, v2
999998
; GFX803-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1000999
; GFX803-NEXT: v_or_b32_e32 v0, v0, v1
10011000
; GFX803-NEXT: flat_store_dword v[0:1], v0
10021001
; GFX803-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
10031002
; GFX803-NEXT: s_setpc_b64 s[30:31]
1003+
1004+
; FIXME: the and above should be removable
10041005
entry:
10051006
%reg.bc = bitcast i32 %reg to <2 x half>
10061007
%load = load half, half* %in

llvm/test/CodeGen/AMDGPU/split-arg-dbg-value.ll

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
define hidden <4 x float> @split_v4f32_arg(<4 x float> returned %arg) local_unnamed_addr #0 !dbg !7 {
66
; GCN-LABEL: split_v4f32_arg:
77
; GCN: .Lfunc_begin0:
8-
; GCN-NEXT: .file 0
8+
; GCN-NEXT: .file 0 "/tmp/dbg.cl" md5 0x0f834f91e91489a5ff6308040ddbd175
99
; GCN-NEXT: .loc 0 3 0 ; /tmp/dbg.cl:3:0
1010
; GCN-NEXT: ; %bb.0:
1111
; GCN-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)

llvm/test/CodeGen/AMDGPU/stack-realign-kernel.ll

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,3 @@
1-
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
21
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=fiji < %s | FileCheck -check-prefix=VI %s
32
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 < %s | FileCheck -check-prefix=GFX9 %s
43

llvm/test/CodeGen/AMDGPU/subreg-coalescer-undef-use.ll

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -13,18 +13,10 @@ define amdgpu_kernel void @foobar(float %a0, float %a1, float addrspace(1)* %out
1313
; CHECK-NEXT: v_cmp_eq_u32_e32 vcc, 0, v0
1414
; CHECK-NEXT: s_mov_b32 s2, -1
1515
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
16-
17-
; FIXME: The change related to the fact that
18-
; DetectDeadLanes pass hit "Copy across incompatible class" SGPR -> VGPR in analysis
19-
; and hence it cannot derive the fact that the vector element is unused.
20-
; Such a copies appear because the float4 vectors and their elements in the test are uniform
21-
; but the PHI node in "ife" block is divergent because of the CF dependency (divergent branch in bb0)
22-
2316
; CHECK-NEXT: v_mov_b32_e32 v0, s4
2417
; CHECK-NEXT: v_mov_b32_e32 v1, s5
2518
; CHECK-NEXT: v_mov_b32_e32 v2, s6
2619
; CHECK-NEXT: v_mov_b32_e32 v3, s7
27-
2820
; CHECK-NEXT: s_and_saveexec_b64 s[6:7], vcc
2921
; CHECK-NEXT: ; mask branch BB0_2
3022
; CHECK-NEXT: BB0_1: ; %ift
@@ -38,6 +30,12 @@ define amdgpu_kernel void @foobar(float %a0, float %a1, float addrspace(1)* %out
3830
; CHECK-NEXT: s_mov_b32 s3, 0xf000
3931
; CHECK-NEXT: buffer_store_dword v1, off, s[0:3], 0
4032
; CHECK-NEXT: s_endpgm
33+
34+
; FIXME: The change related to the fact that
35+
; DetectDeadLanes pass hit "Copy across incompatible class" SGPR -> VGPR in analysis
36+
; and hence it cannot derive the fact that the vector element in the "ift" block is unused.
37+
; Such a copies appear because the float4 vectors and their elements in the test are uniform
38+
; but the PHI node in "ife" block is divergent because of the CF dependency (divergent branch in bb0)
4139
entry:
4240
%v0 = insertelement <4 x float> undef, float %a0, i32 0
4341
%tid = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0) #0

0 commit comments

Comments
 (0)