@@ -13,9 +13,8 @@ define amdgpu_kernel void @global_load_tr_b64(ptr addrspace(1) %addr, ptr addrsp
13
13
; GFX12-SDAG-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
14
14
; GFX12-SDAG-W32-NEXT: v_mov_b32_e32 v2, 0
15
15
; GFX12-SDAG-W32-NEXT: s_wait_kmcnt 0x0
16
- ; GFX12-SDAG-W32-NEXT: global_load_tr_b64 v[0:1], v2, s[0:1] offset:32 th:TH_LOAD_NT
16
+ ; GFX12-SDAG-W32-NEXT: global_load_tr_b64 v[0:1], v2, s[0:1] offset:32
17
17
; GFX12-SDAG-W32-NEXT: s_wait_loadcnt 0x0
18
- ; GFX12-SDAG-W32-NEXT: global_inv scope:SCOPE_SYS
19
18
; GFX12-SDAG-W32-NEXT: global_store_b64 v2, v[0:1], s[2:3]
20
19
; GFX12-SDAG-W32-NEXT: s_nop 0
21
20
; GFX12-SDAG-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -26,9 +25,8 @@ define amdgpu_kernel void @global_load_tr_b64(ptr addrspace(1) %addr, ptr addrsp
26
25
; GFX12-GISEL-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
27
26
; GFX12-GISEL-W32-NEXT: v_mov_b32_e32 v2, 0
28
27
; GFX12-GISEL-W32-NEXT: s_wait_kmcnt 0x0
29
- ; GFX12-GISEL-W32-NEXT: global_load_tr_b64 v[0:1], v2, s[0:1] offset:32 th:TH_LOAD_NT
28
+ ; GFX12-GISEL-W32-NEXT: global_load_tr_b64 v[0:1], v2, s[0:1] offset:32
30
29
; GFX12-GISEL-W32-NEXT: s_wait_loadcnt 0x0
31
- ; GFX12-GISEL-W32-NEXT: global_inv scope:SCOPE_SYS
32
30
; GFX12-GISEL-W32-NEXT: global_store_b64 v2, v[0:1], s[2:3]
33
31
; GFX12-GISEL-W32-NEXT: s_nop 0
34
32
; GFX12-GISEL-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -46,9 +44,8 @@ define amdgpu_kernel void @global_load_tr_b128_i16(ptr addrspace(1) %addr, ptr a
46
44
; GFX12-SDAG-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
47
45
; GFX12-SDAG-W32-NEXT: v_mov_b32_e32 v4, 0
48
46
; GFX12-SDAG-W32-NEXT: s_wait_kmcnt 0x0
49
- ; GFX12-SDAG-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32 th:TH_LOAD_NT
47
+ ; GFX12-SDAG-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32
50
48
; GFX12-SDAG-W32-NEXT: s_wait_loadcnt 0x0
51
- ; GFX12-SDAG-W32-NEXT: global_inv scope:SCOPE_SYS
52
49
; GFX12-SDAG-W32-NEXT: global_store_b128 v4, v[0:3], s[2:3]
53
50
; GFX12-SDAG-W32-NEXT: s_nop 0
54
51
; GFX12-SDAG-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -59,9 +56,8 @@ define amdgpu_kernel void @global_load_tr_b128_i16(ptr addrspace(1) %addr, ptr a
59
56
; GFX12-GISEL-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
60
57
; GFX12-GISEL-W32-NEXT: v_mov_b32_e32 v4, 0
61
58
; GFX12-GISEL-W32-NEXT: s_wait_kmcnt 0x0
62
- ; GFX12-GISEL-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32 th:TH_LOAD_NT
59
+ ; GFX12-GISEL-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32
63
60
; GFX12-GISEL-W32-NEXT: s_wait_loadcnt 0x0
64
- ; GFX12-GISEL-W32-NEXT: global_inv scope:SCOPE_SYS
65
61
; GFX12-GISEL-W32-NEXT: global_store_b128 v4, v[0:3], s[2:3]
66
62
; GFX12-GISEL-W32-NEXT: s_nop 0
67
63
; GFX12-GISEL-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -79,9 +75,8 @@ define amdgpu_kernel void @global_load_tr_b128_half(ptr addrspace(1) %addr, ptr
79
75
; GFX12-SDAG-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
80
76
; GFX12-SDAG-W32-NEXT: v_mov_b32_e32 v4, 0
81
77
; GFX12-SDAG-W32-NEXT: s_wait_kmcnt 0x0
82
- ; GFX12-SDAG-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32 th:TH_LOAD_NT
78
+ ; GFX12-SDAG-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32
83
79
; GFX12-SDAG-W32-NEXT: s_wait_loadcnt 0x0
84
- ; GFX12-SDAG-W32-NEXT: global_inv scope:SCOPE_SYS
85
80
; GFX12-SDAG-W32-NEXT: global_store_b128 v4, v[0:3], s[2:3]
86
81
; GFX12-SDAG-W32-NEXT: s_nop 0
87
82
; GFX12-SDAG-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -92,9 +87,8 @@ define amdgpu_kernel void @global_load_tr_b128_half(ptr addrspace(1) %addr, ptr
92
87
; GFX12-GISEL-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
93
88
; GFX12-GISEL-W32-NEXT: v_mov_b32_e32 v4, 0
94
89
; GFX12-GISEL-W32-NEXT: s_wait_kmcnt 0x0
95
- ; GFX12-GISEL-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32 th:TH_LOAD_NT
90
+ ; GFX12-GISEL-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32
96
91
; GFX12-GISEL-W32-NEXT: s_wait_loadcnt 0x0
97
- ; GFX12-GISEL-W32-NEXT: global_inv scope:SCOPE_SYS
98
92
; GFX12-GISEL-W32-NEXT: global_store_b128 v4, v[0:3], s[2:3]
99
93
; GFX12-GISEL-W32-NEXT: s_nop 0
100
94
; GFX12-GISEL-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -112,9 +106,8 @@ define amdgpu_kernel void @global_load_tr_b128_bfloat(ptr addrspace(1) %addr, pt
112
106
; GFX12-SDAG-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
113
107
; GFX12-SDAG-W32-NEXT: v_mov_b32_e32 v4, 0
114
108
; GFX12-SDAG-W32-NEXT: s_wait_kmcnt 0x0
115
- ; GFX12-SDAG-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32 th:TH_LOAD_NT
109
+ ; GFX12-SDAG-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32
116
110
; GFX12-SDAG-W32-NEXT: s_wait_loadcnt 0x0
117
- ; GFX12-SDAG-W32-NEXT: global_inv scope:SCOPE_SYS
118
111
; GFX12-SDAG-W32-NEXT: global_store_b128 v4, v[0:3], s[2:3]
119
112
; GFX12-SDAG-W32-NEXT: s_nop 0
120
113
; GFX12-SDAG-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
@@ -125,9 +118,8 @@ define amdgpu_kernel void @global_load_tr_b128_bfloat(ptr addrspace(1) %addr, pt
125
118
; GFX12-GISEL-W32-NEXT: s_load_b128 s[0:3], s[0:1], 0x24
126
119
; GFX12-GISEL-W32-NEXT: v_mov_b32_e32 v4, 0
127
120
; GFX12-GISEL-W32-NEXT: s_wait_kmcnt 0x0
128
- ; GFX12-GISEL-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32 th:TH_LOAD_NT
121
+ ; GFX12-GISEL-W32-NEXT: global_load_tr_b128 v[0:3], v4, s[0:1] offset:32
129
122
; GFX12-GISEL-W32-NEXT: s_wait_loadcnt 0x0
130
- ; GFX12-GISEL-W32-NEXT: global_inv scope:SCOPE_SYS
131
123
; GFX12-GISEL-W32-NEXT: global_store_b128 v4, v[0:3], s[2:3]
132
124
; GFX12-GISEL-W32-NEXT: s_nop 0
133
125
; GFX12-GISEL-W32-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
0 commit comments