@@ -221,15 +221,15 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
221
221
; GFX906-NEXT: ; def s29
222
222
; GFX906-NEXT: ;;#ASMEND
223
223
; GFX906-NEXT: buffer_load_dword v31, off, s[0:3], s33 offset:4 ; 4-byte Folded Reload
224
- ; GFX906-NEXT: v_writelane_b32 v40, s21, 24
225
- ; GFX906-NEXT: v_writelane_b32 v40, s22, 25
226
- ; GFX906-NEXT: v_writelane_b32 v40, s23, 26
227
- ; GFX906-NEXT: v_writelane_b32 v40, s24, 27
228
- ; GFX906-NEXT: v_writelane_b32 v40, s25, 28
229
- ; GFX906-NEXT: v_writelane_b32 v40, s26, 29
230
- ; GFX906-NEXT: v_writelane_b32 v40, s27, 30
231
- ; GFX906-NEXT: v_writelane_b32 v40, s28, 31
232
- ; GFX906-NEXT: v_writelane_b32 v40, s29, 32
224
+ ; GFX906-NEXT: v_writelane_b32 v40, s21, 12
225
+ ; GFX906-NEXT: v_writelane_b32 v40, s22, 13
226
+ ; GFX906-NEXT: v_writelane_b32 v40, s23, 14
227
+ ; GFX906-NEXT: v_writelane_b32 v40, s24, 15
228
+ ; GFX906-NEXT: v_writelane_b32 v40, s25, 16
229
+ ; GFX906-NEXT: v_writelane_b32 v40, s26, 17
230
+ ; GFX906-NEXT: v_writelane_b32 v40, s27, 18
231
+ ; GFX906-NEXT: v_writelane_b32 v40, s28, 19
232
+ ; GFX906-NEXT: v_writelane_b32 v40, s29, 20
233
233
; GFX906-NEXT: v_readlane_b32 s4, v40, 10
234
234
; GFX906-NEXT: v_readlane_b32 s6, v40, 0
235
235
; GFX906-NEXT: v_readlane_b32 s8, v40, 8
@@ -249,39 +249,39 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
249
249
; GFX906-NEXT: s_swappc_b64 s[30:31], s[16:17]
250
250
; GFX906-NEXT: s_or_saveexec_b64 s[34:35], -1
251
251
; GFX906-NEXT: s_mov_b64 exec, s[34:35]
252
- ; GFX906-NEXT: v_readlane_b32 s21, v40, 24
252
+ ; GFX906-NEXT: v_readlane_b32 s21, v40, 12
253
253
; GFX906-NEXT: ;;#ASMSTART
254
254
; GFX906-NEXT: ; use s21
255
255
; GFX906-NEXT: ;;#ASMEND
256
- ; GFX906-NEXT: v_readlane_b32 s22, v40, 25
256
+ ; GFX906-NEXT: v_readlane_b32 s22, v40, 13
257
257
; GFX906-NEXT: ;;#ASMSTART
258
258
; GFX906-NEXT: ; use s22
259
259
; GFX906-NEXT: ;;#ASMEND
260
- ; GFX906-NEXT: v_readlane_b32 s23, v40, 26
260
+ ; GFX906-NEXT: v_readlane_b32 s23, v40, 14
261
261
; GFX906-NEXT: ;;#ASMSTART
262
262
; GFX906-NEXT: ; use s23
263
263
; GFX906-NEXT: ;;#ASMEND
264
- ; GFX906-NEXT: v_readlane_b32 s24, v40, 27
264
+ ; GFX906-NEXT: v_readlane_b32 s24, v40, 15
265
265
; GFX906-NEXT: ;;#ASMSTART
266
266
; GFX906-NEXT: ; use s24
267
267
; GFX906-NEXT: ;;#ASMEND
268
- ; GFX906-NEXT: v_readlane_b32 s25, v40, 28
268
+ ; GFX906-NEXT: v_readlane_b32 s25, v40, 16
269
269
; GFX906-NEXT: ;;#ASMSTART
270
270
; GFX906-NEXT: ; use s25
271
271
; GFX906-NEXT: ;;#ASMEND
272
- ; GFX906-NEXT: v_readlane_b32 s26, v40, 29
272
+ ; GFX906-NEXT: v_readlane_b32 s26, v40, 17
273
273
; GFX906-NEXT: ;;#ASMSTART
274
274
; GFX906-NEXT: ; use s26
275
275
; GFX906-NEXT: ;;#ASMEND
276
- ; GFX906-NEXT: v_readlane_b32 s27, v40, 30
276
+ ; GFX906-NEXT: v_readlane_b32 s27, v40, 18
277
277
; GFX906-NEXT: ;;#ASMSTART
278
278
; GFX906-NEXT: ; use s27
279
279
; GFX906-NEXT: ;;#ASMEND
280
- ; GFX906-NEXT: v_readlane_b32 s28, v40, 31
280
+ ; GFX906-NEXT: v_readlane_b32 s28, v40, 19
281
281
; GFX906-NEXT: ;;#ASMSTART
282
282
; GFX906-NEXT: ; use s28
283
283
; GFX906-NEXT: ;;#ASMEND
284
- ; GFX906-NEXT: v_readlane_b32 s29, v40, 32
284
+ ; GFX906-NEXT: v_readlane_b32 s29, v40, 20
285
285
; GFX906-NEXT: ;;#ASMSTART
286
286
; GFX906-NEXT: ; use s29
287
287
; GFX906-NEXT: ;;#ASMEND
@@ -602,15 +602,15 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
602
602
; GFX908-NEXT: ; def s29
603
603
; GFX908-NEXT: ;;#ASMEND
604
604
; GFX908-NEXT: buffer_load_dword v31, off, s[0:3], s33 offset:8 ; 4-byte Folded Reload
605
- ; GFX908-NEXT: v_writelane_b32 v40, s21, 24
606
- ; GFX908-NEXT: v_writelane_b32 v40, s22, 25
607
- ; GFX908-NEXT: v_writelane_b32 v40, s23, 26
608
- ; GFX908-NEXT: v_writelane_b32 v40, s24, 27
609
- ; GFX908-NEXT: v_writelane_b32 v40, s25, 28
610
- ; GFX908-NEXT: v_writelane_b32 v40, s26, 29
611
- ; GFX908-NEXT: v_writelane_b32 v40, s27, 30
612
- ; GFX908-NEXT: v_writelane_b32 v40, s28, 31
613
- ; GFX908-NEXT: v_writelane_b32 v40, s29, 32
605
+ ; GFX908-NEXT: v_writelane_b32 v40, s21, 12
606
+ ; GFX908-NEXT: v_writelane_b32 v40, s22, 13
607
+ ; GFX908-NEXT: v_writelane_b32 v40, s23, 14
608
+ ; GFX908-NEXT: v_writelane_b32 v40, s24, 15
609
+ ; GFX908-NEXT: v_writelane_b32 v40, s25, 16
610
+ ; GFX908-NEXT: v_writelane_b32 v40, s26, 17
611
+ ; GFX908-NEXT: v_writelane_b32 v40, s27, 18
612
+ ; GFX908-NEXT: v_writelane_b32 v40, s28, 19
613
+ ; GFX908-NEXT: v_writelane_b32 v40, s29, 20
614
614
; GFX908-NEXT: v_readlane_b32 s4, v40, 10
615
615
; GFX908-NEXT: v_readlane_b32 s6, v40, 0
616
616
; GFX908-NEXT: v_readlane_b32 s8, v40, 8
@@ -630,39 +630,39 @@ define void @preserve_wwm_copy_dstreg(ptr %parg0, ptr %parg1, ptr %parg2) #0 {
630
630
; GFX908-NEXT: s_swappc_b64 s[30:31], s[16:17]
631
631
; GFX908-NEXT: s_or_saveexec_b64 s[34:35], -1
632
632
; GFX908-NEXT: s_mov_b64 exec, s[34:35]
633
- ; GFX908-NEXT: v_readlane_b32 s21, v40, 24
633
+ ; GFX908-NEXT: v_readlane_b32 s21, v40, 12
634
634
; GFX908-NEXT: ;;#ASMSTART
635
635
; GFX908-NEXT: ; use s21
636
636
; GFX908-NEXT: ;;#ASMEND
637
- ; GFX908-NEXT: v_readlane_b32 s22, v40, 25
637
+ ; GFX908-NEXT: v_readlane_b32 s22, v40, 13
638
638
; GFX908-NEXT: ;;#ASMSTART
639
639
; GFX908-NEXT: ; use s22
640
640
; GFX908-NEXT: ;;#ASMEND
641
- ; GFX908-NEXT: v_readlane_b32 s23, v40, 26
641
+ ; GFX908-NEXT: v_readlane_b32 s23, v40, 14
642
642
; GFX908-NEXT: ;;#ASMSTART
643
643
; GFX908-NEXT: ; use s23
644
644
; GFX908-NEXT: ;;#ASMEND
645
- ; GFX908-NEXT: v_readlane_b32 s24, v40, 27
645
+ ; GFX908-NEXT: v_readlane_b32 s24, v40, 15
646
646
; GFX908-NEXT: ;;#ASMSTART
647
647
; GFX908-NEXT: ; use s24
648
648
; GFX908-NEXT: ;;#ASMEND
649
- ; GFX908-NEXT: v_readlane_b32 s25, v40, 28
649
+ ; GFX908-NEXT: v_readlane_b32 s25, v40, 16
650
650
; GFX908-NEXT: ;;#ASMSTART
651
651
; GFX908-NEXT: ; use s25
652
652
; GFX908-NEXT: ;;#ASMEND
653
- ; GFX908-NEXT: v_readlane_b32 s26, v40, 29
653
+ ; GFX908-NEXT: v_readlane_b32 s26, v40, 17
654
654
; GFX908-NEXT: ;;#ASMSTART
655
655
; GFX908-NEXT: ; use s26
656
656
; GFX908-NEXT: ;;#ASMEND
657
- ; GFX908-NEXT: v_readlane_b32 s27, v40, 30
657
+ ; GFX908-NEXT: v_readlane_b32 s27, v40, 18
658
658
; GFX908-NEXT: ;;#ASMSTART
659
659
; GFX908-NEXT: ; use s27
660
660
; GFX908-NEXT: ;;#ASMEND
661
- ; GFX908-NEXT: v_readlane_b32 s28, v40, 31
661
+ ; GFX908-NEXT: v_readlane_b32 s28, v40, 19
662
662
; GFX908-NEXT: ;;#ASMSTART
663
663
; GFX908-NEXT: ; use s28
664
664
; GFX908-NEXT: ;;#ASMEND
665
- ; GFX908-NEXT: v_readlane_b32 s29, v40, 32
665
+ ; GFX908-NEXT: v_readlane_b32 s29, v40, 20
666
666
; GFX908-NEXT: ;;#ASMSTART
667
667
; GFX908-NEXT: ; use s29
668
668
; GFX908-NEXT: ;;#ASMEND
0 commit comments