@@ -248,24 +248,25 @@ body: |
248
248
249
249
; GFX7-LABEL: name: load_global_s64
250
250
; GFX7: liveins: $vgpr0_vgpr1
251
- ; GFX7: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
252
- ; GFX7: [[LOAD :%[0-9]+]]:vreg_64(s64) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
253
- ; GFX7: $vgpr0_vgpr1 = COPY [[LOAD]](s64)
251
+ ; GFX7: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
252
+ ; GFX7: [[FLAT_LOAD_DWORDX2_ :%[0-9]+]]:vreg_64 = FLAT_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 8, addrspace 1)
253
+ ; GFX7: $vgpr0_vgpr1 = COPY [[FLAT_LOAD_DWORDX2_]]
254
254
; GFX8-LABEL: name: load_global_s64
255
255
; GFX8: liveins: $vgpr0_vgpr1
256
- ; GFX8: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
257
- ; GFX8: [[LOAD :%[0-9]+]]:vreg_64(s64) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
258
- ; GFX8: $vgpr0_vgpr1 = COPY [[LOAD]](s64)
256
+ ; GFX8: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
257
+ ; GFX8: [[FLAT_LOAD_DWORDX2_ :%[0-9]+]]:vreg_64 = FLAT_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 8, addrspace 1)
258
+ ; GFX8: $vgpr0_vgpr1 = COPY [[FLAT_LOAD_DWORDX2_]]
259
259
; GFX9-LABEL: name: load_global_s64
260
260
; GFX9: liveins: $vgpr0_vgpr1
261
- ; GFX9: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
262
- ; GFX9: [[LOAD :%[0-9]+]]:vreg_64(s64) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
263
- ; GFX9: $vgpr0_vgpr1 = COPY [[LOAD]](s64)
261
+ ; GFX9: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
262
+ ; GFX9: [[GLOBAL_LOAD_DWORDX2_ :%[0-9]+]]:vreg_64 = GLOBAL_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec :: (load 8, addrspace 1)
263
+ ; GFX9: $vgpr0_vgpr1 = COPY [[GLOBAL_LOAD_DWORDX2_]]
264
264
; GFX10-LABEL: name: load_global_s64
265
265
; GFX10: liveins: $vgpr0_vgpr1
266
- ; GFX10: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
267
- ; GFX10: [[LOAD:%[0-9]+]]:vreg_64(s64) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
268
- ; GFX10: $vgpr0_vgpr1 = COPY [[LOAD]](s64)
266
+ ; GFX10: $vcc_hi = IMPLICIT_DEF
267
+ ; GFX10: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
268
+ ; GFX10: [[GLOBAL_LOAD_DWORDX2_:%[0-9]+]]:vreg_64 = GLOBAL_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec :: (load 8, addrspace 1)
269
+ ; GFX10: $vgpr0_vgpr1 = COPY [[GLOBAL_LOAD_DWORDX2_]]
269
270
%0:vgpr(p1) = COPY $vgpr0_vgpr1
270
271
%1:vgpr(s64) = G_LOAD %0 :: (load 8, align 8, addrspace 1)
271
272
$vgpr0_vgpr1 = COPY %1
@@ -581,24 +582,25 @@ body: |
581
582
582
583
; GFX7-LABEL: name: load_global_v2s16
583
584
; GFX7: liveins: $vgpr0_vgpr1
584
- ; GFX7: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
585
- ; GFX7: [[LOAD :%[0-9]+]]:vgpr_32(<2 x s16>) = G_LOAD [[COPY]](p1) :: (load 4, addrspace 1)
586
- ; GFX7: $vgpr0 = COPY [[LOAD]](<2 x s16>)
585
+ ; GFX7: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
586
+ ; GFX7: [[FLAT_LOAD_DWORD :%[0-9]+]]:vgpr_32 = FLAT_LOAD_DWORD [[COPY]], 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 4, addrspace 1)
587
+ ; GFX7: $vgpr0 = COPY [[FLAT_LOAD_DWORD]]
587
588
; GFX8-LABEL: name: load_global_v2s16
588
589
; GFX8: liveins: $vgpr0_vgpr1
589
- ; GFX8: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
590
- ; GFX8: [[LOAD :%[0-9]+]]:vgpr_32(<2 x s16>) = G_LOAD [[COPY]](p1) :: (load 4, addrspace 1)
591
- ; GFX8: $vgpr0 = COPY [[LOAD]](<2 x s16>)
590
+ ; GFX8: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
591
+ ; GFX8: [[FLAT_LOAD_DWORD :%[0-9]+]]:vgpr_32 = FLAT_LOAD_DWORD [[COPY]], 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 4, addrspace 1)
592
+ ; GFX8: $vgpr0 = COPY [[FLAT_LOAD_DWORD]]
592
593
; GFX9-LABEL: name: load_global_v2s16
593
594
; GFX9: liveins: $vgpr0_vgpr1
594
- ; GFX9: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
595
- ; GFX9: [[LOAD :%[0-9]+]]:vgpr_32(<2 x s16>) = G_LOAD [[COPY]](p1) :: (load 4, addrspace 1)
596
- ; GFX9: $vgpr0 = COPY [[LOAD]](<2 x s16>)
595
+ ; GFX9: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
596
+ ; GFX9: [[GLOBAL_LOAD_DWORD :%[0-9]+]]:vgpr_32 = GLOBAL_LOAD_DWORD [[COPY]], 0, 0, 0, 0, implicit $exec :: (load 4, addrspace 1)
597
+ ; GFX9: $vgpr0 = COPY [[GLOBAL_LOAD_DWORD]]
597
598
; GFX10-LABEL: name: load_global_v2s16
598
599
; GFX10: liveins: $vgpr0_vgpr1
599
- ; GFX10: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
600
- ; GFX10: [[LOAD:%[0-9]+]]:vgpr_32(<2 x s16>) = G_LOAD [[COPY]](p1) :: (load 4, addrspace 1)
601
- ; GFX10: $vgpr0 = COPY [[LOAD]](<2 x s16>)
600
+ ; GFX10: $vcc_hi = IMPLICIT_DEF
601
+ ; GFX10: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
602
+ ; GFX10: [[GLOBAL_LOAD_DWORD:%[0-9]+]]:vgpr_32 = GLOBAL_LOAD_DWORD [[COPY]], 0, 0, 0, 0, implicit $exec :: (load 4, addrspace 1)
603
+ ; GFX10: $vgpr0 = COPY [[GLOBAL_LOAD_DWORD]]
602
604
%0:vgpr(p1) = COPY $vgpr0_vgpr1
603
605
%1:vgpr(<2 x s16>) = G_LOAD %0 :: (load 4, align 4, addrspace 1)
604
606
$vgpr0 = COPY %1
@@ -618,24 +620,25 @@ body: |
618
620
619
621
; GFX7-LABEL: name: load_global_v4s16
620
622
; GFX7: liveins: $vgpr0_vgpr1
621
- ; GFX7: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
622
- ; GFX7: [[LOAD :%[0-9]+]]:vreg_64(<4 x s16>) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
623
- ; GFX7: $vgpr0_vgpr1 = COPY [[LOAD]](<4 x s16>)
623
+ ; GFX7: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
624
+ ; GFX7: [[FLAT_LOAD_DWORDX2_ :%[0-9]+]]:vreg_64 = FLAT_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 8, addrspace 1)
625
+ ; GFX7: $vgpr0_vgpr1 = COPY [[FLAT_LOAD_DWORDX2_]]
624
626
; GFX8-LABEL: name: load_global_v4s16
625
627
; GFX8: liveins: $vgpr0_vgpr1
626
- ; GFX8: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
627
- ; GFX8: [[LOAD :%[0-9]+]]:vreg_64(<4 x s16>) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
628
- ; GFX8: $vgpr0_vgpr1 = COPY [[LOAD]](<4 x s16>)
628
+ ; GFX8: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
629
+ ; GFX8: [[FLAT_LOAD_DWORDX2_ :%[0-9]+]]:vreg_64 = FLAT_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 8, addrspace 1)
630
+ ; GFX8: $vgpr0_vgpr1 = COPY [[FLAT_LOAD_DWORDX2_]]
629
631
; GFX9-LABEL: name: load_global_v4s16
630
632
; GFX9: liveins: $vgpr0_vgpr1
631
- ; GFX9: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
632
- ; GFX9: [[LOAD :%[0-9]+]]:vreg_64(<4 x s16>) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
633
- ; GFX9: $vgpr0_vgpr1 = COPY [[LOAD]](<4 x s16>)
633
+ ; GFX9: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
634
+ ; GFX9: [[GLOBAL_LOAD_DWORDX2_ :%[0-9]+]]:vreg_64 = GLOBAL_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec :: (load 8, addrspace 1)
635
+ ; GFX9: $vgpr0_vgpr1 = COPY [[GLOBAL_LOAD_DWORDX2_]]
634
636
; GFX10-LABEL: name: load_global_v4s16
635
637
; GFX10: liveins: $vgpr0_vgpr1
636
- ; GFX10: [[COPY:%[0-9]+]]:vgpr(p1) = COPY $vgpr0_vgpr1
637
- ; GFX10: [[LOAD:%[0-9]+]]:vreg_64(<4 x s16>) = G_LOAD [[COPY]](p1) :: (load 8, addrspace 1)
638
- ; GFX10: $vgpr0_vgpr1 = COPY [[LOAD]](<4 x s16>)
638
+ ; GFX10: $vcc_hi = IMPLICIT_DEF
639
+ ; GFX10: [[COPY:%[0-9]+]]:vreg_64 = COPY $vgpr0_vgpr1
640
+ ; GFX10: [[GLOBAL_LOAD_DWORDX2_:%[0-9]+]]:vreg_64 = GLOBAL_LOAD_DWORDX2 [[COPY]], 0, 0, 0, 0, implicit $exec :: (load 8, addrspace 1)
641
+ ; GFX10: $vgpr0_vgpr1 = COPY [[GLOBAL_LOAD_DWORDX2_]]
639
642
%0:vgpr(p1) = COPY $vgpr0_vgpr1
640
643
%1:vgpr(<4 x s16>) = G_LOAD %0 :: (load 8, align 8, addrspace 1)
641
644
$vgpr0_vgpr1 = COPY %1
0 commit comments