This commit fixes a missed opportunity in merging consecutive stores.
The code that searches for stores skipped the case of stores that
directly connect to the root. The comment above the implementation lists
this case but the code did not handle it. I found this pattern when
looking into the shared_ptr destructor. GCC generates the right
sequence. Here is a small repo:
int foo(int* buff) {
buff[0] = 0;
int x = buff[1];
buff[1] = 0;
return x;
}
Differential Revision: https://reviews.llvm.org/D116895
629 lines
22 KiB
LLVM
629 lines
22 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
|
|
; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | \
|
|
; RUN: FileCheck %s --check-prefix=LE-PAIRED
|
|
; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-linux-gnu \
|
|
; RUN: -mcpu=pwr10 -ppc-asm-full-reg-names \
|
|
; RUN: -ppc-vsr-nums-as-vr < %s | FileCheck %s --check-prefix=BE-PAIRED
|
|
; RUN: llc -verify-machineinstrs -mcpu=pwr9 -ppc-vsr-nums-as-vr \
|
|
; RUN: -ppc-asm-full-reg-names -mtriple=powerpc64le-unknown-linux-gnu < %s \
|
|
; RUN: | FileCheck %s --check-prefix=LE-PWR9
|
|
; RUN: llc -verify-machineinstrs -mcpu=pwr8 -ppc-vsr-nums-as-vr \
|
|
; RUN: -ppc-asm-full-reg-names -mtriple=powerpc64le-unknown-linux-gnu < %s \
|
|
; RUN: | FileCheck %s --check-prefix=LE-PWR8
|
|
; RUN: llc -verify-machineinstrs -mcpu=pwr9 -ppc-vsr-nums-as-vr \
|
|
; RUN: -ppc-asm-full-reg-names -mtriple=powerpc64-unknown-linux-gnu < %s \
|
|
; RUN: | FileCheck %s --check-prefix=BE-PWR9
|
|
; RUN: llc -verify-machineinstrs -mcpu=pwr8 -ppc-vsr-nums-as-vr \
|
|
; RUN: -ppc-asm-full-reg-names -mtriple=powerpc64-unknown-linux-gnu < %s \
|
|
; RUN: | FileCheck %s --check-prefix=BE-PWR8
|
|
|
|
@f = common dso_local local_unnamed_addr global <512 x i1> zeroinitializer, align 16
|
|
@g = common dso_local local_unnamed_addr global <256 x i1> zeroinitializer, align 16
|
|
|
|
define dso_local void @testLdSt(i64 %SrcIdx, i64 %DstIdx) {
|
|
; LE-PAIRED-LABEL: testLdSt:
|
|
; LE-PAIRED: # %bb.0: # %entry
|
|
; LE-PAIRED-NEXT: plxv vs1, f@PCREL+96(0), 1
|
|
; LE-PAIRED-NEXT: plxv vs0, f@PCREL+112(0), 1
|
|
; LE-PAIRED-NEXT: plxv vs3, f@PCREL+64(0), 1
|
|
; LE-PAIRED-NEXT: plxv vs2, f@PCREL+80(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs0, f@PCREL+176(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs1, f@PCREL+160(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs2, f@PCREL+144(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs3, f@PCREL+128(0), 1
|
|
; LE-PAIRED-NEXT: blr
|
|
;
|
|
; BE-PAIRED-LABEL: testLdSt:
|
|
; BE-PAIRED: # %bb.0: # %entry
|
|
; BE-PAIRED-NEXT: addis r3, r2, f@toc@ha
|
|
; BE-PAIRED-NEXT: addi r3, r3, f@toc@l
|
|
; BE-PAIRED-NEXT: lxv vs1, 80(r3)
|
|
; BE-PAIRED-NEXT: lxv vs0, 64(r3)
|
|
; BE-PAIRED-NEXT: lxv vs3, 112(r3)
|
|
; BE-PAIRED-NEXT: lxv vs2, 96(r3)
|
|
; BE-PAIRED-NEXT: stxv vs1, 144(r3)
|
|
; BE-PAIRED-NEXT: stxv vs0, 128(r3)
|
|
; BE-PAIRED-NEXT: stxv vs3, 176(r3)
|
|
; BE-PAIRED-NEXT: stxv vs2, 160(r3)
|
|
; BE-PAIRED-NEXT: blr
|
|
;
|
|
; LE-PWR9-LABEL: testLdSt:
|
|
; LE-PWR9: # %bb.0: # %entry
|
|
; LE-PWR9-NEXT: addis r3, r2, f@toc@ha
|
|
; LE-PWR9-NEXT: addi r3, r3, f@toc@l
|
|
; LE-PWR9-NEXT: lxv vs1, 96(r3)
|
|
; LE-PWR9-NEXT: lxv vs0, 64(r3)
|
|
; LE-PWR9-NEXT: lxv vs2, 112(r3)
|
|
; LE-PWR9-NEXT: stxv vs1, 160(r3)
|
|
; LE-PWR9-NEXT: lxv vs1, 80(r3)
|
|
; LE-PWR9-NEXT: stxv vs2, 176(r3)
|
|
; LE-PWR9-NEXT: stxv vs0, 128(r3)
|
|
; LE-PWR9-NEXT: stxv vs1, 144(r3)
|
|
; LE-PWR9-NEXT: blr
|
|
;
|
|
; LE-PWR8-LABEL: testLdSt:
|
|
; LE-PWR8: # %bb.0: # %entry
|
|
; LE-PWR8-NEXT: addis r3, r2, f@toc@ha
|
|
; LE-PWR8-NEXT: li r4, 96
|
|
; LE-PWR8-NEXT: li r5, 112
|
|
; LE-PWR8-NEXT: addi r3, r3, f@toc@l
|
|
; LE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; LE-PWR8-NEXT: li r4, 64
|
|
; LE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; LE-PWR8-NEXT: li r5, 80
|
|
; LE-PWR8-NEXT: lxvd2x vs2, r3, r4
|
|
; LE-PWR8-NEXT: lxvd2x vs3, r3, r5
|
|
; LE-PWR8-NEXT: li r4, 176
|
|
; LE-PWR8-NEXT: li r5, 160
|
|
; LE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; LE-PWR8-NEXT: li r4, 144
|
|
; LE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; LE-PWR8-NEXT: li r5, 128
|
|
; LE-PWR8-NEXT: stxvd2x vs3, r3, r4
|
|
; LE-PWR8-NEXT: stxvd2x vs2, r3, r5
|
|
; LE-PWR8-NEXT: blr
|
|
;
|
|
; BE-PWR9-LABEL: testLdSt:
|
|
; BE-PWR9: # %bb.0: # %entry
|
|
; BE-PWR9-NEXT: addis r3, r2, f@toc@ha
|
|
; BE-PWR9-NEXT: addi r3, r3, f@toc@l
|
|
; BE-PWR9-NEXT: lxv vs1, 96(r3)
|
|
; BE-PWR9-NEXT: lxv vs0, 64(r3)
|
|
; BE-PWR9-NEXT: lxv vs2, 112(r3)
|
|
; BE-PWR9-NEXT: stxv vs1, 160(r3)
|
|
; BE-PWR9-NEXT: lxv vs1, 80(r3)
|
|
; BE-PWR9-NEXT: stxv vs2, 176(r3)
|
|
; BE-PWR9-NEXT: stxv vs0, 128(r3)
|
|
; BE-PWR9-NEXT: stxv vs1, 144(r3)
|
|
; BE-PWR9-NEXT: blr
|
|
;
|
|
; BE-PWR8-LABEL: testLdSt:
|
|
; BE-PWR8: # %bb.0: # %entry
|
|
; BE-PWR8-NEXT: addis r3, r2, f@toc@ha
|
|
; BE-PWR8-NEXT: li r4, 96
|
|
; BE-PWR8-NEXT: li r5, 112
|
|
; BE-PWR8-NEXT: addi r3, r3, f@toc@l
|
|
; BE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; BE-PWR8-NEXT: li r4, 64
|
|
; BE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; BE-PWR8-NEXT: li r5, 80
|
|
; BE-PWR8-NEXT: lxvd2x vs2, r3, r4
|
|
; BE-PWR8-NEXT: lxvd2x vs3, r3, r5
|
|
; BE-PWR8-NEXT: li r4, 176
|
|
; BE-PWR8-NEXT: li r5, 160
|
|
; BE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; BE-PWR8-NEXT: li r4, 144
|
|
; BE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; BE-PWR8-NEXT: li r5, 128
|
|
; BE-PWR8-NEXT: stxvd2x vs3, r3, r4
|
|
; BE-PWR8-NEXT: stxvd2x vs2, r3, r5
|
|
; BE-PWR8-NEXT: blr
|
|
entry:
|
|
%arrayidx = getelementptr inbounds <512 x i1>, <512 x i1>* @f, i64 1
|
|
%0 = load <512 x i1>, <512 x i1>* %arrayidx, align 64
|
|
%arrayidx1 = getelementptr inbounds <512 x i1>, <512 x i1>* @f, i64 2
|
|
store <512 x i1> %0, <512 x i1>* %arrayidx1, align 64
|
|
ret void
|
|
}
|
|
|
|
define dso_local void @testXLdSt(i64 %SrcIdx, i64 %DstIdx) {
|
|
; LE-PAIRED-LABEL: testXLdSt:
|
|
; LE-PAIRED: # %bb.0: # %entry
|
|
; LE-PAIRED-NEXT: paddi r5, 0, f@PCREL, 1
|
|
; LE-PAIRED-NEXT: sldi r3, r3, 6
|
|
; LE-PAIRED-NEXT: add r6, r5, r3
|
|
; LE-PAIRED-NEXT: lxv vs1, 32(r6)
|
|
; LE-PAIRED-NEXT: lxv vs0, 48(r6)
|
|
; LE-PAIRED-NEXT: lxvx vs3, r5, r3
|
|
; LE-PAIRED-NEXT: lxv vs2, 16(r6)
|
|
; LE-PAIRED-NEXT: sldi r3, r4, 6
|
|
; LE-PAIRED-NEXT: add r4, r5, r3
|
|
; LE-PAIRED-NEXT: stxvx vs3, r5, r3
|
|
; LE-PAIRED-NEXT: stxv vs0, 48(r4)
|
|
; LE-PAIRED-NEXT: stxv vs1, 32(r4)
|
|
; LE-PAIRED-NEXT: stxv vs2, 16(r4)
|
|
; LE-PAIRED-NEXT: blr
|
|
;
|
|
; BE-PAIRED-LABEL: testXLdSt:
|
|
; BE-PAIRED: # %bb.0: # %entry
|
|
; BE-PAIRED-NEXT: addis r5, r2, f@toc@ha
|
|
; BE-PAIRED-NEXT: addi r5, r5, f@toc@l
|
|
; BE-PAIRED-NEXT: sldi r3, r3, 6
|
|
; BE-PAIRED-NEXT: add r6, r5, r3
|
|
; BE-PAIRED-NEXT: lxvx vs0, r5, r3
|
|
; BE-PAIRED-NEXT: sldi r3, r4, 6
|
|
; BE-PAIRED-NEXT: add r4, r5, r3
|
|
; BE-PAIRED-NEXT: lxv vs1, 16(r6)
|
|
; BE-PAIRED-NEXT: lxv vs3, 48(r6)
|
|
; BE-PAIRED-NEXT: lxv vs2, 32(r6)
|
|
; BE-PAIRED-NEXT: stxvx vs0, r5, r3
|
|
; BE-PAIRED-NEXT: stxv vs1, 16(r4)
|
|
; BE-PAIRED-NEXT: stxv vs3, 48(r4)
|
|
; BE-PAIRED-NEXT: stxv vs2, 32(r4)
|
|
; BE-PAIRED-NEXT: blr
|
|
;
|
|
; LE-PWR9-LABEL: testXLdSt:
|
|
; LE-PWR9: # %bb.0: # %entry
|
|
; LE-PWR9-NEXT: addis r5, r2, f@toc@ha
|
|
; LE-PWR9-NEXT: sldi r3, r3, 6
|
|
; LE-PWR9-NEXT: addi r5, r5, f@toc@l
|
|
; LE-PWR9-NEXT: add r6, r5, r3
|
|
; LE-PWR9-NEXT: lxvx vs3, r5, r3
|
|
; LE-PWR9-NEXT: sldi r3, r4, 6
|
|
; LE-PWR9-NEXT: lxv vs0, 16(r6)
|
|
; LE-PWR9-NEXT: lxv vs1, 32(r6)
|
|
; LE-PWR9-NEXT: lxv vs2, 48(r6)
|
|
; LE-PWR9-NEXT: stxvx vs3, r5, r3
|
|
; LE-PWR9-NEXT: add r3, r5, r3
|
|
; LE-PWR9-NEXT: stxv vs2, 48(r3)
|
|
; LE-PWR9-NEXT: stxv vs1, 32(r3)
|
|
; LE-PWR9-NEXT: stxv vs0, 16(r3)
|
|
; LE-PWR9-NEXT: blr
|
|
;
|
|
; LE-PWR8-LABEL: testXLdSt:
|
|
; LE-PWR8: # %bb.0: # %entry
|
|
; LE-PWR8-NEXT: addis r5, r2, f@toc@ha
|
|
; LE-PWR8-NEXT: sldi r3, r3, 6
|
|
; LE-PWR8-NEXT: li r6, 48
|
|
; LE-PWR8-NEXT: li r8, 16
|
|
; LE-PWR8-NEXT: li r9, 32
|
|
; LE-PWR8-NEXT: addi r5, r5, f@toc@l
|
|
; LE-PWR8-NEXT: add r7, r5, r3
|
|
; LE-PWR8-NEXT: lxvd2x vs0, r5, r3
|
|
; LE-PWR8-NEXT: sldi r3, r4, 6
|
|
; LE-PWR8-NEXT: lxvd2x vs1, r7, r6
|
|
; LE-PWR8-NEXT: lxvd2x vs2, r7, r8
|
|
; LE-PWR8-NEXT: add r4, r5, r3
|
|
; LE-PWR8-NEXT: lxvd2x vs3, r7, r9
|
|
; LE-PWR8-NEXT: stxvd2x vs0, r5, r3
|
|
; LE-PWR8-NEXT: stxvd2x vs1, r4, r6
|
|
; LE-PWR8-NEXT: stxvd2x vs3, r4, r9
|
|
; LE-PWR8-NEXT: stxvd2x vs2, r4, r8
|
|
; LE-PWR8-NEXT: blr
|
|
;
|
|
; BE-PWR9-LABEL: testXLdSt:
|
|
; BE-PWR9: # %bb.0: # %entry
|
|
; BE-PWR9-NEXT: addis r5, r2, f@toc@ha
|
|
; BE-PWR9-NEXT: sldi r3, r3, 6
|
|
; BE-PWR9-NEXT: addi r5, r5, f@toc@l
|
|
; BE-PWR9-NEXT: add r6, r5, r3
|
|
; BE-PWR9-NEXT: lxvx vs3, r5, r3
|
|
; BE-PWR9-NEXT: sldi r3, r4, 6
|
|
; BE-PWR9-NEXT: lxv vs0, 16(r6)
|
|
; BE-PWR9-NEXT: lxv vs1, 32(r6)
|
|
; BE-PWR9-NEXT: lxv vs2, 48(r6)
|
|
; BE-PWR9-NEXT: stxvx vs3, r5, r3
|
|
; BE-PWR9-NEXT: add r3, r5, r3
|
|
; BE-PWR9-NEXT: stxv vs2, 48(r3)
|
|
; BE-PWR9-NEXT: stxv vs1, 32(r3)
|
|
; BE-PWR9-NEXT: stxv vs0, 16(r3)
|
|
; BE-PWR9-NEXT: blr
|
|
;
|
|
; BE-PWR8-LABEL: testXLdSt:
|
|
; BE-PWR8: # %bb.0: # %entry
|
|
; BE-PWR8-NEXT: addis r5, r2, f@toc@ha
|
|
; BE-PWR8-NEXT: sldi r3, r3, 6
|
|
; BE-PWR8-NEXT: li r6, 32
|
|
; BE-PWR8-NEXT: li r7, 48
|
|
; BE-PWR8-NEXT: li r9, 16
|
|
; BE-PWR8-NEXT: addi r5, r5, f@toc@l
|
|
; BE-PWR8-NEXT: add r8, r5, r3
|
|
; BE-PWR8-NEXT: lxvd2x vs2, r5, r3
|
|
; BE-PWR8-NEXT: sldi r3, r4, 6
|
|
; BE-PWR8-NEXT: lxvd2x vs0, r8, r6
|
|
; BE-PWR8-NEXT: lxvd2x vs1, r8, r7
|
|
; BE-PWR8-NEXT: add r4, r5, r3
|
|
; BE-PWR8-NEXT: lxvd2x vs3, r8, r9
|
|
; BE-PWR8-NEXT: stxvd2x vs2, r5, r3
|
|
; BE-PWR8-NEXT: stxvd2x vs1, r4, r7
|
|
; BE-PWR8-NEXT: stxvd2x vs0, r4, r6
|
|
; BE-PWR8-NEXT: stxvd2x vs3, r4, r9
|
|
; BE-PWR8-NEXT: blr
|
|
entry:
|
|
%arrayidx = getelementptr inbounds <512 x i1>, <512 x i1>* @f, i64 %SrcIdx
|
|
%0 = load <512 x i1>, <512 x i1>* %arrayidx, align 64
|
|
%arrayidx1 = getelementptr inbounds <512 x i1>, <512 x i1>* @f, i64 %DstIdx
|
|
store <512 x i1> %0, <512 x i1>* %arrayidx1, align 64
|
|
ret void
|
|
}
|
|
|
|
define dso_local void @testUnalignedLdSt() {
|
|
; LE-PAIRED-LABEL: testUnalignedLdSt:
|
|
; LE-PAIRED: # %bb.0: # %entry
|
|
; LE-PAIRED-NEXT: plxv vs1, f@PCREL+43(0), 1
|
|
; LE-PAIRED-NEXT: plxv vs0, f@PCREL+59(0), 1
|
|
; LE-PAIRED-NEXT: plxv vs3, f@PCREL+11(0), 1
|
|
; LE-PAIRED-NEXT: plxv vs2, f@PCREL+27(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs0, f@PCREL+67(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs1, f@PCREL+51(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs2, f@PCREL+35(0), 1
|
|
; LE-PAIRED-NEXT: pstxv vs3, f@PCREL+19(0), 1
|
|
; LE-PAIRED-NEXT: blr
|
|
;
|
|
; BE-PAIRED-LABEL: testUnalignedLdSt:
|
|
; BE-PAIRED: # %bb.0: # %entry
|
|
; BE-PAIRED-NEXT: addis r3, r2, f@toc@ha
|
|
; BE-PAIRED-NEXT: addi r3, r3, f@toc@l
|
|
; BE-PAIRED-NEXT: plxv vs1, 27(r3), 0
|
|
; BE-PAIRED-NEXT: plxv vs0, 11(r3), 0
|
|
; BE-PAIRED-NEXT: plxv vs3, 59(r3), 0
|
|
; BE-PAIRED-NEXT: plxv vs2, 43(r3), 0
|
|
; BE-PAIRED-NEXT: pstxv vs1, 35(r3), 0
|
|
; BE-PAIRED-NEXT: pstxv vs0, 19(r3), 0
|
|
; BE-PAIRED-NEXT: pstxv vs3, 67(r3), 0
|
|
; BE-PAIRED-NEXT: pstxv vs2, 51(r3), 0
|
|
; BE-PAIRED-NEXT: blr
|
|
;
|
|
; LE-PWR9-LABEL: testUnalignedLdSt:
|
|
; LE-PWR9: # %bb.0: # %entry
|
|
; LE-PWR9-NEXT: addis r3, r2, f@toc@ha
|
|
; LE-PWR9-NEXT: li r4, 11
|
|
; LE-PWR9-NEXT: addi r3, r3, f@toc@l
|
|
; LE-PWR9-NEXT: lxvx vs0, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 27
|
|
; LE-PWR9-NEXT: lxvx vs1, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 43
|
|
; LE-PWR9-NEXT: lxvx vs2, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 59
|
|
; LE-PWR9-NEXT: lxvx vs3, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 67
|
|
; LE-PWR9-NEXT: stxvx vs3, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 51
|
|
; LE-PWR9-NEXT: stxvx vs2, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 35
|
|
; LE-PWR9-NEXT: stxvx vs1, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 19
|
|
; LE-PWR9-NEXT: stxvx vs0, r3, r4
|
|
; LE-PWR9-NEXT: blr
|
|
;
|
|
; LE-PWR8-LABEL: testUnalignedLdSt:
|
|
; LE-PWR8: # %bb.0: # %entry
|
|
; LE-PWR8-NEXT: addis r3, r2, f@toc@ha
|
|
; LE-PWR8-NEXT: li r4, 59
|
|
; LE-PWR8-NEXT: li r5, 43
|
|
; LE-PWR8-NEXT: addi r3, r3, f@toc@l
|
|
; LE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; LE-PWR8-NEXT: li r4, 11
|
|
; LE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; LE-PWR8-NEXT: li r5, 27
|
|
; LE-PWR8-NEXT: lxvd2x vs2, r3, r4
|
|
; LE-PWR8-NEXT: lxvd2x vs3, r3, r5
|
|
; LE-PWR8-NEXT: li r4, 51
|
|
; LE-PWR8-NEXT: li r5, 67
|
|
; LE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; LE-PWR8-NEXT: li r4, 35
|
|
; LE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; LE-PWR8-NEXT: li r5, 19
|
|
; LE-PWR8-NEXT: stxvd2x vs3, r3, r4
|
|
; LE-PWR8-NEXT: stxvd2x vs2, r3, r5
|
|
; LE-PWR8-NEXT: blr
|
|
;
|
|
; BE-PWR9-LABEL: testUnalignedLdSt:
|
|
; BE-PWR9: # %bb.0: # %entry
|
|
; BE-PWR9-NEXT: addis r3, r2, f@toc@ha
|
|
; BE-PWR9-NEXT: li r4, 11
|
|
; BE-PWR9-NEXT: addi r3, r3, f@toc@l
|
|
; BE-PWR9-NEXT: lxvx vs0, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 27
|
|
; BE-PWR9-NEXT: lxvx vs1, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 43
|
|
; BE-PWR9-NEXT: lxvx vs2, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 59
|
|
; BE-PWR9-NEXT: lxvx vs3, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 67
|
|
; BE-PWR9-NEXT: stxvx vs3, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 51
|
|
; BE-PWR9-NEXT: stxvx vs2, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 35
|
|
; BE-PWR9-NEXT: stxvx vs1, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 19
|
|
; BE-PWR9-NEXT: stxvx vs0, r3, r4
|
|
; BE-PWR9-NEXT: blr
|
|
;
|
|
; BE-PWR8-LABEL: testUnalignedLdSt:
|
|
; BE-PWR8: # %bb.0: # %entry
|
|
; BE-PWR8-NEXT: addis r3, r2, f@toc@ha
|
|
; BE-PWR8-NEXT: li r4, 43
|
|
; BE-PWR8-NEXT: li r5, 59
|
|
; BE-PWR8-NEXT: addi r3, r3, f@toc@l
|
|
; BE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; BE-PWR8-NEXT: li r4, 11
|
|
; BE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; BE-PWR8-NEXT: li r5, 27
|
|
; BE-PWR8-NEXT: lxvd2x vs2, r3, r4
|
|
; BE-PWR8-NEXT: lxvd2x vs3, r3, r5
|
|
; BE-PWR8-NEXT: li r4, 67
|
|
; BE-PWR8-NEXT: li r5, 51
|
|
; BE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; BE-PWR8-NEXT: li r4, 35
|
|
; BE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; BE-PWR8-NEXT: li r5, 19
|
|
; BE-PWR8-NEXT: stxvd2x vs3, r3, r4
|
|
; BE-PWR8-NEXT: stxvd2x vs2, r3, r5
|
|
; BE-PWR8-NEXT: blr
|
|
entry:
|
|
%0 = bitcast <512 x i1>* @f to i8*
|
|
%add.ptr = getelementptr inbounds i8, i8* %0, i64 11
|
|
%add.ptr1 = getelementptr inbounds i8, i8* %0, i64 19
|
|
%1 = bitcast i8* %add.ptr to <512 x i1>*
|
|
%2 = bitcast i8* %add.ptr1 to <512 x i1>*
|
|
%3 = load <512 x i1>, <512 x i1>* %1, align 64
|
|
store <512 x i1> %3, <512 x i1>* %2, align 64
|
|
ret void
|
|
}
|
|
|
|
define dso_local void @testLdStPair(i64 %SrcIdx, i64 %DstIdx) {
|
|
; LE-PAIRED-LABEL: testLdStPair:
|
|
; LE-PAIRED: # %bb.0: # %entry
|
|
; LE-PAIRED-NEXT: plxv v3, g@PCREL+32(0), 1
|
|
; LE-PAIRED-NEXT: plxv v2, g@PCREL+48(0), 1
|
|
; LE-PAIRED-NEXT: pstxv v3, g@PCREL+64(0), 1
|
|
; LE-PAIRED-NEXT: pstxv v2, g@PCREL+80(0), 1
|
|
; LE-PAIRED-NEXT: blr
|
|
;
|
|
; BE-PAIRED-LABEL: testLdStPair:
|
|
; BE-PAIRED: # %bb.0: # %entry
|
|
; BE-PAIRED-NEXT: addis r3, r2, g@toc@ha
|
|
; BE-PAIRED-NEXT: addi r3, r3, g@toc@l
|
|
; BE-PAIRED-NEXT: lxv v3, 48(r3)
|
|
; BE-PAIRED-NEXT: lxv v2, 32(r3)
|
|
; BE-PAIRED-NEXT: stxv v3, 80(r3)
|
|
; BE-PAIRED-NEXT: stxv v2, 64(r3)
|
|
; BE-PAIRED-NEXT: blr
|
|
;
|
|
; LE-PWR9-LABEL: testLdStPair:
|
|
; LE-PWR9: # %bb.0: # %entry
|
|
; LE-PWR9-NEXT: addis r3, r2, g@toc@ha
|
|
; LE-PWR9-NEXT: addi r3, r3, g@toc@l
|
|
; LE-PWR9-NEXT: lxv vs0, 32(r3)
|
|
; LE-PWR9-NEXT: lxv vs1, 48(r3)
|
|
; LE-PWR9-NEXT: stxv vs1, 80(r3)
|
|
; LE-PWR9-NEXT: stxv vs0, 64(r3)
|
|
; LE-PWR9-NEXT: blr
|
|
;
|
|
; LE-PWR8-LABEL: testLdStPair:
|
|
; LE-PWR8: # %bb.0: # %entry
|
|
; LE-PWR8-NEXT: addis r3, r2, g@toc@ha
|
|
; LE-PWR8-NEXT: li r4, 32
|
|
; LE-PWR8-NEXT: li r5, 48
|
|
; LE-PWR8-NEXT: addi r3, r3, g@toc@l
|
|
; LE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; LE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; LE-PWR8-NEXT: li r4, 80
|
|
; LE-PWR8-NEXT: li r5, 64
|
|
; LE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; LE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; LE-PWR8-NEXT: blr
|
|
;
|
|
; BE-PWR9-LABEL: testLdStPair:
|
|
; BE-PWR9: # %bb.0: # %entry
|
|
; BE-PWR9-NEXT: addis r3, r2, g@toc@ha
|
|
; BE-PWR9-NEXT: addi r3, r3, g@toc@l
|
|
; BE-PWR9-NEXT: lxv vs0, 32(r3)
|
|
; BE-PWR9-NEXT: lxv vs1, 48(r3)
|
|
; BE-PWR9-NEXT: stxv vs1, 80(r3)
|
|
; BE-PWR9-NEXT: stxv vs0, 64(r3)
|
|
; BE-PWR9-NEXT: blr
|
|
;
|
|
; BE-PWR8-LABEL: testLdStPair:
|
|
; BE-PWR8: # %bb.0: # %entry
|
|
; BE-PWR8-NEXT: addis r3, r2, g@toc@ha
|
|
; BE-PWR8-NEXT: li r4, 32
|
|
; BE-PWR8-NEXT: li r5, 48
|
|
; BE-PWR8-NEXT: addi r3, r3, g@toc@l
|
|
; BE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; BE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; BE-PWR8-NEXT: li r4, 80
|
|
; BE-PWR8-NEXT: li r5, 64
|
|
; BE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; BE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; BE-PWR8-NEXT: blr
|
|
entry:
|
|
%arrayidx = getelementptr inbounds <256 x i1>, <256 x i1>* @g, i64 1
|
|
%0 = load <256 x i1>, <256 x i1>* %arrayidx, align 64
|
|
%arrayidx1 = getelementptr inbounds <256 x i1>, <256 x i1>* @g, i64 2
|
|
store <256 x i1> %0, <256 x i1>* %arrayidx1, align 64
|
|
ret void
|
|
}
|
|
|
|
define dso_local void @testXLdStPair(i64 %SrcIdx, i64 %DstIdx) {
|
|
; LE-PAIRED-LABEL: testXLdStPair:
|
|
; LE-PAIRED: # %bb.0: # %entry
|
|
; LE-PAIRED-NEXT: sldi r3, r3, 5
|
|
; LE-PAIRED-NEXT: paddi r5, 0, g@PCREL, 1
|
|
; LE-PAIRED-NEXT: add r6, r5, r3
|
|
; LE-PAIRED-NEXT: lxvx v3, r5, r3
|
|
; LE-PAIRED-NEXT: sldi r3, r4, 5
|
|
; LE-PAIRED-NEXT: lxv v2, 16(r6)
|
|
; LE-PAIRED-NEXT: add r4, r5, r3
|
|
; LE-PAIRED-NEXT: stxvx v3, r5, r3
|
|
; LE-PAIRED-NEXT: stxv v2, 16(r4)
|
|
; LE-PAIRED-NEXT: blr
|
|
;
|
|
; BE-PAIRED-LABEL: testXLdStPair:
|
|
; BE-PAIRED: # %bb.0: # %entry
|
|
; BE-PAIRED-NEXT: addis r5, r2, g@toc@ha
|
|
; BE-PAIRED-NEXT: sldi r3, r3, 5
|
|
; BE-PAIRED-NEXT: addi r5, r5, g@toc@l
|
|
; BE-PAIRED-NEXT: add r6, r5, r3
|
|
; BE-PAIRED-NEXT: lxvx v2, r5, r3
|
|
; BE-PAIRED-NEXT: sldi r3, r4, 5
|
|
; BE-PAIRED-NEXT: lxv v3, 16(r6)
|
|
; BE-PAIRED-NEXT: add r4, r5, r3
|
|
; BE-PAIRED-NEXT: stxvx v2, r5, r3
|
|
; BE-PAIRED-NEXT: stxv v3, 16(r4)
|
|
; BE-PAIRED-NEXT: blr
|
|
;
|
|
; LE-PWR9-LABEL: testXLdStPair:
|
|
; LE-PWR9: # %bb.0: # %entry
|
|
; LE-PWR9-NEXT: addis r5, r2, g@toc@ha
|
|
; LE-PWR9-NEXT: sldi r3, r3, 5
|
|
; LE-PWR9-NEXT: sldi r4, r4, 5
|
|
; LE-PWR9-NEXT: addi r5, r5, g@toc@l
|
|
; LE-PWR9-NEXT: add r6, r5, r3
|
|
; LE-PWR9-NEXT: lxvx vs1, r5, r3
|
|
; LE-PWR9-NEXT: lxv vs0, 16(r6)
|
|
; LE-PWR9-NEXT: add r6, r5, r4
|
|
; LE-PWR9-NEXT: stxvx vs1, r5, r4
|
|
; LE-PWR9-NEXT: stxv vs0, 16(r6)
|
|
; LE-PWR9-NEXT: blr
|
|
;
|
|
; LE-PWR8-LABEL: testXLdStPair:
|
|
; LE-PWR8: # %bb.0: # %entry
|
|
; LE-PWR8-NEXT: addis r5, r2, g@toc@ha
|
|
; LE-PWR8-NEXT: sldi r3, r3, 5
|
|
; LE-PWR8-NEXT: li r7, 16
|
|
; LE-PWR8-NEXT: addi r5, r5, g@toc@l
|
|
; LE-PWR8-NEXT: add r6, r5, r3
|
|
; LE-PWR8-NEXT: lxvd2x vs1, r5, r3
|
|
; LE-PWR8-NEXT: sldi r3, r4, 5
|
|
; LE-PWR8-NEXT: lxvd2x vs0, r6, r7
|
|
; LE-PWR8-NEXT: add r4, r5, r3
|
|
; LE-PWR8-NEXT: stxvd2x vs1, r5, r3
|
|
; LE-PWR8-NEXT: stxvd2x vs0, r4, r7
|
|
; LE-PWR8-NEXT: blr
|
|
;
|
|
; BE-PWR9-LABEL: testXLdStPair:
|
|
; BE-PWR9: # %bb.0: # %entry
|
|
; BE-PWR9-NEXT: addis r5, r2, g@toc@ha
|
|
; BE-PWR9-NEXT: sldi r3, r3, 5
|
|
; BE-PWR9-NEXT: sldi r4, r4, 5
|
|
; BE-PWR9-NEXT: addi r5, r5, g@toc@l
|
|
; BE-PWR9-NEXT: add r6, r5, r3
|
|
; BE-PWR9-NEXT: lxvx vs1, r5, r3
|
|
; BE-PWR9-NEXT: lxv vs0, 16(r6)
|
|
; BE-PWR9-NEXT: add r6, r5, r4
|
|
; BE-PWR9-NEXT: stxvx vs1, r5, r4
|
|
; BE-PWR9-NEXT: stxv vs0, 16(r6)
|
|
; BE-PWR9-NEXT: blr
|
|
;
|
|
; BE-PWR8-LABEL: testXLdStPair:
|
|
; BE-PWR8: # %bb.0: # %entry
|
|
; BE-PWR8-NEXT: addis r5, r2, g@toc@ha
|
|
; BE-PWR8-NEXT: sldi r3, r3, 5
|
|
; BE-PWR8-NEXT: li r7, 16
|
|
; BE-PWR8-NEXT: addi r5, r5, g@toc@l
|
|
; BE-PWR8-NEXT: add r6, r5, r3
|
|
; BE-PWR8-NEXT: lxvd2x vs0, r5, r3
|
|
; BE-PWR8-NEXT: sldi r3, r4, 5
|
|
; BE-PWR8-NEXT: lxvd2x vs1, r6, r7
|
|
; BE-PWR8-NEXT: add r4, r5, r3
|
|
; BE-PWR8-NEXT: stxvd2x vs0, r5, r3
|
|
; BE-PWR8-NEXT: stxvd2x vs1, r4, r7
|
|
; BE-PWR8-NEXT: blr
|
|
entry:
|
|
%arrayidx = getelementptr inbounds <256 x i1>, <256 x i1>* @g, i64 %SrcIdx
|
|
%0 = load <256 x i1>, <256 x i1>* %arrayidx, align 64
|
|
%arrayidx1 = getelementptr inbounds <256 x i1>, <256 x i1>* @g, i64 %DstIdx
|
|
store <256 x i1> %0, <256 x i1>* %arrayidx1, align 64
|
|
ret void
|
|
}
|
|
|
|
define dso_local void @testUnalignedLdStPair() {
|
|
; LE-PAIRED-LABEL: testUnalignedLdStPair:
|
|
; LE-PAIRED: # %bb.0: # %entry
|
|
; LE-PAIRED-NEXT: plxv v3, g@PCREL+11(0), 1
|
|
; LE-PAIRED-NEXT: plxv v2, g@PCREL+27(0), 1
|
|
; LE-PAIRED-NEXT: pstxv v3, g@PCREL+19(0), 1
|
|
; LE-PAIRED-NEXT: pstxv v2, g@PCREL+35(0), 1
|
|
; LE-PAIRED-NEXT: blr
|
|
;
|
|
; BE-PAIRED-LABEL: testUnalignedLdStPair:
|
|
; BE-PAIRED: # %bb.0: # %entry
|
|
; BE-PAIRED-NEXT: addis r3, r2, g@toc@ha
|
|
; BE-PAIRED-NEXT: addi r3, r3, g@toc@l
|
|
; BE-PAIRED-NEXT: plxv v3, 27(r3), 0
|
|
; BE-PAIRED-NEXT: plxv v2, 11(r3), 0
|
|
; BE-PAIRED-NEXT: pstxv v3, 35(r3), 0
|
|
; BE-PAIRED-NEXT: pstxv v2, 19(r3), 0
|
|
; BE-PAIRED-NEXT: blr
|
|
;
|
|
; LE-PWR9-LABEL: testUnalignedLdStPair:
|
|
; LE-PWR9: # %bb.0: # %entry
|
|
; LE-PWR9-NEXT: addis r3, r2, g@toc@ha
|
|
; LE-PWR9-NEXT: li r4, 11
|
|
; LE-PWR9-NEXT: addi r3, r3, g@toc@l
|
|
; LE-PWR9-NEXT: lxvx vs0, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 27
|
|
; LE-PWR9-NEXT: lxvx vs1, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 35
|
|
; LE-PWR9-NEXT: stxvx vs1, r3, r4
|
|
; LE-PWR9-NEXT: li r4, 19
|
|
; LE-PWR9-NEXT: stxvx vs0, r3, r4
|
|
; LE-PWR9-NEXT: blr
|
|
;
|
|
; LE-PWR8-LABEL: testUnalignedLdStPair:
|
|
; LE-PWR8: # %bb.0: # %entry
|
|
; LE-PWR8-NEXT: addis r3, r2, g@toc@ha
|
|
; LE-PWR8-NEXT: li r4, 27
|
|
; LE-PWR8-NEXT: li r5, 11
|
|
; LE-PWR8-NEXT: li r6, 19
|
|
; LE-PWR8-NEXT: li r8, 35
|
|
; LE-PWR8-NEXT: addi r3, r3, g@toc@l
|
|
; LE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; LE-PWR8-NEXT: ldx r5, r3, r5
|
|
; LE-PWR8-NEXT: ldx r7, r3, r6
|
|
; LE-PWR8-NEXT: stdx r7, r3, r4
|
|
; LE-PWR8-NEXT: stdx r5, r3, r6
|
|
; LE-PWR8-NEXT: stxvd2x vs0, r3, r8
|
|
; LE-PWR8-NEXT: blr
|
|
;
|
|
; BE-PWR9-LABEL: testUnalignedLdStPair:
|
|
; BE-PWR9: # %bb.0: # %entry
|
|
; BE-PWR9-NEXT: addis r3, r2, g@toc@ha
|
|
; BE-PWR9-NEXT: li r4, 11
|
|
; BE-PWR9-NEXT: addi r3, r3, g@toc@l
|
|
; BE-PWR9-NEXT: lxvx vs0, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 27
|
|
; BE-PWR9-NEXT: lxvx vs1, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 35
|
|
; BE-PWR9-NEXT: stxvx vs1, r3, r4
|
|
; BE-PWR9-NEXT: li r4, 19
|
|
; BE-PWR9-NEXT: stxvx vs0, r3, r4
|
|
; BE-PWR9-NEXT: blr
|
|
;
|
|
; BE-PWR8-LABEL: testUnalignedLdStPair:
|
|
; BE-PWR8: # %bb.0: # %entry
|
|
; BE-PWR8-NEXT: addis r3, r2, g@toc@ha
|
|
; BE-PWR8-NEXT: li r4, 11
|
|
; BE-PWR8-NEXT: li r5, 27
|
|
; BE-PWR8-NEXT: addi r3, r3, g@toc@l
|
|
; BE-PWR8-NEXT: lxvd2x vs0, r3, r4
|
|
; BE-PWR8-NEXT: lxvd2x vs1, r3, r5
|
|
; BE-PWR8-NEXT: li r4, 35
|
|
; BE-PWR8-NEXT: li r5, 19
|
|
; BE-PWR8-NEXT: stxvd2x vs1, r3, r4
|
|
; BE-PWR8-NEXT: stxvd2x vs0, r3, r5
|
|
; BE-PWR8-NEXT: blr
|
|
entry:
|
|
%0 = bitcast <256 x i1>* @g to i8*
|
|
%add.ptr = getelementptr inbounds i8, i8* %0, i64 11
|
|
%add.ptr1 = getelementptr inbounds i8, i8* %0, i64 19
|
|
%1 = bitcast i8* %add.ptr to <256 x i1>*
|
|
%2 = bitcast i8* %add.ptr1 to <256 x i1>*
|
|
%3 = load <256 x i1>, <256 x i1>* %1, align 64
|
|
store <256 x i1> %3, <256 x i1>* %2, align 64
|
|
ret void
|
|
}
|