Before this patch (and D135844) - Given DAG node shl(op, N), isBitfieldPositioningOp uses (optionally shifted [1] ) op as the Src (least significant bits of Src are inserted into DstLSB of Dst node). After this patch - If op is and(val, mask), isBitfieldPositioningOp tries to see through and and find if val is a simpler source than op. It helps in a similar (probably symmetric) way how isSeveralBitsExtractOpFromShr [2] optimizes isBitfieldExtractOpFromShr Existing test cases are improved without regressions. [1]cbd8464595/llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp (L2546)[2]cbd8464595/llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp (L2057)Differential Revision: https://reviews.llvm.org/D135850
31 lines
1.0 KiB
LLVM
31 lines
1.0 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=aarch64-none-linux-gnu | FileCheck %s
|
|
|
|
; This used to hit an assertion caused by dagcombine merge store.
|
|
; When the store memVT is v1f32 and the other store to be merged
|
|
; is f32, we need to build vector for the f32 store.
|
|
|
|
define void @f(<1 x float> %a, i64 %b) {
|
|
; CHECK-LABEL: f:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: sub sp, sp, #16
|
|
; CHECK-NEXT: .cfi_def_cfa_offset 16
|
|
; CHECK-NEXT: adrp x8, .LCPI0_0
|
|
; CHECK-NEXT: mov x9, sp
|
|
; CHECK-NEXT: bfi x9, x0, #2, #1
|
|
; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0
|
|
; CHECK-NEXT: ldr d1, [x8, :lo12:.LCPI0_0]
|
|
; CHECK-NEXT: str d1, [sp]
|
|
; CHECK-NEXT: ldr s1, [x9]
|
|
; CHECK-NEXT: mov v1.s[1], v0.s[0]
|
|
; CHECK-NEXT: str d1, [sp, #8]
|
|
; CHECK-NEXT: add sp, sp, #16
|
|
; CHECK-NEXT: ret
|
|
%P = alloca i64
|
|
%E = extractelement <2 x float> <float 0.5, float 1.0>, i64 %b
|
|
%G = getelementptr <1 x float>, ptr %P, i64 1
|
|
store float %E, ptr %P
|
|
store <1 x float> %a, ptr %G
|
|
ret void
|
|
}
|