
This issue starts in the selection DAG and causes the backend to emit the following for a trivial tail call: ``` ldr w8, [sp] str w8, [sp] b func ``` I'm not too sure that checking for immutability of a specific stack object is a good enough of a gurantee, because as soon a tail-call is done lowering,`setHasTailCall()` is called and in that case perhaps a pass is allowed to change the value of the object in-memory? This can be extended to the ARM backend as well. Removed the `tailcall` keyword from a few other test assets, I'm assuming their original intent was left intact.
84 lines
4.0 KiB
LLVM
84 lines
4.0 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s | FileCheck %s
|
|
|
|
target triple = "aarch64-unknown-linux-gnu"
|
|
|
|
; Ensure we don't crash by trying to fold fixed length frame indexes into
|
|
; loads/stores that don't support an appropriate addressing mode, hence creating
|
|
; too many extra vregs during frame lowering, when we don't have an emergency
|
|
; spill slot.
|
|
|
|
define dso_local void @func1(ptr %v1, ptr %v2, ptr %v3, ptr %v4, ptr %v5, ptr %v6, ptr %v7, ptr %v8,
|
|
; CHECK-LABEL: func1:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: sub sp, sp, #368
|
|
; CHECK-NEXT: stp x29, x30, [sp, #336] // 16-byte Folded Spill
|
|
; CHECK-NEXT: str x28, [sp, #352] // 8-byte Folded Spill
|
|
; CHECK-NEXT: add x29, sp, #336
|
|
; CHECK-NEXT: .cfi_def_cfa w29, 32
|
|
; CHECK-NEXT: .cfi_offset w28, -16
|
|
; CHECK-NEXT: .cfi_offset w30, -24
|
|
; CHECK-NEXT: .cfi_offset w29, -32
|
|
; CHECK-NEXT: add x8, x29, #32
|
|
; CHECK-NEXT: add x9, x29, #72
|
|
; CHECK-NEXT: ptrue p0.d
|
|
; CHECK-NEXT: ldr z0, [x8]
|
|
; CHECK-NEXT: add x8, x29, #256
|
|
; CHECK-NEXT: ldr z3, [x9]
|
|
; CHECK-NEXT: ldr z1, [x8]
|
|
; CHECK-NEXT: add x8, x29, #288
|
|
; CHECK-NEXT: add x9, x29, #168
|
|
; CHECK-NEXT: ldr z2, [x8]
|
|
; CHECK-NEXT: add x8, x29, #104
|
|
; CHECK-NEXT: ldr z6, [x9]
|
|
; CHECK-NEXT: ldr z4, [x8]
|
|
; CHECK-NEXT: add x8, x29, #136
|
|
; CHECK-NEXT: mov x12, #17 // =0x11
|
|
; CHECK-NEXT: ldr z5, [x8]
|
|
; CHECK-NEXT: ldp x10, x11, [x29, #336]
|
|
; CHECK-NEXT: st1d { z6.d }, p0, [sp, x12, lsl #3]
|
|
; CHECK-NEXT: mov x12, #13 // =0xd
|
|
; CHECK-NEXT: ldr x8, [x29, #200]
|
|
; CHECK-NEXT: ldr x9, [x29, #320]
|
|
; CHECK-NEXT: st1d { z5.d }, p0, [sp, x12, lsl #3]
|
|
; CHECK-NEXT: mov x12, #9 // =0x9
|
|
; CHECK-NEXT: st1d { z4.d }, p0, [sp, x12, lsl #3]
|
|
; CHECK-NEXT: mov x12, #5 // =0x5
|
|
; CHECK-NEXT: st1d { z3.d }, p0, [sp, x12, lsl #3]
|
|
; CHECK-NEXT: stp x10, x11, [sp, #304]
|
|
; CHECK-NEXT: str x9, [sp, #288]
|
|
; CHECK-NEXT: str z2, [sp, #8, mul vl]
|
|
; CHECK-NEXT: str z1, [sp, #7, mul vl]
|
|
; CHECK-NEXT: str x8, [sp, #168]
|
|
; CHECK-NEXT: str z0, [sp]
|
|
; CHECK-NEXT: bl func2
|
|
; CHECK-NEXT: ldp x29, x30, [sp, #336] // 16-byte Folded Reload
|
|
; CHECK-NEXT: ldr x28, [sp, #352] // 8-byte Folded Reload
|
|
; CHECK-NEXT: add sp, sp, #368
|
|
; CHECK-NEXT: ret
|
|
ptr %v9, ptr %v10, ptr %v11, ptr %v12, ptr %v13, ptr %v14, ptr %v15, ptr %v16,
|
|
ptr %v17, ptr %v18, ptr %v19, ptr %v20, ptr %v21, ptr %v22, ptr %v23, ptr %v24,
|
|
ptr %v25, ptr %v26, ptr %v27, ptr %v28, ptr %v29, ptr %v30, ptr %v31, ptr %v32,
|
|
ptr %v33, ptr %v34, ptr %v35, ptr %v36, ptr %v37, ptr %v38, ptr %v39, ptr %v40,
|
|
ptr %v41, ptr %v42, ptr %v43, ptr %v44, ptr %v45, ptr %v46, ptr %v47, ptr %v48,
|
|
i64 %v49) #0 {
|
|
call void @func2(ptr %v1, ptr %v2, ptr %v3, ptr %v4, ptr %v5, ptr %v6, ptr %v7, ptr %v8,
|
|
ptr %v9, ptr %v10, ptr %v11, ptr %v12, ptr undef, ptr %v14, ptr %v15, ptr %v16,
|
|
ptr %v17, ptr %v18, ptr %v19, ptr %v20, ptr %v21, ptr %v22, ptr %v23, ptr %v24,
|
|
ptr %v25, ptr %v26, ptr %v27, ptr %v28, ptr %v29, ptr %v30, ptr undef, ptr undef,
|
|
ptr undef, ptr undef, ptr undef, ptr undef, ptr %v37, ptr %v38, ptr %v39, ptr %v40,
|
|
ptr %v41, ptr %v42, ptr %v43, ptr %v44, ptr %v45, ptr undef, ptr %v47, ptr %v48,
|
|
i64 undef)
|
|
ret void
|
|
}
|
|
|
|
declare dso_local void @func2(ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr,
|
|
ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr,
|
|
ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr,
|
|
ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr,
|
|
ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr,
|
|
ptr, ptr, ptr, ptr, ptr, ptr, ptr, ptr,
|
|
i64)
|
|
|
|
attributes #0 = { "target-features"="+sve" vscale_range(2,2) }
|