Ryan Cowan ad1a45b903
[AArch64] Use GISel for optnone functions (#174746)
Currently, when SDAG is run on AArch64 and an `optnone` function is
encountered, the selector is chosen as FastISel. AArch64 makes use of
GlobalISel at O0 and this patch aims to align `optnone` with this
functionality.

A flag is exposed to enable this functionality for a given backend but,
as AArch64 is currently the only backend I could find using GlobalISel
at O0 this is the only one with it implemented. This flag is set when
the target supports GlobalISel & GlobalISel hasn't been forced by the
user, the target machine or by being at an optimisation level lower than
`EnableGlobalISelAtO`.

If this happens, the GlobalISel passes are included as shown in
`llvm/test/CodeGen/AArch64/O3-pipeline.ll` and skipped by IRTranslator
for functions not marked as `optnone`.

In updating the tests based on this functionality, I found some unused
check lines or run lines that mixed SDAG with GlobalISel pass names
which have been fixed.

---------

Co-authored-by: Matt Arsenault <arsenm2@gmail.com>
2026-01-29 16:30:22 +00:00

55 lines
2.5 KiB
LLVM

; RUN: llc < %s -mtriple=aarch64-none-linux-gnu | FileCheck %s
@.str = private unnamed_addr constant [11 x i8] c"val = %ld\0A\00", align 1
; Function Attrs: noinline optnone
define dso_local void @set_large(i64 %val) #0 {
entry:
%val.addr = alloca i64, align 8
%large = alloca [268435456 x i64], align 8
%i = alloca i32, align 4
store i64 %val, ptr %val.addr, align 8
%0 = load i64, ptr %val.addr, align 8
%arrayidx = getelementptr inbounds [268435456 x i64], ptr %large, i64 0, i64 %0
store i64 1, ptr %arrayidx, align 8
%1 = load i64, ptr %val.addr, align 8
%arrayidx1 = getelementptr inbounds [268435456 x i64], ptr %large, i64 0, i64 %1
%2 = load i64, ptr %arrayidx1, align 8
%call = call i32 (ptr, ...) @printf(ptr @.str, i64 %2)
ret void
}
declare dso_local i32 @printf(ptr, ...)
attributes #0 = { noinline optnone "frame-pointer"="all" uwtable }
; CHECK: stp x[[SPILL_REG1:[0-9]+]], x[[SPILL_REG2:[0-9]+]], [sp, #-[[SPILL_OFFSET1:[0-9]+]]]
; CHECK-NEXT: .cfi_def_cfa_offset [[SPILL_OFFSET1]]
; CHECK-NEXT: str x[[SPILL_REG3:[0-9]+]], [sp, #[[SPILL_OFFSET2:[0-9]+]]]
; CHECK-NEXT: mov x[[FRAME:[0-9]+]], sp
; CHECK-NEXT: .cfi_def_cfa w[[FRAME]], [[SPILL_OFFSET1]]
; CHECK-COUNT-128: sub sp, sp, #[[STACK1:[0-9]+]], lsl #12
; CHECK-NEXT: sub sp, sp, #[[STACK2:[0-9]+]], lsl #12
; CHECK-NEXT: sub sp, sp, #[[STACK3:[0-9]+]]
; CHECK: sub x[[INDEX:[0-9]+]], x[[FRAME]], #8
; CHECK-NEXT: str x0, [x[[INDEX]]]
; CHECK-NEXT: ldr x[[VAL1:[0-9]+]], [x[[INDEX]]]
; CHECK-NEXT: add x10, sp, #8
; CHECK-NEXT: mov x11, #1 // =0x1
; CHECK-NEXT: str x11, [x10, x9, lsl #3]
; CHECK-NEXT: ldr x8, [x8]
; CHECK-NEXT: ldr x1, [x10, x8, lsl #3]
; CHECK-NEXT: adrp x0, .L.str
; CHECK-NEXT: add x0, x0, :lo12:.L.str
; CHECK: bl printf
; CHECK-COUNT-128: add sp, sp, #[[STACK1]], lsl #12
; CHECK-NEXT: add sp, sp, #[[STACK2]], lsl #12
; CHECK-NEXT: add sp, sp, #[[STACK3]]
; CHECK-NEXT: .cfi_def_cfa wsp, [[SPILL_OFFSET1]]
; CHECK-NEXT: ldr x[[SPILL_REG3]], [sp, #[[SPILL_OFFSET2]]]
; CHECK-NEXT: ldp x[[SPILL_REG1]], x[[SPILL_REG2]], [sp], #[[SPILL_OFFSET1]]
; CHECK-NEXT: .cfi_def_cfa_offset 0
; CHECK-NEXT: .cfi_restore w[[SPILL_REG3]]
; CHECK-NEXT: .cfi_restore w[[SPILL_REG2]]
; CHECK-NEXT: .cfi_restore w[[SPILL_REG1]]