[AArch64] Add global isel coverage for fp16 tests and strict-fp. NFC

This commit is contained in:
David Green 2025-09-29 16:54:49 +01:00
parent edca510555
commit 2e3f2523e6
3 changed files with 1620 additions and 708 deletions

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -1,31 +1,40 @@
; RUN: llc -mtriple=aarch64 %s -o - | FileCheck %s
; RUN: llc -mtriple=aarch64 -global-isel=true -global-isel-abort=2 %s -o - | FileCheck %s
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc -mtriple=aarch64 %s -o - | FileCheck %s --check-prefixes=CHECK,CHECK-SD
; RUN: llc -mtriple=aarch64 -global-isel=true -global-isel-abort=2 %s -o - 2>&1 | FileCheck %s --check-prefixes=CHECK,CHECK-GI
; CHECK-GI: warning: Instruction selection used fallback path for unused_div_fpexcept_strict
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for unused_div_round_dynamic
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for add_twice_fpexcept_strict
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for add_twice_round_dynamic
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for set_rounding
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for set_rounding_fpexcept_strict
; CHECK-GI-NEXT: warning: Instruction selection used fallback path for set_rounding_round_dynamic
; Div whose result is unused should be removed unless we have strict exceptions
; CHECK-LABEL: unused_div:
; CHECK-NOT: fdiv
; CHECK: ret
define void @unused_div(float %x, float %y) {
; CHECK-LABEL: unused_div:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: ret
entry:
%add = fdiv float %x, %y
ret void
}
; CHECK-LABEL: unused_div_fpexcept_strict:
; CHECK: fdiv s0, s0, s1
; CHECK-NEXT: ret
define void @unused_div_fpexcept_strict(float %x, float %y) #0 {
; CHECK-LABEL: unused_div_fpexcept_strict:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: fdiv s0, s0, s1
; CHECK-NEXT: ret
entry:
%add = call float @llvm.experimental.constrained.fdiv.f32(float %x, float %y, metadata !"round.tonearest", metadata !"fpexcept.strict") #0
ret void
}
; CHECK-LABEL: unused_div_round_dynamic:
; CHECK-NOT: fdiv
; CHECK: ret
define void @unused_div_round_dynamic(float %x, float %y) #0 {
; CHECK-LABEL: unused_div_round_dynamic:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: ret
entry:
%add = call float @llvm.experimental.constrained.fdiv.f32(float %x, float %y, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
ret void
@ -33,14 +42,14 @@ entry:
; Machine CSE should eliminate the second add unless we have strict exceptions
; CHECK-LABEL: add_twice:
; CHECK: fadd [[ADD:s[0-9]+]], s0, s1
; CHECK-NEXT: cmp w0, #0
; CHECK-NEXT: fmul [[MUL:s[0-9]+]], [[ADD]], [[ADD]]
; CHECK-NEXT: fcsel s0, [[ADD]], [[MUL]], eq
; CHECK-NEXT: ret
define float @add_twice(float %x, float %y, i32 %n) {
; CHECK-LABEL: add_twice:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: cmp w0, #0
; CHECK-NEXT: fmul s1, s0, s0
; CHECK-NEXT: fcsel s0, s0, s1, eq
; CHECK-NEXT: ret
entry:
%add = fadd float %x, %y
%tobool.not = icmp eq i32 %n, 0
@ -56,15 +65,17 @@ if.end:
ret float %a.0
}
; CHECK-LABEL: add_twice_fpexcept_strict:
; CHECK: fmov [[X:s[0-9]+]], s0
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: cbz w0, [[LABEL:.LBB[0-9_]+]]
; CHECK: fadd [[ADD:s[0-9]+]], [[X]], s1
; CHECK-NEXT: fmul s0, s0, [[ADD]]
; CHECK: [[LABEL]]:
; CHECK-NEXT: ret
define float @add_twice_fpexcept_strict(float %x, float %y, i32 %n) #0 {
; CHECK-LABEL: add_twice_fpexcept_strict:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: fmov s2, s0
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: cbz w0, .LBB4_2
; CHECK-NEXT: // %bb.1: // %if.then
; CHECK-NEXT: fadd s1, s2, s1
; CHECK-NEXT: fmul s0, s0, s1
; CHECK-NEXT: .LBB4_2: // %if.end
; CHECK-NEXT: ret
entry:
%add = call float @llvm.experimental.constrained.fadd.f32(float %x, float %y, metadata !"round.tonearest", metadata !"fpexcept.strict") #0
%tobool.not = icmp eq i32 %n, 0
@ -80,14 +91,15 @@ if.end:
ret float %a.0
}
; CHECK-LABEL: add_twice_round_dynamic:
; CHECK: fadd s0, s0, s1
; CHECK-NEXT: cbz w0, [[LABEL:.LBB[0-9_]+]]
; CHECK-NOT: fadd
; CHECK: fmul s0, s0, s0
; CHECK: [[LABEL]]:
; CHECK-NEXT: ret
define float @add_twice_round_dynamic(float %x, float %y, i32 %n) #0 {
; CHECK-LABEL: add_twice_round_dynamic:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: cbz w0, .LBB5_2
; CHECK-NEXT: // %bb.1: // %if.then
; CHECK-NEXT: fmul s0, s0, s0
; CHECK-NEXT: .LBB5_2: // %if.end
; CHECK-NEXT: ret
entry:
%add = call float @llvm.experimental.constrained.fadd.f32(float %x, float %y, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
%tobool.not = icmp eq i32 %n, 0
@ -108,17 +120,18 @@ if.end:
; dynamic (as they may give different results) or when we have strict exceptions
; (the llvm.set.rounding is irrelevant, but both could trap).
; CHECK-LABEL: set_rounding:
; CHECK-DAG: fadd [[SREG:s[0-9]+]], s0, s1
; CHECK-DAG: mrs [[XREG1:x[0-9]+]], FPCR
; CHECK-DAG: orr [[XREG2:x[0-9]+]], [[XREG1]], #0xc00000
; CHECK: msr FPCR, [[XREG2]]
; CHECK-NEXT: mrs [[XREG3:x[0-9]+]], FPCR
; CHECK-NEXT: and [[XREG4:x[0-9]+]], [[XREG3]], #0xffffffffff3fffff
; CHECK-NEXT: msr FPCR, [[XREG4]]
; CHECK-NEXT: fsub s0, [[SREG]], [[SREG]]
; CHECK-NEXT: ret
define float @set_rounding(float %x, float %y) {
; CHECK-LABEL: set_rounding:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: mrs x8, FPCR
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: orr x8, x8, #0xc00000
; CHECK-NEXT: msr FPCR, x8
; CHECK-NEXT: mrs x8, FPCR
; CHECK-NEXT: and x8, x8, #0xffffffffff3fffff
; CHECK-NEXT: msr FPCR, x8
; CHECK-NEXT: fsub s0, s0, s0
; CHECK-NEXT: ret
entry:
%add1 = fadd float %x, %y
call void @llvm.set.rounding(i32 0)
@ -128,18 +141,19 @@ entry:
ret float %sub
}
; CHECK-LABEL: set_rounding_fpexcept_strict:
; CHECK-DAG: fadd [[SREG1:s[0-9]+]], s0, s1
; CHECK-DAG: mrs [[XREG1:x[0-9]+]], FPCR
; CHECK-DAG: orr [[XREG2:x[0-9]+]], [[XREG1]], #0xc00000
; CHECK: msr FPCR, [[XREG2]]
; CHECK-DAG: fadd [[SREG2:s[0-9]+]], s0, s1
; CHECK-DAG: mrs [[XREG3:x[0-9]+]], FPCR
; CHECK-DAG: and [[XREG4:x[0-9]+]], [[XREG3]], #0xffffffffff3fffff
; CHECK-NEXT: msr FPCR, [[XREG4]]
; CHECK-NEXT: fsub s0, [[SREG1]], [[SREG2]]
; CHECK-NEXT: ret
define float @set_rounding_fpexcept_strict(float %x, float %y) #0 {
; CHECK-LABEL: set_rounding_fpexcept_strict:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: fadd s2, s0, s1
; CHECK-NEXT: mrs x8, FPCR
; CHECK-NEXT: orr x8, x8, #0xc00000
; CHECK-NEXT: msr FPCR, x8
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: mrs x8, FPCR
; CHECK-NEXT: and x8, x8, #0xffffffffff3fffff
; CHECK-NEXT: msr FPCR, x8
; CHECK-NEXT: fsub s0, s2, s0
; CHECK-NEXT: ret
entry:
%add1 = call float @llvm.experimental.constrained.fadd.f32(float %x, float %y, metadata !"round.tonearest", metadata !"fpexcept.strict") #0
call void @llvm.set.rounding(i32 0) #0
@ -149,18 +163,19 @@ entry:
ret float %sub
}
; CHECK-LABEL: set_rounding_round_dynamic:
; CHECK-DAG: fadd [[SREG1:s[0-9]+]], s0, s1
; CHECK-DAG: mrs [[XREG1:x[0-9]+]], FPCR
; CHECK-DAG: orr [[XREG2:x[0-9]+]], [[XREG1]], #0xc00000
; CHECK: msr FPCR, [[XREG2]]
; CHECK-DAG: fadd [[SREG2:s[0-9]+]], s0, s1
; CHECK-DAG: mrs [[XREG3:x[0-9]+]], FPCR
; CHECK-DAG: and [[XREG4:x[0-9]+]], [[XREG3]], #0xffffffffff3fffff
; CHECK-NEXT: msr FPCR, [[XREG4]]
; CHECK-NEXT: fsub s0, [[SREG1]], [[SREG2]]
; CHECK-NEXT: ret
define float @set_rounding_round_dynamic(float %x, float %y) #0 {
; CHECK-LABEL: set_rounding_round_dynamic:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: mrs x8, FPCR
; CHECK-NEXT: fadd s2, s0, s1
; CHECK-NEXT: orr x8, x8, #0xc00000
; CHECK-NEXT: msr FPCR, x8
; CHECK-NEXT: fadd s0, s0, s1
; CHECK-NEXT: mrs x8, FPCR
; CHECK-NEXT: and x8, x8, #0xffffffffff3fffff
; CHECK-NEXT: msr FPCR, x8
; CHECK-NEXT: fsub s0, s2, s0
; CHECK-NEXT: ret
entry:
%add1 = call float @llvm.experimental.constrained.fadd.f32(float %x, float %y, metadata !"round.dynamic", metadata !"fpexcept.ignore") #0
call void @llvm.set.rounding(i32 0) #0
@ -178,3 +193,6 @@ declare i32 @llvm.get.rounding()
declare void @llvm.set.rounding(i32)
attributes #0 = { strictfp }
;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
; CHECK-GI: {{.*}}
; CHECK-SD: {{.*}}