154 lines
6.9 KiB
LLVM
154 lines
6.9 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
|
; RUN: llc --mtriple=loongarch64 --mattr=+lasx < %s | FileCheck %s
|
|
|
|
declare <8 x float> @llvm.powi.v8f32.i32(<8 x float>, i32)
|
|
|
|
define <8 x float> @powi_v8f32(<8 x float> %va, i32 %b) nounwind {
|
|
; CHECK-LABEL: powi_v8f32:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: addi.d $sp, $sp, -128
|
|
; CHECK-NEXT: st.d $ra, $sp, 120 # 8-byte Folded Spill
|
|
; CHECK-NEXT: st.d $fp, $sp, 112 # 8-byte Folded Spill
|
|
; CHECK-NEXT: xvst $xr0, $sp, 80 # 32-byte Folded Spill
|
|
; CHECK-NEXT: addi.w $fp, $a0, 0
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 5
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $vr0
|
|
; CHECK-NEXT: vst $vr0, $sp, 48 # 16-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 4
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $xr0
|
|
; CHECK-NEXT: vld $vr1, $sp, 48 # 16-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.w $vr0, $vr1, 16
|
|
; CHECK-NEXT: xvst $xr0, $sp, 48 # 32-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 6
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $vr0
|
|
; CHECK-NEXT: xvld $xr1, $sp, 48 # 32-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.w $vr1, $vr0, 32
|
|
; CHECK-NEXT: xvst $xr1, $sp, 48 # 32-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 7
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $vr0
|
|
; CHECK-NEXT: xvld $xr1, $sp, 48 # 32-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.w $vr1, $vr0, 48
|
|
; CHECK-NEXT: xvst $xr1, $sp, 48 # 32-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 1
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $vr0
|
|
; CHECK-NEXT: vst $vr0, $sp, 16 # 16-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $xr0
|
|
; CHECK-NEXT: vld $vr1, $sp, 16 # 16-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.w $vr0, $vr1, 16
|
|
; CHECK-NEXT: xvst $xr0, $sp, 16 # 32-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 2
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $vr0
|
|
; CHECK-NEXT: xvld $xr1, $sp, 16 # 32-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.w $vr1, $vr0, 32
|
|
; CHECK-NEXT: xvst $xr1, $sp, 16 # 32-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 80 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.w $xr0, $xr0, 3
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powisf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0 killed $f0 def $vr0
|
|
; CHECK-NEXT: xvld $xr1, $sp, 16 # 32-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.w $vr1, $vr0, 48
|
|
; CHECK-NEXT: xvld $xr0, $sp, 48 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpermi.q $xr1, $xr0, 2
|
|
; CHECK-NEXT: xvori.b $xr0, $xr1, 0
|
|
; CHECK-NEXT: ld.d $fp, $sp, 112 # 8-byte Folded Reload
|
|
; CHECK-NEXT: ld.d $ra, $sp, 120 # 8-byte Folded Reload
|
|
; CHECK-NEXT: addi.d $sp, $sp, 128
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%res = call <8 x float> @llvm.powi.v8f32.i32(<8 x float> %va, i32 %b)
|
|
ret <8 x float> %res
|
|
}
|
|
|
|
declare <4 x double> @llvm.powi.v4f64.i32(<4 x double>, i32)
|
|
|
|
define <4 x double> @powi_v4f64(<4 x double> %va, i32 %b) nounwind {
|
|
; CHECK-LABEL: powi_v4f64:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: addi.d $sp, $sp, -112
|
|
; CHECK-NEXT: st.d $ra, $sp, 104 # 8-byte Folded Spill
|
|
; CHECK-NEXT: st.d $fp, $sp, 96 # 8-byte Folded Spill
|
|
; CHECK-NEXT: xvst $xr0, $sp, 64 # 32-byte Folded Spill
|
|
; CHECK-NEXT: addi.w $fp, $a0, 0
|
|
; CHECK-NEXT: xvpickve.d $xr0, $xr0, 3
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powidf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 def $vr0
|
|
; CHECK-NEXT: vst $vr0, $sp, 32 # 16-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 64 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.d $xr0, $xr0, 2
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powidf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 def $xr0
|
|
; CHECK-NEXT: vld $vr1, $sp, 32 # 16-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.d $vr0, $vr1, 16
|
|
; CHECK-NEXT: xvst $xr0, $sp, 32 # 32-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 64 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.d $xr0, $xr0, 1
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powidf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 def $vr0
|
|
; CHECK-NEXT: vst $vr0, $sp, 16 # 16-byte Folded Spill
|
|
; CHECK-NEXT: xvld $xr0, $sp, 64 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpickve.d $xr0, $xr0, 0
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 killed $xr0
|
|
; CHECK-NEXT: move $a0, $fp
|
|
; CHECK-NEXT: pcaddu18i $ra, %call36(__powidf2)
|
|
; CHECK-NEXT: jirl $ra, $ra, 0
|
|
; CHECK-NEXT: # kill: def $f0_64 killed $f0_64 def $xr0
|
|
; CHECK-NEXT: vld $vr1, $sp, 16 # 16-byte Folded Reload
|
|
; CHECK-NEXT: vextrins.d $vr0, $vr1, 16
|
|
; CHECK-NEXT: xvld $xr1, $sp, 32 # 32-byte Folded Reload
|
|
; CHECK-NEXT: xvpermi.q $xr0, $xr1, 2
|
|
; CHECK-NEXT: ld.d $fp, $sp, 96 # 8-byte Folded Reload
|
|
; CHECK-NEXT: ld.d $ra, $sp, 104 # 8-byte Folded Reload
|
|
; CHECK-NEXT: addi.d $sp, $sp, 112
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%res = call <4 x double> @llvm.powi.v4f64.i32(<4 x double> %va, i32 %b)
|
|
ret <4 x double> %res
|
|
}
|