Type legalization can promote constant operands. The MULHU optimization `mulhu x, (1 << c) -> x >> (bitwidth - c)` was failing when constants were promoted because: 1. `isConstantOrConstantVector` check rejected promoted constants 2. `BuildLogBase2` -> `takeInexpensiveLog2` -> `matchUnaryPredicate` rejected promoted constants This fixes both by adding `AllowTruncation=true`, following the pattern from the recent UDIV fix (#169491).
243 lines
9.9 KiB
LLVM
243 lines
9.9 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mtriple=riscv32 -mattr=+v -verify-machineinstrs < %s | FileCheck %s --check-prefixes=CHECK,RV32
|
|
; RUN: llc -mtriple=riscv64 -mattr=+v -verify-machineinstrs < %s | FileCheck %s --check-prefixes=CHECK,RV64
|
|
|
|
define <vscale x 1 x i32> @vmulhu_vv_nxv1i32(<vscale x 1 x i32> %va, <vscale x 1 x i32> %vb) {
|
|
; CHECK-LABEL: vmulhu_vv_nxv1i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, mf2, ta, ma
|
|
; CHECK-NEXT: vmulhu.vv v8, v9, v8
|
|
; CHECK-NEXT: ret
|
|
%vc = zext <vscale x 1 x i32> %vb to <vscale x 1 x i64>
|
|
%vd = zext <vscale x 1 x i32> %va to <vscale x 1 x i64>
|
|
%ve = mul <vscale x 1 x i64> %vc, %vd
|
|
%vf = lshr <vscale x 1 x i64> %ve, splat (i64 32)
|
|
%vg = trunc <vscale x 1 x i64> %vf to <vscale x 1 x i32>
|
|
ret <vscale x 1 x i32> %vg
|
|
}
|
|
|
|
define <vscale x 1 x i32> @vmulhu_vx_nxv1i32(<vscale x 1 x i32> %va, i32 %x) {
|
|
; CHECK-LABEL: vmulhu_vx_nxv1i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, mf2, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%head1 = insertelement <vscale x 1 x i32> poison, i32 %x, i32 0
|
|
%splat1 = shufflevector <vscale x 1 x i32> %head1, <vscale x 1 x i32> poison, <vscale x 1 x i32> zeroinitializer
|
|
%vb = zext <vscale x 1 x i32> %splat1 to <vscale x 1 x i64>
|
|
%vc = zext <vscale x 1 x i32> %va to <vscale x 1 x i64>
|
|
%vd = mul <vscale x 1 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 1 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 1 x i64> %ve to <vscale x 1 x i32>
|
|
ret <vscale x 1 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 1 x i32> @vmulhu_vi_nxv1i32_0(<vscale x 1 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv1i32_0:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: li a0, -7
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, mf2, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 1 x i32> splat (i32 -7) to <vscale x 1 x i64>
|
|
%vc = zext <vscale x 1 x i32> %va to <vscale x 1 x i64>
|
|
%vd = mul <vscale x 1 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 1 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 1 x i64> %ve to <vscale x 1 x i32>
|
|
ret <vscale x 1 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 1 x i32> @vmulhu_vi_nxv1i32_1(<vscale x 1 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv1i32_1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, mf2, ta, ma
|
|
; CHECK-NEXT: vsrl.vi v8, v8, 28
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 1 x i32> splat (i32 16) to <vscale x 1 x i64>
|
|
%vc = zext <vscale x 1 x i32> %va to <vscale x 1 x i64>
|
|
%vd = mul <vscale x 1 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 1 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 1 x i64> %ve to <vscale x 1 x i32>
|
|
ret <vscale x 1 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 2 x i32> @vmulhu_vv_nxv2i32(<vscale x 2 x i32> %va, <vscale x 2 x i32> %vb) {
|
|
; CHECK-LABEL: vmulhu_vv_nxv2i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, m1, ta, ma
|
|
; CHECK-NEXT: vmulhu.vv v8, v9, v8
|
|
; CHECK-NEXT: ret
|
|
%vc = zext <vscale x 2 x i32> %vb to <vscale x 2 x i64>
|
|
%vd = zext <vscale x 2 x i32> %va to <vscale x 2 x i64>
|
|
%ve = mul <vscale x 2 x i64> %vc, %vd
|
|
%vf = lshr <vscale x 2 x i64> %ve, splat (i64 32)
|
|
%vg = trunc <vscale x 2 x i64> %vf to <vscale x 2 x i32>
|
|
ret <vscale x 2 x i32> %vg
|
|
}
|
|
|
|
define <vscale x 2 x i32> @vmulhu_vx_nxv2i32(<vscale x 2 x i32> %va, i32 %x) {
|
|
; CHECK-LABEL: vmulhu_vx_nxv2i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, m1, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%head1 = insertelement <vscale x 2 x i32> poison, i32 %x, i32 0
|
|
%splat1 = shufflevector <vscale x 2 x i32> %head1, <vscale x 2 x i32> poison, <vscale x 2 x i32> zeroinitializer
|
|
%vb = zext <vscale x 2 x i32> %splat1 to <vscale x 2 x i64>
|
|
%vc = zext <vscale x 2 x i32> %va to <vscale x 2 x i64>
|
|
%vd = mul <vscale x 2 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 2 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 2 x i64> %ve to <vscale x 2 x i32>
|
|
ret <vscale x 2 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 2 x i32> @vmulhu_vi_nxv2i32_0(<vscale x 2 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv2i32_0:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: li a0, -7
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, m1, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 2 x i32> splat (i32 -7) to <vscale x 2 x i64>
|
|
%vc = zext <vscale x 2 x i32> %va to <vscale x 2 x i64>
|
|
%vd = mul <vscale x 2 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 2 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 2 x i64> %ve to <vscale x 2 x i32>
|
|
ret <vscale x 2 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 2 x i32> @vmulhu_vi_nxv2i32_1(<vscale x 2 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv2i32_1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, m1, ta, ma
|
|
; CHECK-NEXT: vsrl.vi v8, v8, 28
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 2 x i32> splat (i32 16) to <vscale x 2 x i64>
|
|
%vc = zext <vscale x 2 x i32> %va to <vscale x 2 x i64>
|
|
%vd = mul <vscale x 2 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 2 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 2 x i64> %ve to <vscale x 2 x i32>
|
|
ret <vscale x 2 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 4 x i32> @vmulhu_vv_nxv4i32(<vscale x 4 x i32> %va, <vscale x 4 x i32> %vb) {
|
|
; CHECK-LABEL: vmulhu_vv_nxv4i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, m2, ta, ma
|
|
; CHECK-NEXT: vmulhu.vv v8, v10, v8
|
|
; CHECK-NEXT: ret
|
|
%vc = zext <vscale x 4 x i32> %vb to <vscale x 4 x i64>
|
|
%vd = zext <vscale x 4 x i32> %va to <vscale x 4 x i64>
|
|
%ve = mul <vscale x 4 x i64> %vc, %vd
|
|
%vf = lshr <vscale x 4 x i64> %ve, splat (i64 32)
|
|
%vg = trunc <vscale x 4 x i64> %vf to <vscale x 4 x i32>
|
|
ret <vscale x 4 x i32> %vg
|
|
}
|
|
|
|
define <vscale x 4 x i32> @vmulhu_vx_nxv4i32(<vscale x 4 x i32> %va, i32 %x) {
|
|
; CHECK-LABEL: vmulhu_vx_nxv4i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, m2, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%head1 = insertelement <vscale x 4 x i32> poison, i32 %x, i32 0
|
|
%splat1 = shufflevector <vscale x 4 x i32> %head1, <vscale x 4 x i32> poison, <vscale x 4 x i32> zeroinitializer
|
|
%vb = zext <vscale x 4 x i32> %splat1 to <vscale x 4 x i64>
|
|
%vc = zext <vscale x 4 x i32> %va to <vscale x 4 x i64>
|
|
%vd = mul <vscale x 4 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 4 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 4 x i64> %ve to <vscale x 4 x i32>
|
|
ret <vscale x 4 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 4 x i32> @vmulhu_vi_nxv4i32_0(<vscale x 4 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv4i32_0:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: li a0, -7
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, m2, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 4 x i32> splat (i32 -7) to <vscale x 4 x i64>
|
|
%vc = zext <vscale x 4 x i32> %va to <vscale x 4 x i64>
|
|
%vd = mul <vscale x 4 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 4 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 4 x i64> %ve to <vscale x 4 x i32>
|
|
ret <vscale x 4 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 4 x i32> @vmulhu_vi_nxv4i32_1(<vscale x 4 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv4i32_1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, m2, ta, ma
|
|
; CHECK-NEXT: vsrl.vi v8, v8, 28
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 4 x i32> splat (i32 16) to <vscale x 4 x i64>
|
|
%vc = zext <vscale x 4 x i32> %va to <vscale x 4 x i64>
|
|
%vd = mul <vscale x 4 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 4 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 4 x i64> %ve to <vscale x 4 x i32>
|
|
ret <vscale x 4 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 8 x i32> @vmulhu_vv_nxv8i32(<vscale x 8 x i32> %va, <vscale x 8 x i32> %vb) {
|
|
; CHECK-LABEL: vmulhu_vv_nxv8i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, m4, ta, ma
|
|
; CHECK-NEXT: vmulhu.vv v8, v12, v8
|
|
; CHECK-NEXT: ret
|
|
%vc = zext <vscale x 8 x i32> %vb to <vscale x 8 x i64>
|
|
%vd = zext <vscale x 8 x i32> %va to <vscale x 8 x i64>
|
|
%ve = mul <vscale x 8 x i64> %vc, %vd
|
|
%vf = lshr <vscale x 8 x i64> %ve, splat (i64 32)
|
|
%vg = trunc <vscale x 8 x i64> %vf to <vscale x 8 x i32>
|
|
ret <vscale x 8 x i32> %vg
|
|
}
|
|
|
|
define <vscale x 8 x i32> @vmulhu_vx_nxv8i32(<vscale x 8 x i32> %va, i32 %x) {
|
|
; CHECK-LABEL: vmulhu_vx_nxv8i32:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, m4, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%head1 = insertelement <vscale x 8 x i32> poison, i32 %x, i32 0
|
|
%splat1 = shufflevector <vscale x 8 x i32> %head1, <vscale x 8 x i32> poison, <vscale x 8 x i32> zeroinitializer
|
|
%vb = zext <vscale x 8 x i32> %splat1 to <vscale x 8 x i64>
|
|
%vc = zext <vscale x 8 x i32> %va to <vscale x 8 x i64>
|
|
%vd = mul <vscale x 8 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 8 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 8 x i64> %ve to <vscale x 8 x i32>
|
|
ret <vscale x 8 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 8 x i32> @vmulhu_vi_nxv8i32_0(<vscale x 8 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv8i32_0:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: li a0, -7
|
|
; CHECK-NEXT: vsetvli a1, zero, e32, m4, ta, ma
|
|
; CHECK-NEXT: vmulhu.vx v8, v8, a0
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 8 x i32> splat (i32 -7) to <vscale x 8 x i64>
|
|
%vc = zext <vscale x 8 x i32> %va to <vscale x 8 x i64>
|
|
%vd = mul <vscale x 8 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 8 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 8 x i64> %ve to <vscale x 8 x i32>
|
|
ret <vscale x 8 x i32> %vf
|
|
}
|
|
|
|
define <vscale x 8 x i32> @vmulhu_vi_nxv8i32_1(<vscale x 8 x i32> %va) {
|
|
; CHECK-LABEL: vmulhu_vi_nxv8i32_1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vsetvli a0, zero, e32, m4, ta, ma
|
|
; CHECK-NEXT: vsrl.vi v8, v8, 28
|
|
; CHECK-NEXT: ret
|
|
%vb = zext <vscale x 8 x i32> splat (i32 16) to <vscale x 8 x i64>
|
|
%vc = zext <vscale x 8 x i32> %va to <vscale x 8 x i64>
|
|
%vd = mul <vscale x 8 x i64> %vb, %vc
|
|
%ve = lshr <vscale x 8 x i64> %vd, splat (i64 32)
|
|
%vf = trunc <vscale x 8 x i64> %ve to <vscale x 8 x i32>
|
|
ret <vscale x 8 x i32> %vf
|
|
}
|
|
;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line:
|
|
; RV32: {{.*}}
|
|
; RV64: {{.*}}
|