829 lines
58 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+sse2 | FileCheck %s -check-prefixes=X86,SSE2
; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+sse4.2 | FileCheck %s -check-prefixes=X86,SSE42
; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx | FileCheck %s -check-prefixes=X86,AVX1
; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx2 | FileCheck %s -check-prefixes=X86,AVX2
; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx512f | FileCheck %s -check-prefixes=X86,AVX512F
; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx512vl,avx512bw,avx512dq | FileCheck %s -check-prefixes=X86,AVX512BW
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+sse2 | FileCheck %s -check-prefixes=X64,SSE2
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+sse4.2 | FileCheck %s -check-prefixes=X64,SSE42
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx | FileCheck %s -check-prefixes=X64,AVX1
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx2 | FileCheck %s -check-prefixes=X64,AVX2
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx512f | FileCheck %s -check-prefixes=X64,AVX512F
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+avx512vl,+avx512bw,+avx512dq | FileCheck %s -check-prefixes=X64,AVX512BW
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+xop | FileCheck %s -check-prefixes=XOP
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+xop,+avx2 | FileCheck %s -check-prefixes=XOP
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+gfni,+ssse3 | FileCheck %s -check-prefixes=GFNISSE
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+gfni,+avx | FileCheck %s -check-prefixes=GFNIAVX
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+gfni,+avx2 | FileCheck %s -check-prefixes=GFNIAVX2
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+gfni,+avx512f | FileCheck %s -check-prefixes=GFNIAVX512F
; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -passes="print<cost-model>" 2>&1 -disable-output -cost-kind=all -mattr=+gfni,+avx512bw | FileCheck %s -check-prefixes=GFNIAVX512BW
; Verify the cost of scalar bitreverse instructions.
declare i64 @llvm.bitreverse.i64(i64)
declare i32 @llvm.bitreverse.i32(i32)
declare i16 @llvm.bitreverse.i16(i16)
declare i8 @llvm.bitreverse.i8(i8)
define i64 @var_bitreverse_i64(i64 %a) {
; X86-LABEL: 'var_bitreverse_i64'
; X86-NEXT: Cost Model: Found costs of RThru:18 CodeSize:34 Lat:24 SizeLat:38 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; X86-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; X64-LABEL: 'var_bitreverse_i64'
; X64-NEXT: Cost Model: Found costs of RThru:10 CodeSize:20 Lat:12 SizeLat:22 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; X64-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; XOP-LABEL: 'var_bitreverse_i64'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:3 Lat:2 SizeLat:4 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_i64'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_i64'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_i64'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_i64'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_i64'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i64 %bitreverse
;
%bitreverse = call i64 @llvm.bitreverse.i64(i64 %a)
ret i64 %bitreverse
}
define i32 @var_bitreverse_i32(i32 %a) {
; X86-LABEL: 'var_bitreverse_i32'
; X86-NEXT: Cost Model: Found costs of RThru:9 CodeSize:17 Lat:12 SizeLat:19 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; X86-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; X64-LABEL: 'var_bitreverse_i32'
; X64-NEXT: Cost Model: Found costs of RThru:9 CodeSize:17 Lat:12 SizeLat:19 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; X64-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; XOP-LABEL: 'var_bitreverse_i32'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:3 Lat:2 SizeLat:4 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_i32'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:5 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_i32'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:5 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_i32'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:5 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_i32'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:5 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_i32'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:5 for: %bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i32 %bitreverse
;
%bitreverse = call i32 @llvm.bitreverse.i32(i32 %a)
ret i32 %bitreverse
}
define i16 @var_bitreverse_i16(i16 %a) {
; X86-LABEL: 'var_bitreverse_i16'
; X86-NEXT: Cost Model: Found costs of RThru:9 CodeSize:17 Lat:12 SizeLat:19 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; X86-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; X64-LABEL: 'var_bitreverse_i16'
; X64-NEXT: Cost Model: Found costs of RThru:9 CodeSize:17 Lat:12 SizeLat:19 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; X64-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; XOP-LABEL: 'var_bitreverse_i16'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:3 Lat:2 SizeLat:4 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_i16'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_i16'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_i16'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_i16'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_i16'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:4 Lat:3 SizeLat:6 for: %bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i16 %bitreverse
;
%bitreverse = call i16 @llvm.bitreverse.i16(i16 %a)
ret i16 %bitreverse
}
define i8 @var_bitreverse_i8(i8 %a) {
; X86-LABEL: 'var_bitreverse_i8'
; X86-NEXT: Cost Model: Found costs of RThru:7 CodeSize:13 Lat:9 SizeLat:14 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; X86-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; X64-LABEL: 'var_bitreverse_i8'
; X64-NEXT: Cost Model: Found costs of RThru:7 CodeSize:13 Lat:9 SizeLat:14 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; X64-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; XOP-LABEL: 'var_bitreverse_i8'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:3 Lat:2 SizeLat:4 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_i8'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:3 CodeSize:3 Lat:3 SizeLat:4 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_i8'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:3 CodeSize:3 Lat:3 SizeLat:4 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_i8'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:3 Lat:3 SizeLat:4 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_i8'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:3 Lat:3 SizeLat:4 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_i8'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:3 Lat:3 SizeLat:4 for: %bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret i8 %bitreverse
;
%bitreverse = call i8 @llvm.bitreverse.i8(i8 %a)
ret i8 %bitreverse
}
; Verify the cost of vector bitreverse instructions.
declare <2 x i64> @llvm.bitreverse.v2i64(<2 x i64>)
declare <4 x i32> @llvm.bitreverse.v4i32(<4 x i32>)
declare <8 x i16> @llvm.bitreverse.v8i16(<8 x i16>)
declare <16 x i8> @llvm.bitreverse.v16i8(<16 x i8>)
declare <4 x i64> @llvm.bitreverse.v4i64(<4 x i64>)
declare <8 x i32> @llvm.bitreverse.v8i32(<8 x i32>)
declare <16 x i16> @llvm.bitreverse.v16i16(<16 x i16>)
declare <32 x i8> @llvm.bitreverse.v32i8(<32 x i8>)
declare <8 x i64> @llvm.bitreverse.v8i64(<8 x i64>)
declare <16 x i32> @llvm.bitreverse.v16i32(<16 x i32>)
declare <32 x i16> @llvm.bitreverse.v32i16(<32 x i16>)
declare <64 x i8> @llvm.bitreverse.v64i8(<64 x i8>)
define <2 x i64> @var_bitreverse_v2i64(<2 x i64> %a) {
; SSE2-LABEL: 'var_bitreverse_v2i64'
; SSE2-NEXT: Cost Model: Found costs of RThru:16 CodeSize:32 Lat:20 SizeLat:32 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v2i64'
; SSE42-NEXT: Cost Model: Found costs of RThru:16 CodeSize:11 Lat:20 SizeLat:21 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v2i64'
; AVX1-NEXT: Cost Model: Found costs of RThru:8 CodeSize:10 Lat:13 SizeLat:16 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v2i64'
; AVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v2i64'
; AVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v2i64'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:10 SizeLat:11 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v2i64'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:1 Lat:7 SizeLat:1 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v2i64'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v2i64'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v2i64'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v2i64'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v2i64'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <2 x i64> %bitreverse
;
%bitreverse = call <2 x i64> @llvm.bitreverse.v2i64(<2 x i64> %a)
ret <2 x i64> %bitreverse
}
define <4 x i64> @var_bitreverse_v4i64(<4 x i64> %a) {
; SSE2-LABEL: 'var_bitreverse_v4i64'
; SSE2-NEXT: Cost Model: Found costs of RThru:32 CodeSize:64 Lat:40 SizeLat:64 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v4i64'
; SSE42-NEXT: Cost Model: Found costs of RThru:32 CodeSize:22 Lat:40 SizeLat:42 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v4i64'
; AVX1-NEXT: Cost Model: Found costs of RThru:17 CodeSize:20 Lat:20 SizeLat:33 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v4i64'
; AVX2-NEXT: Cost Model: Found costs of RThru:5 CodeSize:10 Lat:11 SizeLat:17 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v4i64'
; AVX512F-NEXT: Cost Model: Found costs of RThru:5 CodeSize:10 Lat:11 SizeLat:17 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v4i64'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v4i64'
; XOP-NEXT: Cost Model: Found costs of RThru:3 CodeSize:5 Lat:6 SizeLat:6 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v4i64'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:16 SizeLat:8 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v4i64'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v4i64'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v4i64'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v4i64'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i64> %bitreverse
;
%bitreverse = call <4 x i64> @llvm.bitreverse.v4i64(<4 x i64> %a)
ret <4 x i64> %bitreverse
}
define <8 x i64> @var_bitreverse_v8i64(<8 x i64> %a) {
; SSE2-LABEL: 'var_bitreverse_v8i64'
; SSE2-NEXT: Cost Model: Found costs of RThru:64 CodeSize:128 Lat:80 SizeLat:128 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v8i64'
; SSE42-NEXT: Cost Model: Found costs of RThru:64 CodeSize:44 Lat:80 SizeLat:84 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v8i64'
; AVX1-NEXT: Cost Model: Found costs of RThru:34 CodeSize:40 Lat:40 SizeLat:66 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v8i64'
; AVX2-NEXT: Cost Model: Found costs of RThru:10 CodeSize:20 Lat:22 SizeLat:34 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v8i64'
; AVX512F-NEXT: Cost Model: Found costs of RThru:9 CodeSize:20 Lat:13 SizeLat:20 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v8i64'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:12 SizeLat:14 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v8i64'
; XOP-NEXT: Cost Model: Found costs of RThru:6 CodeSize:10 Lat:12 SizeLat:12 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v8i64'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:4 CodeSize:8 Lat:32 SizeLat:16 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v8i64'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:18 SizeLat:8 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v8i64'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:18 SizeLat:8 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v8i64'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v8i64'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i64> %bitreverse
;
%bitreverse = call <8 x i64> @llvm.bitreverse.v8i64(<8 x i64> %a)
ret <8 x i64> %bitreverse
}
define <4 x i32> @var_bitreverse_v4i32(<4 x i32> %a) {
; SSE2-LABEL: 'var_bitreverse_v4i32'
; SSE2-NEXT: Cost Model: Found costs of RThru:16 CodeSize:30 Lat:20 SizeLat:30 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v4i32'
; SSE42-NEXT: Cost Model: Found costs of RThru:16 CodeSize:11 Lat:20 SizeLat:21 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v4i32'
; AVX1-NEXT: Cost Model: Found costs of RThru:8 CodeSize:10 Lat:13 SizeLat:16 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v4i32'
; AVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v4i32'
; AVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v4i32'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:10 SizeLat:11 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v4i32'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:1 Lat:7 SizeLat:1 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v4i32'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v4i32'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v4i32'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v4i32'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v4i32'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i32> %bitreverse
;
%bitreverse = call <4 x i32> @llvm.bitreverse.v4i32(<4 x i32> %a)
ret <4 x i32> %bitreverse
}
define <8 x i32> @var_bitreverse_v8i32(<8 x i32> %a) {
; SSE2-LABEL: 'var_bitreverse_v8i32'
; SSE2-NEXT: Cost Model: Found costs of RThru:32 CodeSize:60 Lat:40 SizeLat:60 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v8i32'
; SSE42-NEXT: Cost Model: Found costs of RThru:32 CodeSize:22 Lat:40 SizeLat:42 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v8i32'
; AVX1-NEXT: Cost Model: Found costs of RThru:17 CodeSize:20 Lat:20 SizeLat:33 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v8i32'
; AVX2-NEXT: Cost Model: Found costs of RThru:5 CodeSize:10 Lat:11 SizeLat:17 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v8i32'
; AVX512F-NEXT: Cost Model: Found costs of RThru:5 CodeSize:10 Lat:11 SizeLat:17 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v8i32'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v8i32'
; XOP-NEXT: Cost Model: Found costs of RThru:3 CodeSize:5 Lat:6 SizeLat:6 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v8i32'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:16 SizeLat:8 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v8i32'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v8i32'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v8i32'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v8i32'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i32> %bitreverse
;
%bitreverse = call <8 x i32> @llvm.bitreverse.v8i32(<8 x i32> %a)
ret <8 x i32> %bitreverse
}
define <16 x i32> @var_bitreverse_v16i32(<16 x i32> %a) {
; SSE2-LABEL: 'var_bitreverse_v16i32'
; SSE2-NEXT: Cost Model: Found costs of RThru:64 CodeSize:120 Lat:80 SizeLat:120 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v16i32'
; SSE42-NEXT: Cost Model: Found costs of RThru:64 CodeSize:44 Lat:80 SizeLat:84 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v16i32'
; AVX1-NEXT: Cost Model: Found costs of RThru:34 CodeSize:40 Lat:40 SizeLat:66 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v16i32'
; AVX2-NEXT: Cost Model: Found costs of RThru:10 CodeSize:20 Lat:22 SizeLat:34 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v16i32'
; AVX512F-NEXT: Cost Model: Found costs of RThru:9 CodeSize:20 Lat:13 SizeLat:20 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v16i32'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:12 SizeLat:14 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v16i32'
; XOP-NEXT: Cost Model: Found costs of RThru:6 CodeSize:10 Lat:12 SizeLat:12 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v16i32'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:4 CodeSize:8 Lat:32 SizeLat:16 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v16i32'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:18 SizeLat:8 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v16i32'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:18 SizeLat:8 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v16i32'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v16i32'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i32> %bitreverse
;
%bitreverse = call <16 x i32> @llvm.bitreverse.v16i32(<16 x i32> %a)
ret <16 x i32> %bitreverse
}
define <8 x i16> @var_bitreverse_v8i16(<8 x i16> %a) {
; SSE2-LABEL: 'var_bitreverse_v8i16'
; SSE2-NEXT: Cost Model: Found costs of RThru:16 CodeSize:25 Lat:20 SizeLat:25 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v8i16'
; SSE42-NEXT: Cost Model: Found costs of RThru:16 CodeSize:11 Lat:20 SizeLat:21 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v8i16'
; AVX1-NEXT: Cost Model: Found costs of RThru:8 CodeSize:10 Lat:13 SizeLat:16 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v8i16'
; AVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v8i16'
; AVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v8i16'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:10 SizeLat:11 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v8i16'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:1 Lat:7 SizeLat:1 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v8i16'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v8i16'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v8i16'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v8i16'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v8i16'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:8 SizeLat:4 for: %bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i16> %bitreverse
;
%bitreverse = call <8 x i16> @llvm.bitreverse.v8i16(<8 x i16> %a)
ret <8 x i16> %bitreverse
}
define <16 x i16> @var_bitreverse_v16i16(<16 x i16> %a) {
; SSE2-LABEL: 'var_bitreverse_v16i16'
; SSE2-NEXT: Cost Model: Found costs of RThru:32 CodeSize:50 Lat:40 SizeLat:50 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v16i16'
; SSE42-NEXT: Cost Model: Found costs of RThru:32 CodeSize:22 Lat:40 SizeLat:42 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v16i16'
; AVX1-NEXT: Cost Model: Found costs of RThru:17 CodeSize:20 Lat:20 SizeLat:33 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v16i16'
; AVX2-NEXT: Cost Model: Found costs of RThru:5 CodeSize:10 Lat:11 SizeLat:17 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v16i16'
; AVX512F-NEXT: Cost Model: Found costs of RThru:5 CodeSize:10 Lat:11 SizeLat:17 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v16i16'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:11 SizeLat:11 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v16i16'
; XOP-NEXT: Cost Model: Found costs of RThru:3 CodeSize:5 Lat:6 SizeLat:6 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v16i16'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:16 SizeLat:8 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v16i16'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v16i16'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v16i16'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v16i16'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i16> %bitreverse
;
%bitreverse = call <16 x i16> @llvm.bitreverse.v16i16(<16 x i16> %a)
ret <16 x i16> %bitreverse
}
define <32 x i16> @var_bitreverse_v32i16(<32 x i16> %a) {
; SSE2-LABEL: 'var_bitreverse_v32i16'
; SSE2-NEXT: Cost Model: Found costs of RThru:64 CodeSize:100 Lat:80 SizeLat:100 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v32i16'
; SSE42-NEXT: Cost Model: Found costs of RThru:64 CodeSize:44 Lat:80 SizeLat:84 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v32i16'
; AVX1-NEXT: Cost Model: Found costs of RThru:34 CodeSize:40 Lat:40 SizeLat:66 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v32i16'
; AVX2-NEXT: Cost Model: Found costs of RThru:10 CodeSize:20 Lat:22 SizeLat:34 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v32i16'
; AVX512F-NEXT: Cost Model: Found costs of RThru:9 CodeSize:20 Lat:13 SizeLat:20 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v32i16'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:3 CodeSize:10 Lat:12 SizeLat:14 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v32i16'
; XOP-NEXT: Cost Model: Found costs of RThru:6 CodeSize:10 Lat:12 SizeLat:12 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v32i16'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:4 CodeSize:8 Lat:32 SizeLat:16 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v32i16'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:18 SizeLat:8 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v32i16'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:2 CodeSize:4 Lat:18 SizeLat:8 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v32i16'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v32i16'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:2 Lat:9 SizeLat:4 for: %bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i16> %bitreverse
;
%bitreverse = call <32 x i16> @llvm.bitreverse.v32i16(<32 x i16> %a)
ret <32 x i16> %bitreverse
}
define <16 x i8> @var_bitreverse_v16i8(<16 x i8> %a) {
; SSE2-LABEL: 'var_bitreverse_v16i8'
; SSE2-NEXT: Cost Model: Found costs of RThru:11 CodeSize:21 Lat:12 SizeLat:21 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v16i8'
; SSE42-NEXT: Cost Model: Found costs of RThru:11 CodeSize:10 Lat:12 SizeLat:16 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v16i8'
; AVX1-NEXT: Cost Model: Found costs of RThru:7 CodeSize:9 Lat:7 SizeLat:13 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v16i8'
; AVX2-NEXT: Cost Model: Found costs of RThru:3 CodeSize:9 Lat:6 SizeLat:9 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v16i8'
; AVX512F-NEXT: Cost Model: Found costs of RThru:3 CodeSize:9 Lat:6 SizeLat:9 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v16i8'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:2 CodeSize:9 Lat:5 SizeLat:9 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v16i8'
; XOP-NEXT: Cost Model: Found costs of RThru:2 CodeSize:1 Lat:7 SizeLat:1 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v16i8'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v16i8'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v16i8'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v16i8'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v16i8'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <16 x i8> %bitreverse
;
%bitreverse = call <16 x i8> @llvm.bitreverse.v16i8(<16 x i8> %a)
ret <16 x i8> %bitreverse
}
define <32 x i8> @var_bitreverse_v32i8(<32 x i8> %a) {
; SSE2-LABEL: 'var_bitreverse_v32i8'
; SSE2-NEXT: Cost Model: Found costs of RThru:22 CodeSize:42 Lat:24 SizeLat:42 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v32i8'
; SSE42-NEXT: Cost Model: Found costs of RThru:22 CodeSize:20 Lat:24 SizeLat:32 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v32i8'
; AVX1-NEXT: Cost Model: Found costs of RThru:13 CodeSize:17 Lat:15 SizeLat:26 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v32i8'
; AVX2-NEXT: Cost Model: Found costs of RThru:4 CodeSize:9 Lat:5 SizeLat:15 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v32i8'
; AVX512F-NEXT: Cost Model: Found costs of RThru:4 CodeSize:9 Lat:5 SizeLat:15 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v32i8'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:2 CodeSize:9 Lat:5 SizeLat:9 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v32i8'
; XOP-NEXT: Cost Model: Found costs of RThru:3 CodeSize:5 Lat:6 SizeLat:6 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v32i8'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:2 CodeSize:2 Lat:12 SizeLat:4 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v32i8'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v32i8'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v32i8'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v32i8'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <32 x i8> %bitreverse
;
%bitreverse = call <32 x i8> @llvm.bitreverse.v32i8(<32 x i8> %a)
ret <32 x i8> %bitreverse
}
define <64 x i8> @var_bitreverse_v64i8(<64 x i8> %a) {
; SSE2-LABEL: 'var_bitreverse_v64i8'
; SSE2-NEXT: Cost Model: Found costs of RThru:44 CodeSize:84 Lat:48 SizeLat:84 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; SSE2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; SSE42-LABEL: 'var_bitreverse_v64i8'
; SSE42-NEXT: Cost Model: Found costs of RThru:44 CodeSize:40 Lat:48 SizeLat:64 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; SSE42-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; AVX1-LABEL: 'var_bitreverse_v64i8'
; AVX1-NEXT: Cost Model: Found costs of RThru:26 CodeSize:34 Lat:30 SizeLat:52 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; AVX1-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; AVX2-LABEL: 'var_bitreverse_v64i8'
; AVX2-NEXT: Cost Model: Found costs of RThru:8 CodeSize:18 Lat:10 SizeLat:30 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; AVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; AVX512F-LABEL: 'var_bitreverse_v64i8'
; AVX512F-NEXT: Cost Model: Found costs of RThru:6 CodeSize:17 Lat:11 SizeLat:17 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; AVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; AVX512BW-LABEL: 'var_bitreverse_v64i8'
; AVX512BW-NEXT: Cost Model: Found costs of RThru:2 CodeSize:9 Lat:5 SizeLat:12 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; AVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; XOP-LABEL: 'var_bitreverse_v64i8'
; XOP-NEXT: Cost Model: Found costs of RThru:6 CodeSize:10 Lat:12 SizeLat:12 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; XOP-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; GFNISSE-LABEL: 'var_bitreverse_v64i8'
; GFNISSE-NEXT: Cost Model: Found costs of RThru:4 CodeSize:4 Lat:24 SizeLat:8 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; GFNISSE-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; GFNIAVX-LABEL: 'var_bitreverse_v64i8'
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:2 CodeSize:2 Lat:12 SizeLat:4 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; GFNIAVX-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; GFNIAVX2-LABEL: 'var_bitreverse_v64i8'
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:2 CodeSize:2 Lat:12 SizeLat:4 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; GFNIAVX2-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; GFNIAVX512F-LABEL: 'var_bitreverse_v64i8'
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; GFNIAVX512F-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
; GFNIAVX512BW-LABEL: 'var_bitreverse_v64i8'
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:1 CodeSize:1 Lat:6 SizeLat:2 for: %bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
; GFNIAVX512BW-NEXT: Cost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <64 x i8> %bitreverse
;
%bitreverse = call <64 x i8> @llvm.bitreverse.v64i8(<64 x i8> %a)
ret <64 x i8> %bitreverse
}