
Running the `vector-combine` pass on this test now produces a single shuffle on a loaded `<1 x float>` instead of an insert into a `<2 x float>` followed by a shuffle. This test change matches changes in other tests in PR #144690, which introduced the optimization.
21 lines
911 B
LLVM
21 lines
911 B
LLVM
; RUN: opt -S -passes=vector-combine < %s | FileCheck %s
|
|
|
|
target datalayout = "e-m:e-p:32:32-i1:32-i8:8-i16:16-i32:32-i64:64-f16:16-f32:32-f64:64-n8:16:32:64"
|
|
target triple = "dxil-unknown-shadermodel6.7-library"
|
|
|
|
; Make sure vec combine min vec size is 1 instead of 4 for float.
|
|
; CHECK:@foo()
|
|
; CHECK-NEXT:%[[LD:[0-9]+]] = load <1 x float>, ptr @a, align 8
|
|
; CHECK-NEXT:%shuffle = shufflevector <1 x float> %[[LD]], <1 x float> poison, <2 x i32> zeroinitializer
|
|
; CHECK-NEXT:ret <2 x float> %shuffle
|
|
|
|
@a = external local_unnamed_addr constant float
|
|
|
|
; Function Attrs: mustprogress nofree norecurse nosync nounwind readnone willreturn
|
|
define noundef <2 x float> @foo() local_unnamed_addr {
|
|
%1 = load float, ptr @a, align 8
|
|
%insert = insertelement <2 x float> poison, float %1, i64 0
|
|
%shuffle = shufflevector <2 x float> %insert, <2 x float> poison, <2 x i32> zeroinitializer
|
|
ret <2 x float> %shuffle
|
|
}
|