[LV] Regenerate some more tests.
This commit is contained in:
parent
6b316ecb5f
commit
8a0c7e9b32
@ -1,3 +1,4 @@
|
|||||||
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --filter-out-after "scalar.ph\:" --version 5
|
||||||
; REQUIRES: asserts
|
; REQUIRES: asserts
|
||||||
; RUN: opt < %s -aa-pipeline=basic-aa -passes=loop-vectorize,instcombine -S -debug-only=loop-vectorize -disable-output -print-after=instcombine 2>&1 | FileCheck %s
|
; RUN: opt < %s -aa-pipeline=basic-aa -passes=loop-vectorize,instcombine -S -debug-only=loop-vectorize -disable-output -print-after=instcombine 2>&1 | FileCheck %s
|
||||||
; RUN: opt < %s -passes=loop-vectorize -force-vector-width=2 -S | FileCheck %s -check-prefix=FORCE
|
; RUN: opt < %s -passes=loop-vectorize -force-vector-width=2 -S | FileCheck %s -check-prefix=FORCE
|
||||||
@ -18,32 +19,119 @@ target triple = "x86_64-unknown-linux-gnu"
|
|||||||
; CHECK-NOT: LV: Found uniform instruction: %tmp3 = getelementptr inbounds %data, ptr %d, i64 0, i32 0, i64 %i
|
; CHECK-NOT: LV: Found uniform instruction: %tmp3 = getelementptr inbounds %data, ptr %d, i64 0, i32 0, i64 %i
|
||||||
; CHECK-NOT: LV: Found uniform instruction: %i = phi i64 [ %i.next, %for.body ], [ 0, %entry ]
|
; CHECK-NOT: LV: Found uniform instruction: %i = phi i64 [ %i.next, %for.body ], [ 0, %entry ]
|
||||||
; CHECK-NOT: LV: Found uniform instruction: %i.next = add nuw nsw i64 %i, 5
|
; CHECK-NOT: LV: Found uniform instruction: %i.next = add nuw nsw i64 %i, 5
|
||||||
; CHECK: define void @PR31671(
|
|
||||||
; CHECK: vector.ph:
|
|
||||||
; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <16 x float> poison, float %x, i64 0
|
|
||||||
; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <16 x float> [[BROADCAST_SPLATINSERT]], <16 x float> poison, <16 x i32> zeroinitializer
|
|
||||||
; CHECK-NEXT: br label %vector.body
|
|
||||||
; CHECK: vector.body:
|
|
||||||
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %vector.ph ], [ [[INDEX_NEXT:%.*]], %vector.body ]
|
|
||||||
; CHECK-NEXT: [[VEC_IND:%.*]] = phi <16 x i64> [ <i64 0, i64 5, i64 10, i64 15, i64 20, i64 25, i64 30, i64 35, i64 40, i64 45, i64 50, i64 55, i64 60, i64 65, i64 70, i64 75>, %vector.ph ], [ [[VEC_IND_NEXT:%.*]], %vector.body ]
|
|
||||||
; CHECK-NEXT: [[OFFSET_IDX:%.*]] = mul i64 [[INDEX]], 5
|
|
||||||
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds %data, ptr %d, i64 0, i32 3, i64 [[OFFSET_IDX]]
|
|
||||||
; CHECK-NEXT: [[WIDE_VEC:%.*]] = load <80 x float>, ptr [[TMP0]], align 4
|
|
||||||
; CHECK-NEXT: [[STRIDED_VEC:%.*]] = shufflevector <80 x float> [[WIDE_VEC]], <80 x float> poison, <16 x i32> <i32 0, i32 5, i32 10, i32 15, i32 20, i32 25, i32 30, i32 35, i32 40, i32 45, i32 50, i32 55, i32 60, i32 65, i32 70, i32 75>
|
|
||||||
; CHECK-NEXT: [[TMP2:%.*]] = fmul <16 x float> [[BROADCAST_SPLAT]], [[STRIDED_VEC]]
|
|
||||||
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds %data, ptr %d, i64 0, i32 0, <16 x i64> [[VEC_IND]]
|
|
||||||
; CHECK-NEXT: [[TMP4:%.*]] = extractelement <16 x ptr> [[TMP3]], i64 0
|
|
||||||
; CHECK-NEXT: [[WIDE_VEC1:%.*]] = load <80 x float>, ptr [[TMP4]], align 4
|
|
||||||
; CHECK-NEXT: [[STRIDED_VEC2:%.*]] = shufflevector <80 x float> [[WIDE_VEC1]], <80 x float> poison, <16 x i32> <i32 0, i32 5, i32 10, i32 15, i32 20, i32 25, i32 30, i32 35, i32 40, i32 45, i32 50, i32 55, i32 60, i32 65, i32 70, i32 75>
|
|
||||||
; CHECK-NEXT: [[TMP5:%.*]] = fadd <16 x float> [[STRIDED_VEC2]], [[TMP2]]
|
|
||||||
; CHECK-NEXT: call void @llvm.masked.scatter.v16f32.v16p0(<16 x float> [[TMP5]], <16 x ptr> [[TMP3]], i32 4, <16 x i1> splat (i1 true))
|
|
||||||
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 16
|
|
||||||
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <16 x i64> [[VEC_IND]], splat (i64 80)
|
|
||||||
; CHECK: br i1 {{.*}}, label %middle.block, label %vector.body
|
|
||||||
|
|
||||||
%data = type { [32000 x float], [3 x i32], [4 x i8], [32000 x float] }
|
%data = type { [32000 x float], [3 x i32], [4 x i8], [32000 x float] }
|
||||||
|
|
||||||
define void @PR31671(float %x, ptr %d) #0 {
|
define void @PR31671(float %x, ptr %d) #0 {
|
||||||
|
; CHECK-LABEL: define void @PR31671(
|
||||||
|
; CHECK-SAME: float [[X:%.*]], ptr [[D:%.*]]) #[[ATTR0:[0-9]+]] {
|
||||||
|
; CHECK-NEXT: [[ENTRY:.*:]]
|
||||||
|
; CHECK-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
|
||||||
|
; CHECK: [[VECTOR_PH]]:
|
||||||
|
; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <16 x float> poison, float [[X]], i64 0
|
||||||
|
; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <16 x float> [[BROADCAST_SPLATINSERT]], <16 x float> poison, <16 x i32> zeroinitializer
|
||||||
|
; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
|
||||||
|
; CHECK: [[VECTOR_BODY]]:
|
||||||
|
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
|
||||||
|
; CHECK-NEXT: [[VEC_IND:%.*]] = phi <16 x i64> [ <i64 0, i64 5, i64 10, i64 15, i64 20, i64 25, i64 30, i64 35, i64 40, i64 45, i64 50, i64 55, i64 60, i64 65, i64 70, i64 75>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ]
|
||||||
|
; CHECK-NEXT: [[OFFSET_IDX:%.*]] = mul i64 [[INDEX]], 5
|
||||||
|
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[DATA:%.*]], ptr [[D]], i64 0, i32 3, i64 [[OFFSET_IDX]]
|
||||||
|
; CHECK-NEXT: [[WIDE_VEC:%.*]] = load <80 x float>, ptr [[TMP0]], align 4
|
||||||
|
; CHECK-NEXT: [[STRIDED_VEC:%.*]] = shufflevector <80 x float> [[WIDE_VEC]], <80 x float> poison, <16 x i32> <i32 0, i32 5, i32 10, i32 15, i32 20, i32 25, i32 30, i32 35, i32 40, i32 45, i32 50, i32 55, i32 60, i32 65, i32 70, i32 75>
|
||||||
|
; CHECK-NEXT: [[TMP1:%.*]] = fmul <16 x float> [[BROADCAST_SPLAT]], [[STRIDED_VEC]]
|
||||||
|
; CHECK-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, <16 x i64> [[VEC_IND]]
|
||||||
|
; CHECK-NEXT: [[TMP3:%.*]] = extractelement <16 x ptr> [[TMP2]], i64 0
|
||||||
|
; CHECK-NEXT: [[WIDE_VEC1:%.*]] = load <80 x float>, ptr [[TMP3]], align 4
|
||||||
|
; CHECK-NEXT: [[STRIDED_VEC2:%.*]] = shufflevector <80 x float> [[WIDE_VEC1]], <80 x float> poison, <16 x i32> <i32 0, i32 5, i32 10, i32 15, i32 20, i32 25, i32 30, i32 35, i32 40, i32 45, i32 50, i32 55, i32 60, i32 65, i32 70, i32 75>
|
||||||
|
; CHECK-NEXT: [[TMP4:%.*]] = fadd <16 x float> [[STRIDED_VEC2]], [[TMP1]]
|
||||||
|
; CHECK-NEXT: call void @llvm.masked.scatter.v16f32.v16p0(<16 x float> [[TMP4]], <16 x ptr> [[TMP2]], i32 4, <16 x i1> splat (i1 true))
|
||||||
|
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 16
|
||||||
|
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <16 x i64> [[VEC_IND]], splat (i64 80)
|
||||||
|
; CHECK-NEXT: [[TMP5:%.*]] = icmp eq i64 [[INDEX_NEXT]], 6384
|
||||||
|
; CHECK-NEXT: br i1 [[TMP5]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
|
||||||
|
; CHECK: [[MIDDLE_BLOCK]]:
|
||||||
|
; CHECK-NEXT: br label %[[SCALAR_PH]]
|
||||||
|
; CHECK: [[SCALAR_PH]]:
|
||||||
|
;
|
||||||
|
; FORCE-LABEL: define void @PR31671(
|
||||||
|
; FORCE-SAME: float [[X:%.*]], ptr [[D:%.*]]) #[[ATTR0:[0-9]+]] {
|
||||||
|
; FORCE-NEXT: [[ENTRY:.*:]]
|
||||||
|
; FORCE-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
|
||||||
|
; FORCE: [[VECTOR_PH]]:
|
||||||
|
; FORCE-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <2 x float> poison, float [[X]], i64 0
|
||||||
|
; FORCE-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <2 x float> [[BROADCAST_SPLATINSERT]], <2 x float> poison, <2 x i32> zeroinitializer
|
||||||
|
; FORCE-NEXT: br label %[[VECTOR_BODY:.*]]
|
||||||
|
; FORCE: [[VECTOR_BODY]]:
|
||||||
|
; FORCE-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
|
||||||
|
; FORCE-NEXT: [[OFFSET_IDX:%.*]] = mul i64 [[INDEX]], 5
|
||||||
|
; FORCE-NEXT: [[TMP0:%.*]] = add i64 [[OFFSET_IDX]], 0
|
||||||
|
; FORCE-NEXT: [[TMP1:%.*]] = add i64 [[OFFSET_IDX]], 5
|
||||||
|
; FORCE-NEXT: [[TMP2:%.*]] = add i64 [[OFFSET_IDX]], 10
|
||||||
|
; FORCE-NEXT: [[TMP3:%.*]] = add i64 [[OFFSET_IDX]], 15
|
||||||
|
; FORCE-NEXT: [[TMP4:%.*]] = add i64 [[OFFSET_IDX]], 20
|
||||||
|
; FORCE-NEXT: [[TMP5:%.*]] = add i64 [[OFFSET_IDX]], 25
|
||||||
|
; FORCE-NEXT: [[TMP6:%.*]] = add i64 [[OFFSET_IDX]], 30
|
||||||
|
; FORCE-NEXT: [[TMP7:%.*]] = add i64 [[OFFSET_IDX]], 35
|
||||||
|
; FORCE-NEXT: [[TMP8:%.*]] = getelementptr inbounds [[DATA:%.*]], ptr [[D]], i64 0, i32 3, i64 [[TMP0]]
|
||||||
|
; FORCE-NEXT: [[TMP9:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 3, i64 [[TMP2]]
|
||||||
|
; FORCE-NEXT: [[TMP10:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 3, i64 [[TMP4]]
|
||||||
|
; FORCE-NEXT: [[TMP11:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 3, i64 [[TMP6]]
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC:%.*]] = load <10 x float>, ptr [[TMP8]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC:%.*]] = shufflevector <10 x float> [[WIDE_VEC]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC1:%.*]] = load <10 x float>, ptr [[TMP9]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC2:%.*]] = shufflevector <10 x float> [[WIDE_VEC1]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC3:%.*]] = load <10 x float>, ptr [[TMP10]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC4:%.*]] = shufflevector <10 x float> [[WIDE_VEC3]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC5:%.*]] = load <10 x float>, ptr [[TMP11]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC6:%.*]] = shufflevector <10 x float> [[WIDE_VEC5]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[TMP12:%.*]] = fmul <2 x float> [[BROADCAST_SPLAT]], [[STRIDED_VEC]]
|
||||||
|
; FORCE-NEXT: [[TMP13:%.*]] = fmul <2 x float> [[BROADCAST_SPLAT]], [[STRIDED_VEC2]]
|
||||||
|
; FORCE-NEXT: [[TMP14:%.*]] = fmul <2 x float> [[BROADCAST_SPLAT]], [[STRIDED_VEC4]]
|
||||||
|
; FORCE-NEXT: [[TMP15:%.*]] = fmul <2 x float> [[BROADCAST_SPLAT]], [[STRIDED_VEC6]]
|
||||||
|
; FORCE-NEXT: [[TMP16:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP0]]
|
||||||
|
; FORCE-NEXT: [[TMP17:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP1]]
|
||||||
|
; FORCE-NEXT: [[TMP18:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP2]]
|
||||||
|
; FORCE-NEXT: [[TMP19:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP3]]
|
||||||
|
; FORCE-NEXT: [[TMP20:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP4]]
|
||||||
|
; FORCE-NEXT: [[TMP21:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP5]]
|
||||||
|
; FORCE-NEXT: [[TMP22:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP6]]
|
||||||
|
; FORCE-NEXT: [[TMP23:%.*]] = getelementptr inbounds [[DATA]], ptr [[D]], i64 0, i32 0, i64 [[TMP7]]
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC7:%.*]] = load <10 x float>, ptr [[TMP16]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC8:%.*]] = shufflevector <10 x float> [[WIDE_VEC7]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC9:%.*]] = load <10 x float>, ptr [[TMP18]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC10:%.*]] = shufflevector <10 x float> [[WIDE_VEC9]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC11:%.*]] = load <10 x float>, ptr [[TMP20]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC12:%.*]] = shufflevector <10 x float> [[WIDE_VEC11]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[WIDE_VEC13:%.*]] = load <10 x float>, ptr [[TMP22]], align 4
|
||||||
|
; FORCE-NEXT: [[STRIDED_VEC14:%.*]] = shufflevector <10 x float> [[WIDE_VEC13]], <10 x float> poison, <2 x i32> <i32 0, i32 5>
|
||||||
|
; FORCE-NEXT: [[TMP24:%.*]] = fadd <2 x float> [[STRIDED_VEC8]], [[TMP12]]
|
||||||
|
; FORCE-NEXT: [[TMP25:%.*]] = fadd <2 x float> [[STRIDED_VEC10]], [[TMP13]]
|
||||||
|
; FORCE-NEXT: [[TMP26:%.*]] = fadd <2 x float> [[STRIDED_VEC12]], [[TMP14]]
|
||||||
|
; FORCE-NEXT: [[TMP27:%.*]] = fadd <2 x float> [[STRIDED_VEC14]], [[TMP15]]
|
||||||
|
; FORCE-NEXT: [[TMP28:%.*]] = extractelement <2 x float> [[TMP24]], i32 0
|
||||||
|
; FORCE-NEXT: store float [[TMP28]], ptr [[TMP16]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP29:%.*]] = extractelement <2 x float> [[TMP24]], i32 1
|
||||||
|
; FORCE-NEXT: store float [[TMP29]], ptr [[TMP17]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP30:%.*]] = extractelement <2 x float> [[TMP25]], i32 0
|
||||||
|
; FORCE-NEXT: store float [[TMP30]], ptr [[TMP18]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP31:%.*]] = extractelement <2 x float> [[TMP25]], i32 1
|
||||||
|
; FORCE-NEXT: store float [[TMP31]], ptr [[TMP19]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP32:%.*]] = extractelement <2 x float> [[TMP26]], i32 0
|
||||||
|
; FORCE-NEXT: store float [[TMP32]], ptr [[TMP20]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP33:%.*]] = extractelement <2 x float> [[TMP26]], i32 1
|
||||||
|
; FORCE-NEXT: store float [[TMP33]], ptr [[TMP21]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP34:%.*]] = extractelement <2 x float> [[TMP27]], i32 0
|
||||||
|
; FORCE-NEXT: store float [[TMP34]], ptr [[TMP22]], align 4
|
||||||
|
; FORCE-NEXT: [[TMP35:%.*]] = extractelement <2 x float> [[TMP27]], i32 1
|
||||||
|
; FORCE-NEXT: store float [[TMP35]], ptr [[TMP23]], align 4
|
||||||
|
; FORCE-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 8
|
||||||
|
; FORCE-NEXT: [[TMP36:%.*]] = icmp eq i64 [[INDEX_NEXT]], 6392
|
||||||
|
; FORCE-NEXT: br i1 [[TMP36]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
|
||||||
|
; FORCE: [[MIDDLE_BLOCK]]:
|
||||||
|
; FORCE-NEXT: br label %[[SCALAR_PH]]
|
||||||
|
; FORCE: [[SCALAR_PH]]:
|
||||||
|
;
|
||||||
entry:
|
entry:
|
||||||
br label %for.body
|
br label %for.body
|
||||||
|
|
||||||
@ -79,39 +167,56 @@ attributes #0 = { "target-cpu"="knl" }
|
|||||||
; CHECK: LV: Found not uniform due to requiring predication: {{%.*}} = load i32, ptr {{%.*}}, align 1
|
; CHECK: LV: Found not uniform due to requiring predication: {{%.*}} = load i32, ptr {{%.*}}, align 1
|
||||||
; CHECK: LV: Found scalar instruction: {{%.*}} = getelementptr inbounds [3 x i32], ptr @a, i32 0, i32 {{%.*}}
|
; CHECK: LV: Found scalar instruction: {{%.*}} = getelementptr inbounds [3 x i32], ptr @a, i32 0, i32 {{%.*}}
|
||||||
;
|
;
|
||||||
; FORCE-LABEL: @PR40816(
|
|
||||||
; FORCE-NEXT: entry:
|
|
||||||
; FORCE-NEXT: br i1 false, label {{%.*}}, label [[VECTOR_PH:%.*]]
|
|
||||||
; FORCE: vector.ph:
|
|
||||||
; FORCE-NEXT: br label [[VECTOR_BODY:%.*]]
|
|
||||||
; FORCE: vector.body:
|
|
||||||
; FORCE-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[PRED_STORE_CONTINUE4:%.*]] ]
|
|
||||||
; FORCE-NEXT: [[VEC_IND:%.*]] = phi <2 x i8> [ <i8 0, i8 1>, [[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], [[PRED_STORE_CONTINUE4]] ]
|
|
||||||
; FORCE-NEXT: [[TMP2:%.*]] = icmp ule <2 x i8> [[VEC_IND]], splat (i8 2)
|
|
||||||
; FORCE-NEXT: [[TMP3:%.*]] = extractelement <2 x i1> [[TMP2]], i32 0
|
|
||||||
; FORCE-NEXT: br i1 [[TMP3]], label [[PRED_STORE_IF:%.*]], label [[PRED_STORE_CONTINUE:%.*]]
|
|
||||||
; FORCE: pred.store.if:
|
|
||||||
; FORCE-NEXT: [[TMP0:%.*]] = add i32 [[INDEX]], 0
|
|
||||||
; FORCE-NEXT: store i32 [[TMP0]], ptr @b, align 1
|
|
||||||
; FORCE-NEXT: br label [[PRED_STORE_CONTINUE]]
|
|
||||||
; FORCE: pred.store.continue:
|
|
||||||
; FORCE-NEXT: [[TMP10:%.*]] = extractelement <2 x i1> [[TMP2]], i32 1
|
|
||||||
; FORCE-NEXT: br i1 [[TMP10]], label [[PRED_STORE_IF3:%.*]], label [[PRED_STORE_CONTINUE4]]
|
|
||||||
; FORCE: pred.store.if1:
|
|
||||||
; FORCE-NEXT: [[TMP1:%.*]] = add i32 [[INDEX]], 1
|
|
||||||
; FORCE-NEXT: store i32 [[TMP1]], ptr @b, align 1
|
|
||||||
; FORCE-NEXT: br label [[PRED_STORE_CONTINUE4]]
|
|
||||||
; FORCE: pred.store.continue2:
|
|
||||||
; FORCE-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 2
|
|
||||||
; FORCE-NEXT: [[VEC_IND_NEXT]] = add <2 x i8> [[VEC_IND]], splat (i8 2)
|
|
||||||
; FORCE-NEXT: [[TMP15:%.*]] = icmp eq i32 [[INDEX_NEXT]], 4
|
|
||||||
; FORCE-NEXT: br i1 [[TMP15]], label {{%.*}}, label [[VECTOR_BODY]]
|
|
||||||
;
|
;
|
||||||
@a = internal constant [3 x i32] [i32 7, i32 7, i32 0], align 1
|
@a = internal constant [3 x i32] [i32 7, i32 7, i32 0], align 1
|
||||||
@b = external global i32, align 1
|
@b = external global i32, align 1
|
||||||
|
|
||||||
define void @PR40816() #1 {
|
define void @PR40816() #1 {
|
||||||
|
; CHECK-LABEL: define void @PR40816(
|
||||||
|
; CHECK-SAME: ) #[[ATTR1:[0-9]+]] {
|
||||||
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
||||||
|
; CHECK-NEXT: br label %[[FOR_BODY:.*]]
|
||||||
|
; CHECK: [[FOR_BODY]]:
|
||||||
|
; CHECK-NEXT: [[TMP0:%.*]] = phi i32 [ 0, %[[ENTRY]] ], [ [[INC:%.*]], %[[FOR_BODY]] ]
|
||||||
|
; CHECK-NEXT: store i32 [[TMP0]], ptr @b, align 1
|
||||||
|
; CHECK-NEXT: [[CMP2:%.*]] = icmp eq i32 [[TMP0]], 2
|
||||||
|
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[TMP0]], 1
|
||||||
|
; CHECK-NEXT: br i1 [[CMP2]], label %[[RETURN:.*]], label %[[FOR_BODY]]
|
||||||
|
; CHECK: [[RETURN]]:
|
||||||
|
; CHECK-NEXT: ret void
|
||||||
|
;
|
||||||
|
; FORCE-LABEL: define void @PR40816(
|
||||||
|
; FORCE-SAME: ) #[[ATTR1:[0-9]+]] {
|
||||||
|
; FORCE-NEXT: [[ENTRY:.*:]]
|
||||||
|
; FORCE-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
|
||||||
|
; FORCE: [[VECTOR_PH]]:
|
||||||
|
; FORCE-NEXT: br label %[[VECTOR_BODY:.*]]
|
||||||
|
; FORCE: [[VECTOR_BODY]]:
|
||||||
|
; FORCE-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_STORE_CONTINUE4:.*]] ]
|
||||||
|
; FORCE-NEXT: [[VEC_IND:%.*]] = phi <2 x i8> [ <i8 0, i8 1>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_STORE_CONTINUE4]] ]
|
||||||
|
; FORCE-NEXT: [[TMP2:%.*]] = icmp ule <2 x i8> [[VEC_IND]], splat (i8 2)
|
||||||
|
; FORCE-NEXT: [[TMP3:%.*]] = extractelement <2 x i1> [[TMP2]], i32 0
|
||||||
|
; FORCE-NEXT: br i1 [[TMP3]], label %[[PRED_STORE_IF:.*]], label %[[PRED_STORE_CONTINUE:.*]]
|
||||||
|
; FORCE: [[PRED_STORE_IF]]:
|
||||||
|
; FORCE-NEXT: [[TMP0:%.*]] = add i32 [[INDEX]], 0
|
||||||
|
; FORCE-NEXT: store i32 [[TMP0]], ptr @b, align 1
|
||||||
|
; FORCE-NEXT: br label %[[PRED_STORE_CONTINUE]]
|
||||||
|
; FORCE: [[PRED_STORE_CONTINUE]]:
|
||||||
|
; FORCE-NEXT: [[TMP10:%.*]] = extractelement <2 x i1> [[TMP2]], i32 1
|
||||||
|
; FORCE-NEXT: br i1 [[TMP10]], label %[[PRED_STORE_IF1:.*]], label %[[PRED_STORE_CONTINUE4]]
|
||||||
|
; FORCE: [[PRED_STORE_IF1]]:
|
||||||
|
; FORCE-NEXT: [[TMP1:%.*]] = add i32 [[INDEX]], 1
|
||||||
|
; FORCE-NEXT: store i32 [[TMP1]], ptr @b, align 1
|
||||||
|
; FORCE-NEXT: br label %[[PRED_STORE_CONTINUE4]]
|
||||||
|
; FORCE: [[PRED_STORE_CONTINUE4]]:
|
||||||
|
; FORCE-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 2
|
||||||
|
; FORCE-NEXT: [[VEC_IND_NEXT]] = add <2 x i8> [[VEC_IND]], splat (i8 2)
|
||||||
|
; FORCE-NEXT: [[TMP15:%.*]] = icmp eq i32 [[INDEX_NEXT]], 4
|
||||||
|
; FORCE-NEXT: br i1 [[TMP15]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]]
|
||||||
|
; FORCE: [[MIDDLE_BLOCK]]:
|
||||||
|
; FORCE-NEXT: br [[RETURN:label %.*]]
|
||||||
|
; FORCE: [[SCALAR_PH]]:
|
||||||
|
;
|
||||||
entry:
|
entry:
|
||||||
br label %for.body
|
br label %for.body
|
||||||
|
|
||||||
|
@ -1,4 +1,4 @@
|
|||||||
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
|
||||||
; RUN: opt < %s -S -passes=loop-vectorize -enable-vplan-native-path -force-vector-interleave=1 -force-vector-width=4 | FileCheck %s
|
; RUN: opt < %s -S -passes=loop-vectorize -enable-vplan-native-path -force-vector-interleave=1 -force-vector-width=4 | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-m:e-p:64:64-i64:64-i128:128-n32:64-S128"
|
target datalayout = "e-m:e-p:64:64-i64:64-i128:128-n32:64-S128"
|
||||||
@ -6,60 +6,60 @@ target datalayout = "e-m:e-p:64:64-i64:64-i128:128-n32:64-S128"
|
|||||||
define void @foo(ptr %h) !dbg !4 {
|
define void @foo(ptr %h) !dbg !4 {
|
||||||
; CHECK-LABEL: define void @foo(
|
; CHECK-LABEL: define void @foo(
|
||||||
; CHECK-SAME: ptr [[H:%.*]]) !dbg [[DBG4:![0-9]+]] {
|
; CHECK-SAME: ptr [[H:%.*]]) !dbg [[DBG4:![0-9]+]] {
|
||||||
; CHECK-NEXT: entry:
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
||||||
; CHECK-NEXT: #dbg_value(i64 0, [[META11:![0-9]+]], !DIExpression(), [[META20:![0-9]+]])
|
; CHECK-NEXT: #dbg_value(i64 0, [[META11:![0-9]+]], !DIExpression(), [[META20:![0-9]+]])
|
||||||
; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]], !dbg [[DBG21:![0-9]+]]
|
; CHECK-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]], !dbg [[DBG21:![0-9]+]]
|
||||||
; CHECK: vector.ph:
|
; CHECK: [[VECTOR_PH]]:
|
||||||
; CHECK-NEXT: br label [[VECTOR_BODY:%.*]], !dbg [[DBG21]]
|
; CHECK-NEXT: br label %[[VECTOR_BODY:.*]], !dbg [[DBG21]]
|
||||||
; CHECK: vector.body:
|
; CHECK: [[VECTOR_BODY]]:
|
||||||
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[FOR_COND_CLEANUP32:%.*]] ], !dbg [[DBG222:![0-9]+]]
|
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_LATCH:.*]] ], !dbg [[DBG22:![0-9]+]]
|
||||||
; CHECK-NEXT: br label [[FOR_COND5_PREHEADER1:%.*]]
|
; CHECK-NEXT: br label %[[FOR_COND5_PREHEADER1:.*]]
|
||||||
; CHECK: for.cond5.preheader1:
|
; CHECK: [[FOR_COND5_PREHEADER1]]:
|
||||||
; CHECK-NEXT: [[VEC_PHI:%.*]] = phi <4 x i64> [ zeroinitializer, [[VECTOR_BODY]] ], [ [[TMP4:%.*]], [[FOR_COND5_PREHEADER1]] ], !dbg [[DBG22:![0-9]+]]
|
; CHECK-NEXT: [[VEC_PHI:%.*]] = phi <4 x i64> [ zeroinitializer, %[[VECTOR_BODY]] ], [ [[TMP5:%.*]], %[[FOR_COND5_PREHEADER1]] ], !dbg [[DBG23:![0-9]+]]
|
||||||
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr i32, ptr [[H]], <4 x i64> [[VEC_PHI]]
|
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr i32, ptr [[H]], <4 x i64> [[VEC_PHI]]
|
||||||
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> zeroinitializer, <4 x ptr> [[TMP0]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG23:![0-9]+]]
|
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> zeroinitializer, <4 x ptr> [[TMP0]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG24:![0-9]+]]
|
||||||
; CHECK-NEXT: [[TMP1:%.*]] = getelementptr i32, <4 x ptr> [[TMP0]], i64 1, !dbg [[DBG25:![0-9]+]]
|
; CHECK-NEXT: [[TMP2:%.*]] = getelementptr i32, <4 x ptr> [[TMP0]], i64 1, !dbg [[DBG26:![0-9]+]]
|
||||||
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> splat (i32 1), <4 x ptr> [[TMP1]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG23]]
|
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> splat (i32 1), <4 x ptr> [[TMP2]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[TMP2:%.*]] = getelementptr i32, <4 x ptr> [[TMP0]], i64 2, !dbg [[DBG25]]
|
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr i32, <4 x ptr> [[TMP0]], i64 2, !dbg [[DBG26]]
|
||||||
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> splat (i32 2), <4 x ptr> [[TMP2]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG23]]
|
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> splat (i32 2), <4 x ptr> [[TMP3]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr i32, <4 x ptr> [[TMP0]], i64 3, !dbg [[DBG25]]
|
; CHECK-NEXT: [[TMP4:%.*]] = getelementptr i32, <4 x ptr> [[TMP0]], i64 3, !dbg [[DBG26]]
|
||||||
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> splat (i32 3), <4 x ptr> [[TMP3]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG23]]
|
; CHECK-NEXT: call void @llvm.masked.scatter.v4i32.v4p0(<4 x i32> splat (i32 3), <4 x ptr> [[TMP4]], i32 4, <4 x i1> splat (i1 true)), !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[TMP4]] = add nuw nsw <4 x i64> [[VEC_PHI]], splat (i64 1), !dbg [[DBG26:![0-9]+]]
|
; CHECK-NEXT: [[TMP5]] = add nuw nsw <4 x i64> [[VEC_PHI]], splat (i64 1), !dbg [[DBG27:![0-9]+]]
|
||||||
; CHECK-NEXT: [[TMP5:%.*]] = icmp eq <4 x i64> [[TMP4]], splat (i64 5), !dbg [[DBG27:![0-9]+]]
|
; CHECK-NEXT: [[TMP6:%.*]] = icmp eq <4 x i64> [[TMP5]], splat (i64 5), !dbg [[DBG28:![0-9]+]]
|
||||||
; CHECK-NEXT: [[TMP6:%.*]] = extractelement <4 x i1> [[TMP5]], i32 0, !dbg [[DBG28:![0-9]+]]
|
; CHECK-NEXT: [[TMP7:%.*]] = extractelement <4 x i1> [[TMP6]], i32 0, !dbg [[DBG29:![0-9]+]]
|
||||||
; CHECK-NEXT: br i1 [[TMP6]], label [[FOR_COND_CLEANUP32]], label [[FOR_COND5_PREHEADER1]], !dbg [[DBG28]]
|
; CHECK-NEXT: br i1 [[TMP7]], label %[[VECTOR_LATCH]], label %[[FOR_COND5_PREHEADER1]], !dbg [[DBG29]]
|
||||||
; CHECK: vector.latch:
|
; CHECK: [[VECTOR_LATCH]]:
|
||||||
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 4, !dbg [[DBG222]]
|
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 4, !dbg [[DBG22]]
|
||||||
; CHECK-NEXT: [[TMP9:%.*]] = icmp eq i64 [[INDEX_NEXT]], 20, !dbg [[DBG21]]
|
; CHECK-NEXT: [[TMP8:%.*]] = icmp eq i64 [[INDEX_NEXT]], 20, !dbg [[DBG21]]
|
||||||
; CHECK-NEXT: br i1 [[TMP9]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !dbg [[DBG21]], !llvm.loop [[LOOP29:![0-9]+]]
|
; CHECK-NEXT: br i1 [[TMP8]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !dbg [[DBG21]], !llvm.loop [[LOOP30:![0-9]+]]
|
||||||
; CHECK: middle.block:
|
; CHECK: [[MIDDLE_BLOCK]]:
|
||||||
; CHECK-NEXT: br i1 false, label [[EXIT:%.*]], label [[SCALAR_PH]], !dbg [[DBG21]]
|
; CHECK-NEXT: br i1 false, label %[[EXIT:.*]], label %[[SCALAR_PH]], !dbg [[DBG21]]
|
||||||
; CHECK: scalar.ph:
|
; CHECK: [[SCALAR_PH]]:
|
||||||
; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ 20, [[MIDDLE_BLOCK]] ], [ 0, [[ENTRY:%.*]] ]
|
; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ 20, %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ]
|
||||||
; CHECK-NEXT: br label [[FOR_COND1_PREHEADER:%.*]], !dbg [[DBG21]]
|
; CHECK-NEXT: br label %[[FOR_COND1_PREHEADER:.*]], !dbg [[DBG21]]
|
||||||
; CHECK: for.cond1.preheader:
|
; CHECK: [[FOR_COND1_PREHEADER]]:
|
||||||
; CHECK-NEXT: [[I_023:%.*]] = phi i64 [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ], [ [[INC13:%.*]], [[FOR_COND_CLEANUP3:%.*]] ]
|
; CHECK-NEXT: [[I_023:%.*]] = phi i64 [ [[BC_RESUME_VAL]], %[[SCALAR_PH]] ], [ [[INC13:%.*]], %[[FOR_COND_CLEANUP3:.*]] ]
|
||||||
; CHECK-NEXT: #dbg_value(i64 [[I_023]], [[META11]], !DIExpression(), [[META20]])
|
; CHECK-NEXT: #dbg_value(i64 [[I_023]], [[META11]], !DIExpression(), [[META20]])
|
||||||
; CHECK-NEXT: br label [[FOR_COND5_PREHEADER:%.*]], !dbg [[DBG28]]
|
; CHECK-NEXT: br label %[[FOR_COND5_PREHEADER:.*]], !dbg [[DBG29]]
|
||||||
; CHECK: for.cond5.preheader:
|
; CHECK: [[FOR_COND5_PREHEADER]]:
|
||||||
; CHECK-NEXT: [[L_022:%.*]] = phi i64 [ 0, [[FOR_COND1_PREHEADER]] ], [ [[INC10:%.*]], [[FOR_COND5_PREHEADER]] ], !dbg [[DBG22]]
|
; CHECK-NEXT: [[L_022:%.*]] = phi i64 [ 0, %[[FOR_COND1_PREHEADER]] ], [ [[INC10:%.*]], %[[FOR_COND5_PREHEADER]] ], !dbg [[DBG23]]
|
||||||
; CHECK-NEXT: [[TMP10:%.*]] = getelementptr i32, ptr [[H]], i64 [[L_022]]
|
; CHECK-NEXT: [[TMP9:%.*]] = getelementptr i32, ptr [[H]], i64 [[L_022]]
|
||||||
; CHECK-NEXT: store i32 0, ptr [[TMP10]], align 4, !dbg [[DBG23]]
|
; CHECK-NEXT: store i32 0, ptr [[TMP9]], align 4, !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[ARRAYIDX_1:%.*]] = getelementptr i32, ptr [[TMP10]], i64 1, !dbg [[DBG25]]
|
; CHECK-NEXT: [[ARRAYIDX_1:%.*]] = getelementptr i32, ptr [[TMP9]], i64 1, !dbg [[DBG26]]
|
||||||
; CHECK-NEXT: store i32 1, ptr [[ARRAYIDX_1]], align 4, !dbg [[DBG23]]
|
; CHECK-NEXT: store i32 1, ptr [[ARRAYIDX_1]], align 4, !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[ARRAYIDX_2:%.*]] = getelementptr i32, ptr [[TMP10]], i64 2, !dbg [[DBG25]]
|
; CHECK-NEXT: [[ARRAYIDX_2:%.*]] = getelementptr i32, ptr [[TMP9]], i64 2, !dbg [[DBG26]]
|
||||||
; CHECK-NEXT: store i32 2, ptr [[ARRAYIDX_2]], align 4, !dbg [[DBG23]]
|
; CHECK-NEXT: store i32 2, ptr [[ARRAYIDX_2]], align 4, !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[ARRAYIDX_3:%.*]] = getelementptr i32, ptr [[TMP10]], i64 3, !dbg [[DBG25]]
|
; CHECK-NEXT: [[ARRAYIDX_3:%.*]] = getelementptr i32, ptr [[TMP9]], i64 3, !dbg [[DBG26]]
|
||||||
; CHECK-NEXT: store i32 3, ptr [[ARRAYIDX_3]], align 4, !dbg [[DBG23]]
|
; CHECK-NEXT: store i32 3, ptr [[ARRAYIDX_3]], align 4, !dbg [[DBG24]]
|
||||||
; CHECK-NEXT: [[INC10]] = add nuw nsw i64 [[L_022]], 1, !dbg [[DBG26]]
|
; CHECK-NEXT: [[INC10]] = add nuw nsw i64 [[L_022]], 1, !dbg [[DBG27]]
|
||||||
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[INC10]], 5, !dbg [[DBG27]]
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[INC10]], 5, !dbg [[DBG28]]
|
||||||
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP3]], label [[FOR_COND5_PREHEADER]], !dbg [[DBG28]]
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[FOR_COND_CLEANUP3]], label %[[FOR_COND5_PREHEADER]], !dbg [[DBG29]]
|
||||||
; CHECK: for.cond.cleanup3:
|
; CHECK: [[FOR_COND_CLEANUP3]]:
|
||||||
; CHECK-NEXT: [[INC13]] = add nuw nsw i64 [[I_023]], 1, !dbg [[DBG33:![0-9]+]]
|
; CHECK-NEXT: [[INC13]] = add nuw nsw i64 [[I_023]], 1, !dbg [[DBG22]]
|
||||||
; CHECK-NEXT: #dbg_value(i64 [[INC13]], [[META11]], !DIExpression(), [[META20]])
|
; CHECK-NEXT: #dbg_value(i64 [[INC13]], [[META11]], !DIExpression(), [[META20]])
|
||||||
; CHECK-NEXT: [[EXITCOND24_NOT:%.*]] = icmp eq i64 [[INC13]], 23, !dbg [[DBG34:![0-9]+]]
|
; CHECK-NEXT: [[EXITCOND24_NOT:%.*]] = icmp eq i64 [[INC13]], 23, !dbg [[DBG34:![0-9]+]]
|
||||||
; CHECK-NEXT: br i1 [[EXITCOND24_NOT]], label [[EXIT]], label [[FOR_COND1_PREHEADER]], !dbg [[DBG21]], !llvm.loop [[LOOP35:![0-9]+]]
|
; CHECK-NEXT: br i1 [[EXITCOND24_NOT]], label %[[EXIT]], label %[[FOR_COND1_PREHEADER]], !dbg [[DBG21]], !llvm.loop [[LOOP35:![0-9]+]]
|
||||||
; CHECK: exit:
|
; CHECK: [[EXIT]]:
|
||||||
; CHECK-NEXT: ret void, !dbg [[DBG36:![0-9]+]]
|
; CHECK-NEXT: ret void, !dbg [[DBG36:![0-9]+]]
|
||||||
;
|
;
|
||||||
entry:
|
entry:
|
||||||
@ -137,7 +137,7 @@ declare void @llvm.dbg.value(metadata, metadata, metadata)
|
|||||||
!34 = !DILocation(line: 10, column: 5, scope: !12)
|
!34 = !DILocation(line: 10, column: 5, scope: !12)
|
||||||
;.
|
;.
|
||||||
; CHECK: [[META0:![0-9]+]] = distinct !DICompileUnit(language: DW_LANG_C11, file: [[META1:![0-9]+]], producer: "clang", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, splitDebugInlining: false, nameTableKind: None)
|
; CHECK: [[META0:![0-9]+]] = distinct !DICompileUnit(language: DW_LANG_C11, file: [[META1:![0-9]+]], producer: "clang", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, splitDebugInlining: false, nameTableKind: None)
|
||||||
; CHECK: [[META1]] = !DIFile(filename: "outer-loop-vect.c", directory: {{.*}})
|
; CHECK: [[META1]] = !DIFile(filename: "{{.*}}outer-loop-vect.c", directory: {{.*}})
|
||||||
; CHECK: [[DBG4]] = distinct !DISubprogram(name: "foo", scope: [[META1]], file: [[META1]], line: 8, type: [[META5:![0-9]+]], scopeLine: 8, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: [[META0]], retainedNodes: [[META9:![0-9]+]])
|
; CHECK: [[DBG4]] = distinct !DISubprogram(name: "foo", scope: [[META1]], file: [[META1]], line: 8, type: [[META5:![0-9]+]], scopeLine: 8, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: [[META0]], retainedNodes: [[META9:![0-9]+]])
|
||||||
; CHECK: [[META5]] = !DISubroutineType(types: [[META6:![0-9]+]])
|
; CHECK: [[META5]] = !DISubroutineType(types: [[META6:![0-9]+]])
|
||||||
; CHECK: [[META6]] = !{null, [[META7:![0-9]+]]}
|
; CHECK: [[META6]] = !{null, [[META7:![0-9]+]]}
|
||||||
@ -156,19 +156,19 @@ declare void @llvm.dbg.value(metadata, metadata, metadata)
|
|||||||
; CHECK: [[META19]] = distinct !DILexicalBlock(scope: [[META15]], file: [[META1]], line: 11, column: 5)
|
; CHECK: [[META19]] = distinct !DILexicalBlock(scope: [[META15]], file: [[META1]], line: 11, column: 5)
|
||||||
; CHECK: [[META20]] = !DILocation(line: 0, scope: [[META12]])
|
; CHECK: [[META20]] = !DILocation(line: 0, scope: [[META12]])
|
||||||
; CHECK: [[DBG21]] = !DILocation(line: 10, column: 3, scope: [[META12]])
|
; CHECK: [[DBG21]] = !DILocation(line: 10, column: 3, scope: [[META12]])
|
||||||
; CHECK: [[DBG222]] = !DILocation(line: 10, column: 30, scope: [[META16]])
|
; CHECK: [[DBG22]] = !DILocation(line: 10, column: 30, scope: [[META16]])
|
||||||
; CHECK: [[DBG22]] = !DILocation(line: 10, column: 5, scope: [[META12]])
|
; CHECK: [[DBG23]] = !DILocation(line: 10, column: 5, scope: [[META12]])
|
||||||
; CHECK: [[DBG23]] = !DILocation(line: 13, column: 11, scope: [[META24:![0-9]+]])
|
; CHECK: [[DBG24]] = !DILocation(line: 13, column: 11, scope: [[META25:![0-9]+]])
|
||||||
; CHECK: [[META24]] = distinct !DILexicalBlock(scope: [[META18]], file: [[META1]], line: 12, column: 7)
|
; CHECK: [[META25]] = distinct !DILexicalBlock(scope: [[META18]], file: [[META1]], line: 12, column: 7)
|
||||||
; CHECK: [[DBG25]] = !DILocation(line: 13, column: 2, scope: [[META24]])
|
; CHECK: [[DBG26]] = !DILocation(line: 13, column: 2, scope: [[META25]])
|
||||||
; CHECK: [[DBG26]] = !DILocation(line: 11, column: 32, scope: [[META19]])
|
; CHECK: [[DBG27]] = !DILocation(line: 11, column: 32, scope: [[META19]])
|
||||||
; CHECK: [[DBG27]] = !DILocation(line: 11, column: 26, scope: [[META19]])
|
; CHECK: [[DBG28]] = !DILocation(line: 11, column: 26, scope: [[META19]])
|
||||||
; CHECK: [[DBG28]] = !DILocation(line: 11, column: 5, scope: [[META15]])
|
; CHECK: [[DBG29]] = !DILocation(line: 11, column: 5, scope: [[META15]])
|
||||||
; CHECK: [[LOOP29]] = distinct !{[[LOOP29]], [[DBG21]], [[META30:![0-9]+]], [[META31:![0-9]+]], [[META32:![0-9]+]]}
|
; CHECK: [[LOOP30]] = distinct !{[[LOOP30]], [[DBG21]], [[META31:![0-9]+]], [[META32:![0-9]+]], [[META33:![0-9]+]]}
|
||||||
; CHECK: [[META30]] = !DILocation(line: 13, column: 13, scope: [[META12]])
|
; CHECK: [[META31]] = !DILocation(line: 13, column: 13, scope: [[META12]])
|
||||||
; CHECK: [[META31]] = !{!"llvm.loop.isvectorized", i32 1}
|
; CHECK: [[META32]] = !{!"llvm.loop.isvectorized", i32 1}
|
||||||
; CHECK: [[META32]] = !{!"llvm.loop.unroll.runtime.disable"}
|
; CHECK: [[META33]] = !{!"llvm.loop.unroll.runtime.disable"}
|
||||||
; CHECK: [[DBG34]] = !DILocation(line: 10, column: 24, scope: [[META16]])
|
; CHECK: [[DBG34]] = !DILocation(line: 10, column: 24, scope: [[META16]])
|
||||||
; CHECK: [[LOOP35]] = distinct !{[[LOOP35]], [[DBG21]], [[META30]], [[META31]]}
|
; CHECK: [[LOOP35]] = distinct !{[[LOOP35]], [[DBG21]], [[META31]], [[META32]]}
|
||||||
; CHECK: [[DBG36]] = !DILocation(line: 14, column: 1, scope: [[DBG4]])
|
; CHECK: [[DBG36]] = !DILocation(line: 14, column: 1, scope: [[DBG4]])
|
||||||
;.
|
;.
|
||||||
|
@ -1,16 +1,31 @@
|
|||||||
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --filter-out-after "scalar.ph\:" --version 5
|
||||||
; RUN: opt < %s -passes=loop-vectorize -force-vector-width=4 -S | FileCheck %s
|
; RUN: opt < %s -passes=loop-vectorize -force-vector-width=4 -S | FileCheck %s
|
||||||
|
|
||||||
; Test case for PR45525. Checks that phi's with a single predecessor and a mask are supported.
|
; Test case for PR45525. Checks that phi's with a single predecessor and a mask are supported.
|
||||||
|
|
||||||
define void @main(i1 %cond, ptr %arr) {
|
define void @main(i1 %cond, ptr %arr) {
|
||||||
; CHECK-LABEL: @main(
|
; CHECK-LABEL: define void @main(
|
||||||
; CHECK-NEXT: bb.0:
|
; CHECK-SAME: i1 [[COND:%.*]], ptr [[ARR:%.*]]) {
|
||||||
; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]]
|
; CHECK-NEXT: [[BB_0:.*:]]
|
||||||
; CHECK: vector.ph:
|
; CHECK-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
|
||||||
; CHECK: br label [[VECTOR_BODY:%.*]]
|
; CHECK: [[VECTOR_PH]]:
|
||||||
; CHECK: vector.body:
|
; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i1> poison, i1 [[COND]], i64 0
|
||||||
; CHECK: [[VEC_IND:%.*]] = phi <4 x i32> [ <i32 0, i32 1, i32 2, i32 3>, [[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], [[VECTOR_BODY]] ]
|
; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i1> [[BROADCAST_SPLATINSERT]], <4 x i1> poison, <4 x i32> zeroinitializer
|
||||||
; CHECK: [[TMP5:%.*]] = mul <4 x i32> [[VEC_IND]], splat (i32 3)
|
; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
|
||||||
|
; CHECK: [[VECTOR_BODY]]:
|
||||||
|
; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
|
||||||
|
; CHECK-NEXT: [[VEC_IND:%.*]] = phi <4 x i32> [ <i32 0, i32 1, i32 2, i32 3>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ]
|
||||||
|
; CHECK-NEXT: [[TMP5:%.*]] = mul <4 x i32> [[VEC_IND]], splat (i32 3)
|
||||||
|
; CHECK-NEXT: [[PREDPHI:%.*]] = select <4 x i1> [[BROADCAST_SPLAT]], <4 x i32> splat (i32 7), <4 x i32> [[TMP5]]
|
||||||
|
; CHECK-NEXT: [[TMP1:%.*]] = getelementptr inbounds i32, ptr [[ARR]], i32 [[INDEX]]
|
||||||
|
; CHECK-NEXT: store <4 x i32> [[PREDPHI]], ptr [[TMP1]], align 4
|
||||||
|
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4
|
||||||
|
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i32> [[VEC_IND]], splat (i32 4)
|
||||||
|
; CHECK-NEXT: [[TMP2:%.*]] = icmp eq i32 [[INDEX_NEXT]], 32
|
||||||
|
; CHECK-NEXT: br i1 [[TMP2]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
|
||||||
|
; CHECK: [[MIDDLE_BLOCK]]:
|
||||||
|
; CHECK-NEXT: br [[BB_4:label %.*]]
|
||||||
|
; CHECK: [[SCALAR_PH]]:
|
||||||
;
|
;
|
||||||
bb.0:
|
bb.0:
|
||||||
br label %bb.1
|
br label %bb.1
|
||||||
|
@ -1,42 +1,42 @@
|
|||||||
|
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --filter-out-after "vector.ph\:" --version 5
|
||||||
; RUN: opt < %s -passes=loop-vectorize,dce,instcombine -force-vector-interleave=1 -force-vector-width=4 -S | FileCheck %s
|
; RUN: opt < %s -passes=loop-vectorize,dce,instcombine -force-vector-interleave=1 -force-vector-width=4 -S | FileCheck %s
|
||||||
|
|
||||||
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
||||||
|
|
||||||
define void @add_ints(ptr nocapture %A, ptr nocapture %B, ptr nocapture %C) {
|
define void @add_ints(ptr nocapture %A, ptr nocapture %B, ptr nocapture %C) {
|
||||||
; CHECK-LABEL: @add_ints(
|
; CHECK-LABEL: define void @add_ints(
|
||||||
; CHECK-NEXT: entry:
|
; CHECK-SAME: ptr captures(none) [[A:%.*]], ptr captures(none) [[B:%.*]], ptr captures(none) [[C:%.*]]) {
|
||||||
; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[VECTOR_MEMCHECK:%.*]]
|
; CHECK-NEXT: [[ENTRY:.*:]]
|
||||||
; CHECK-LABEL: vector.memcheck:
|
; CHECK-NEXT: br i1 false, [[SCALAR_PH:label %.*]], label %[[VECTOR_MEMCHECK:.*]]
|
||||||
; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A:%.*]] to i64
|
; CHECK: [[VECTOR_MEMCHECK]]:
|
||||||
; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B:%.*]] to i64
|
; CHECK-NEXT: [[A1:%.*]] = ptrtoint ptr [[A]] to i64
|
||||||
; CHECK-NEXT: [[C3:%.*]] = ptrtoint ptr [[C:%.*]] to i64
|
; CHECK-NEXT: [[B2:%.*]] = ptrtoint ptr [[B]] to i64
|
||||||
|
; CHECK-NEXT: [[C3:%.*]] = ptrtoint ptr [[C]] to i64
|
||||||
; CHECK-NEXT: [[TMP0:%.*]] = sub i64 [[A1]], [[B2]]
|
; CHECK-NEXT: [[TMP0:%.*]] = sub i64 [[A1]], [[B2]]
|
||||||
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 16
|
; CHECK-NEXT: [[DIFF_CHECK:%.*]] = icmp ult i64 [[TMP0]], 16
|
||||||
; CHECK-NEXT: [[TMP1:%.*]] = sub i64 [[A1]], [[C3]]
|
; CHECK-NEXT: [[TMP1:%.*]] = sub i64 [[A1]], [[C3]]
|
||||||
; CHECK-NEXT: [[DIFF_CHECK4:%.*]] = icmp ult i64 [[TMP1]], 16
|
; CHECK-NEXT: [[DIFF_CHECK4:%.*]] = icmp ult i64 [[TMP1]], 16
|
||||||
; CHECK-NEXT: [[CONFLICT_RDX:%.*]] = or i1 [[DIFF_CHECK]], [[DIFF_CHECK4]]
|
; CHECK-NEXT: [[CONFLICT_RDX:%.*]] = or i1 [[DIFF_CHECK]], [[DIFF_CHECK4]]
|
||||||
; CHECK-NEXT: br i1 [[CONFLICT_RDX]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
|
; CHECK-NEXT: br i1 [[CONFLICT_RDX]], [[SCALAR_PH]], label %[[VECTOR_PH:.*]]
|
||||||
; CHECK: vector.ph:
|
; CHECK: [[VECTOR_PH]]:
|
||||||
; CHECK-NEXT: br label %vector.body
|
|
||||||
; CHECK: vector.body:
|
|
||||||
;
|
;
|
||||||
entry:
|
entry:
|
||||||
br label %for.body
|
br label %loop
|
||||||
|
|
||||||
for.body:
|
loop:
|
||||||
%indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ]
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
||||||
%arrayidx = getelementptr inbounds i32, ptr %B, i64 %indvars.iv
|
%arrayidx = getelementptr inbounds i32, ptr %B, i64 %iv
|
||||||
%0 = load i32, ptr %arrayidx, align 4
|
%0 = load i32, ptr %arrayidx, align 4
|
||||||
%arrayidx2 = getelementptr inbounds i32, ptr %C, i64 %indvars.iv
|
%arrayidx2 = getelementptr inbounds i32, ptr %C, i64 %iv
|
||||||
%1 = load i32, ptr %arrayidx2, align 4
|
%1 = load i32, ptr %arrayidx2, align 4
|
||||||
%add = add nsw i32 %1, %0
|
%add = add nsw i32 %1, %0
|
||||||
%arrayidx4 = getelementptr inbounds i32, ptr %A, i64 %indvars.iv
|
%arrayidx4 = getelementptr inbounds i32, ptr %A, i64 %iv
|
||||||
store i32 %add, ptr %arrayidx4, align 4
|
store i32 %add, ptr %arrayidx4, align 4
|
||||||
%indvars.iv.next = add i64 %indvars.iv, 1
|
%iv.next = add i64 %iv, 1
|
||||||
%lftr.wideiv = trunc i64 %indvars.iv.next to i32
|
%iv.trunc = trunc i64 %iv.next to i32
|
||||||
%exitcond = icmp eq i32 %lftr.wideiv, 200
|
%exitcond = icmp eq i32 %iv.trunc, 200
|
||||||
br i1 %exitcond, label %for.end, label %for.body
|
br i1 %exitcond, label %exit, label %loop
|
||||||
|
|
||||||
for.end:
|
exit:
|
||||||
ret void
|
ret void
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user