Extend existing tests to cover both finding first/last argmin/argmax for floating point reductions.
532 lines
25 KiB
LLVM
532 lines
25 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --version 6
|
|
; RUN: opt -passes=loop-vectorize -force-vector-width=4 -force-vector-interleave=1 -S %s | FileCheck %s
|
|
|
|
; Basic fmin with strict predicate (ogt: min.val > l means l is strictly
|
|
; smaller, so update -- finds first minimum). Uses llvm.minnum intrinsic.
|
|
define i64 @test_fmin_first_idx(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmin_first_idx(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt float [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call nnan float @llvm.minnum.f32(float [[L]], float [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan ogt float %min.val, %l
|
|
%min.val.next = call nnan float @llvm.minnum.f32(float %l, float %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; Same as above but using a select-based min instead of llvm.minnum intrinsic.
|
|
define i64 @test_fmin_first_idx_select_min(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmin_first_idx_select_min(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt float [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = select nnan i1 [[CMP]], float [[L]], float [[MIN_VAL]]
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan ogt float %min.val, %l
|
|
%min.val.next = select nnan i1 %cmp, float %l, float %min.val
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmin with flipped comparison operands (olt: l < min.val).
|
|
define i64 @test_fmin_first_idx_cond_flipped(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmin_first_idx_cond_flipped(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan olt float [[L]], [[MIN_VAL]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call nnan float @llvm.minnum.f32(float [[L]], float [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan olt float %l, %min.val
|
|
%min.val.next = call nnan float @llvm.minnum.f32(float %l, float %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmax with strict predicate (olt: max.val < l means l is strictly larger).
|
|
define i64 @test_fmax_first_idx(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmax_first_idx(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MAX_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_VAL:%.*]] = phi float [ 0xC7EFFFFFE0000000, %[[ENTRY]] ], [ [[MAX_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan olt float [[MAX_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MAX_VAL_NEXT]] = call nnan float @llvm.maxnum.f32(float [[L]], float [[MAX_VAL]])
|
|
; CHECK-NEXT: [[MAX_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MAX_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MAX_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%max.idx = phi i64 [ 0, %entry ], [ %max.idx.next, %loop ]
|
|
%max.val = phi float [ 0xC7EFFFFFE0000000, %entry ], [ %max.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan olt float %max.val, %l
|
|
%max.val.next = call nnan float @llvm.maxnum.f32(float %l, float %max.val)
|
|
%max.idx.next = select i1 %cmp, i64 %iv, i64 %max.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %max.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmax with flipped comparison (ogt: l > max.val).
|
|
define i64 @test_fmax_first_idx_cond_flipped(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmax_first_idx_cond_flipped(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MAX_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_VAL:%.*]] = phi float [ 0xC7EFFFFFE0000000, %[[ENTRY]] ], [ [[MAX_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt float [[L]], [[MAX_VAL]]
|
|
; CHECK-NEXT: [[MAX_VAL_NEXT]] = call nnan float @llvm.maxnum.f32(float [[L]], float [[MAX_VAL]])
|
|
; CHECK-NEXT: [[MAX_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MAX_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MAX_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%max.idx = phi i64 [ 0, %entry ], [ %max.idx.next, %loop ]
|
|
%max.val = phi float [ 0xC7EFFFFFE0000000, %entry ], [ %max.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan ogt float %l, %max.val
|
|
%max.val.next = call nnan float @llvm.maxnum.f32(float %l, float %max.val)
|
|
%max.idx.next = select i1 %cmp, i64 %iv, i64 %max.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %max.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmin with non-canonical IV (start=5, step=3) -- exercises DerivedIV path.
|
|
define i64 @test_fmin_first_idx_non_canonical_iv(ptr %src) {
|
|
; CHECK-LABEL: define i64 @test_fmin_first_idx_non_canonical_iv(
|
|
; CHECK-SAME: ptr [[SRC:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[INDEX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[WIDE_IV:%.*]] = phi i64 [ 5, %[[ENTRY]] ], [ [[WIDE_IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 5, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr float, ptr [[SRC]], i64 [[INDEX]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[TMP0]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt float [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call nnan float @llvm.minnum.f32(float [[L]], float [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[WIDE_IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw nsw i64 [[INDEX]], 1
|
|
; CHECK-NEXT: [[WIDE_IV_NEXT]] = add nuw nsw i64 [[WIDE_IV]], 3
|
|
; CHECK-NEXT: [[TMP4:%.*]] = icmp eq i64 [[INDEX_NEXT]], 100
|
|
; CHECK-NEXT: br i1 [[TMP4]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[TMP11:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[TMP11]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%wide.iv = phi i64 [ 5, %entry ], [ %wide.iv.next, %loop ]
|
|
%min.idx = phi i64 [ 5, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan ogt float %min.val, %l
|
|
%min.val.next = call nnan float @llvm.minnum.f32(float %l, float %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %wide.iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%wide.iv.next = add nuw nsw i64 %wide.iv, 3
|
|
%exitcond.not = icmp eq i64 %iv.next, 100
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
ret i64 %min.idx.next
|
|
}
|
|
|
|
; fmin without nnan flag on the comparison: should NOT vectorize via the
|
|
; argmin path (falls back to scalar or last-index vectorization).
|
|
define i64 @test_fmin_first_idx_no_nnan(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmin_first_idx_no_nnan(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp ogt float [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call float @llvm.minnum.f32(float [[L]], float [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp ogt float %min.val, %l
|
|
%min.val.next = call float @llvm.minnum.f32(float %l, float %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmin with double precision.
|
|
define i64 @test_fmin_first_idx_double(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmin_first_idx_double(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi double [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr double, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load double, ptr [[GEP]], align 8
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt double [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call nnan double @llvm.minnum.f64(double [[L]], double [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi double [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr double, ptr %src, i64 %iv
|
|
%l = load double, ptr %gep
|
|
%cmp = fcmp nnan ogt double %min.val, %l
|
|
%min.val.next = call nnan double @llvm.minnum.f64(double %l, double %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmin first-index using llvm.minimum intrinsic (FMinimum recurrence kind).
|
|
define i64 @test_fminimum_first_idx(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fminimum_first_idx(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt float [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call nnan float @llvm.minimum.f32(float [[L]], float [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan ogt float %min.val, %l
|
|
%min.val.next = call nnan float @llvm.minimum.f32(float %l, float %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmax first-index using llvm.maximumnum intrinsic (FMaximumNum recurrence kind).
|
|
define i64 @test_fmaximumnum_first_idx(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmaximumnum_first_idx(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MAX_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_VAL:%.*]] = phi float [ 0xC7EFFFFFE0000000, %[[ENTRY]] ], [ [[MAX_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan olt float [[MAX_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MAX_VAL_NEXT]] = call nnan float @llvm.maximumnum.f32(float [[L]], float [[MAX_VAL]])
|
|
; CHECK-NEXT: [[MAX_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MAX_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MAX_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%max.idx = phi i64 [ 0, %entry ], [ %max.idx.next, %loop ]
|
|
%max.val = phi float [ 0xC7EFFFFFE0000000, %entry ], [ %max.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan olt float %max.val, %l
|
|
%max.val.next = call nnan float @llvm.maximumnum.f32(float %l, float %max.val)
|
|
%max.idx.next = select i1 %cmp, i64 %iv, i64 %max.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %max.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmin first-index using llvm.minimumnum intrinsic (FMinimumNum recurrence kind).
|
|
define i64 @test_fminimumnum_first_idx(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fminimumnum_first_idx(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MIN_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MIN_VAL:%.*]] = phi float [ 0x47EFFFFFE0000000, %[[ENTRY]] ], [ [[MIN_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan ogt float [[MIN_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MIN_VAL_NEXT]] = call nnan float @llvm.minimumnum.f32(float [[L]], float [[MIN_VAL]])
|
|
; CHECK-NEXT: [[MIN_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MIN_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MIN_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%min.idx = phi i64 [ 0, %entry ], [ %min.idx.next, %loop ]
|
|
%min.val = phi float [ 0x47EFFFFFE0000000, %entry ], [ %min.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan ogt float %min.val, %l
|
|
%min.val.next = call nnan float @llvm.minimumnum.f32(float %l, float %min.val)
|
|
%min.idx.next = select i1 %cmp, i64 %iv, i64 %min.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %min.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
; fmax first-index using llvm.maximum intrinsic (FMaximum recurrence kind).
|
|
define i64 @test_fmaximum_first_idx(ptr %src, i64 %n) {
|
|
; CHECK-LABEL: define i64 @test_fmaximum_first_idx(
|
|
; CHECK-SAME: ptr [[SRC:%.*]], i64 [[N:%.*]]) {
|
|
; CHECK-NEXT: [[ENTRY:.*]]:
|
|
; CHECK-NEXT: br label %[[LOOP:.*]]
|
|
; CHECK: [[LOOP]]:
|
|
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_IDX:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[MAX_IDX_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[MAX_VAL:%.*]] = phi float [ 0xC7EFFFFFE0000000, %[[ENTRY]] ], [ [[MAX_VAL_NEXT:%.*]], %[[LOOP]] ]
|
|
; CHECK-NEXT: [[GEP:%.*]] = getelementptr float, ptr [[SRC]], i64 [[IV]]
|
|
; CHECK-NEXT: [[L:%.*]] = load float, ptr [[GEP]], align 4
|
|
; CHECK-NEXT: [[CMP:%.*]] = fcmp nnan olt float [[MAX_VAL]], [[L]]
|
|
; CHECK-NEXT: [[MAX_VAL_NEXT]] = call nnan float @llvm.maximum.f32(float [[L]], float [[MAX_VAL]])
|
|
; CHECK-NEXT: [[MAX_IDX_NEXT]] = select i1 [[CMP]], i64 [[IV]], i64 [[MAX_IDX]]
|
|
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
|
|
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
|
|
; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label %[[EXIT:.*]], label %[[LOOP]]
|
|
; CHECK: [[EXIT]]:
|
|
; CHECK-NEXT: [[RES:%.*]] = phi i64 [ [[MAX_IDX_NEXT]], %[[LOOP]] ]
|
|
; CHECK-NEXT: ret i64 [[RES]]
|
|
;
|
|
entry:
|
|
br label %loop
|
|
|
|
loop:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ]
|
|
%max.idx = phi i64 [ 0, %entry ], [ %max.idx.next, %loop ]
|
|
%max.val = phi float [ 0xC7EFFFFFE0000000, %entry ], [ %max.val.next, %loop ]
|
|
%gep = getelementptr float, ptr %src, i64 %iv
|
|
%l = load float, ptr %gep
|
|
%cmp = fcmp nnan olt float %max.val, %l
|
|
%max.val.next = call nnan float @llvm.maximum.f32(float %l, float %max.val)
|
|
%max.idx.next = select i1 %cmp, i64 %iv, i64 %max.idx
|
|
%iv.next = add nuw nsw i64 %iv, 1
|
|
%exitcond.not = icmp eq i64 %iv.next, %n
|
|
br i1 %exitcond.not, label %exit, label %loop
|
|
|
|
exit:
|
|
%res = phi i64 [ %max.idx.next, %loop ]
|
|
ret i64 %res
|
|
}
|
|
|
|
declare float @llvm.minnum.f32(float, float)
|
|
declare float @llvm.maxnum.f32(float, float)
|
|
declare float @llvm.minimum.f32(float, float)
|
|
declare float @llvm.maximum.f32(float, float)
|
|
declare float @llvm.minimumnum.f32(float, float)
|
|
declare float @llvm.maximumnum.f32(float, float)
|
|
declare double @llvm.minnum.f64(double, double)
|