The original loop (OL) that serves as input to LoopUnroll has basic
blocks that are arranged as follows:
```
OLPreHeader
OLHeader <-.
... |
OLLatch ---'
OLExit
```
In this depiction, every block has an implicit edge to the next block
below, so any explicit edge indicates a conditional branch.
Given OL and unroll count N, LoopUnroll sometimes creates an unrolled
loop (UL) with a remainder loop (RL) epilogue arranged like this:
```
,-- ULGuard
| ULPreHeader
| ULHeader <-.
| ... |
| ULLatch ---'
| ULExit
`-> RLGuard -----.
RLPreHeader |
,-> RLHeader |
| ... |
`-- RLLatch |
RLExit |
OLExit <-----'
```
Each UL iteration executes N OL iterations, but each RL iteration
executes 1 OL iteration. ULGuard or RLGuard checks whether the first
iteration of UL or RL should execute, respectively. If so, ULLatch or
RLLatch checks whether to execute each subsequent iteration.
Once reached, OL always executes its first iteration but not necessarily
the next N-1 iterations. Thus, ULGuard is always required before the
first UL iteration. However, when control flows from ULGuard directly to
RLGuard, the first OL iteration has yet to execute, so RLGuard is then
redundant before the first RL iteration.
Thus, this patch makes the following changes:
- Adjust ULGuard to branch to RLPreHeader instead of RLGuard, thus
eliminating RLGuard's unnecessary branch instruction for that path.
- Eliminate the creation of RLGuard phi node poison values. Without this
patch, RLGuard has such a phi node for each value that is defined by any
OL iteration and used in OLExit. The poison value is required where
ULGuard is the predecessor. The poison value indicates that control flow
from ULGuard to RLGuard to Exit has no counterpart in OL because the
first OL iteration must execute either in UL or RL.
- Simplify the CFG by not splitting ULExit and RLGuard because, without
the ULGuard predecessor, the single block can now be a dedicated UL
exit.
- To RLPreHeader, add an `llvm.assume` call that asserts the RL trip
count is non-zero. Without this patch, RLPreHeader is reachable only
when RLGuard guarantees that assertion is true. With this patch, RLGuard
guarantees it only when RLGuard is the predecessor, and the OL structure
guarantees it when ULGuard is the predecessor. If RL itself is unrolled
later, this guarantee somehow prevents ScalarEvolution from giving up
when trying to compute a maximum trip count for RL. That maximum trip
count enables the branch instruction in the final unrolled instance of
RLLatch to be eliminated. Without the `llvm.assume` call, some existing
unroll tests start to fail because that instruction is not eliminated.
The original motivation for this patch is to facilitate later patches
that fix LoopUnroll's computation of branch weights so that they
maintain the block frequency of OL's body (see #135812). Specifically,
this patch ensures RLGuard's branch weights do not affect RL's
contribution to the block frequency of OL's body in the case that
ULGuard skips UL.
6682 lines
359 KiB
LLVM
6682 lines
359 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: -p
|
|
; RUN: opt < %s -passes=loop-unroll -unroll-runtime=true -unroll-runtime-epilog=true -unroll-runtime-multi-exit=true -verify-loop-lcssa -verify-dom-info -verify-loop-info -S | FileCheck %s -check-prefixes=CHECK,EPILOG
|
|
; RUN: opt < %s -passes=loop-unroll -unroll-runtime -unroll-count=2 -unroll-runtime-epilog=true -unroll-runtime-multi-exit=true -verify-loop-lcssa -verify-dom-info -verify-loop-info -S | FileCheck %s -check-prefixes=CHECK,EPILOG-BLOCK
|
|
; RUN: opt < %s -passes=loop-unroll -unroll-runtime=true -unroll-runtime-epilog=false -unroll-runtime-multi-exit=true -verify-loop-lcssa -verify-dom-info -verify-loop-info -S | FileCheck %s -check-prefixes=CHECK,PROLOG
|
|
; RUN: opt < %s -passes=loop-unroll -unroll-runtime -unroll-runtime-epilog=false -unroll-count=2 -unroll-runtime-multi-exit=true -verify-loop-lcssa -verify-dom-info -verify-loop-info -S | FileCheck %s -check-prefixes=CHECK,PROLOG-BLOCK
|
|
|
|
; REQUIRES: asserts
|
|
|
|
; test with three exiting and three exit blocks.
|
|
; none of the exit blocks have successors
|
|
define void @test1(i64 %trip, i1 %cond) {
|
|
; EPILOG-LABEL: @test1(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting_bb1
|
|
; EPILOG: loop_exiting_bb1:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch, label %exit3.loopexit
|
|
; EPILOG: exit3.loopexit:
|
|
; EPILOG-NEXT: br label %exit3
|
|
; EPILOG: exit3.loopexit3:
|
|
; EPILOG-NEXT: br label %exit3
|
|
; EPILOG: exit3:
|
|
; EPILOG-NEXT: ret void
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; EPILOG: loop_exiting_bb1.1:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.1, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.1:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.1, label %exit3.loopexit
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.2, label %loop_exiting_bb1.2
|
|
; EPILOG: loop_exiting_bb1.2:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.2, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.2:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.2, label %exit3.loopexit
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.3, label %loop_exiting_bb1.3
|
|
; EPILOG: loop_exiting_bb1.3:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.3, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.3:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.3, label %exit3.loopexit
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.4, label %loop_exiting_bb1.4
|
|
; EPILOG: loop_exiting_bb1.4:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.4, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.4:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.4, label %exit3.loopexit
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.5, label %loop_exiting_bb1.5
|
|
; EPILOG: loop_exiting_bb1.5:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.5, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.5:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.5, label %exit3.loopexit
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.6, label %loop_exiting_bb1.6
|
|
; EPILOG: loop_exiting_bb1.6:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.6, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.6:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.6, label %exit3.loopexit
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.7, label %loop_exiting_bb1.7
|
|
; EPILOG: loop_exiting_bb1.7:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.7, label %exit1.loopexit
|
|
; EPILOG: loop_exiting_bb2.7:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.7, label %exit3.loopexit
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit2.loopexit.unr-lcssa
|
|
; EPILOG: exit1.loopexit:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
; EPILOG: exit2.loopexit.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2.loopexit
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit2.loopexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.epil, label %loop_exiting_bb1.epil
|
|
; EPILOG: loop_exiting_bb1.epil:
|
|
; EPILOG-NEXT: br i1 false, label %loop_exiting_bb2.epil, label %exit1.loopexit2
|
|
; EPILOG: loop_exiting_bb2.epil:
|
|
; EPILOG-NEXT: br i1 false, label %loop_latch.epil, label %exit3.loopexit3
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit2.loopexit.epilog-lcssa, !llvm.loop !0
|
|
; EPILOG: exit2.loopexit.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit2.loopexit
|
|
; EPILOG: exit2.loopexit:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test1(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting_bb1
|
|
; EPILOG-BLOCK: loop_exiting_bb1:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loop_exiting_bb2, label %exit1.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loop_latch, label %exit3.loopexit
|
|
; EPILOG-BLOCK: exit3.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit3
|
|
; EPILOG-BLOCK: exit3:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; EPILOG-BLOCK: loop_exiting_bb1.1:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loop_exiting_bb2.1, label %exit1.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2.1:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loop_latch.1, label %exit3.loopexit
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit2.loopexit.unr-lcssa, !llvm.loop !0
|
|
; EPILOG-BLOCK: exit1.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
; EPILOG-BLOCK: exit2.loopexit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2.loopexit
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.epil, label %loop_exiting_bb1.epil
|
|
; EPILOG-BLOCK: loop_exiting_bb1.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loop_exiting_bb2.epil, label %exit1
|
|
; EPILOG-BLOCK: loop_exiting_bb2.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loop_latch.epil, label %exit3
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit2.loopexit
|
|
; EPILOG-BLOCK: exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test1(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.prol, label %loop_exiting_bb1.prol
|
|
; PROLOG: loop_exiting_bb1.prol:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.prol, label %exit1.loopexit1
|
|
; PROLOG: loop_exiting_bb2.prol:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.prol, label %exit3.loopexit2
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !0
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit2.loopexit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting_bb1
|
|
; PROLOG: loop_exiting_bb1:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch, label %exit3.loopexit
|
|
; PROLOG: exit3.loopexit:
|
|
; PROLOG-NEXT: br label %exit3
|
|
; PROLOG: exit3.loopexit2:
|
|
; PROLOG-NEXT: br label %exit3
|
|
; PROLOG: exit3:
|
|
; PROLOG-NEXT: ret void
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; PROLOG: loop_exiting_bb1.1:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.1, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.1:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.1, label %exit3.loopexit
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.2, label %loop_exiting_bb1.2
|
|
; PROLOG: loop_exiting_bb1.2:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.2, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.2:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.2, label %exit3.loopexit
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.3, label %loop_exiting_bb1.3
|
|
; PROLOG: loop_exiting_bb1.3:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.3, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.3:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.3, label %exit3.loopexit
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.4, label %loop_exiting_bb1.4
|
|
; PROLOG: loop_exiting_bb1.4:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.4, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.4:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.4, label %exit3.loopexit
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.5, label %loop_exiting_bb1.5
|
|
; PROLOG: loop_exiting_bb1.5:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.5, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.5:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.5, label %exit3.loopexit
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.6, label %loop_exiting_bb1.6
|
|
; PROLOG: loop_exiting_bb1.6:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.6, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.6:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.6, label %exit3.loopexit
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.7, label %loop_exiting_bb1.7
|
|
; PROLOG: loop_exiting_bb1.7:
|
|
; PROLOG-NEXT: br i1 false, label %loop_exiting_bb2.7, label %exit1.loopexit
|
|
; PROLOG: loop_exiting_bb2.7:
|
|
; PROLOG-NEXT: br i1 false, label %loop_latch.7, label %exit3.loopexit
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit2.loopexit.unr-lcssa
|
|
; PROLOG: exit1.loopexit:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
; PROLOG: exit2.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit2.loopexit
|
|
; PROLOG: exit2.loopexit:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test1(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.prol, label %loop_exiting_bb1.prol
|
|
; PROLOG-BLOCK: loop_exiting_bb1.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loop_exiting_bb2.prol, label %exit1
|
|
; PROLOG-BLOCK: loop_exiting_bb2.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loop_latch.prol, label %exit3
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit2.loopexit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting_bb1
|
|
; PROLOG-BLOCK: loop_exiting_bb1:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loop_exiting_bb2, label %exit1.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loop_latch, label %exit3.loopexit
|
|
; PROLOG-BLOCK: exit3.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit3
|
|
; PROLOG-BLOCK: exit3:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; PROLOG-BLOCK: loop_exiting_bb1.1:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loop_exiting_bb2.1, label %exit1.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2.1:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loop_latch.1, label %exit3.loopexit
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit2.loopexit.unr-lcssa, !llvm.loop !0
|
|
; PROLOG-BLOCK: exit1.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
; PROLOG-BLOCK: exit2.loopexit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit2.loopexit
|
|
; PROLOG-BLOCK: exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
br i1 %cond, label %loop_latch, label %loop_exiting_bb1
|
|
|
|
loop_exiting_bb1:
|
|
br i1 false, label %loop_exiting_bb2, label %exit1
|
|
|
|
loop_exiting_bb2:
|
|
br i1 false, label %loop_latch, label %exit3
|
|
|
|
exit3:
|
|
ret void
|
|
|
|
loop_latch:
|
|
%iv_next = add i64 %iv, 1
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit2.loopexit
|
|
|
|
exit1:
|
|
ret void
|
|
|
|
exit2.loopexit:
|
|
ret void
|
|
}
|
|
|
|
|
|
; test with three exiting and two exit blocks.
|
|
; The non-latch exit block has 2 unique predecessors.
|
|
; There are 2 values passed to the exit blocks that are calculated at every iteration.
|
|
; %sum.02 and %add. Both of these are incoming values for phi from every exiting
|
|
; unrolled block.
|
|
define i32 @test2(ptr nocapture %a, i64 %n) {
|
|
; EPILOG-LABEL: @test2(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.7, %for.body.7 ]
|
|
; EPILOG-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.7, %for.body.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %for.body.7 ]
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG: for.exiting_block:
|
|
; EPILOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %for.body
|
|
; EPILOG: for.body:
|
|
; EPILOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG: for.exiting_block.1:
|
|
; EPILOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %for.body.1
|
|
; EPILOG: for.body.1:
|
|
; EPILOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-NEXT: %indvars.iv.next.1 = add nuw nsw i64 %indvars.iv, 2
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; EPILOG: for.exiting_block.2:
|
|
; EPILOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.2, label %for.exit2.loopexit, label %for.body.2
|
|
; EPILOG: for.body.2:
|
|
; EPILOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; EPILOG-NEXT: %5 = load i32, ptr %arrayidx.2, align 4
|
|
; EPILOG-NEXT: %add.2 = add nsw i32 %5, %add.1
|
|
; EPILOG-NEXT: %indvars.iv.next.2 = add nuw nsw i64 %indvars.iv, 3
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; EPILOG: for.exiting_block.3:
|
|
; EPILOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.3, label %for.exit2.loopexit, label %for.body.3
|
|
; EPILOG: for.body.3:
|
|
; EPILOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; EPILOG-NEXT: %6 = load i32, ptr %arrayidx.3, align 4
|
|
; EPILOG-NEXT: %add.3 = add nsw i32 %6, %add.2
|
|
; EPILOG-NEXT: %indvars.iv.next.3 = add nuw nsw i64 %indvars.iv, 4
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; EPILOG: for.exiting_block.4:
|
|
; EPILOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.4, label %for.exit2.loopexit, label %for.body.4
|
|
; EPILOG: for.body.4:
|
|
; EPILOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; EPILOG-NEXT: %7 = load i32, ptr %arrayidx.4, align 4
|
|
; EPILOG-NEXT: %add.4 = add nsw i32 %7, %add.3
|
|
; EPILOG-NEXT: %indvars.iv.next.4 = add nuw nsw i64 %indvars.iv, 5
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; EPILOG: for.exiting_block.5:
|
|
; EPILOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.5, label %for.exit2.loopexit, label %for.body.5
|
|
; EPILOG: for.body.5:
|
|
; EPILOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; EPILOG-NEXT: %8 = load i32, ptr %arrayidx.5, align 4
|
|
; EPILOG-NEXT: %add.5 = add nsw i32 %8, %add.4
|
|
; EPILOG-NEXT: %indvars.iv.next.5 = add nuw nsw i64 %indvars.iv, 6
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; EPILOG: for.exiting_block.6:
|
|
; EPILOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.6, label %for.exit2.loopexit, label %for.body.6
|
|
; EPILOG: for.body.6:
|
|
; EPILOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; EPILOG-NEXT: %9 = load i32, ptr %arrayidx.6, align 4
|
|
; EPILOG-NEXT: %add.6 = add nsw i32 %9, %add.5
|
|
; EPILOG-NEXT: %indvars.iv.next.6 = add nuw nsw i64 %indvars.iv, 7
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; EPILOG: for.exiting_block.7:
|
|
; EPILOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.7, label %for.exit2.loopexit, label %for.body.7
|
|
; EPILOG: for.body.7:
|
|
; EPILOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; EPILOG-NEXT: %10 = load i32, ptr %arrayidx.7, align 4
|
|
; EPILOG-NEXT: %add.7 = add nsw i32 %10, %add.6
|
|
; EPILOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp eq i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %for.end.unr-lcssa, label %header
|
|
; EPILOG: for.end.unr-lcssa:
|
|
; EPILOG-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.7, %for.body.7 ]
|
|
; EPILOG-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.7, %for.body.7 ]
|
|
; EPILOG-NEXT: %sum.02.unr = phi i32 [ %add.7, %for.body.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %for.end
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %for.end.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %for.end.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %indvars.iv.epil = phi i64 [ %indvars.iv.next.epil, %for.body.epil ], [ %indvars.iv.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %sum.02.epil = phi i32 [ %add.epil, %for.body.epil ], [ %sum.02.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %for.body.epil ]
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit3, label %for.exiting_block.epil
|
|
; EPILOG: for.exiting_block.epil:
|
|
; EPILOG-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.epil, label %for.exit2.loopexit3, label %for.body.epil
|
|
; EPILOG: for.body.epil:
|
|
; EPILOG-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil
|
|
; EPILOG-NEXT: %11 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-NEXT: %add.epil = add nsw i32 %11, %sum.02.epil
|
|
; EPILOG-NEXT: %indvars.iv.next.epil = add i64 %indvars.iv.epil, 1
|
|
; EPILOG-NEXT: %exitcond.epil = icmp eq i64 %indvars.iv.next.epil, %n
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %for.end.epilog-lcssa, !llvm.loop !2
|
|
; EPILOG: for.end.epilog-lcssa:
|
|
; EPILOG-NEXT: %sum.0.lcssa.ph1 = phi i32 [ %add.epil, %for.body.epil ]
|
|
; EPILOG-NEXT: br label %for.end
|
|
; EPILOG: for.end:
|
|
; EPILOG-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.ph, %for.end.unr-lcssa ], [ %sum.0.lcssa.ph1, %for.end.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i32 %sum.0.lcssa
|
|
; EPILOG: for.exit2.loopexit:
|
|
; EPILOG-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %for.body ], [ 42, %for.exiting_block.1 ], [ %add.1, %for.body.1 ], [ 42, %for.exiting_block.2 ], [ %add.2, %for.body.2 ], [ 42, %for.exiting_block.3 ], [ %add.3, %for.body.3 ], [ 42, %for.exiting_block.4 ], [ %add.4, %for.body.4 ], [ 42, %for.exiting_block.5 ], [ %add.5, %for.body.5 ], [ 42, %for.exiting_block.6 ], [ %add.6, %for.body.6 ], [ 42, %for.exiting_block.7 ]
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2.loopexit3:
|
|
; EPILOG-NEXT: %retval.ph4 = phi i32 [ 42, %for.exiting_block.epil ], [ %sum.02.epil, %header.epil ]
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2:
|
|
; EPILOG-NEXT: %retval = phi i32 [ %retval.ph, %for.exit2.loopexit ], [ %retval.ph4, %for.exit2.loopexit3 ]
|
|
; EPILOG-NEXT: ret i32 %retval
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test2(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.1, %for.body.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.1, %for.body.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %for.body.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG-BLOCK: for.exiting_block:
|
|
; EPILOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %for.body
|
|
; EPILOG-BLOCK: for.body:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-BLOCK-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-BLOCK-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG-BLOCK: for.exiting_block.1:
|
|
; EPILOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %for.body.1
|
|
; EPILOG-BLOCK: for.body.1:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp eq i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %for.end.unr-lcssa, label %header, !llvm.loop !2
|
|
; EPILOG-BLOCK: for.end.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.1, %for.body.1 ]
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.1, %for.body.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ %add.1, %for.body.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %for.end
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %for.end.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %for.end.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %for.exit2, label %for.exiting_block.epil
|
|
; EPILOG-BLOCK: for.exiting_block.epil:
|
|
; EPILOG-BLOCK-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.epil, label %for.exit2, label %for.body.epil
|
|
; EPILOG-BLOCK: for.body.epil:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil.init
|
|
; EPILOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.epil = add nsw i32 %5, %sum.02.epil.init
|
|
; EPILOG-BLOCK-NEXT: br label %for.end
|
|
; EPILOG-BLOCK: for.end:
|
|
; EPILOG-BLOCK-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.ph, %for.end.unr-lcssa ], [ %add.epil, %for.body.epil ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %sum.0.lcssa
|
|
; EPILOG-BLOCK: for.exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %for.body ], [ 42, %for.exiting_block.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %for.exit2
|
|
; EPILOG-BLOCK: for.exit2:
|
|
; EPILOG-BLOCK-NEXT: %retval = phi i32 [ %sum.02.epil.init, %header.epil ], [ 42, %for.exiting_block.epil ], [ %retval.ph, %for.exit2.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %retval
|
|
;
|
|
; PROLOG-LABEL: @test2(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %indvars.iv.prol = phi i64 [ %indvars.iv.next.prol, %for.body.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %sum.02.prol = phi i32 [ %add.prol, %for.body.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %for.body.prol ]
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit1, label %for.exiting_block.prol
|
|
; PROLOG: for.exiting_block.prol:
|
|
; PROLOG-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.prol, label %for.exit2.loopexit1, label %for.body.prol
|
|
; PROLOG: for.body.prol:
|
|
; PROLOG-NEXT: %arrayidx.prol = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.prol
|
|
; PROLOG-NEXT: %2 = load i32, ptr %arrayidx.prol, align 4
|
|
; PROLOG-NEXT: %add.prol = add nsw i32 %2, %sum.02.prol
|
|
; PROLOG-NEXT: %indvars.iv.next.prol = add i64 %indvars.iv.prol, 1
|
|
; PROLOG-NEXT: %exitcond.prol = icmp eq i64 %indvars.iv.next.prol, %n
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !2
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %sum.0.lcssa.unr.ph = phi i32 [ %add.prol, %for.body.prol ]
|
|
; PROLOG-NEXT: %indvars.iv.unr.ph = phi i64 [ %indvars.iv.next.prol, %for.body.prol ]
|
|
; PROLOG-NEXT: %sum.02.unr.ph = phi i32 [ %add.prol, %for.body.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %sum.0.lcssa.unr = phi i32 [ poison, %entry ], [ %sum.0.lcssa.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ %indvars.iv.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %sum.02.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %3, label %for.end, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.7, %for.body.7 ]
|
|
; PROLOG-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.7, %for.body.7 ]
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG: for.exiting_block:
|
|
; PROLOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %for.body
|
|
; PROLOG: for.body:
|
|
; PROLOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG: for.exiting_block.1:
|
|
; PROLOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %for.body.1
|
|
; PROLOG: for.body.1:
|
|
; PROLOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; PROLOG: for.exiting_block.2:
|
|
; PROLOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.2, label %for.exit2.loopexit, label %for.body.2
|
|
; PROLOG: for.body.2:
|
|
; PROLOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; PROLOG-NEXT: %6 = load i32, ptr %arrayidx.2, align 4
|
|
; PROLOG-NEXT: %add.2 = add nsw i32 %6, %add.1
|
|
; PROLOG-NEXT: %indvars.iv.next.2 = add i64 %indvars.iv, 3
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; PROLOG: for.exiting_block.3:
|
|
; PROLOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.3, label %for.exit2.loopexit, label %for.body.3
|
|
; PROLOG: for.body.3:
|
|
; PROLOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; PROLOG-NEXT: %7 = load i32, ptr %arrayidx.3, align 4
|
|
; PROLOG-NEXT: %add.3 = add nsw i32 %7, %add.2
|
|
; PROLOG-NEXT: %indvars.iv.next.3 = add i64 %indvars.iv, 4
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; PROLOG: for.exiting_block.4:
|
|
; PROLOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.4, label %for.exit2.loopexit, label %for.body.4
|
|
; PROLOG: for.body.4:
|
|
; PROLOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; PROLOG-NEXT: %8 = load i32, ptr %arrayidx.4, align 4
|
|
; PROLOG-NEXT: %add.4 = add nsw i32 %8, %add.3
|
|
; PROLOG-NEXT: %indvars.iv.next.4 = add i64 %indvars.iv, 5
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; PROLOG: for.exiting_block.5:
|
|
; PROLOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.5, label %for.exit2.loopexit, label %for.body.5
|
|
; PROLOG: for.body.5:
|
|
; PROLOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; PROLOG-NEXT: %9 = load i32, ptr %arrayidx.5, align 4
|
|
; PROLOG-NEXT: %add.5 = add nsw i32 %9, %add.4
|
|
; PROLOG-NEXT: %indvars.iv.next.5 = add i64 %indvars.iv, 6
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; PROLOG: for.exiting_block.6:
|
|
; PROLOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.6, label %for.exit2.loopexit, label %for.body.6
|
|
; PROLOG: for.body.6:
|
|
; PROLOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; PROLOG-NEXT: %10 = load i32, ptr %arrayidx.6, align 4
|
|
; PROLOG-NEXT: %add.6 = add nsw i32 %10, %add.5
|
|
; PROLOG-NEXT: %indvars.iv.next.6 = add i64 %indvars.iv, 7
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; PROLOG: for.exiting_block.7:
|
|
; PROLOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %for.exit2.loopexit, label %for.body.7
|
|
; PROLOG: for.body.7:
|
|
; PROLOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; PROLOG-NEXT: %11 = load i32, ptr %arrayidx.7, align 4
|
|
; PROLOG-NEXT: %add.7 = add nsw i32 %11, %add.6
|
|
; PROLOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; PROLOG-NEXT: %exitcond.7 = icmp eq i64 %indvars.iv.next.7, %n
|
|
; PROLOG-NEXT: br i1 %exitcond.7, label %for.end.unr-lcssa, label %header
|
|
; PROLOG: for.end.unr-lcssa:
|
|
; PROLOG-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.7, %for.body.7 ]
|
|
; PROLOG-NEXT: br label %for.end
|
|
; PROLOG: for.end:
|
|
; PROLOG-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.unr, %header.prol.loopexit ], [ %sum.0.lcssa.ph, %for.end.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i32 %sum.0.lcssa
|
|
; PROLOG: for.exit2.loopexit:
|
|
; PROLOG-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %for.body ], [ 42, %for.exiting_block.1 ], [ %add.1, %for.body.1 ], [ 42, %for.exiting_block.2 ], [ %add.2, %for.body.2 ], [ 42, %for.exiting_block.3 ], [ %add.3, %for.body.3 ], [ 42, %for.exiting_block.4 ], [ %add.4, %for.body.4 ], [ 42, %for.exiting_block.5 ], [ %add.5, %for.body.5 ], [ 42, %for.exiting_block.6 ], [ %add.6, %for.body.6 ], [ 42, %for.exiting_block.7 ]
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2.loopexit1:
|
|
; PROLOG-NEXT: %retval.ph2 = phi i32 [ 42, %for.exiting_block.prol ], [ %sum.02.prol, %header.prol ]
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2:
|
|
; PROLOG-NEXT: %retval = phi i32 [ %retval.ph, %for.exit2.loopexit ], [ %retval.ph2, %for.exit2.loopexit1 ]
|
|
; PROLOG-NEXT: ret i32 %retval
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test2(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %for.exit2, label %for.exiting_block.prol
|
|
; PROLOG-BLOCK: for.exiting_block.prol:
|
|
; PROLOG-BLOCK-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.prol, label %for.exit2, label %for.body.prol
|
|
; PROLOG-BLOCK: for.body.prol:
|
|
; PROLOG-BLOCK-NEXT: %2 = load i32, ptr %a, align 4
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %sum.0.lcssa.unr = phi i32 [ poison, %entry ], [ %2, %for.body.prol ]
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ 1, %for.body.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %2, %for.body.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %for.end, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.1, %for.body.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.1, %for.body.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG-BLOCK: for.exiting_block:
|
|
; PROLOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %for.body
|
|
; PROLOG-BLOCK: for.body:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-BLOCK-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG-BLOCK: for.exiting_block.1:
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %for.body.1
|
|
; PROLOG-BLOCK: for.body.1:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-BLOCK-NEXT: %exitcond.1 = icmp eq i64 %indvars.iv.next.1, %n
|
|
; PROLOG-BLOCK-NEXT: br i1 %exitcond.1, label %for.end.unr-lcssa, label %header, !llvm.loop !2
|
|
; PROLOG-BLOCK: for.end.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.1, %for.body.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %for.end
|
|
; PROLOG-BLOCK: for.end:
|
|
; PROLOG-BLOCK-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.unr, %header.prol.loopexit ], [ %sum.0.lcssa.ph, %for.end.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %sum.0.lcssa
|
|
; PROLOG-BLOCK: for.exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %for.body ], [ 42, %for.exiting_block.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %for.exit2
|
|
; PROLOG-BLOCK: for.exit2:
|
|
; PROLOG-BLOCK-NEXT: %retval = phi i32 [ 0, %header.prol ], [ 42, %for.exiting_block.prol ], [ %retval.ph, %for.exit2.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %retval
|
|
;
|
|
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 0, %entry ]
|
|
%sum.02 = phi i32 [ %add, %for.body ], [ 0, %entry ]
|
|
br i1 false, label %for.exit2, label %for.exiting_block
|
|
|
|
for.exiting_block:
|
|
%cmp = icmp eq i64 %n, 42
|
|
br i1 %cmp, label %for.exit2, label %for.body
|
|
|
|
for.body:
|
|
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
%0 = load i32, ptr %arrayidx, align 4
|
|
%add = add nsw i32 %0, %sum.02
|
|
%indvars.iv.next = add i64 %indvars.iv, 1
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %n
|
|
br i1 %exitcond, label %for.end, label %header
|
|
|
|
for.end: ; preds = %for.body
|
|
%sum.0.lcssa = phi i32 [ %add, %for.body ]
|
|
ret i32 %sum.0.lcssa
|
|
|
|
for.exit2:
|
|
%retval = phi i32 [ %sum.02, %header ], [ 42, %for.exiting_block ]
|
|
ret i32 %retval
|
|
}
|
|
|
|
; test with two exiting and three exit blocks.
|
|
; the non-latch exiting block has a switch.
|
|
define void @test3(i64 %trip, i64 %add, i1 %arg) {
|
|
; EPILOG-LABEL: @test3(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %sum = phi i64 [ 0, %entry.new ], [ %sum.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch, label %loop_exiting_bb1
|
|
; EPILOG: loop_exiting_bb1:
|
|
; EPILOG-NEXT: switch i64 %sum, label %loop_latch [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: exit3.loopexit:
|
|
; EPILOG-NEXT: br label %exit3
|
|
; EPILOG: exit3.loopexit3:
|
|
; EPILOG-NEXT: br label %exit3
|
|
; EPILOG: exit3:
|
|
; EPILOG-NEXT: ret void
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: %sum.next = add i64 %sum, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; EPILOG: loop_exiting_bb1.1:
|
|
; EPILOG-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.2, label %loop_exiting_bb1.2
|
|
; EPILOG: loop_exiting_bb1.2:
|
|
; EPILOG-NEXT: switch i64 %sum.next.1, label %loop_latch.2 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: %sum.next.2 = add i64 %sum.next.1, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.3, label %loop_exiting_bb1.3
|
|
; EPILOG: loop_exiting_bb1.3:
|
|
; EPILOG-NEXT: switch i64 %sum.next.2, label %loop_latch.3 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: %sum.next.3 = add i64 %sum.next.2, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.4, label %loop_exiting_bb1.4
|
|
; EPILOG: loop_exiting_bb1.4:
|
|
; EPILOG-NEXT: switch i64 %sum.next.3, label %loop_latch.4 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: %sum.next.4 = add i64 %sum.next.3, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.5, label %loop_exiting_bb1.5
|
|
; EPILOG: loop_exiting_bb1.5:
|
|
; EPILOG-NEXT: switch i64 %sum.next.4, label %loop_latch.5 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: %sum.next.5 = add i64 %sum.next.4, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.6, label %loop_exiting_bb1.6
|
|
; EPILOG: loop_exiting_bb1.6:
|
|
; EPILOG-NEXT: switch i64 %sum.next.5, label %loop_latch.6 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: %sum.next.6 = add i64 %sum.next.5, %add
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.7, label %loop_exiting_bb1.7
|
|
; EPILOG: loop_exiting_bb1.7:
|
|
; EPILOG-NEXT: switch i64 %sum.next.6, label %loop_latch.7 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add nuw nsw i64 %iv, 8
|
|
; EPILOG-NEXT: %sum.next.7 = add i64 %sum.next.6, %add
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit2.loopexit.unr-lcssa
|
|
; EPILOG: exit1.loopexit:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
; EPILOG: exit2.loopexit.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %sum.unr = phi i64 [ %sum.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2.loopexit
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit2.loopexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.epil.init = phi i64 [ 0, %entry ], [ %sum.unr, %exit2.loopexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %sum.epil = phi i64 [ %sum.epil.init, %loop_header.epil.preheader ], [ %sum.next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: br i1 %arg, label %loop_latch.epil, label %loop_exiting_bb1.epil
|
|
; EPILOG: loop_exiting_bb1.epil:
|
|
; EPILOG-NEXT: switch i64 %sum.epil, label %loop_latch.epil [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit2
|
|
; EPILOG-NEXT: i64 42, label %exit3.loopexit3
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add nuw nsw i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %sum.next.epil = add i64 %sum.epil, %add
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit2.loopexit.epilog-lcssa, !llvm.loop !3
|
|
; EPILOG: exit2.loopexit.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit2.loopexit
|
|
; EPILOG: exit2.loopexit:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test3(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum = phi i64 [ 0, %entry.new ], [ %sum.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %arg, label %loop_latch, label %loop_exiting_bb1
|
|
; EPILOG-BLOCK: loop_exiting_bb1:
|
|
; EPILOG-BLOCK-NEXT: switch i64 %sum, label %loop_latch [
|
|
; EPILOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-BLOCK-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-BLOCK-NEXT: ]
|
|
; EPILOG-BLOCK: exit3.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit3
|
|
; EPILOG-BLOCK: exit3:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: %sum.next = add i64 %sum, %add
|
|
; EPILOG-BLOCK-NEXT: br i1 %arg, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; EPILOG-BLOCK: loop_exiting_bb1.1:
|
|
; EPILOG-BLOCK-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; EPILOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-BLOCK-NEXT: i64 42, label %exit3.loopexit
|
|
; EPILOG-BLOCK-NEXT: ]
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit2.loopexit.unr-lcssa, !llvm.loop !3
|
|
; EPILOG-BLOCK: exit1.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
; EPILOG-BLOCK: exit2.loopexit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %sum.unr = phi i64 [ %sum.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2.loopexit
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %sum.epil.init = phi i64 [ 0, %entry ], [ %sum.unr, %exit2.loopexit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %arg, label %loop_latch.epil, label %loop_exiting_bb1.epil
|
|
; EPILOG-BLOCK: loop_exiting_bb1.epil:
|
|
; EPILOG-BLOCK-NEXT: switch i64 %sum.epil.init, label %loop_latch.epil [
|
|
; EPILOG-BLOCK-NEXT: i64 24, label %exit1
|
|
; EPILOG-BLOCK-NEXT: i64 42, label %exit3
|
|
; EPILOG-BLOCK-NEXT: ]
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit2.loopexit
|
|
; EPILOG-BLOCK: exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test3(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %sum.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %sum.next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.prol, label %loop_exiting_bb1.prol
|
|
; PROLOG: loop_exiting_bb1.prol:
|
|
; PROLOG-NEXT: switch i64 %sum.prol, label %loop_latch.prol [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit1
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit2
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add nuw nsw i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %sum.next.prol = add i64 %sum.prol, %add
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !3
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %sum.unr.ph = phi i64 [ %sum.next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.unr = phi i64 [ 0, %entry ], [ %sum.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit2.loopexit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: %sum = phi i64 [ %sum.unr, %entry.new ], [ %sum.next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch, label %loop_exiting_bb1
|
|
; PROLOG: loop_exiting_bb1:
|
|
; PROLOG-NEXT: switch i64 %sum, label %loop_latch [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: exit3.loopexit:
|
|
; PROLOG-NEXT: br label %exit3
|
|
; PROLOG: exit3.loopexit2:
|
|
; PROLOG-NEXT: br label %exit3
|
|
; PROLOG: exit3:
|
|
; PROLOG-NEXT: ret void
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: %sum.next = add i64 %sum, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; PROLOG: loop_exiting_bb1.1:
|
|
; PROLOG-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.2, label %loop_exiting_bb1.2
|
|
; PROLOG: loop_exiting_bb1.2:
|
|
; PROLOG-NEXT: switch i64 %sum.next.1, label %loop_latch.2 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: %sum.next.2 = add i64 %sum.next.1, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.3, label %loop_exiting_bb1.3
|
|
; PROLOG: loop_exiting_bb1.3:
|
|
; PROLOG-NEXT: switch i64 %sum.next.2, label %loop_latch.3 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: %sum.next.3 = add i64 %sum.next.2, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.4, label %loop_exiting_bb1.4
|
|
; PROLOG: loop_exiting_bb1.4:
|
|
; PROLOG-NEXT: switch i64 %sum.next.3, label %loop_latch.4 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: %sum.next.4 = add i64 %sum.next.3, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.5, label %loop_exiting_bb1.5
|
|
; PROLOG: loop_exiting_bb1.5:
|
|
; PROLOG-NEXT: switch i64 %sum.next.4, label %loop_latch.5 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: %sum.next.5 = add i64 %sum.next.4, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.6, label %loop_exiting_bb1.6
|
|
; PROLOG: loop_exiting_bb1.6:
|
|
; PROLOG-NEXT: switch i64 %sum.next.5, label %loop_latch.6 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: %sum.next.6 = add i64 %sum.next.5, %add
|
|
; PROLOG-NEXT: br i1 %arg, label %loop_latch.7, label %loop_exiting_bb1.7
|
|
; PROLOG: loop_exiting_bb1.7:
|
|
; PROLOG-NEXT: switch i64 %sum.next.6, label %loop_latch.7 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add nuw nsw i64 %iv, 8
|
|
; PROLOG-NEXT: %sum.next.7 = add i64 %sum.next.6, %add
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit2.loopexit.unr-lcssa
|
|
; PROLOG: exit1.loopexit:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
; PROLOG: exit2.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit2.loopexit
|
|
; PROLOG: exit2.loopexit:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test3(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %arg, label %loop_latch.prol, label %loop_exiting_bb1.prol
|
|
; PROLOG-BLOCK: loop_exiting_bb1.prol:
|
|
; PROLOG-BLOCK-NEXT: switch i64 0, label %loop_latch.prol [
|
|
; PROLOG-BLOCK-NEXT: i64 24, label %exit1
|
|
; PROLOG-BLOCK-NEXT: i64 42, label %exit3
|
|
; PROLOG-BLOCK-NEXT: ]
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.unr = phi i64 [ 0, %entry ], [ %add, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit2.loopexit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum = phi i64 [ %sum.unr, %entry.new ], [ %sum.next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %arg, label %loop_latch, label %loop_exiting_bb1
|
|
; PROLOG-BLOCK: loop_exiting_bb1:
|
|
; PROLOG-BLOCK-NEXT: switch i64 %sum, label %loop_latch [
|
|
; PROLOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-BLOCK-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-BLOCK-NEXT: ]
|
|
; PROLOG-BLOCK: exit3.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit3
|
|
; PROLOG-BLOCK: exit3:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: %sum.next = add i64 %sum, %add
|
|
; PROLOG-BLOCK-NEXT: br i1 %arg, label %loop_latch.1, label %loop_exiting_bb1.1
|
|
; PROLOG-BLOCK: loop_exiting_bb1.1:
|
|
; PROLOG-BLOCK-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; PROLOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-BLOCK-NEXT: i64 42, label %exit3.loopexit
|
|
; PROLOG-BLOCK-NEXT: ]
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit2.loopexit.unr-lcssa, !llvm.loop !3
|
|
; PROLOG-BLOCK: exit1.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
; PROLOG-BLOCK: exit2.loopexit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit2.loopexit
|
|
; PROLOG-BLOCK: exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
%sum = phi i64 [ 0, %entry ], [ %sum.next, %loop_latch ]
|
|
br i1 %arg, label %loop_latch, label %loop_exiting_bb1
|
|
|
|
loop_exiting_bb1:
|
|
switch i64 %sum, label %loop_latch [
|
|
i64 24, label %exit1
|
|
i64 42, label %exit3
|
|
]
|
|
|
|
exit3:
|
|
ret void
|
|
|
|
loop_latch:
|
|
%iv_next = add nuw nsw i64 %iv, 1
|
|
%sum.next = add i64 %sum, %add
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit2.loopexit
|
|
|
|
exit1:
|
|
ret void
|
|
|
|
exit2.loopexit:
|
|
ret void
|
|
}
|
|
|
|
; FIXME: Support multiple exiting blocks to the same latch exit block.
|
|
; Three exiting blocks where header and latch exit to same LatchExit.
|
|
define i32 @hdr_latch_same_exit(ptr nocapture %a, i64 %n, i1 %cond) {
|
|
; EPILOG-LABEL: @hdr_latch_same_exit(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block
|
|
; EPILOG: for.exiting_block:
|
|
; EPILOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.1
|
|
; EPILOG: for.exiting_block.1:
|
|
; EPILOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-NEXT: %indvars.iv.next.1 = add nuw nsw i64 %indvars.iv, 2
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.2
|
|
; EPILOG: for.exiting_block.2:
|
|
; EPILOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.2, label %for.exit2.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; EPILOG-NEXT: %5 = load i32, ptr %arrayidx.2, align 4
|
|
; EPILOG-NEXT: %add.2 = add nsw i32 %5, %add.1
|
|
; EPILOG-NEXT: %indvars.iv.next.2 = add nuw nsw i64 %indvars.iv, 3
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.3
|
|
; EPILOG: for.exiting_block.3:
|
|
; EPILOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.3, label %for.exit2.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; EPILOG-NEXT: %6 = load i32, ptr %arrayidx.3, align 4
|
|
; EPILOG-NEXT: %add.3 = add nsw i32 %6, %add.2
|
|
; EPILOG-NEXT: %indvars.iv.next.3 = add nuw nsw i64 %indvars.iv, 4
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.4
|
|
; EPILOG: for.exiting_block.4:
|
|
; EPILOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.4, label %for.exit2.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; EPILOG-NEXT: %7 = load i32, ptr %arrayidx.4, align 4
|
|
; EPILOG-NEXT: %add.4 = add nsw i32 %7, %add.3
|
|
; EPILOG-NEXT: %indvars.iv.next.4 = add nuw nsw i64 %indvars.iv, 5
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.5
|
|
; EPILOG: for.exiting_block.5:
|
|
; EPILOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.5, label %for.exit2.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; EPILOG-NEXT: %8 = load i32, ptr %arrayidx.5, align 4
|
|
; EPILOG-NEXT: %add.5 = add nsw i32 %8, %add.4
|
|
; EPILOG-NEXT: %indvars.iv.next.5 = add nuw nsw i64 %indvars.iv, 6
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.6
|
|
; EPILOG: for.exiting_block.6:
|
|
; EPILOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.6, label %for.exit2.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; EPILOG-NEXT: %9 = load i32, ptr %arrayidx.6, align 4
|
|
; EPILOG-NEXT: %add.6 = add nsw i32 %9, %add.5
|
|
; EPILOG-NEXT: %indvars.iv.next.6 = add nuw nsw i64 %indvars.iv, 7
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.7
|
|
; EPILOG: for.exiting_block.7:
|
|
; EPILOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.7, label %for.exit2.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; EPILOG-NEXT: %10 = load i32, ptr %arrayidx.7, align 4
|
|
; EPILOG-NEXT: %add.7 = add nsw i32 %10, %add.6
|
|
; EPILOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp eq i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %latchExit.unr-lcssa, label %header
|
|
; EPILOG: latchExit.unr-lcssa:
|
|
; EPILOG-NEXT: %result.ph = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02.unr = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %indvars.iv.epil = phi i64 [ %indvars.iv.next.epil, %latch.epil ], [ %indvars.iv.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %sum.02.epil = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit3, label %for.exiting_block.epil
|
|
; EPILOG: for.exiting_block.epil:
|
|
; EPILOG-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.epil, label %for.exit2.loopexit5, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil
|
|
; EPILOG-NEXT: %11 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-NEXT: %add.epil = add nsw i32 %11, %sum.02.epil
|
|
; EPILOG-NEXT: %indvars.iv.next.epil = add i64 %indvars.iv.epil, 1
|
|
; EPILOG-NEXT: %exitcond.epil = icmp eq i64 %indvars.iv.next.epil, %n
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latchExit.epilog-lcssa.loopexit3, !llvm.loop !4
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: %result.ph1.ph = phi i32 [ 0, %header ], [ 0, %latch ], [ 0, %latch.1 ], [ 0, %latch.2 ], [ 0, %latch.3 ], [ 0, %latch.4 ], [ 0, %latch.5 ], [ 0, %latch.6 ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit3:
|
|
; EPILOG-NEXT: %result.ph1.ph4 = phi i32 [ 0, %header.epil ], [ %add.epil, %latch.epil ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa:
|
|
; EPILOG-NEXT: %result.ph1 = phi i32 [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ], [ %result.ph1.ph4, %latchExit.epilog-lcssa.loopexit3 ]
|
|
; EPILOG-NEXT: br label %latchExit
|
|
; EPILOG: latchExit:
|
|
; EPILOG-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i32 %result
|
|
; EPILOG: for.exit2.loopexit:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2.loopexit5:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2:
|
|
; EPILOG-NEXT: ret i32 42
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @hdr_latch_same_exit(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block
|
|
; EPILOG-BLOCK: for.exiting_block:
|
|
; EPILOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-BLOCK-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-BLOCK-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %latchExit.epilog-lcssa.loopexit, label %for.exiting_block.1
|
|
; EPILOG-BLOCK: for.exiting_block.1:
|
|
; EPILOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp eq i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %latchExit.unr-lcssa, label %header, !llvm.loop !4
|
|
; EPILOG-BLOCK: latchExit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %latchExit.epilog-lcssa, label %for.exiting_block.epil
|
|
; EPILOG-BLOCK: for.exiting_block.epil:
|
|
; EPILOG-BLOCK-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.epil, label %for.exit2, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil.init
|
|
; EPILOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.epil = add nsw i32 %5, %sum.02.epil.init
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1.ph = phi i32 [ 0, %header ], [ 0, %latch ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1 = phi i32 [ %add.epil, %latch.epil ], [ 0, %header.epil ], [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit
|
|
; EPILOG-BLOCK: latchExit:
|
|
; EPILOG-BLOCK-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %result
|
|
; EPILOG-BLOCK: for.exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %for.exit2
|
|
; EPILOG-BLOCK: for.exit2:
|
|
; EPILOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-LABEL: @hdr_latch_same_exit(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %indvars.iv.prol = phi i64 [ %indvars.iv.next.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %sum.02.prol = phi i32 [ %add.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit1, label %for.exiting_block.prol
|
|
; PROLOG: for.exiting_block.prol:
|
|
; PROLOG-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.prol, label %for.exit2.loopexit3, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %arrayidx.prol = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.prol
|
|
; PROLOG-NEXT: %2 = load i32, ptr %arrayidx.prol, align 4
|
|
; PROLOG-NEXT: %add.prol = add nsw i32 %2, %sum.02.prol
|
|
; PROLOG-NEXT: %indvars.iv.next.prol = add i64 %indvars.iv.prol, 1
|
|
; PROLOG-NEXT: %exitcond.prol = icmp eq i64 %indvars.iv.next.prol, %n
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !4
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %indvars.iv.unr.ph = phi i64 [ %indvars.iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %sum.02.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %result.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ %indvars.iv.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %sum.02.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; PROLOG-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block
|
|
; PROLOG: for.exiting_block:
|
|
; PROLOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.1
|
|
; PROLOG: for.exiting_block.1:
|
|
; PROLOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.2
|
|
; PROLOG: for.exiting_block.2:
|
|
; PROLOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.2, label %for.exit2.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; PROLOG-NEXT: %6 = load i32, ptr %arrayidx.2, align 4
|
|
; PROLOG-NEXT: %add.2 = add nsw i32 %6, %add.1
|
|
; PROLOG-NEXT: %indvars.iv.next.2 = add i64 %indvars.iv, 3
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.3
|
|
; PROLOG: for.exiting_block.3:
|
|
; PROLOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.3, label %for.exit2.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; PROLOG-NEXT: %7 = load i32, ptr %arrayidx.3, align 4
|
|
; PROLOG-NEXT: %add.3 = add nsw i32 %7, %add.2
|
|
; PROLOG-NEXT: %indvars.iv.next.3 = add i64 %indvars.iv, 4
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.4
|
|
; PROLOG: for.exiting_block.4:
|
|
; PROLOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.4, label %for.exit2.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; PROLOG-NEXT: %8 = load i32, ptr %arrayidx.4, align 4
|
|
; PROLOG-NEXT: %add.4 = add nsw i32 %8, %add.3
|
|
; PROLOG-NEXT: %indvars.iv.next.4 = add i64 %indvars.iv, 5
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.5
|
|
; PROLOG: for.exiting_block.5:
|
|
; PROLOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.5, label %for.exit2.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; PROLOG-NEXT: %9 = load i32, ptr %arrayidx.5, align 4
|
|
; PROLOG-NEXT: %add.5 = add nsw i32 %9, %add.4
|
|
; PROLOG-NEXT: %indvars.iv.next.5 = add i64 %indvars.iv, 6
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.6
|
|
; PROLOG: for.exiting_block.6:
|
|
; PROLOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.6, label %for.exit2.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; PROLOG-NEXT: %10 = load i32, ptr %arrayidx.6, align 4
|
|
; PROLOG-NEXT: %add.6 = add nsw i32 %10, %add.5
|
|
; PROLOG-NEXT: %indvars.iv.next.6 = add i64 %indvars.iv, 7
|
|
; PROLOG-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.7
|
|
; PROLOG: for.exiting_block.7:
|
|
; PROLOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %for.exit2.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; PROLOG-NEXT: %11 = load i32, ptr %arrayidx.7, align 4
|
|
; PROLOG-NEXT: %add.7 = add nsw i32 %11, %add.6
|
|
; PROLOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; PROLOG-NEXT: %exitcond.7 = icmp eq i64 %indvars.iv.next.7, %n
|
|
; PROLOG-NEXT: br i1 %exitcond.7, label %latchExit.unr-lcssa.loopexit, label %header
|
|
; PROLOG: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: %result.ph.ph = phi i32 [ 0, %header ], [ 0, %latch ], [ 0, %latch.1 ], [ 0, %latch.2 ], [ 0, %latch.3 ], [ 0, %latch.4 ], [ 0, %latch.5 ], [ 0, %latch.6 ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa.loopexit1:
|
|
; PROLOG-NEXT: %result.ph.ph2 = phi i32 [ 0, %header.prol ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.ph = phi i32 [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ], [ %result.ph.ph2, %latchExit.unr-lcssa.loopexit1 ]
|
|
; PROLOG-NEXT: br label %latchExit
|
|
; PROLOG: latchExit:
|
|
; PROLOG-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i32 %result
|
|
; PROLOG: for.exit2.loopexit:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2.loopexit3:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2:
|
|
; PROLOG-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @hdr_latch_same_exit(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %latchExit.unr-lcssa, label %for.exiting_block.prol
|
|
; PROLOG-BLOCK: for.exiting_block.prol:
|
|
; PROLOG-BLOCK-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.prol, label %for.exit2, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: %2 = load i32, ptr %a, align 4
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block
|
|
; PROLOG-BLOCK: for.exiting_block:
|
|
; PROLOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-BLOCK-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %latchExit.unr-lcssa.loopexit, label %for.exiting_block.1
|
|
; PROLOG-BLOCK: for.exiting_block.1:
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-BLOCK-NEXT: %exitcond.1 = icmp eq i64 %indvars.iv.next.1, %n
|
|
; PROLOG-BLOCK-NEXT: br i1 %exitcond.1, label %latchExit.unr-lcssa.loopexit, label %header, !llvm.loop !4
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.ph.ph = phi i32 [ 0, %header ], [ 0, %latch ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %result.ph = phi i32 [ 0, %header.prol ], [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit
|
|
; PROLOG-BLOCK: latchExit:
|
|
; PROLOG-BLOCK-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %result
|
|
; PROLOG-BLOCK: for.exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %for.exit2
|
|
; PROLOG-BLOCK: for.exit2:
|
|
; PROLOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %latch ], [ 0, %entry ]
|
|
%sum.02 = phi i32 [ %add, %latch ], [ 0, %entry ]
|
|
br i1 %cond, label %latchExit, label %for.exiting_block
|
|
|
|
for.exiting_block:
|
|
%cmp = icmp eq i64 %n, 42
|
|
br i1 %cmp, label %for.exit2, label %latch
|
|
|
|
latch: ; preds = %latch, %entry
|
|
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
%0 = load i32, ptr %arrayidx, align 4
|
|
%add = add nsw i32 %0, %sum.02
|
|
%indvars.iv.next = add i64 %indvars.iv, 1
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %n
|
|
br i1 %exitcond, label %latchExit, label %header
|
|
|
|
latchExit: ; preds = %latch, %entry
|
|
%result = phi i32 [ 0, %header ], [ %add, %latch ]
|
|
ret i32 %result
|
|
|
|
for.exit2:
|
|
ret i32 42
|
|
}
|
|
|
|
; Two exiting blocks to latch where the exiting blocks are Latch and a
|
|
; non-header
|
|
; FIXME: We should unroll this loop.
|
|
define i32 @otherblock_latch_same_exit(ptr nocapture %a, i64 %n, i1 %cond) {
|
|
; EPILOG-LABEL: @otherblock_latch_same_exit(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG: for.exiting_block:
|
|
; EPILOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp, label %latchExit.epilog-lcssa.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG: for.exiting_block.1:
|
|
; EPILOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.1, label %latchExit.epilog-lcssa.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-NEXT: %indvars.iv.next.1 = add nuw nsw i64 %indvars.iv, 2
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; EPILOG: for.exiting_block.2:
|
|
; EPILOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.2, label %latchExit.epilog-lcssa.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; EPILOG-NEXT: %5 = load i32, ptr %arrayidx.2, align 4
|
|
; EPILOG-NEXT: %add.2 = add nsw i32 %5, %add.1
|
|
; EPILOG-NEXT: %indvars.iv.next.2 = add nuw nsw i64 %indvars.iv, 3
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; EPILOG: for.exiting_block.3:
|
|
; EPILOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.3, label %latchExit.epilog-lcssa.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; EPILOG-NEXT: %6 = load i32, ptr %arrayidx.3, align 4
|
|
; EPILOG-NEXT: %add.3 = add nsw i32 %6, %add.2
|
|
; EPILOG-NEXT: %indvars.iv.next.3 = add nuw nsw i64 %indvars.iv, 4
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; EPILOG: for.exiting_block.4:
|
|
; EPILOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.4, label %latchExit.epilog-lcssa.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; EPILOG-NEXT: %7 = load i32, ptr %arrayidx.4, align 4
|
|
; EPILOG-NEXT: %add.4 = add nsw i32 %7, %add.3
|
|
; EPILOG-NEXT: %indvars.iv.next.4 = add nuw nsw i64 %indvars.iv, 5
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; EPILOG: for.exiting_block.5:
|
|
; EPILOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.5, label %latchExit.epilog-lcssa.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; EPILOG-NEXT: %8 = load i32, ptr %arrayidx.5, align 4
|
|
; EPILOG-NEXT: %add.5 = add nsw i32 %8, %add.4
|
|
; EPILOG-NEXT: %indvars.iv.next.5 = add nuw nsw i64 %indvars.iv, 6
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; EPILOG: for.exiting_block.6:
|
|
; EPILOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.6, label %latchExit.epilog-lcssa.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; EPILOG-NEXT: %9 = load i32, ptr %arrayidx.6, align 4
|
|
; EPILOG-NEXT: %add.6 = add nsw i32 %9, %add.5
|
|
; EPILOG-NEXT: %indvars.iv.next.6 = add nuw nsw i64 %indvars.iv, 7
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; EPILOG: for.exiting_block.7:
|
|
; EPILOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.7, label %latchExit.epilog-lcssa.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; EPILOG-NEXT: %10 = load i32, ptr %arrayidx.7, align 4
|
|
; EPILOG-NEXT: %add.7 = add nsw i32 %10, %add.6
|
|
; EPILOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp eq i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %latchExit.unr-lcssa, label %header
|
|
; EPILOG: latchExit.unr-lcssa:
|
|
; EPILOG-NEXT: %result.ph = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02.unr = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %indvars.iv.epil = phi i64 [ %indvars.iv.next.epil, %latch.epil ], [ %indvars.iv.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %sum.02.epil = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit3, label %for.exiting_block.epil
|
|
; EPILOG: for.exiting_block.epil:
|
|
; EPILOG-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.epil, label %latchExit.epilog-lcssa.loopexit4, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil
|
|
; EPILOG-NEXT: %11 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-NEXT: %add.epil = add nsw i32 %11, %sum.02.epil
|
|
; EPILOG-NEXT: %indvars.iv.next.epil = add i64 %indvars.iv.epil, 1
|
|
; EPILOG-NEXT: %exitcond.epil = icmp eq i64 %indvars.iv.next.epil, %n
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latchExit.epilog-lcssa.loopexit4, !llvm.loop !5
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: %result.ph1.ph = phi i32 [ 2, %for.exiting_block ], [ 2, %for.exiting_block.1 ], [ 2, %for.exiting_block.2 ], [ 2, %for.exiting_block.3 ], [ 2, %for.exiting_block.4 ], [ 2, %for.exiting_block.5 ], [ 2, %for.exiting_block.6 ], [ 2, %for.exiting_block.7 ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit4:
|
|
; EPILOG-NEXT: %result.ph1.ph5 = phi i32 [ 2, %for.exiting_block.epil ], [ %add.epil, %latch.epil ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa:
|
|
; EPILOG-NEXT: %result.ph1 = phi i32 [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ], [ %result.ph1.ph5, %latchExit.epilog-lcssa.loopexit4 ]
|
|
; EPILOG-NEXT: br label %latchExit
|
|
; EPILOG: latchExit:
|
|
; EPILOG-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i32 %result
|
|
; EPILOG: for.exit2.loopexit:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2.loopexit3:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2:
|
|
; EPILOG-NEXT: ret i32 42
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @otherblock_latch_same_exit(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG-BLOCK: for.exiting_block:
|
|
; EPILOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp, label %latchExit.epilog-lcssa.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-BLOCK-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-BLOCK-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG-BLOCK: for.exiting_block.1:
|
|
; EPILOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.1, label %latchExit.epilog-lcssa.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp eq i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %latchExit.unr-lcssa, label %header, !llvm.loop !5
|
|
; EPILOG-BLOCK: latchExit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2, label %for.exiting_block.epil
|
|
; EPILOG-BLOCK: for.exiting_block.epil:
|
|
; EPILOG-BLOCK-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.epil, label %latchExit.epilog-lcssa, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil.init
|
|
; EPILOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.epil = add nsw i32 %5, %sum.02.epil.init
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1.ph = phi i32 [ 2, %for.exiting_block ], [ 2, %for.exiting_block.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1 = phi i32 [ %add.epil, %latch.epil ], [ 2, %for.exiting_block.epil ], [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit
|
|
; EPILOG-BLOCK: latchExit:
|
|
; EPILOG-BLOCK-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %result
|
|
; EPILOG-BLOCK: for.exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %for.exit2
|
|
; EPILOG-BLOCK: for.exit2:
|
|
; EPILOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-LABEL: @otherblock_latch_same_exit(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %indvars.iv.prol = phi i64 [ %indvars.iv.next.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %sum.02.prol = phi i32 [ %add.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit1, label %for.exiting_block.prol
|
|
; PROLOG: for.exiting_block.prol:
|
|
; PROLOG-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.prol, label %latchExit.unr-lcssa.loopexit2, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %arrayidx.prol = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.prol
|
|
; PROLOG-NEXT: %2 = load i32, ptr %arrayidx.prol, align 4
|
|
; PROLOG-NEXT: %add.prol = add nsw i32 %2, %sum.02.prol
|
|
; PROLOG-NEXT: %indvars.iv.next.prol = add i64 %indvars.iv.prol, 1
|
|
; PROLOG-NEXT: %exitcond.prol = icmp eq i64 %indvars.iv.next.prol, %n
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !5
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %indvars.iv.unr.ph = phi i64 [ %indvars.iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %sum.02.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %result.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ %indvars.iv.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %sum.02.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; PROLOG-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG: for.exiting_block:
|
|
; PROLOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp, label %latchExit.unr-lcssa.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG: for.exiting_block.1:
|
|
; PROLOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.1, label %latchExit.unr-lcssa.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; PROLOG: for.exiting_block.2:
|
|
; PROLOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.2, label %latchExit.unr-lcssa.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; PROLOG-NEXT: %6 = load i32, ptr %arrayidx.2, align 4
|
|
; PROLOG-NEXT: %add.2 = add nsw i32 %6, %add.1
|
|
; PROLOG-NEXT: %indvars.iv.next.2 = add i64 %indvars.iv, 3
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; PROLOG: for.exiting_block.3:
|
|
; PROLOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.3, label %latchExit.unr-lcssa.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; PROLOG-NEXT: %7 = load i32, ptr %arrayidx.3, align 4
|
|
; PROLOG-NEXT: %add.3 = add nsw i32 %7, %add.2
|
|
; PROLOG-NEXT: %indvars.iv.next.3 = add i64 %indvars.iv, 4
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; PROLOG: for.exiting_block.4:
|
|
; PROLOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.4, label %latchExit.unr-lcssa.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; PROLOG-NEXT: %8 = load i32, ptr %arrayidx.4, align 4
|
|
; PROLOG-NEXT: %add.4 = add nsw i32 %8, %add.3
|
|
; PROLOG-NEXT: %indvars.iv.next.4 = add i64 %indvars.iv, 5
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; PROLOG: for.exiting_block.5:
|
|
; PROLOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.5, label %latchExit.unr-lcssa.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; PROLOG-NEXT: %9 = load i32, ptr %arrayidx.5, align 4
|
|
; PROLOG-NEXT: %add.5 = add nsw i32 %9, %add.4
|
|
; PROLOG-NEXT: %indvars.iv.next.5 = add i64 %indvars.iv, 6
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; PROLOG: for.exiting_block.6:
|
|
; PROLOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.6, label %latchExit.unr-lcssa.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; PROLOG-NEXT: %10 = load i32, ptr %arrayidx.6, align 4
|
|
; PROLOG-NEXT: %add.6 = add nsw i32 %10, %add.5
|
|
; PROLOG-NEXT: %indvars.iv.next.6 = add i64 %indvars.iv, 7
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; PROLOG: for.exiting_block.7:
|
|
; PROLOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %latchExit.unr-lcssa.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; PROLOG-NEXT: %11 = load i32, ptr %arrayidx.7, align 4
|
|
; PROLOG-NEXT: %add.7 = add nsw i32 %11, %add.6
|
|
; PROLOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; PROLOG-NEXT: %exitcond.7 = icmp eq i64 %indvars.iv.next.7, %n
|
|
; PROLOG-NEXT: br i1 %exitcond.7, label %latchExit.unr-lcssa.loopexit, label %header
|
|
; PROLOG: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: %result.ph.ph = phi i32 [ 2, %for.exiting_block ], [ 2, %for.exiting_block.1 ], [ 2, %for.exiting_block.2 ], [ 2, %for.exiting_block.3 ], [ 2, %for.exiting_block.4 ], [ 2, %for.exiting_block.5 ], [ 2, %for.exiting_block.6 ], [ 2, %for.exiting_block.7 ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa.loopexit2:
|
|
; PROLOG-NEXT: %result.ph.ph3 = phi i32 [ 2, %for.exiting_block.prol ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.ph = phi i32 [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ], [ %result.ph.ph3, %latchExit.unr-lcssa.loopexit2 ]
|
|
; PROLOG-NEXT: br label %latchExit
|
|
; PROLOG: latchExit:
|
|
; PROLOG-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i32 %result
|
|
; PROLOG: for.exit2.loopexit:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2.loopexit1:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2:
|
|
; PROLOG-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @otherblock_latch_same_exit(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2, label %for.exiting_block.prol
|
|
; PROLOG-BLOCK: for.exiting_block.prol:
|
|
; PROLOG-BLOCK-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.prol, label %latchExit.unr-lcssa, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: %2 = load i32, ptr %a, align 4
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG-BLOCK: for.exiting_block:
|
|
; PROLOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp, label %latchExit.unr-lcssa.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-BLOCK-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG-BLOCK: for.exiting_block.1:
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %latchExit.unr-lcssa.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-BLOCK-NEXT: %exitcond.1 = icmp eq i64 %indvars.iv.next.1, %n
|
|
; PROLOG-BLOCK-NEXT: br i1 %exitcond.1, label %latchExit.unr-lcssa.loopexit, label %header, !llvm.loop !5
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.ph.ph = phi i32 [ 2, %for.exiting_block ], [ 2, %for.exiting_block.1 ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %result.ph = phi i32 [ 2, %for.exiting_block.prol ], [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit
|
|
; PROLOG-BLOCK: latchExit:
|
|
; PROLOG-BLOCK-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %result
|
|
; PROLOG-BLOCK: for.exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %for.exit2
|
|
; PROLOG-BLOCK: for.exit2:
|
|
; PROLOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %latch ], [ 0, %entry ]
|
|
%sum.02 = phi i32 [ %add, %latch ], [ 0, %entry ]
|
|
br i1 %cond, label %for.exit2, label %for.exiting_block
|
|
|
|
for.exiting_block:
|
|
%cmp = icmp eq i64 %n, 42
|
|
br i1 %cmp, label %latchExit, label %latch
|
|
|
|
latch: ; preds = %latch, %entry
|
|
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
%0 = load i32, ptr %arrayidx, align 4
|
|
%add = add nsw i32 %0, %sum.02
|
|
%indvars.iv.next = add i64 %indvars.iv, 1
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %n
|
|
br i1 %exitcond, label %latchExit, label %header
|
|
|
|
latchExit: ; preds = %latch, %entry
|
|
%result = phi i32 [ 2, %for.exiting_block ], [ %add, %latch ]
|
|
ret i32 %result
|
|
|
|
for.exit2:
|
|
ret i32 42
|
|
}
|
|
|
|
; Two exiting blocks to latch where the exiting blocks are Latch and a
|
|
; non-header
|
|
; Same as above test except the incoming value for latch Phi is from the header
|
|
; FIXME: We should be able to runtime unroll.
|
|
define i32 @otherblock_latch_same_exit2(ptr nocapture %a, i64 %n, i1 %cond) {
|
|
; EPILOG-LABEL: @otherblock_latch_same_exit2(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG: for.exiting_block:
|
|
; EPILOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp, label %latchExit.epilog-lcssa.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG: for.exiting_block.1:
|
|
; EPILOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.1, label %latchExit.epilog-lcssa.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-NEXT: %indvars.iv.next.1 = add nuw nsw i64 %indvars.iv, 2
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; EPILOG: for.exiting_block.2:
|
|
; EPILOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.2, label %latchExit.epilog-lcssa.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; EPILOG-NEXT: %5 = load i32, ptr %arrayidx.2, align 4
|
|
; EPILOG-NEXT: %add.2 = add nsw i32 %5, %add.1
|
|
; EPILOG-NEXT: %indvars.iv.next.2 = add nuw nsw i64 %indvars.iv, 3
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; EPILOG: for.exiting_block.3:
|
|
; EPILOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.3, label %latchExit.epilog-lcssa.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; EPILOG-NEXT: %6 = load i32, ptr %arrayidx.3, align 4
|
|
; EPILOG-NEXT: %add.3 = add nsw i32 %6, %add.2
|
|
; EPILOG-NEXT: %indvars.iv.next.3 = add nuw nsw i64 %indvars.iv, 4
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; EPILOG: for.exiting_block.4:
|
|
; EPILOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.4, label %latchExit.epilog-lcssa.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; EPILOG-NEXT: %7 = load i32, ptr %arrayidx.4, align 4
|
|
; EPILOG-NEXT: %add.4 = add nsw i32 %7, %add.3
|
|
; EPILOG-NEXT: %indvars.iv.next.4 = add nuw nsw i64 %indvars.iv, 5
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; EPILOG: for.exiting_block.5:
|
|
; EPILOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.5, label %latchExit.epilog-lcssa.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; EPILOG-NEXT: %8 = load i32, ptr %arrayidx.5, align 4
|
|
; EPILOG-NEXT: %add.5 = add nsw i32 %8, %add.4
|
|
; EPILOG-NEXT: %indvars.iv.next.5 = add nuw nsw i64 %indvars.iv, 6
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; EPILOG: for.exiting_block.6:
|
|
; EPILOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.6, label %latchExit.epilog-lcssa.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; EPILOG-NEXT: %9 = load i32, ptr %arrayidx.6, align 4
|
|
; EPILOG-NEXT: %add.6 = add nsw i32 %9, %add.5
|
|
; EPILOG-NEXT: %indvars.iv.next.6 = add nuw nsw i64 %indvars.iv, 7
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; EPILOG: for.exiting_block.7:
|
|
; EPILOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.7, label %latchExit.epilog-lcssa.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; EPILOG-NEXT: %10 = load i32, ptr %arrayidx.7, align 4
|
|
; EPILOG-NEXT: %add.7 = add nsw i32 %10, %add.6
|
|
; EPILOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp eq i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %latchExit.unr-lcssa, label %header
|
|
; EPILOG: latchExit.unr-lcssa:
|
|
; EPILOG-NEXT: %result.ph = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02.unr = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %indvars.iv.epil = phi i64 [ %indvars.iv.next.epil, %latch.epil ], [ %indvars.iv.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %sum.02.epil = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit3, label %for.exiting_block.epil
|
|
; EPILOG: for.exiting_block.epil:
|
|
; EPILOG-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.epil, label %latchExit.epilog-lcssa.loopexit4, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil
|
|
; EPILOG-NEXT: %11 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-NEXT: %add.epil = add nsw i32 %11, %sum.02.epil
|
|
; EPILOG-NEXT: %indvars.iv.next.epil = add i64 %indvars.iv.epil, 1
|
|
; EPILOG-NEXT: %exitcond.epil = icmp eq i64 %indvars.iv.next.epil, %n
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latchExit.epilog-lcssa.loopexit4, !llvm.loop !6
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: %result.ph1.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ], [ %add.1, %for.exiting_block.2 ], [ %add.2, %for.exiting_block.3 ], [ %add.3, %for.exiting_block.4 ], [ %add.4, %for.exiting_block.5 ], [ %add.5, %for.exiting_block.6 ], [ %add.6, %for.exiting_block.7 ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit4:
|
|
; EPILOG-NEXT: %result.ph1.ph5 = phi i32 [ %sum.02.epil, %for.exiting_block.epil ], [ %add.epil, %latch.epil ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa:
|
|
; EPILOG-NEXT: %result.ph1 = phi i32 [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ], [ %result.ph1.ph5, %latchExit.epilog-lcssa.loopexit4 ]
|
|
; EPILOG-NEXT: br label %latchExit
|
|
; EPILOG: latchExit:
|
|
; EPILOG-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i32 %result
|
|
; EPILOG: for.exit2.loopexit:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2.loopexit3:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2:
|
|
; EPILOG-NEXT: ret i32 42
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @otherblock_latch_same_exit2(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG-BLOCK: for.exiting_block:
|
|
; EPILOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp, label %latchExit.epilog-lcssa.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-BLOCK-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-BLOCK-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG-BLOCK: for.exiting_block.1:
|
|
; EPILOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.1, label %latchExit.epilog-lcssa.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp eq i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %latchExit.unr-lcssa, label %header, !llvm.loop !6
|
|
; EPILOG-BLOCK: latchExit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2, label %for.exiting_block.epil
|
|
; EPILOG-BLOCK: for.exiting_block.epil:
|
|
; EPILOG-BLOCK-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.epil, label %latchExit.epilog-lcssa, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil.init
|
|
; EPILOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.epil = add nsw i32 %5, %sum.02.epil.init
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1 = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %for.exiting_block.epil ], [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit
|
|
; EPILOG-BLOCK: latchExit:
|
|
; EPILOG-BLOCK-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %result
|
|
; EPILOG-BLOCK: for.exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %for.exit2
|
|
; EPILOG-BLOCK: for.exit2:
|
|
; EPILOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-LABEL: @otherblock_latch_same_exit2(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %indvars.iv.prol = phi i64 [ %indvars.iv.next.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %sum.02.prol = phi i32 [ %add.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit1, label %for.exiting_block.prol
|
|
; PROLOG: for.exiting_block.prol:
|
|
; PROLOG-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.prol, label %latchExit.unr-lcssa.loopexit2, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %arrayidx.prol = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.prol
|
|
; PROLOG-NEXT: %2 = load i32, ptr %arrayidx.prol, align 4
|
|
; PROLOG-NEXT: %add.prol = add nsw i32 %2, %sum.02.prol
|
|
; PROLOG-NEXT: %indvars.iv.next.prol = add i64 %indvars.iv.prol, 1
|
|
; PROLOG-NEXT: %exitcond.prol = icmp eq i64 %indvars.iv.next.prol, %n
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !6
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %indvars.iv.unr.ph = phi i64 [ %indvars.iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %sum.02.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %result.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ %indvars.iv.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %sum.02.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; PROLOG-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG: for.exiting_block:
|
|
; PROLOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp, label %latchExit.unr-lcssa.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG: for.exiting_block.1:
|
|
; PROLOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.1, label %latchExit.unr-lcssa.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; PROLOG: for.exiting_block.2:
|
|
; PROLOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.2, label %latchExit.unr-lcssa.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; PROLOG-NEXT: %6 = load i32, ptr %arrayidx.2, align 4
|
|
; PROLOG-NEXT: %add.2 = add nsw i32 %6, %add.1
|
|
; PROLOG-NEXT: %indvars.iv.next.2 = add i64 %indvars.iv, 3
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; PROLOG: for.exiting_block.3:
|
|
; PROLOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.3, label %latchExit.unr-lcssa.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; PROLOG-NEXT: %7 = load i32, ptr %arrayidx.3, align 4
|
|
; PROLOG-NEXT: %add.3 = add nsw i32 %7, %add.2
|
|
; PROLOG-NEXT: %indvars.iv.next.3 = add i64 %indvars.iv, 4
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; PROLOG: for.exiting_block.4:
|
|
; PROLOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.4, label %latchExit.unr-lcssa.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; PROLOG-NEXT: %8 = load i32, ptr %arrayidx.4, align 4
|
|
; PROLOG-NEXT: %add.4 = add nsw i32 %8, %add.3
|
|
; PROLOG-NEXT: %indvars.iv.next.4 = add i64 %indvars.iv, 5
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; PROLOG: for.exiting_block.5:
|
|
; PROLOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.5, label %latchExit.unr-lcssa.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; PROLOG-NEXT: %9 = load i32, ptr %arrayidx.5, align 4
|
|
; PROLOG-NEXT: %add.5 = add nsw i32 %9, %add.4
|
|
; PROLOG-NEXT: %indvars.iv.next.5 = add i64 %indvars.iv, 6
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; PROLOG: for.exiting_block.6:
|
|
; PROLOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.6, label %latchExit.unr-lcssa.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; PROLOG-NEXT: %10 = load i32, ptr %arrayidx.6, align 4
|
|
; PROLOG-NEXT: %add.6 = add nsw i32 %10, %add.5
|
|
; PROLOG-NEXT: %indvars.iv.next.6 = add i64 %indvars.iv, 7
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; PROLOG: for.exiting_block.7:
|
|
; PROLOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %latchExit.unr-lcssa.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; PROLOG-NEXT: %11 = load i32, ptr %arrayidx.7, align 4
|
|
; PROLOG-NEXT: %add.7 = add nsw i32 %11, %add.6
|
|
; PROLOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; PROLOG-NEXT: %exitcond.7 = icmp eq i64 %indvars.iv.next.7, %n
|
|
; PROLOG-NEXT: br i1 %exitcond.7, label %latchExit.unr-lcssa.loopexit, label %header
|
|
; PROLOG: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: %result.ph.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ], [ %add.1, %for.exiting_block.2 ], [ %add.2, %for.exiting_block.3 ], [ %add.3, %for.exiting_block.4 ], [ %add.4, %for.exiting_block.5 ], [ %add.5, %for.exiting_block.6 ], [ %add.6, %for.exiting_block.7 ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa.loopexit2:
|
|
; PROLOG-NEXT: %result.ph.ph3 = phi i32 [ %sum.02.prol, %for.exiting_block.prol ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.ph = phi i32 [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ], [ %result.ph.ph3, %latchExit.unr-lcssa.loopexit2 ]
|
|
; PROLOG-NEXT: br label %latchExit
|
|
; PROLOG: latchExit:
|
|
; PROLOG-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i32 %result
|
|
; PROLOG: for.exit2.loopexit:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2.loopexit1:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2:
|
|
; PROLOG-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @otherblock_latch_same_exit2(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2, label %for.exiting_block.prol
|
|
; PROLOG-BLOCK: for.exiting_block.prol:
|
|
; PROLOG-BLOCK-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.prol, label %latchExit.unr-lcssa, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: %2 = load i32, ptr %a, align 4
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG-BLOCK: for.exiting_block:
|
|
; PROLOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp, label %latchExit.unr-lcssa.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-BLOCK-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG-BLOCK: for.exiting_block.1:
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %latchExit.unr-lcssa.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-BLOCK-NEXT: %exitcond.1 = icmp eq i64 %indvars.iv.next.1, %n
|
|
; PROLOG-BLOCK-NEXT: br i1 %exitcond.1, label %latchExit.unr-lcssa.loopexit, label %header, !llvm.loop !6
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.ph.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %result.ph = phi i32 [ 0, %for.exiting_block.prol ], [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit
|
|
; PROLOG-BLOCK: latchExit:
|
|
; PROLOG-BLOCK-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %result
|
|
; PROLOG-BLOCK: for.exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %for.exit2
|
|
; PROLOG-BLOCK: for.exit2:
|
|
; PROLOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %latch ], [ 0, %entry ]
|
|
%sum.02 = phi i32 [ %add, %latch ], [ 0, %entry ]
|
|
br i1 %cond, label %for.exit2, label %for.exiting_block
|
|
|
|
for.exiting_block:
|
|
%cmp = icmp eq i64 %n, 42
|
|
br i1 %cmp, label %latchExit, label %latch
|
|
|
|
latch: ; preds = %latch, %entry
|
|
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
%0 = load i32, ptr %arrayidx, align 4
|
|
%add = add nsw i32 %0, %sum.02
|
|
%indvars.iv.next = add i64 %indvars.iv, 1
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %n
|
|
br i1 %exitcond, label %latchExit, label %header
|
|
|
|
latchExit: ; preds = %latch, %entry
|
|
%result = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %latch ]
|
|
ret i32 %result
|
|
|
|
for.exit2:
|
|
ret i32 42
|
|
}
|
|
|
|
; Two exiting blocks to latch where the exiting blocks are Latch and a
|
|
; non-header
|
|
; Same as above test except the incoming value for cloned latch Phi is from the
|
|
; for.exiting_block.
|
|
; FIXME: We should be able to runtime unroll.
|
|
define i32 @otherblock_latch_same_exit3(ptr nocapture %a, i64 %n, i1 %cond) {
|
|
; EPILOG-LABEL: @otherblock_latch_same_exit3(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG: for.exiting_block:
|
|
; EPILOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp, label %latchExit.epilog-lcssa.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG: for.exiting_block.1:
|
|
; EPILOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.1, label %latchExit.epilog-lcssa.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: %indvars.iv.next.1 = add nuw nsw i64 %indvars.iv, 2
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; EPILOG: for.exiting_block.2:
|
|
; EPILOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; EPILOG-NEXT: %5 = load i32, ptr %arrayidx.2, align 4
|
|
; EPILOG-NEXT: %add.2 = add nsw i32 %5, %add.1
|
|
; EPILOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.2, label %latchExit.epilog-lcssa.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: %indvars.iv.next.2 = add nuw nsw i64 %indvars.iv, 3
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; EPILOG: for.exiting_block.3:
|
|
; EPILOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; EPILOG-NEXT: %6 = load i32, ptr %arrayidx.3, align 4
|
|
; EPILOG-NEXT: %add.3 = add nsw i32 %6, %add.2
|
|
; EPILOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.3, label %latchExit.epilog-lcssa.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: %indvars.iv.next.3 = add nuw nsw i64 %indvars.iv, 4
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; EPILOG: for.exiting_block.4:
|
|
; EPILOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; EPILOG-NEXT: %7 = load i32, ptr %arrayidx.4, align 4
|
|
; EPILOG-NEXT: %add.4 = add nsw i32 %7, %add.3
|
|
; EPILOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.4, label %latchExit.epilog-lcssa.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: %indvars.iv.next.4 = add nuw nsw i64 %indvars.iv, 5
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; EPILOG: for.exiting_block.5:
|
|
; EPILOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; EPILOG-NEXT: %8 = load i32, ptr %arrayidx.5, align 4
|
|
; EPILOG-NEXT: %add.5 = add nsw i32 %8, %add.4
|
|
; EPILOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.5, label %latchExit.epilog-lcssa.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: %indvars.iv.next.5 = add nuw nsw i64 %indvars.iv, 6
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; EPILOG: for.exiting_block.6:
|
|
; EPILOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; EPILOG-NEXT: %9 = load i32, ptr %arrayidx.6, align 4
|
|
; EPILOG-NEXT: %add.6 = add nsw i32 %9, %add.5
|
|
; EPILOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.6, label %latchExit.epilog-lcssa.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %indvars.iv.next.6 = add nuw nsw i64 %indvars.iv, 7
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; EPILOG: for.exiting_block.7:
|
|
; EPILOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; EPILOG-NEXT: %10 = load i32, ptr %arrayidx.7, align 4
|
|
; EPILOG-NEXT: %add.7 = add nsw i32 %10, %add.6
|
|
; EPILOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.7, label %latchExit.epilog-lcssa.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp eq i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %latchExit.unr-lcssa, label %header
|
|
; EPILOG: latchExit.unr-lcssa:
|
|
; EPILOG-NEXT: %result.ph = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02.unr = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %indvars.iv.epil = phi i64 [ %indvars.iv.next.epil, %latch.epil ], [ %indvars.iv.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %sum.02.epil = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: br i1 %cond, label %for.exit2.loopexit3, label %for.exiting_block.epil
|
|
; EPILOG: for.exiting_block.epil:
|
|
; EPILOG-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil
|
|
; EPILOG-NEXT: %11 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-NEXT: %add.epil = add nsw i32 %11, %sum.02.epil
|
|
; EPILOG-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.epil, label %latchExit.epilog-lcssa.loopexit4, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %indvars.iv.next.epil = add i64 %indvars.iv.epil, 1
|
|
; EPILOG-NEXT: %exitcond.epil = icmp eq i64 %indvars.iv.next.epil, %n
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latchExit.epilog-lcssa.loopexit4, !llvm.loop !7
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: %result.ph1.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ], [ %add.1, %for.exiting_block.2 ], [ %add.2, %for.exiting_block.3 ], [ %add.3, %for.exiting_block.4 ], [ %add.4, %for.exiting_block.5 ], [ %add.5, %for.exiting_block.6 ], [ %add.6, %for.exiting_block.7 ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit4:
|
|
; EPILOG-NEXT: %result.ph1.ph5 = phi i32 [ %sum.02.epil, %for.exiting_block.epil ], [ %add.epil, %latch.epil ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa:
|
|
; EPILOG-NEXT: %result.ph1 = phi i32 [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ], [ %result.ph1.ph5, %latchExit.epilog-lcssa.loopexit4 ]
|
|
; EPILOG-NEXT: br label %latchExit
|
|
; EPILOG: latchExit:
|
|
; EPILOG-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i32 %result
|
|
; EPILOG: for.exit2.loopexit:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2.loopexit3:
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2:
|
|
; EPILOG-NEXT: ret i32 42
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @otherblock_latch_same_exit3(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG-BLOCK: for.exiting_block:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-BLOCK-NEXT: %3 = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-BLOCK-NEXT: %add = add nsw i32 %3, %sum.02
|
|
; EPILOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp, label %latchExit.epilog-lcssa.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG-BLOCK: for.exiting_block.1:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nsw i32 %4, %add
|
|
; EPILOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.1, label %latchExit.epilog-lcssa.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp eq i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %latchExit.unr-lcssa, label %header, !llvm.loop !7
|
|
; EPILOG-BLOCK: latchExit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %for.exit2, label %for.exiting_block.epil
|
|
; EPILOG-BLOCK: for.exiting_block.epil:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil.init
|
|
; EPILOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.epil = add nsw i32 %5, %sum.02.epil.init
|
|
; EPILOG-BLOCK-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.epil, label %latchExit.epilog-lcssa, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %result.ph1 = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %for.exiting_block.epil ], [ %result.ph1.ph, %latchExit.epilog-lcssa.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit
|
|
; EPILOG-BLOCK: latchExit:
|
|
; EPILOG-BLOCK-NEXT: %result = phi i32 [ %result.ph, %latchExit.unr-lcssa ], [ %result.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %result
|
|
; EPILOG-BLOCK: for.exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %for.exit2
|
|
; EPILOG-BLOCK: for.exit2:
|
|
; EPILOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-LABEL: @otherblock_latch_same_exit3(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %indvars.iv.prol = phi i64 [ %indvars.iv.next.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %sum.02.prol = phi i32 [ %add.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit1, label %for.exiting_block.prol
|
|
; PROLOG: for.exiting_block.prol:
|
|
; PROLOG-NEXT: %arrayidx.prol = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.prol
|
|
; PROLOG-NEXT: %2 = load i32, ptr %arrayidx.prol, align 4
|
|
; PROLOG-NEXT: %add.prol = add nsw i32 %2, %sum.02.prol
|
|
; PROLOG-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.prol, label %latchExit.unr-lcssa.loopexit2, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %indvars.iv.next.prol = add i64 %indvars.iv.prol, 1
|
|
; PROLOG-NEXT: %exitcond.prol = icmp eq i64 %indvars.iv.next.prol, %n
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !7
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %indvars.iv.unr.ph = phi i64 [ %indvars.iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %sum.02.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %result.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ %indvars.iv.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %sum.02.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; PROLOG-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG: for.exiting_block:
|
|
; PROLOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp, label %latchExit.unr-lcssa.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG: for.exiting_block.1:
|
|
; PROLOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.1, label %latchExit.unr-lcssa.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; PROLOG: for.exiting_block.2:
|
|
; PROLOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; PROLOG-NEXT: %6 = load i32, ptr %arrayidx.2, align 4
|
|
; PROLOG-NEXT: %add.2 = add nsw i32 %6, %add.1
|
|
; PROLOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.2, label %latchExit.unr-lcssa.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: %indvars.iv.next.2 = add i64 %indvars.iv, 3
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; PROLOG: for.exiting_block.3:
|
|
; PROLOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; PROLOG-NEXT: %7 = load i32, ptr %arrayidx.3, align 4
|
|
; PROLOG-NEXT: %add.3 = add nsw i32 %7, %add.2
|
|
; PROLOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.3, label %latchExit.unr-lcssa.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: %indvars.iv.next.3 = add i64 %indvars.iv, 4
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; PROLOG: for.exiting_block.4:
|
|
; PROLOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; PROLOG-NEXT: %8 = load i32, ptr %arrayidx.4, align 4
|
|
; PROLOG-NEXT: %add.4 = add nsw i32 %8, %add.3
|
|
; PROLOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.4, label %latchExit.unr-lcssa.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: %indvars.iv.next.4 = add i64 %indvars.iv, 5
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; PROLOG: for.exiting_block.5:
|
|
; PROLOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; PROLOG-NEXT: %9 = load i32, ptr %arrayidx.5, align 4
|
|
; PROLOG-NEXT: %add.5 = add nsw i32 %9, %add.4
|
|
; PROLOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.5, label %latchExit.unr-lcssa.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: %indvars.iv.next.5 = add i64 %indvars.iv, 6
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; PROLOG: for.exiting_block.6:
|
|
; PROLOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; PROLOG-NEXT: %10 = load i32, ptr %arrayidx.6, align 4
|
|
; PROLOG-NEXT: %add.6 = add nsw i32 %10, %add.5
|
|
; PROLOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.6, label %latchExit.unr-lcssa.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %indvars.iv.next.6 = add i64 %indvars.iv, 7
|
|
; PROLOG-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; PROLOG: for.exiting_block.7:
|
|
; PROLOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; PROLOG-NEXT: %11 = load i32, ptr %arrayidx.7, align 4
|
|
; PROLOG-NEXT: %add.7 = add nsw i32 %11, %add.6
|
|
; PROLOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %latchExit.unr-lcssa.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; PROLOG-NEXT: %exitcond.7 = icmp eq i64 %indvars.iv.next.7, %n
|
|
; PROLOG-NEXT: br i1 %exitcond.7, label %latchExit.unr-lcssa.loopexit, label %header
|
|
; PROLOG: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: %result.ph.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ], [ %add.1, %for.exiting_block.2 ], [ %add.2, %for.exiting_block.3 ], [ %add.3, %for.exiting_block.4 ], [ %add.4, %for.exiting_block.5 ], [ %add.5, %for.exiting_block.6 ], [ %add.6, %for.exiting_block.7 ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa.loopexit2:
|
|
; PROLOG-NEXT: %result.ph.ph3 = phi i32 [ %sum.02.prol, %for.exiting_block.prol ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa:
|
|
; PROLOG-NEXT: %result.ph = phi i32 [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ], [ %result.ph.ph3, %latchExit.unr-lcssa.loopexit2 ]
|
|
; PROLOG-NEXT: br label %latchExit
|
|
; PROLOG: latchExit:
|
|
; PROLOG-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i32 %result
|
|
; PROLOG: for.exit2.loopexit:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2.loopexit1:
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2:
|
|
; PROLOG-NEXT: ret i32 42
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @otherblock_latch_same_exit3(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2, label %for.exiting_block.prol
|
|
; PROLOG-BLOCK: for.exiting_block.prol:
|
|
; PROLOG-BLOCK-NEXT: %2 = load i32, ptr %a, align 4
|
|
; PROLOG-BLOCK-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.prol, label %latchExit.unr-lcssa, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.unr = phi i32 [ poison, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %latchExit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG-BLOCK: for.exiting_block:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-BLOCK-NEXT: %4 = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-BLOCK-NEXT: %add = add nsw i32 %4, %sum.02
|
|
; PROLOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp, label %latchExit.unr-lcssa.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG-BLOCK: for.exiting_block.1:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-BLOCK-NEXT: %5 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nsw i32 %5, %add
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %latchExit.unr-lcssa.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-BLOCK-NEXT: %exitcond.1 = icmp eq i64 %indvars.iv.next.1, %n
|
|
; PROLOG-BLOCK-NEXT: br i1 %exitcond.1, label %latchExit.unr-lcssa.loopexit, label %header, !llvm.loop !7
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.ph.ph = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %for.exiting_block.1 ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %result.ph = phi i32 [ 0, %for.exiting_block.prol ], [ %result.ph.ph, %latchExit.unr-lcssa.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit
|
|
; PROLOG-BLOCK: latchExit:
|
|
; PROLOG-BLOCK-NEXT: %result = phi i32 [ %result.unr, %header.prol.loopexit ], [ %result.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %result
|
|
; PROLOG-BLOCK: for.exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %for.exit2
|
|
; PROLOG-BLOCK: for.exit2:
|
|
; PROLOG-BLOCK-NEXT: ret i32 42
|
|
;
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %latch ], [ 0, %entry ]
|
|
%sum.02 = phi i32 [ %add, %latch ], [ 0, %entry ]
|
|
br i1 %cond, label %for.exit2, label %for.exiting_block
|
|
|
|
for.exiting_block:
|
|
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
%0 = load i32, ptr %arrayidx, align 4
|
|
%add = add nsw i32 %0, %sum.02
|
|
%cmp = icmp eq i64 %n, 42
|
|
br i1 %cmp, label %latchExit, label %latch
|
|
|
|
latch: ; preds = %latch, %entry
|
|
%indvars.iv.next = add i64 %indvars.iv, 1
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %n
|
|
br i1 %exitcond, label %latchExit, label %header
|
|
|
|
latchExit: ; preds = %latch, %entry
|
|
%result = phi i32 [ %sum.02, %for.exiting_block ], [ %add, %latch ]
|
|
ret i32 %result
|
|
|
|
for.exit2:
|
|
ret i32 42
|
|
}
|
|
|
|
; Show a case where we have multiple exits, but (provably) exit on the
|
|
; first iteration and thus have nothing to unroll
|
|
define void @non_loop(i32 %arg) {
|
|
; CHECK-LABEL: @non_loop(
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: %i = icmp sgt i32 undef, %arg
|
|
; CHECK-NEXT: br i1 %i, label %preheader, label %returnblock
|
|
; CHECK: preheader:
|
|
; CHECK-NEXT: br label %header
|
|
; CHECK: header:
|
|
; CHECK-NEXT: br i1 true, label %latchExit, label %latch
|
|
; CHECK: latch:
|
|
; CHECK-NEXT: br label %latchExit
|
|
; CHECK: latchExit:
|
|
; CHECK-NEXT: %i2.ph = phi i32 [ %arg, %header ], [ -1, %latch ]
|
|
; CHECK-NEXT: br label %returnblock
|
|
; CHECK: returnblock:
|
|
; CHECK-NEXT: %i2 = phi i32 [ -1, %entry ], [ %i2.ph, %latchExit ]
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
|
|
entry:
|
|
%i = icmp sgt i32 undef, %arg
|
|
br i1 %i, label %preheader, label %returnblock
|
|
|
|
preheader: ; preds = %entry
|
|
br label %header
|
|
|
|
header: ; preds = %preheader, %latch
|
|
%i4 = phi i32 [ %inc, %latch ], [ %arg, %preheader ]
|
|
%inc = add nsw i32 %i4, 1
|
|
br i1 true, label %latchExit, label %latch
|
|
|
|
latch: ; preds = %header
|
|
%cmp = icmp slt i32 %inc, undef
|
|
br i1 %cmp, label %header, label %latchExit
|
|
|
|
latchExit: ; preds = %header, %latch
|
|
%i2.ph = phi i32 [ %i4, %header ], [ -1, %latch ]
|
|
br label %returnblock
|
|
|
|
returnblock: ; preds = %latchExit, %entry
|
|
%i2 = phi i32 [ -1, %entry ], [ %i2.ph, %latchExit ]
|
|
ret void
|
|
}
|
|
|
|
; Latch exit is shared by all exiting blocks
|
|
define void @unique_exit(i32 %N, i32 %M) {
|
|
; EPILOG-LABEL: @unique_exit(
|
|
; EPILOG-NEXT: preheader:
|
|
; EPILOG-NEXT: %M.shifted = shl i32 %M, 3
|
|
; EPILOG-NEXT: %umax = call i32 @llvm.umax.i32(i32 %M.shifted, i32 1)
|
|
; EPILOG-NEXT: %0 = freeze i32 %umax
|
|
; EPILOG-NEXT: %1 = add i32 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i32 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i32 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %preheader.new
|
|
; EPILOG: preheader.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i32 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %i4 = phi i32 [ 0, %preheader.new ], [ %inc.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i32 [ 0, %preheader.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %inc = add nuw nsw i32 %i4, 1
|
|
; EPILOG-NEXT: %cmp1 = icmp ult i32 %inc, %N
|
|
; EPILOG-NEXT: br i1 %cmp1, label %latch, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: %inc.1 = add nuw nsw i32 %i4, 2
|
|
; EPILOG-NEXT: %cmp1.1 = icmp ult i32 %inc.1, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.1, label %latch.1, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: %inc.2 = add nuw nsw i32 %i4, 3
|
|
; EPILOG-NEXT: %cmp1.2 = icmp ult i32 %inc.2, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.2, label %latch.2, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: %inc.3 = add nuw nsw i32 %i4, 4
|
|
; EPILOG-NEXT: %cmp1.3 = icmp ult i32 %inc.3, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.3, label %latch.3, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: %inc.4 = add nuw nsw i32 %i4, 5
|
|
; EPILOG-NEXT: %cmp1.4 = icmp ult i32 %inc.4, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.4, label %latch.4, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: %inc.5 = add nuw nsw i32 %i4, 6
|
|
; EPILOG-NEXT: %cmp1.5 = icmp ult i32 %inc.5, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.5, label %latch.5, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: %inc.6 = add nuw nsw i32 %i4, 7
|
|
; EPILOG-NEXT: %cmp1.6 = icmp ult i32 %inc.6, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.6, label %latch.6, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %inc.7 = add nuw i32 %i4, 8
|
|
; EPILOG-NEXT: %cmp1.7 = icmp ult i32 %inc.7, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.7, label %latch.7, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %niter.next.7 = add nuw i32 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i32 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %header, label %latchExit.unr-lcssa
|
|
; EPILOG: latchExit.unr-lcssa:
|
|
; EPILOG-NEXT: %i2.ph.ph = phi i32 [ -1, %latch.7 ]
|
|
; EPILOG-NEXT: %i4.unr = phi i32 [ %inc.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %i4.epil.init = phi i32 [ 0, %preheader ], [ %i4.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %i4.epil = phi i32 [ %inc.epil, %latch.epil ], [ %i4.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i32 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: %inc.epil = add nuw i32 %i4.epil, 1
|
|
; EPILOG-NEXT: %cmp1.epil = icmp ult i32 %inc.epil, %N
|
|
; EPILOG-NEXT: br i1 %cmp1.epil, label %latch.epil, label %latchExit.epilog-lcssa.loopexit3
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %cmp.epil = icmp ult i32 %inc.epil, %M.shifted
|
|
; EPILOG-NEXT: %epil.iter.next = add i32 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i32 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latchExit.epilog-lcssa.loopexit3, !llvm.loop !8
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: %i2.ph.ph1.ph = phi i32 [ %i4, %header ], [ %inc, %latch ], [ %inc.1, %latch.1 ], [ %inc.2, %latch.2 ], [ %inc.3, %latch.3 ], [ %inc.4, %latch.4 ], [ %inc.5, %latch.5 ], [ %inc.6, %latch.6 ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa.loopexit3:
|
|
; EPILOG-NEXT: %i2.ph.ph1.ph4 = phi i32 [ %i4.epil, %header.epil ], [ -1, %latch.epil ]
|
|
; EPILOG-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG: latchExit.epilog-lcssa:
|
|
; EPILOG-NEXT: %i2.ph.ph1 = phi i32 [ %i2.ph.ph1.ph, %latchExit.epilog-lcssa.loopexit ], [ %i2.ph.ph1.ph4, %latchExit.epilog-lcssa.loopexit3 ]
|
|
; EPILOG-NEXT: br label %latchExit
|
|
; EPILOG: latchExit:
|
|
; EPILOG-NEXT: %i2.ph = phi i32 [ %i2.ph.ph, %latchExit.unr-lcssa ], [ %i2.ph.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @unique_exit(
|
|
; EPILOG-BLOCK-NEXT: preheader:
|
|
; EPILOG-BLOCK-NEXT: %M.shifted = shl i32 %M, 3
|
|
; EPILOG-BLOCK-NEXT: %umax = call i32 @llvm.umax.i32(i32 %M.shifted, i32 1)
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i32 %umax
|
|
; EPILOG-BLOCK-NEXT: %1 = add i32 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i32 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i32 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %preheader.new
|
|
; EPILOG-BLOCK: preheader.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i32 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %i4 = phi i32 [ 0, %preheader.new ], [ %inc.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i32 [ 0, %preheader.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %inc = add nuw nsw i32 %i4, 1
|
|
; EPILOG-BLOCK-NEXT: %cmp1 = icmp ult i32 %inc, %N
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp1, label %latch, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %inc.1 = add nuw i32 %i4, 2
|
|
; EPILOG-BLOCK-NEXT: %cmp1.1 = icmp ult i32 %inc.1, %N
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp1.1, label %latch.1, label %latchExit.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add nuw i32 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i32 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %header, label %latchExit.unr-lcssa, !llvm.loop !8
|
|
; EPILOG-BLOCK: latchExit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %i2.ph.ph = phi i32 [ -1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %i4.unr = phi i32 [ %inc.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchExit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %i4.epil.init = phi i32 [ 0, %preheader ], [ %i4.unr, %latchExit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: %inc.epil = add nuw i32 %i4.epil.init, 1
|
|
; EPILOG-BLOCK-NEXT: %cmp1.epil = icmp ult i32 %inc.epil, %N
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp1.epil, label %latch.epil, label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %i2.ph.ph1.ph = phi i32 [ %i4, %header ], [ %inc, %latch ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit.epilog-lcssa
|
|
; EPILOG-BLOCK: latchExit.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %i2.ph.ph1 = phi i32 [ -1, %latch.epil ], [ %i4.epil.init, %header.epil ], [ %i2.ph.ph1.ph, %latchExit.epilog-lcssa.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: br label %latchExit
|
|
; EPILOG-BLOCK: latchExit:
|
|
; EPILOG-BLOCK-NEXT: %i2.ph = phi i32 [ %i2.ph.ph, %latchExit.unr-lcssa ], [ %i2.ph.ph1, %latchExit.epilog-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @unique_exit(
|
|
; PROLOG-NEXT: preheader:
|
|
; PROLOG-NEXT: %M.shifted = shl i32 %M, 3
|
|
; PROLOG-NEXT: %umax = call i32 @llvm.umax.i32(i32 %M.shifted, i32 1)
|
|
; PROLOG-NEXT: %0 = freeze i32 %umax
|
|
; PROLOG-NEXT: %1 = add i32 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i32 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %i4.prol = phi i32 [ %inc.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i32 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: %inc.prol = add nuw i32 %i4.prol, 1
|
|
; PROLOG-NEXT: %cmp1.prol = icmp ult i32 %inc.prol, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.prol, label %latch.prol, label %latchExit.unr-lcssa.loopexit1
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %cmp.prol = icmp ult i32 %inc.prol, %M.shifted
|
|
; PROLOG-NEXT: %prol.iter.next = add i32 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i32 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !8
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %i4.unr.ph = phi i32 [ %inc.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %i2.ph.unr.ph = phi i32 [ -1, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %i4.unr = phi i32 [ 0, %preheader ], [ %i4.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %i2.ph.unr = phi i32 [ poison, %preheader ], [ %i2.ph.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i32 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %latchExit, label %preheader.new
|
|
; PROLOG: preheader.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %i4 = phi i32 [ %i4.unr, %preheader.new ], [ %inc.7, %latch.7 ]
|
|
; PROLOG-NEXT: %inc = add nuw i32 %i4, 1
|
|
; PROLOG-NEXT: %cmp1 = icmp ult i32 %inc, %N
|
|
; PROLOG-NEXT: br i1 %cmp1, label %latch, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: %inc.1 = add nuw i32 %i4, 2
|
|
; PROLOG-NEXT: %cmp1.1 = icmp ult i32 %inc.1, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.1, label %latch.1, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: %inc.2 = add nuw i32 %i4, 3
|
|
; PROLOG-NEXT: %cmp1.2 = icmp ult i32 %inc.2, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.2, label %latch.2, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: %inc.3 = add nuw i32 %i4, 4
|
|
; PROLOG-NEXT: %cmp1.3 = icmp ult i32 %inc.3, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.3, label %latch.3, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: %inc.4 = add nuw i32 %i4, 5
|
|
; PROLOG-NEXT: %cmp1.4 = icmp ult i32 %inc.4, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.4, label %latch.4, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: %inc.5 = add nuw i32 %i4, 6
|
|
; PROLOG-NEXT: %cmp1.5 = icmp ult i32 %inc.5, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.5, label %latch.5, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: %inc.6 = add nuw i32 %i4, 7
|
|
; PROLOG-NEXT: %cmp1.6 = icmp ult i32 %inc.6, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.6, label %latch.6, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %inc.7 = add nuw i32 %i4, 8
|
|
; PROLOG-NEXT: %cmp1.7 = icmp ult i32 %inc.7, %N
|
|
; PROLOG-NEXT: br i1 %cmp1.7, label %latch.7, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %cmp.7 = icmp ult i32 %inc.7, %M.shifted
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %header, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: %i2.ph.ph.ph = phi i32 [ %i4, %header ], [ %inc, %latch ], [ %inc.1, %latch.1 ], [ %inc.2, %latch.2 ], [ %inc.3, %latch.3 ], [ %inc.4, %latch.4 ], [ %inc.5, %latch.5 ], [ %inc.6, %latch.6 ], [ -1, %latch.7 ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa.loopexit1:
|
|
; PROLOG-NEXT: %i2.ph.ph.ph2 = phi i32 [ %i4.prol, %header.prol ]
|
|
; PROLOG-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG: latchExit.unr-lcssa:
|
|
; PROLOG-NEXT: %i2.ph.ph = phi i32 [ %i2.ph.ph.ph, %latchExit.unr-lcssa.loopexit ], [ %i2.ph.ph.ph2, %latchExit.unr-lcssa.loopexit1 ]
|
|
; PROLOG-NEXT: br label %latchExit
|
|
; PROLOG: latchExit:
|
|
; PROLOG-NEXT: %i2.ph = phi i32 [ %i2.ph.unr, %header.prol.loopexit ], [ %i2.ph.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @unique_exit(
|
|
; PROLOG-BLOCK-NEXT: preheader:
|
|
; PROLOG-BLOCK-NEXT: %M.shifted = shl i32 %M, 3
|
|
; PROLOG-BLOCK-NEXT: %umax = call i32 @llvm.umax.i32(i32 %M.shifted, i32 1)
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i32 %umax
|
|
; PROLOG-BLOCK-NEXT: %1 = add i32 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i32 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: %cmp1.prol = icmp ult i32 1, %N
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp1.prol, label %latch.prol, label %latchExit.unr-lcssa
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %i4.unr = phi i32 [ 0, %preheader ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %i2.ph.unr = phi i32 [ poison, %preheader ], [ -1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i32 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %latchExit, label %preheader.new
|
|
; PROLOG-BLOCK: preheader.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %i4 = phi i32 [ %i4.unr, %preheader.new ], [ %inc.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %inc = add nuw i32 %i4, 1
|
|
; PROLOG-BLOCK-NEXT: %cmp1 = icmp ult i32 %inc, %N
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp1, label %latch, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %inc.1 = add nuw i32 %i4, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp1.1 = icmp ult i32 %inc.1, %N
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp1.1, label %latch.1, label %latchExit.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ult i32 %inc.1, %M.shifted
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %header, label %latchExit.unr-lcssa.loopexit, !llvm.loop !8
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %i2.ph.ph.ph = phi i32 [ %i4, %header ], [ %inc, %latch ], [ -1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit.unr-lcssa
|
|
; PROLOG-BLOCK: latchExit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %i2.ph.ph = phi i32 [ 0, %header.prol ], [ %i2.ph.ph.ph, %latchExit.unr-lcssa.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchExit
|
|
; PROLOG-BLOCK: latchExit:
|
|
; PROLOG-BLOCK-NEXT: %i2.ph = phi i32 [ %i2.ph.unr, %header.prol.loopexit ], [ %i2.ph.ph, %latchExit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
|
|
preheader:
|
|
%M.shifted = shl nuw i32 %M, 3
|
|
br label %header
|
|
|
|
header: ; preds = %preheader, %latch
|
|
%i4 = phi i32 [ %inc, %latch ], [ 0, %preheader ]
|
|
%inc = add nuw i32 %i4, 1
|
|
%cmp1 = icmp ult i32 %inc, %N
|
|
br i1 %cmp1, label %latch, label %latchExit
|
|
|
|
latch: ; preds = %header
|
|
%cmp = icmp ult i32 %inc, %M.shifted
|
|
br i1 %cmp, label %header, label %latchExit
|
|
|
|
latchExit: ; preds = %header, %latch
|
|
%i2.ph = phi i32 [ %i4, %header ], [ -1, %latch ]
|
|
ret void
|
|
}
|
|
|
|
|
|
; two exiting and two exit blocks.
|
|
; the non-latch exiting block has duplicate edges to the non-latch exit block.
|
|
define i64 @test5(i64 %trip, i64 %add, i1 %cond) {
|
|
; EPILOG-LABEL: @test5(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %sum = phi i64 [ 0, %entry.new ], [ %sum.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting
|
|
; EPILOG: loop_exiting:
|
|
; EPILOG-NEXT: %ivy = add i64 %iv, %add
|
|
; EPILOG-NEXT: switch i64 %sum, label %loop_latch [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-NEXT: %sum.next = add i64 %sum, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting.1
|
|
; EPILOG: loop_exiting.1:
|
|
; EPILOG-NEXT: %ivy.1 = add i64 %iv_next, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; EPILOG-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.2, label %loop_exiting.2
|
|
; EPILOG: loop_exiting.2:
|
|
; EPILOG-NEXT: %ivy.2 = add i64 %iv_next.1, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next.1, label %loop_latch.2 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: %iv_next.2 = add nuw nsw i64 %iv, 3
|
|
; EPILOG-NEXT: %sum.next.2 = add i64 %sum.next.1, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.3, label %loop_exiting.3
|
|
; EPILOG: loop_exiting.3:
|
|
; EPILOG-NEXT: %ivy.3 = add i64 %iv_next.2, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next.2, label %loop_latch.3 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: %iv_next.3 = add nuw nsw i64 %iv, 4
|
|
; EPILOG-NEXT: %sum.next.3 = add i64 %sum.next.2, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.4, label %loop_exiting.4
|
|
; EPILOG: loop_exiting.4:
|
|
; EPILOG-NEXT: %ivy.4 = add i64 %iv_next.3, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next.3, label %loop_latch.4 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: %iv_next.4 = add nuw nsw i64 %iv, 5
|
|
; EPILOG-NEXT: %sum.next.4 = add i64 %sum.next.3, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.5, label %loop_exiting.5
|
|
; EPILOG: loop_exiting.5:
|
|
; EPILOG-NEXT: %ivy.5 = add i64 %iv_next.4, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next.4, label %loop_latch.5 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: %iv_next.5 = add nuw nsw i64 %iv, 6
|
|
; EPILOG-NEXT: %sum.next.5 = add i64 %sum.next.4, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.6, label %loop_exiting.6
|
|
; EPILOG: loop_exiting.6:
|
|
; EPILOG-NEXT: %ivy.6 = add i64 %iv_next.5, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next.5, label %loop_latch.6 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: %iv_next.6 = add nuw nsw i64 %iv, 7
|
|
; EPILOG-NEXT: %sum.next.6 = add i64 %sum.next.5, %add
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.7, label %loop_exiting.7
|
|
; EPILOG: loop_exiting.7:
|
|
; EPILOG-NEXT: %ivy.7 = add i64 %iv_next.6, %add
|
|
; EPILOG-NEXT: switch i64 %sum.next.6, label %loop_latch.7 [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add nuw nsw i64 %iv, 8
|
|
; EPILOG-NEXT: %sum.next.7 = add i64 %sum.next.6, %add
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %latchexit.unr-lcssa
|
|
; EPILOG: exit1.loopexit:
|
|
; EPILOG-NEXT: %result.ph = phi i64 [ %ivy, %loop_exiting ], [ %ivy, %loop_exiting ], [ %ivy.1, %loop_exiting.1 ], [ %ivy.1, %loop_exiting.1 ], [ %ivy.2, %loop_exiting.2 ], [ %ivy.2, %loop_exiting.2 ], [ %ivy.3, %loop_exiting.3 ], [ %ivy.3, %loop_exiting.3 ], [ %ivy.4, %loop_exiting.4 ], [ %ivy.4, %loop_exiting.4 ], [ %ivy.5, %loop_exiting.5 ], [ %ivy.5, %loop_exiting.5 ], [ %ivy.6, %loop_exiting.6 ], [ %ivy.6, %loop_exiting.6 ], [ %ivy.7, %loop_exiting.7 ], [ %ivy.7, %loop_exiting.7 ]
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1.loopexit3:
|
|
; EPILOG-NEXT: %result.ph4 = phi i64 [ %ivy.epil, %loop_exiting.epil ], [ %ivy.epil, %loop_exiting.epil ]
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: %result = phi i64 [ %result.ph, %exit1.loopexit ], [ %result.ph4, %exit1.loopexit3 ]
|
|
; EPILOG-NEXT: ret i64 %result
|
|
; EPILOG: latchexit.unr-lcssa:
|
|
; EPILOG-NEXT: %sum.next.lcssa.ph = phi i64 [ %sum.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %sum.unr = phi i64 [ %sum.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %latchexit
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %latchexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.epil.init = phi i64 [ 0, %entry ], [ %sum.unr, %latchexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %sum.epil = phi i64 [ %sum.epil.init, %loop_header.epil.preheader ], [ %sum.next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.epil, label %loop_exiting.epil
|
|
; EPILOG: loop_exiting.epil:
|
|
; EPILOG-NEXT: %ivy.epil = add i64 %iv.epil, %add
|
|
; EPILOG-NEXT: switch i64 %sum.epil, label %loop_latch.epil [
|
|
; EPILOG-NEXT: i64 24, label %exit1.loopexit3
|
|
; EPILOG-NEXT: i64 42, label %exit1.loopexit3
|
|
; EPILOG-NEXT: ]
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add nuw nsw i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %sum.next.epil = add i64 %sum.epil, %add
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %latchexit.epilog-lcssa, !llvm.loop !9
|
|
; EPILOG: latchexit.epilog-lcssa:
|
|
; EPILOG-NEXT: %sum.next.lcssa.ph1 = phi i64 [ %sum.next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: br label %latchexit
|
|
; EPILOG: latchexit:
|
|
; EPILOG-NEXT: %sum.next.lcssa = phi i64 [ %sum.next.lcssa.ph, %latchexit.unr-lcssa ], [ %sum.next.lcssa.ph1, %latchexit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i64 %sum.next.lcssa
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test5(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum = phi i64 [ 0, %entry.new ], [ %sum.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting
|
|
; EPILOG-BLOCK: loop_exiting:
|
|
; EPILOG-BLOCK-NEXT: %ivy = add i64 %iv, %add
|
|
; EPILOG-BLOCK-NEXT: switch i64 %sum, label %loop_latch [
|
|
; EPILOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-BLOCK-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-BLOCK-NEXT: ]
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-BLOCK-NEXT: %sum.next = add i64 %sum, %add
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting.1
|
|
; EPILOG-BLOCK: loop_exiting.1:
|
|
; EPILOG-BLOCK-NEXT: %ivy.1 = add i64 %iv_next, %add
|
|
; EPILOG-BLOCK-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; EPILOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; EPILOG-BLOCK-NEXT: i64 42, label %exit1.loopexit
|
|
; EPILOG-BLOCK-NEXT: ]
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %latchexit.unr-lcssa, !llvm.loop !9
|
|
; EPILOG-BLOCK: exit1.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %result.ph = phi i64 [ %ivy, %loop_exiting ], [ %ivy, %loop_exiting ], [ %ivy.1, %loop_exiting.1 ], [ %ivy.1, %loop_exiting.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: %result = phi i64 [ %ivy.epil, %loop_exiting.epil ], [ %ivy.epil, %loop_exiting.epil ], [ %result.ph, %exit1.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: ret i64 %result
|
|
; EPILOG-BLOCK: latchexit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %sum.next.lcssa.ph = phi i64 [ %sum.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %iv.unr = phi i64 [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.unr = phi i64 [ %sum.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %latchexit
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %latchexit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.epil.init = phi i64 [ 0, %entry ], [ %sum.unr, %latchexit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.epil, label %loop_exiting.epil
|
|
; EPILOG-BLOCK: loop_exiting.epil:
|
|
; EPILOG-BLOCK-NEXT: %ivy.epil = add i64 %iv.epil.init, %add
|
|
; EPILOG-BLOCK-NEXT: switch i64 %sum.epil.init, label %loop_latch.epil [
|
|
; EPILOG-BLOCK-NEXT: i64 24, label %exit1
|
|
; EPILOG-BLOCK-NEXT: i64 42, label %exit1
|
|
; EPILOG-BLOCK-NEXT: ]
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: %sum.next.epil = add i64 %sum.epil.init, %add
|
|
; EPILOG-BLOCK-NEXT: br label %latchexit
|
|
; EPILOG-BLOCK: latchexit:
|
|
; EPILOG-BLOCK-NEXT: %sum.next.lcssa = phi i64 [ %sum.next.lcssa.ph, %latchexit.unr-lcssa ], [ %sum.next.epil, %loop_latch.epil ]
|
|
; EPILOG-BLOCK-NEXT: ret i64 %sum.next.lcssa
|
|
;
|
|
; PROLOG-LABEL: @test5(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %sum.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %sum.next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.prol, label %loop_exiting.prol
|
|
; PROLOG: loop_exiting.prol:
|
|
; PROLOG-NEXT: %ivy.prol = add i64 %iv.prol, %add
|
|
; PROLOG-NEXT: switch i64 %sum.prol, label %loop_latch.prol [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit1
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit1
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add nuw nsw i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %sum.next.prol = add i64 %sum.prol, %add
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !9
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %sum.unr.ph = phi i64 [ %sum.next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %sum.next.lcssa.unr.ph = phi i64 [ %sum.next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.unr = phi i64 [ 0, %entry ], [ %sum.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.next.lcssa.unr = phi i64 [ poison, %entry ], [ %sum.next.lcssa.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %latchexit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: %sum = phi i64 [ %sum.unr, %entry.new ], [ %sum.next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting
|
|
; PROLOG: loop_exiting:
|
|
; PROLOG-NEXT: %ivy = add i64 %iv, %add
|
|
; PROLOG-NEXT: switch i64 %sum, label %loop_latch [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; PROLOG-NEXT: %sum.next = add i64 %sum, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting.1
|
|
; PROLOG: loop_exiting.1:
|
|
; PROLOG-NEXT: %ivy.1 = add i64 %iv_next, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; PROLOG-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.2, label %loop_exiting.2
|
|
; PROLOG: loop_exiting.2:
|
|
; PROLOG-NEXT: %ivy.2 = add i64 %iv_next.1, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next.1, label %loop_latch.2 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: %iv_next.2 = add nuw nsw i64 %iv, 3
|
|
; PROLOG-NEXT: %sum.next.2 = add i64 %sum.next.1, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.3, label %loop_exiting.3
|
|
; PROLOG: loop_exiting.3:
|
|
; PROLOG-NEXT: %ivy.3 = add i64 %iv_next.2, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next.2, label %loop_latch.3 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: %iv_next.3 = add nuw nsw i64 %iv, 4
|
|
; PROLOG-NEXT: %sum.next.3 = add i64 %sum.next.2, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.4, label %loop_exiting.4
|
|
; PROLOG: loop_exiting.4:
|
|
; PROLOG-NEXT: %ivy.4 = add i64 %iv_next.3, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next.3, label %loop_latch.4 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: %iv_next.4 = add nuw nsw i64 %iv, 5
|
|
; PROLOG-NEXT: %sum.next.4 = add i64 %sum.next.3, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.5, label %loop_exiting.5
|
|
; PROLOG: loop_exiting.5:
|
|
; PROLOG-NEXT: %ivy.5 = add i64 %iv_next.4, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next.4, label %loop_latch.5 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: %iv_next.5 = add nuw nsw i64 %iv, 6
|
|
; PROLOG-NEXT: %sum.next.5 = add i64 %sum.next.4, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.6, label %loop_exiting.6
|
|
; PROLOG: loop_exiting.6:
|
|
; PROLOG-NEXT: %ivy.6 = add i64 %iv_next.5, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next.5, label %loop_latch.6 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: %iv_next.6 = add nuw nsw i64 %iv, 7
|
|
; PROLOG-NEXT: %sum.next.6 = add i64 %sum.next.5, %add
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.7, label %loop_exiting.7
|
|
; PROLOG: loop_exiting.7:
|
|
; PROLOG-NEXT: %ivy.7 = add i64 %iv_next.6, %add
|
|
; PROLOG-NEXT: switch i64 %sum.next.6, label %loop_latch.7 [
|
|
; PROLOG-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-NEXT: ]
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add nuw nsw i64 %iv, 8
|
|
; PROLOG-NEXT: %sum.next.7 = add i64 %sum.next.6, %add
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %latchexit.unr-lcssa
|
|
; PROLOG: exit1.loopexit:
|
|
; PROLOG-NEXT: %result.ph = phi i64 [ %ivy, %loop_exiting ], [ %ivy, %loop_exiting ], [ %ivy.1, %loop_exiting.1 ], [ %ivy.1, %loop_exiting.1 ], [ %ivy.2, %loop_exiting.2 ], [ %ivy.2, %loop_exiting.2 ], [ %ivy.3, %loop_exiting.3 ], [ %ivy.3, %loop_exiting.3 ], [ %ivy.4, %loop_exiting.4 ], [ %ivy.4, %loop_exiting.4 ], [ %ivy.5, %loop_exiting.5 ], [ %ivy.5, %loop_exiting.5 ], [ %ivy.6, %loop_exiting.6 ], [ %ivy.6, %loop_exiting.6 ], [ %ivy.7, %loop_exiting.7 ], [ %ivy.7, %loop_exiting.7 ]
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1.loopexit1:
|
|
; PROLOG-NEXT: %result.ph2 = phi i64 [ %ivy.prol, %loop_exiting.prol ], [ %ivy.prol, %loop_exiting.prol ]
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: %result = phi i64 [ %result.ph, %exit1.loopexit ], [ %result.ph2, %exit1.loopexit1 ]
|
|
; PROLOG-NEXT: ret i64 %result
|
|
; PROLOG: latchexit.unr-lcssa:
|
|
; PROLOG-NEXT: %sum.next.lcssa.ph = phi i64 [ %sum.next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: br label %latchexit
|
|
; PROLOG: latchexit:
|
|
; PROLOG-NEXT: %sum.next.lcssa = phi i64 [ %sum.next.lcssa.unr, %loop_header.prol.loopexit ], [ %sum.next.lcssa.ph, %latchexit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i64 %sum.next.lcssa
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test5(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.prol, label %loop_exiting.prol
|
|
; PROLOG-BLOCK: loop_exiting.prol:
|
|
; PROLOG-BLOCK-NEXT: switch i64 0, label %loop_latch.prol [
|
|
; PROLOG-BLOCK-NEXT: i64 24, label %exit1
|
|
; PROLOG-BLOCK-NEXT: i64 42, label %exit1
|
|
; PROLOG-BLOCK-NEXT: ]
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.unr = phi i64 [ 0, %entry ], [ %add, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.next.lcssa.unr = phi i64 [ poison, %entry ], [ %add, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %latchexit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum = phi i64 [ %sum.unr, %entry.new ], [ %sum.next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %loop_exiting
|
|
; PROLOG-BLOCK: loop_exiting:
|
|
; PROLOG-BLOCK-NEXT: %ivy = add i64 %iv, %add
|
|
; PROLOG-BLOCK-NEXT: switch i64 %sum, label %loop_latch [
|
|
; PROLOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-BLOCK-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-BLOCK-NEXT: ]
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; PROLOG-BLOCK-NEXT: %sum.next = add i64 %sum, %add
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %loop_exiting.1
|
|
; PROLOG-BLOCK: loop_exiting.1:
|
|
; PROLOG-BLOCK-NEXT: %ivy.1 = add i64 %iv_next, %add
|
|
; PROLOG-BLOCK-NEXT: switch i64 %sum.next, label %loop_latch.1 [
|
|
; PROLOG-BLOCK-NEXT: i64 24, label %exit1.loopexit
|
|
; PROLOG-BLOCK-NEXT: i64 42, label %exit1.loopexit
|
|
; PROLOG-BLOCK-NEXT: ]
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %sum.next.1 = add i64 %sum.next, %add
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %latchexit.unr-lcssa, !llvm.loop !9
|
|
; PROLOG-BLOCK: exit1.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %result.ph = phi i64 [ %ivy, %loop_exiting ], [ %ivy, %loop_exiting ], [ %ivy.1, %loop_exiting.1 ], [ %ivy.1, %loop_exiting.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: %result = phi i64 [ %add, %loop_exiting.prol ], [ %add, %loop_exiting.prol ], [ %result.ph, %exit1.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: ret i64 %result
|
|
; PROLOG-BLOCK: latchexit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %sum.next.lcssa.ph = phi i64 [ %sum.next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latchexit
|
|
; PROLOG-BLOCK: latchexit:
|
|
; PROLOG-BLOCK-NEXT: %sum.next.lcssa = phi i64 [ %sum.next.lcssa.unr, %loop_header.prol.loopexit ], [ %sum.next.lcssa.ph, %latchexit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i64 %sum.next.lcssa
|
|
;
|
|
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
%sum = phi i64 [ 0, %entry ], [ %sum.next, %loop_latch ]
|
|
br i1 %cond, label %loop_latch, label %loop_exiting
|
|
|
|
loop_exiting:
|
|
%ivy = add i64 %iv, %add
|
|
switch i64 %sum, label %loop_latch [
|
|
i64 24, label %exit1
|
|
i64 42, label %exit1
|
|
]
|
|
|
|
loop_latch:
|
|
%iv_next = add nuw nsw i64 %iv, 1
|
|
%sum.next = add i64 %sum, %add
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %latchexit
|
|
|
|
exit1:
|
|
%result = phi i64 [ %ivy, %loop_exiting ], [ %ivy, %loop_exiting ]
|
|
ret i64 %result
|
|
|
|
latchexit:
|
|
ret i64 %sum.next
|
|
}
|
|
|
|
; test when exit blocks have successors.
|
|
define i32 @test6(ptr nocapture %a, i64 %n, i1 %cond, i32 %x) {
|
|
; EPILOG-LABEL: @test6(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG: for.exiting_block:
|
|
; EPILOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-NEXT: %load = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-NEXT: %add = add nsw i32 %load, %sum.02
|
|
; EPILOG-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG: for.exiting_block.1:
|
|
; EPILOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-NEXT: %load.1 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-NEXT: %add.1 = add nsw i32 %load.1, %add
|
|
; EPILOG-NEXT: %indvars.iv.next.1 = add nuw nsw i64 %indvars.iv, 2
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; EPILOG: for.exiting_block.2:
|
|
; EPILOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.2, label %for.exit2.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; EPILOG-NEXT: %load.2 = load i32, ptr %arrayidx.2, align 4
|
|
; EPILOG-NEXT: %add.2 = add nsw i32 %load.2, %add.1
|
|
; EPILOG-NEXT: %indvars.iv.next.2 = add nuw nsw i64 %indvars.iv, 3
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; EPILOG: for.exiting_block.3:
|
|
; EPILOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.3, label %for.exit2.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; EPILOG-NEXT: %load.3 = load i32, ptr %arrayidx.3, align 4
|
|
; EPILOG-NEXT: %add.3 = add nsw i32 %load.3, %add.2
|
|
; EPILOG-NEXT: %indvars.iv.next.3 = add nuw nsw i64 %indvars.iv, 4
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; EPILOG: for.exiting_block.4:
|
|
; EPILOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.4, label %for.exit2.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; EPILOG-NEXT: %load.4 = load i32, ptr %arrayidx.4, align 4
|
|
; EPILOG-NEXT: %add.4 = add nsw i32 %load.4, %add.3
|
|
; EPILOG-NEXT: %indvars.iv.next.4 = add nuw nsw i64 %indvars.iv, 5
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; EPILOG: for.exiting_block.5:
|
|
; EPILOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.5, label %for.exit2.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; EPILOG-NEXT: %load.5 = load i32, ptr %arrayidx.5, align 4
|
|
; EPILOG-NEXT: %add.5 = add nsw i32 %load.5, %add.4
|
|
; EPILOG-NEXT: %indvars.iv.next.5 = add nuw nsw i64 %indvars.iv, 6
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; EPILOG: for.exiting_block.6:
|
|
; EPILOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.6, label %for.exit2.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; EPILOG-NEXT: %load.6 = load i32, ptr %arrayidx.6, align 4
|
|
; EPILOG-NEXT: %add.6 = add nsw i32 %load.6, %add.5
|
|
; EPILOG-NEXT: %indvars.iv.next.6 = add nuw nsw i64 %indvars.iv, 7
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; EPILOG: for.exiting_block.7:
|
|
; EPILOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.7, label %for.exit2.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; EPILOG-NEXT: %load.7 = load i32, ptr %arrayidx.7, align 4
|
|
; EPILOG-NEXT: %add.7 = add nsw i32 %load.7, %add.6
|
|
; EPILOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp eq i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %latch_exit.unr-lcssa, label %header
|
|
; EPILOG: latch_exit.unr-lcssa:
|
|
; EPILOG-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %sum.02.unr = phi i32 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latch_exit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latch_exit.unr-lcssa ]
|
|
; EPILOG-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latch_exit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %indvars.iv.epil = phi i64 [ %indvars.iv.next.epil, %latch.epil ], [ %indvars.iv.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %sum.02.epil = phi i32 [ %add.epil, %latch.epil ], [ %sum.02.epil.init, %header.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: br i1 false, label %for.exit2.loopexit3, label %for.exiting_block.epil
|
|
; EPILOG: for.exiting_block.epil:
|
|
; EPILOG-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-NEXT: br i1 %cmp.epil, label %for.exit2.loopexit3, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil
|
|
; EPILOG-NEXT: %load.epil = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-NEXT: %add.epil = add nsw i32 %load.epil, %sum.02.epil
|
|
; EPILOG-NEXT: %indvars.iv.next.epil = add i64 %indvars.iv.epil, 1
|
|
; EPILOG-NEXT: %exitcond.epil = icmp eq i64 %indvars.iv.next.epil, %n
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latch_exit.epilog-lcssa, !llvm.loop !10
|
|
; EPILOG: latch_exit.epilog-lcssa:
|
|
; EPILOG-NEXT: %sum.0.lcssa.ph1 = phi i32 [ %add.epil, %latch.epil ]
|
|
; EPILOG-NEXT: br label %latch_exit
|
|
; EPILOG: latch_exit:
|
|
; EPILOG-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.ph, %latch_exit.unr-lcssa ], [ %sum.0.lcssa.ph1, %latch_exit.epilog-lcssa ]
|
|
; EPILOG-NEXT: ret i32 %sum.0.lcssa
|
|
; EPILOG: for.exit2.loopexit:
|
|
; EPILOG-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %latch ], [ 42, %for.exiting_block.1 ], [ %add.1, %latch.1 ], [ 42, %for.exiting_block.2 ], [ %add.2, %latch.2 ], [ 42, %for.exiting_block.3 ], [ %add.3, %latch.3 ], [ 42, %for.exiting_block.4 ], [ %add.4, %latch.4 ], [ 42, %for.exiting_block.5 ], [ %add.5, %latch.5 ], [ 42, %for.exiting_block.6 ], [ %add.6, %latch.6 ], [ 42, %for.exiting_block.7 ]
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2.loopexit3:
|
|
; EPILOG-NEXT: %retval.ph4 = phi i32 [ 42, %for.exiting_block.epil ], [ %sum.02.epil, %header.epil ]
|
|
; EPILOG-NEXT: br label %for.exit2
|
|
; EPILOG: for.exit2:
|
|
; EPILOG-NEXT: %retval = phi i32 [ %retval.ph, %for.exit2.loopexit ], [ %retval.ph4, %for.exit2.loopexit3 ]
|
|
; EPILOG-NEXT: %addx = add i32 %retval, %x
|
|
; EPILOG-NEXT: br i1 %cond, label %exit_true, label %exit_false
|
|
; EPILOG: exit_true:
|
|
; EPILOG-NEXT: ret i32 %retval
|
|
; EPILOG: exit_false:
|
|
; EPILOG-NEXT: ret i32 %addx
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test6(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv = phi i64 [ 0, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02 = phi i32 [ 0, %entry.new ], [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; EPILOG-BLOCK: for.exiting_block:
|
|
; EPILOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; EPILOG-BLOCK-NEXT: %load = load i32, ptr %arrayidx, align 4
|
|
; EPILOG-BLOCK-NEXT: %add = add nsw i32 %load, %sum.02
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; EPILOG-BLOCK: for.exiting_block.1:
|
|
; EPILOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; EPILOG-BLOCK-NEXT: %load.1 = load i32, ptr %arrayidx.1, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nsw i32 %load.1, %add
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp eq i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %latch_exit.unr-lcssa, label %header, !llvm.loop !10
|
|
; EPILOG-BLOCK: latch_exit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ %indvars.iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latch_exit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %indvars.iv.epil.init = phi i64 [ 0, %entry ], [ %indvars.iv.unr, %latch_exit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %sum.02.epil.init = phi i32 [ 0, %entry ], [ %sum.02.unr, %latch_exit.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod2 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod2)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %for.exit2, label %for.exiting_block.epil
|
|
; EPILOG-BLOCK: for.exiting_block.epil:
|
|
; EPILOG-BLOCK-NEXT: %cmp.epil = icmp eq i64 %n, 42
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp.epil, label %for.exit2, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: %arrayidx.epil = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.epil.init
|
|
; EPILOG-BLOCK-NEXT: %load.epil = load i32, ptr %arrayidx.epil, align 4
|
|
; EPILOG-BLOCK-NEXT: %add.epil = add nsw i32 %load.epil, %sum.02.epil.init
|
|
; EPILOG-BLOCK-NEXT: br label %latch_exit
|
|
; EPILOG-BLOCK: latch_exit:
|
|
; EPILOG-BLOCK-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.ph, %latch_exit.unr-lcssa ], [ %add.epil, %latch.epil ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %sum.0.lcssa
|
|
; EPILOG-BLOCK: for.exit2.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %latch ], [ 42, %for.exiting_block.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %for.exit2
|
|
; EPILOG-BLOCK: for.exit2:
|
|
; EPILOG-BLOCK-NEXT: %retval = phi i32 [ %sum.02.epil.init, %header.epil ], [ 42, %for.exiting_block.epil ], [ %retval.ph, %for.exit2.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: %addx = add i32 %retval, %x
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %exit_true, label %exit_false
|
|
; EPILOG-BLOCK: exit_true:
|
|
; EPILOG-BLOCK-NEXT: ret i32 %retval
|
|
; EPILOG-BLOCK: exit_false:
|
|
; EPILOG-BLOCK-NEXT: ret i32 %addx
|
|
;
|
|
; PROLOG-LABEL: @test6(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %indvars.iv.prol = phi i64 [ %indvars.iv.next.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %sum.02.prol = phi i32 [ %add.prol, %latch.prol ], [ 0, %header.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit1, label %for.exiting_block.prol
|
|
; PROLOG: for.exiting_block.prol:
|
|
; PROLOG-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.prol, label %for.exit2.loopexit1, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %arrayidx.prol = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.prol
|
|
; PROLOG-NEXT: %load.prol = load i32, ptr %arrayidx.prol, align 4
|
|
; PROLOG-NEXT: %add.prol = add nsw i32 %load.prol, %sum.02.prol
|
|
; PROLOG-NEXT: %indvars.iv.next.prol = add i64 %indvars.iv.prol, 1
|
|
; PROLOG-NEXT: %exitcond.prol = icmp eq i64 %indvars.iv.next.prol, %n
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !10
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %sum.0.lcssa.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %indvars.iv.unr.ph = phi i64 [ %indvars.iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %sum.02.unr.ph = phi i32 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %sum.0.lcssa.unr = phi i32 [ poison, %entry ], [ %sum.0.lcssa.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ %indvars.iv.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %sum.02.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %latch_exit, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.7, %latch.7 ]
|
|
; PROLOG-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG: for.exiting_block:
|
|
; PROLOG-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-NEXT: %load = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-NEXT: %add = add nsw i32 %load, %sum.02
|
|
; PROLOG-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG: for.exiting_block.1:
|
|
; PROLOG-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-NEXT: %load.1 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-NEXT: %add.1 = add nsw i32 %load.1, %add
|
|
; PROLOG-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.2
|
|
; PROLOG: for.exiting_block.2:
|
|
; PROLOG-NEXT: %cmp.2 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.2, label %for.exit2.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: %arrayidx.2 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.1
|
|
; PROLOG-NEXT: %load.2 = load i32, ptr %arrayidx.2, align 4
|
|
; PROLOG-NEXT: %add.2 = add nsw i32 %load.2, %add.1
|
|
; PROLOG-NEXT: %indvars.iv.next.2 = add i64 %indvars.iv, 3
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.3
|
|
; PROLOG: for.exiting_block.3:
|
|
; PROLOG-NEXT: %cmp.3 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.3, label %for.exit2.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: %arrayidx.3 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.2
|
|
; PROLOG-NEXT: %load.3 = load i32, ptr %arrayidx.3, align 4
|
|
; PROLOG-NEXT: %add.3 = add nsw i32 %load.3, %add.2
|
|
; PROLOG-NEXT: %indvars.iv.next.3 = add i64 %indvars.iv, 4
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.4
|
|
; PROLOG: for.exiting_block.4:
|
|
; PROLOG-NEXT: %cmp.4 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.4, label %for.exit2.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: %arrayidx.4 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.3
|
|
; PROLOG-NEXT: %load.4 = load i32, ptr %arrayidx.4, align 4
|
|
; PROLOG-NEXT: %add.4 = add nsw i32 %load.4, %add.3
|
|
; PROLOG-NEXT: %indvars.iv.next.4 = add i64 %indvars.iv, 5
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.5
|
|
; PROLOG: for.exiting_block.5:
|
|
; PROLOG-NEXT: %cmp.5 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.5, label %for.exit2.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: %arrayidx.5 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.4
|
|
; PROLOG-NEXT: %load.5 = load i32, ptr %arrayidx.5, align 4
|
|
; PROLOG-NEXT: %add.5 = add nsw i32 %load.5, %add.4
|
|
; PROLOG-NEXT: %indvars.iv.next.5 = add i64 %indvars.iv, 6
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.6
|
|
; PROLOG: for.exiting_block.6:
|
|
; PROLOG-NEXT: %cmp.6 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.6, label %for.exit2.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %arrayidx.6 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.5
|
|
; PROLOG-NEXT: %load.6 = load i32, ptr %arrayidx.6, align 4
|
|
; PROLOG-NEXT: %add.6 = add nsw i32 %load.6, %add.5
|
|
; PROLOG-NEXT: %indvars.iv.next.6 = add i64 %indvars.iv, 7
|
|
; PROLOG-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.7
|
|
; PROLOG: for.exiting_block.7:
|
|
; PROLOG-NEXT: %cmp.7 = icmp eq i64 %n, 42
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %for.exit2.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %arrayidx.7 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next.6
|
|
; PROLOG-NEXT: %load.7 = load i32, ptr %arrayidx.7, align 4
|
|
; PROLOG-NEXT: %add.7 = add nsw i32 %load.7, %add.6
|
|
; PROLOG-NEXT: %indvars.iv.next.7 = add i64 %indvars.iv, 8
|
|
; PROLOG-NEXT: %exitcond.7 = icmp eq i64 %indvars.iv.next.7, %n
|
|
; PROLOG-NEXT: br i1 %exitcond.7, label %latch_exit.unr-lcssa, label %header
|
|
; PROLOG: latch_exit.unr-lcssa:
|
|
; PROLOG-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br label %latch_exit
|
|
; PROLOG: latch_exit:
|
|
; PROLOG-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.unr, %header.prol.loopexit ], [ %sum.0.lcssa.ph, %latch_exit.unr-lcssa ]
|
|
; PROLOG-NEXT: ret i32 %sum.0.lcssa
|
|
; PROLOG: for.exit2.loopexit:
|
|
; PROLOG-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %latch ], [ 42, %for.exiting_block.1 ], [ %add.1, %latch.1 ], [ 42, %for.exiting_block.2 ], [ %add.2, %latch.2 ], [ 42, %for.exiting_block.3 ], [ %add.3, %latch.3 ], [ 42, %for.exiting_block.4 ], [ %add.4, %latch.4 ], [ 42, %for.exiting_block.5 ], [ %add.5, %latch.5 ], [ 42, %for.exiting_block.6 ], [ %add.6, %latch.6 ], [ 42, %for.exiting_block.7 ]
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2.loopexit1:
|
|
; PROLOG-NEXT: %retval.ph2 = phi i32 [ 42, %for.exiting_block.prol ], [ %sum.02.prol, %header.prol ]
|
|
; PROLOG-NEXT: br label %for.exit2
|
|
; PROLOG: for.exit2:
|
|
; PROLOG-NEXT: %retval = phi i32 [ %retval.ph, %for.exit2.loopexit ], [ %retval.ph2, %for.exit2.loopexit1 ]
|
|
; PROLOG-NEXT: %addx = add i32 %retval, %x
|
|
; PROLOG-NEXT: br i1 %cond, label %exit_true, label %exit_false
|
|
; PROLOG: exit_true:
|
|
; PROLOG-NEXT: ret i32 %retval
|
|
; PROLOG: exit_false:
|
|
; PROLOG-NEXT: ret i32 %addx
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test6(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %n
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %for.exit2, label %for.exiting_block.prol
|
|
; PROLOG-BLOCK: for.exiting_block.prol:
|
|
; PROLOG-BLOCK-NEXT: %cmp.prol = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.prol, label %for.exit2, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: %load.prol = load i32, ptr %a, align 4
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %sum.0.lcssa.unr = phi i32 [ poison, %entry ], [ %load.prol, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.unr = phi i64 [ 0, %entry ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02.unr = phi i32 [ 0, %entry ], [ %load.prol, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %latch_exit, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv = phi i64 [ %indvars.iv.unr, %entry.new ], [ %indvars.iv.next.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: %sum.02 = phi i32 [ %sum.02.unr, %entry.new ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block
|
|
; PROLOG-BLOCK: for.exiting_block:
|
|
; PROLOG-BLOCK-NEXT: %cmp = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp, label %for.exit2.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
; PROLOG-BLOCK-NEXT: %load = load i32, ptr %arrayidx, align 4
|
|
; PROLOG-BLOCK-NEXT: %add = add nsw i32 %load, %sum.02
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next = add i64 %indvars.iv, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %for.exit2.loopexit, label %for.exiting_block.1
|
|
; PROLOG-BLOCK: for.exiting_block.1:
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp eq i64 %n, 42
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %for.exit2.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %arrayidx.1 = getelementptr inbounds i32, ptr %a, i64 %indvars.iv.next
|
|
; PROLOG-BLOCK-NEXT: %load.1 = load i32, ptr %arrayidx.1, align 4
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nsw i32 %load.1, %add
|
|
; PROLOG-BLOCK-NEXT: %indvars.iv.next.1 = add i64 %indvars.iv, 2
|
|
; PROLOG-BLOCK-NEXT: %exitcond.1 = icmp eq i64 %indvars.iv.next.1, %n
|
|
; PROLOG-BLOCK-NEXT: br i1 %exitcond.1, label %latch_exit.unr-lcssa, label %header, !llvm.loop !10
|
|
; PROLOG-BLOCK: latch_exit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: %sum.0.lcssa.ph = phi i32 [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %latch_exit
|
|
; PROLOG-BLOCK: latch_exit:
|
|
; PROLOG-BLOCK-NEXT: %sum.0.lcssa = phi i32 [ %sum.0.lcssa.unr, %header.prol.loopexit ], [ %sum.0.lcssa.ph, %latch_exit.unr-lcssa ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %sum.0.lcssa
|
|
; PROLOG-BLOCK: for.exit2.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %retval.ph = phi i32 [ 42, %for.exiting_block ], [ %sum.02, %header ], [ %add, %latch ], [ 42, %for.exiting_block.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %for.exit2
|
|
; PROLOG-BLOCK: for.exit2:
|
|
; PROLOG-BLOCK-NEXT: %retval = phi i32 [ 0, %header.prol ], [ 42, %for.exiting_block.prol ], [ %retval.ph, %for.exit2.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: %addx = add i32 %retval, %x
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %exit_true, label %exit_false
|
|
; PROLOG-BLOCK: exit_true:
|
|
; PROLOG-BLOCK-NEXT: ret i32 %retval
|
|
; PROLOG-BLOCK: exit_false:
|
|
; PROLOG-BLOCK-NEXT: ret i32 %addx
|
|
;
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
%indvars.iv = phi i64 [ %indvars.iv.next, %latch ], [ 0, %entry ]
|
|
%sum.02 = phi i32 [ %add, %latch ], [ 0, %entry ]
|
|
br i1 false, label %for.exit2, label %for.exiting_block
|
|
|
|
for.exiting_block:
|
|
%cmp = icmp eq i64 %n, 42
|
|
br i1 %cmp, label %for.exit2, label %latch
|
|
|
|
latch:
|
|
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %indvars.iv
|
|
%load = load i32, ptr %arrayidx, align 4
|
|
%add = add nsw i32 %load, %sum.02
|
|
%indvars.iv.next = add i64 %indvars.iv, 1
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %n
|
|
br i1 %exitcond, label %latch_exit, label %header
|
|
|
|
latch_exit:
|
|
%sum.0.lcssa = phi i32 [ %add, %latch ]
|
|
ret i32 %sum.0.lcssa
|
|
|
|
for.exit2:
|
|
%retval = phi i32 [ %sum.02, %header ], [ 42, %for.exiting_block ]
|
|
%addx = add i32 %retval, %x
|
|
br i1 %cond, label %exit_true, label %exit_false
|
|
|
|
exit_true:
|
|
ret i32 %retval
|
|
|
|
exit_false:
|
|
ret i32 %addx
|
|
}
|
|
|
|
; test when value in exit block does not have VMap.
|
|
define i32 @test7(i32 %arg, i32 %arg1, i32 %arg2) {
|
|
; EPILOG-LABEL: @test7(
|
|
; EPILOG-NEXT: bb:
|
|
; EPILOG-NEXT: %i = icmp slt i32 undef, 2
|
|
; EPILOG-NEXT: %sext = sext i32 undef to i64
|
|
; EPILOG-NEXT: %shft = ashr exact i32 %arg, 16
|
|
; EPILOG-NEXT: br i1 %i, label %loopexit2, label %preheader
|
|
; EPILOG: preheader:
|
|
; EPILOG-NEXT: %0 = add nsw i64 %sext, -1
|
|
; EPILOG-NEXT: %1 = freeze i64 %0
|
|
; EPILOG-NEXT: %2 = add i64 %1, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %1, 7
|
|
; EPILOG-NEXT: %3 = icmp ult i64 %2, 7
|
|
; EPILOG-NEXT: br i1 %3, label %header.epil.preheader, label %preheader.new
|
|
; EPILOG: preheader.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %1, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %i6 = phi i64 [ 1, %preheader.new ], [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %preheader.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %add.7 = add nuw nsw i64 %i6, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %header, label %latchexit.unr-lcssa
|
|
; EPILOG: latchexit.unr-lcssa:
|
|
; EPILOG-NEXT: %i6.unr = phi i64 [ %add.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchexit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %i6.epil.init = phi i64 [ 1, %preheader ], [ %i6.unr, %latchexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %i6.epil = phi i64 [ %i6.epil.init, %header.epil.preheader ], [ %add.epil, %latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: br i1 false, label %loopexit1.loopexit2, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %add.epil = add nuw nsw i64 %i6.epil, 1
|
|
; EPILOG-NEXT: %i9.epil = icmp slt i64 %add.epil, %sext
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %latchexit.epilog-lcssa, !llvm.loop !11
|
|
; EPILOG: latchexit.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %latchexit
|
|
; EPILOG: latchexit:
|
|
; EPILOG-NEXT: unreachable
|
|
; EPILOG: loopexit2:
|
|
; EPILOG-NEXT: ret i32 %shft
|
|
; EPILOG: loopexit1.loopexit:
|
|
; EPILOG-NEXT: %sext3.ph = phi i32 [ %shft, %header ], [ %shft, %latch ], [ %shft, %latch.1 ], [ %shft, %latch.2 ], [ %shft, %latch.3 ], [ %shft, %latch.4 ], [ %shft, %latch.5 ], [ %shft, %latch.6 ]
|
|
; EPILOG-NEXT: br label %loopexit1
|
|
; EPILOG: loopexit1.loopexit2:
|
|
; EPILOG-NEXT: %sext3.ph3 = phi i32 [ %shft, %header.epil ]
|
|
; EPILOG-NEXT: br label %loopexit1
|
|
; EPILOG: loopexit1:
|
|
; EPILOG-NEXT: %sext3 = phi i32 [ %sext3.ph, %loopexit1.loopexit ], [ %sext3.ph3, %loopexit1.loopexit2 ]
|
|
; EPILOG-NEXT: ret i32 %sext3
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test7(
|
|
; EPILOG-BLOCK-NEXT: bb:
|
|
; EPILOG-BLOCK-NEXT: %i = icmp slt i32 undef, 2
|
|
; EPILOG-BLOCK-NEXT: %sext = sext i32 undef to i64
|
|
; EPILOG-BLOCK-NEXT: %shft = ashr exact i32 %arg, 16
|
|
; EPILOG-BLOCK-NEXT: br i1 %i, label %loopexit2, label %preheader
|
|
; EPILOG-BLOCK: preheader:
|
|
; EPILOG-BLOCK-NEXT: %0 = add nsw i64 %sext, -1
|
|
; EPILOG-BLOCK-NEXT: %1 = freeze i64 %0
|
|
; EPILOG-BLOCK-NEXT: %2 = add i64 %1, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: %3 = icmp ult i64 %2, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %3, label %header.epil.preheader, label %preheader.new
|
|
; EPILOG-BLOCK: preheader.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %1, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %i6 = phi i64 [ 1, %preheader.new ], [ %add.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %preheader.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loopexit1.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %add.1 = add nuw nsw i64 %i6, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %header, label %latchexit.unr-lcssa, !llvm.loop !11
|
|
; EPILOG-BLOCK: latchexit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %latchexit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %loopexit1, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %latchexit
|
|
; EPILOG-BLOCK: latchexit:
|
|
; EPILOG-BLOCK-NEXT: unreachable
|
|
; EPILOG-BLOCK: loopexit2:
|
|
; EPILOG-BLOCK-NEXT: ret i32 %shft
|
|
; EPILOG-BLOCK: loopexit1.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %sext3.ph = phi i32 [ %shft, %header ], [ %shft, %latch ]
|
|
; EPILOG-BLOCK-NEXT: br label %loopexit1
|
|
; EPILOG-BLOCK: loopexit1:
|
|
; EPILOG-BLOCK-NEXT: %sext3 = phi i32 [ %shft, %header.epil ], [ %sext3.ph, %loopexit1.loopexit ]
|
|
; EPILOG-BLOCK-NEXT: ret i32 %sext3
|
|
;
|
|
; PROLOG-LABEL: @test7(
|
|
; PROLOG-NEXT: bb:
|
|
; PROLOG-NEXT: %i = icmp slt i32 undef, 2
|
|
; PROLOG-NEXT: %sext = sext i32 undef to i64
|
|
; PROLOG-NEXT: %shft = ashr exact i32 %arg, 16
|
|
; PROLOG-NEXT: br i1 %i, label %loopexit2, label %preheader
|
|
; PROLOG: preheader:
|
|
; PROLOG-NEXT: %0 = add nsw i64 %sext, -1
|
|
; PROLOG-NEXT: %1 = freeze i64 %0
|
|
; PROLOG-NEXT: %2 = add i64 %1, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %1, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %i6.prol = phi i64 [ 1, %header.prol.preheader ], [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit1, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %add.prol = add nuw nsw i64 %i6.prol, 1
|
|
; PROLOG-NEXT: %i9.prol = icmp slt i64 %add.prol, %sext
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !11
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %i6.unr.ph = phi i64 [ %add.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %i6.unr = phi i64 [ 1, %preheader ], [ %i6.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i64 %2, 7
|
|
; PROLOG-NEXT: br i1 %3, label %latchexit, label %preheader.new
|
|
; PROLOG: preheader.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %i6 = phi i64 [ %i6.unr, %preheader.new ], [ %add.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %add.7 = add nuw nsw i64 %i6, 8
|
|
; PROLOG-NEXT: %i9.7 = icmp slt i64 %add.7, %sext
|
|
; PROLOG-NEXT: br i1 %i9.7, label %header, label %latchexit.unr-lcssa
|
|
; PROLOG: latchexit.unr-lcssa:
|
|
; PROLOG-NEXT: br label %latchexit
|
|
; PROLOG: latchexit:
|
|
; PROLOG-NEXT: unreachable
|
|
; PROLOG: loopexit2:
|
|
; PROLOG-NEXT: ret i32 %shft
|
|
; PROLOG: loopexit1.loopexit:
|
|
; PROLOG-NEXT: %sext3.ph = phi i32 [ %shft, %header ], [ %shft, %latch ], [ %shft, %latch.1 ], [ %shft, %latch.2 ], [ %shft, %latch.3 ], [ %shft, %latch.4 ], [ %shft, %latch.5 ], [ %shft, %latch.6 ]
|
|
; PROLOG-NEXT: br label %loopexit1
|
|
; PROLOG: loopexit1.loopexit1:
|
|
; PROLOG-NEXT: %sext3.ph2 = phi i32 [ %shft, %header.prol ]
|
|
; PROLOG-NEXT: br label %loopexit1
|
|
; PROLOG: loopexit1:
|
|
; PROLOG-NEXT: %sext3 = phi i32 [ %sext3.ph, %loopexit1.loopexit ], [ %sext3.ph2, %loopexit1.loopexit1 ]
|
|
; PROLOG-NEXT: ret i32 %sext3
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test7(
|
|
; PROLOG-BLOCK-NEXT: bb:
|
|
; PROLOG-BLOCK-NEXT: %i = icmp slt i32 undef, 2
|
|
; PROLOG-BLOCK-NEXT: %sext = sext i32 undef to i64
|
|
; PROLOG-BLOCK-NEXT: %shft = ashr exact i32 %arg, 16
|
|
; PROLOG-BLOCK-NEXT: br i1 %i, label %loopexit2, label %preheader
|
|
; PROLOG-BLOCK: preheader:
|
|
; PROLOG-BLOCK-NEXT: %0 = add nsw i64 %sext, -1
|
|
; PROLOG-BLOCK-NEXT: %1 = freeze i64 %0
|
|
; PROLOG-BLOCK-NEXT: %2 = add i64 %1, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loopexit1, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %i6.unr = phi i64 [ 1, %preheader ], [ 2, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i64 %2, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %latchexit, label %preheader.new
|
|
; PROLOG-BLOCK: preheader.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %i6 = phi i64 [ %i6.unr, %preheader.new ], [ %add.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loopexit1.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %loopexit1.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %add.1 = add nuw nsw i64 %i6, 2
|
|
; PROLOG-BLOCK-NEXT: %i9.1 = icmp slt i64 %add.1, %sext
|
|
; PROLOG-BLOCK-NEXT: br i1 %i9.1, label %header, label %latchexit.unr-lcssa, !llvm.loop !11
|
|
; PROLOG-BLOCK: latchexit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %latchexit
|
|
; PROLOG-BLOCK: latchexit:
|
|
; PROLOG-BLOCK-NEXT: unreachable
|
|
; PROLOG-BLOCK: loopexit2:
|
|
; PROLOG-BLOCK-NEXT: ret i32 %shft
|
|
; PROLOG-BLOCK: loopexit1.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %sext3.ph = phi i32 [ %shft, %header ], [ %shft, %latch ]
|
|
; PROLOG-BLOCK-NEXT: br label %loopexit1
|
|
; PROLOG-BLOCK: loopexit1:
|
|
; PROLOG-BLOCK-NEXT: %sext3 = phi i32 [ %shft, %header.prol ], [ %sext3.ph, %loopexit1.loopexit ]
|
|
; PROLOG-BLOCK-NEXT: ret i32 %sext3
|
|
;
|
|
bb:
|
|
%i = icmp slt i32 undef, 2
|
|
%sext = sext i32 undef to i64
|
|
%shft = ashr exact i32 %arg, 16
|
|
br i1 %i, label %loopexit2, label %preheader
|
|
|
|
preheader: ; preds = %bb2
|
|
br label %header
|
|
|
|
header: ; preds = %latch, %preheader
|
|
%i6 = phi i64 [ 1, %preheader ], [ %add, %latch ]
|
|
br i1 false, label %loopexit1, label %latch
|
|
|
|
latch: ; preds = %header
|
|
%add = add nuw nsw i64 %i6, 1
|
|
%i9 = icmp slt i64 %add, %sext
|
|
br i1 %i9, label %header, label %latchexit
|
|
|
|
latchexit: ; preds = %latch
|
|
unreachable
|
|
|
|
loopexit2: ; preds = %bb2
|
|
ret i32 %shft
|
|
|
|
loopexit1: ; preds = %header
|
|
%sext3 = phi i32 [ %shft, %header ]
|
|
ret i32 %sext3
|
|
}
|
|
|
|
; Nested loop and inner loop is unrolled. The tricky bit here is that
|
|
; several blocks in the inner loop fall out of the outer block when we
|
|
; use the epilogue block remainder strategy.
|
|
define void @test8() {
|
|
; EPILOG-LABEL: @test8(
|
|
; EPILOG-NEXT: bb:
|
|
; EPILOG-NEXT: br label %outerloop
|
|
; EPILOG: outerloop.loopexit.loopexit:
|
|
; EPILOG-NEXT: br label %outerloop.loopexit
|
|
; EPILOG: outerloop.loopexit.loopexit2:
|
|
; EPILOG-NEXT: br label %outerloop.loopexit
|
|
; EPILOG: outerloop.loopexit:
|
|
; EPILOG-NEXT: br label %outerloop
|
|
; EPILOG: outerloop:
|
|
; EPILOG-NEXT: %i = phi i64 [ 3, %bb ], [ 0, %outerloop.loopexit ]
|
|
; EPILOG-NEXT: %0 = sub i64 100, %i
|
|
; EPILOG-NEXT: %1 = sub i64 99, %i
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %innerH.epil.preheader, label %outerloop.new
|
|
; EPILOG: outerloop.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %innerH
|
|
; EPILOG: innerH:
|
|
; EPILOG-NEXT: %i3 = phi i64 [ %i, %outerloop.new ], [ %i4.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %outerloop.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.1
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.2
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.3
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.4
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.5
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.6
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: %i4.7 = add nuw nsw i64 %i3, 8
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.7
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %niter.next.7 = add nuw nsw i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %innerH, label %exit.unr-lcssa
|
|
; EPILOG: exit.unr-lcssa:
|
|
; EPILOG-NEXT: %i3.unr = phi i64 [ %i4.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %innerH.epil.preheader, label %exit.loopexit
|
|
; EPILOG: innerH.epil.preheader:
|
|
; EPILOG-NEXT: %i3.epil.init = phi i64 [ %i, %outerloop ], [ %i3.unr, %exit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %innerH.epil
|
|
; EPILOG: innerH.epil:
|
|
; EPILOG-NEXT: %i3.epil = phi i64 [ %i4.epil, %latch.epil ], [ %i3.epil.init, %innerH.epil.preheader ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %innerH.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: %i4.epil = add nuw nsw i64 %i3.epil, 1
|
|
; EPILOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit2, label %latch.epil
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %i6.epil = icmp ult i64 %i4.epil, 100
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %innerH.epil, label %exit.epilog-lcssa, !llvm.loop !12
|
|
; EPILOG: exit.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit
|
|
; EPILOG: exit.loopexit:
|
|
; EPILOG-NEXT: br label %exit
|
|
; EPILOG: exit:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test8(
|
|
; EPILOG-BLOCK-NEXT: bb:
|
|
; EPILOG-BLOCK-NEXT: br label %outerloop
|
|
; EPILOG-BLOCK: outerloop.loopexit.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %outerloop.loopexit
|
|
; EPILOG-BLOCK: outerloop.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %innerH.epil.preheader.1, label %outerloop.new.1
|
|
; EPILOG-BLOCK: outerloop.new.1:
|
|
; EPILOG-BLOCK-NEXT: br label %innerH.1
|
|
; EPILOG-BLOCK: innerH.1:
|
|
; EPILOG-BLOCK-NEXT: %i3.1 = phi i64 [ 0, %outerloop.new.1 ], [ %i4.1.1, %latch.1.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter.1 = phi i64 [ 0, %outerloop.new.1 ], [ %niter.next.1.1, %latch.1.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit.1, label %latch.13
|
|
; EPILOG-BLOCK: latch.13:
|
|
; EPILOG-BLOCK-NEXT: %i4.1.1 = add nuw nsw i64 %i3.1, 2
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit.1, label %latch.1.1
|
|
; EPILOG-BLOCK: latch.1.1:
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1.1 = add i64 %niter.1, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1.1 = icmp ne i64 %niter.next.1.1, 100
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1.1, label %innerH.1, label %exit.unr-lcssa.1, !llvm.loop !12
|
|
; EPILOG-BLOCK: exit.unr-lcssa.1:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %innerH.epil.preheader.1, label %exit.loopexit
|
|
; EPILOG-BLOCK: outerloop.loopexit.loopexit.1:
|
|
; EPILOG-BLOCK-NEXT: br label %outerloop.loopexit.1
|
|
; EPILOG-BLOCK: innerH.epil.preheader.1:
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 false)
|
|
; EPILOG-BLOCK-NEXT: br label %innerH.epil.1
|
|
; EPILOG-BLOCK: innerH.epil.1:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.1, label %latch.epil
|
|
; EPILOG-BLOCK: outerloop.loopexit.1:
|
|
; EPILOG-BLOCK-NEXT: br label %outerloop, !llvm.loop !13
|
|
; EPILOG-BLOCK: outerloop:
|
|
; EPILOG-BLOCK-NEXT: %i = phi i64 [ 3, %bb ], [ 0, %outerloop.loopexit.1 ]
|
|
; EPILOG-BLOCK-NEXT: %0 = sub i64 100, %i
|
|
; EPILOG-BLOCK-NEXT: %1 = sub i64 99, %i
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %innerH.epil.preheader, label %outerloop.new
|
|
; EPILOG-BLOCK: outerloop.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %innerH
|
|
; EPILOG-BLOCK: innerH:
|
|
; EPILOG-BLOCK-NEXT: %i3 = phi i64 [ %i, %outerloop.new ], [ %i4.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %outerloop.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: %i4.1 = add nuw nsw i64 %i3, 2
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.1
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %innerH, label %exit.unr-lcssa, !llvm.loop !12
|
|
; EPILOG-BLOCK: exit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %innerH.epil.preheader, label %exit.loopexit
|
|
; EPILOG-BLOCK: innerH.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %innerH.epil
|
|
; EPILOG-BLOCK: innerH.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit, label %latch.epil
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit
|
|
; EPILOG-BLOCK: exit.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit
|
|
; EPILOG-BLOCK: exit:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test8(
|
|
; PROLOG-NEXT: bb:
|
|
; PROLOG-NEXT: br label %outerloop
|
|
; PROLOG: outerloop.loopexit.loopexit:
|
|
; PROLOG-NEXT: br label %outerloop.loopexit
|
|
; PROLOG: outerloop.loopexit.loopexit1:
|
|
; PROLOG-NEXT: br label %outerloop.loopexit
|
|
; PROLOG: outerloop.loopexit:
|
|
; PROLOG-NEXT: br label %outerloop
|
|
; PROLOG: outerloop:
|
|
; PROLOG-NEXT: %i = phi i64 [ 3, %bb ], [ 0, %outerloop.loopexit ]
|
|
; PROLOG-NEXT: %0 = sub i64 100, %i
|
|
; PROLOG-NEXT: %1 = sub i64 99, %i
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %innerH.prol.preheader, label %innerH.prol.loopexit
|
|
; PROLOG: innerH.prol.preheader:
|
|
; PROLOG-NEXT: br label %innerH.prol
|
|
; PROLOG: innerH.prol:
|
|
; PROLOG-NEXT: %i3.prol = phi i64 [ %i4.prol, %latch.prol ], [ %i, %innerH.prol.preheader ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %innerH.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: %i4.prol = add nuw nsw i64 %i3.prol, 1
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit1, label %latch.prol
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %i6.prol = icmp ult i64 %i4.prol, 100
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %innerH.prol, label %innerH.prol.loopexit.unr-lcssa, !llvm.loop !12
|
|
; PROLOG: innerH.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %i3.unr.ph = phi i64 [ %i4.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %innerH.prol.loopexit
|
|
; PROLOG: innerH.prol.loopexit:
|
|
; PROLOG-NEXT: %i3.unr = phi i64 [ %i, %outerloop ], [ %i3.unr.ph, %innerH.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit.loopexit, label %outerloop.new
|
|
; PROLOG: outerloop.new:
|
|
; PROLOG-NEXT: br label %innerH
|
|
; PROLOG: innerH:
|
|
; PROLOG-NEXT: %i3 = phi i64 [ %i3.unr, %outerloop.new ], [ %i4.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.1
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.2
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.3
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.4
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.5
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.6
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %i4.7 = add nuw nsw i64 %i3, 8
|
|
; PROLOG-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.7
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %i6.7 = icmp ult i64 %i4.7, 100
|
|
; PROLOG-NEXT: br i1 %i6.7, label %innerH, label %exit.unr-lcssa
|
|
; PROLOG: exit.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit
|
|
; PROLOG: exit.loopexit:
|
|
; PROLOG-NEXT: br label %exit
|
|
; PROLOG: exit:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test8(
|
|
; PROLOG-BLOCK-NEXT: bb:
|
|
; PROLOG-BLOCK-NEXT: br label %outerloop
|
|
; PROLOG-BLOCK: outerloop.loopexit.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %outerloop.loopexit
|
|
; PROLOG-BLOCK: outerloop.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %innerH.prol.preheader.1, label %innerH.prol.loopexit.1
|
|
; PROLOG-BLOCK: innerH.prol.preheader.1:
|
|
; PROLOG-BLOCK-NEXT: br label %innerH.prol.1
|
|
; PROLOG-BLOCK: innerH.prol.1:
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.1, label %latch.prol.1
|
|
; PROLOG-BLOCK: latch.prol.1:
|
|
; PROLOG-BLOCK-NEXT: br label %innerH.prol.loopexit.1
|
|
; PROLOG-BLOCK: innerH.prol.loopexit.1:
|
|
; PROLOG-BLOCK-NEXT: %i3.unr.1 = phi i64 [ 0, %outerloop.loopexit ], [ 1, %latch.prol.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %exit.loopexit, label %outerloop.new.1
|
|
; PROLOG-BLOCK: outerloop.new.1:
|
|
; PROLOG-BLOCK-NEXT: br label %innerH.1
|
|
; PROLOG-BLOCK: innerH.1:
|
|
; PROLOG-BLOCK-NEXT: %i3.1 = phi i64 [ %i3.unr.1, %outerloop.new.1 ], [ %i4.1.1, %latch.1.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit.1, label %latch.11
|
|
; PROLOG-BLOCK: latch.11:
|
|
; PROLOG-BLOCK-NEXT: %i4.1.1 = add nuw nsw i64 %i3.1, 2
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit.1, label %latch.1.1
|
|
; PROLOG-BLOCK: latch.1.1:
|
|
; PROLOG-BLOCK-NEXT: %i6.1.1 = icmp ult i64 %i4.1.1, 100
|
|
; PROLOG-BLOCK-NEXT: br i1 %i6.1.1, label %innerH.1, label %exit.unr-lcssa.loopexit2, !llvm.loop !12
|
|
; PROLOG-BLOCK: outerloop.loopexit.loopexit.1:
|
|
; PROLOG-BLOCK-NEXT: br label %outerloop.loopexit.1
|
|
; PROLOG-BLOCK: outerloop.loopexit.1:
|
|
; PROLOG-BLOCK-NEXT: br label %outerloop, !llvm.loop !13
|
|
; PROLOG-BLOCK: outerloop:
|
|
; PROLOG-BLOCK-NEXT: %i = phi i64 [ 3, %bb ], [ 0, %outerloop.loopexit.1 ]
|
|
; PROLOG-BLOCK-NEXT: %0 = sub i64 100, %i
|
|
; PROLOG-BLOCK-NEXT: %1 = sub i64 99, %i
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %innerH.prol.preheader, label %innerH.prol.loopexit
|
|
; PROLOG-BLOCK: innerH.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %innerH.prol
|
|
; PROLOG-BLOCK: innerH.prol:
|
|
; PROLOG-BLOCK-NEXT: %i4.prol = add nuw nsw i64 %i, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit, label %latch.prol
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %innerH.prol.loopexit
|
|
; PROLOG-BLOCK: innerH.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %i3.unr = phi i64 [ %i, %outerloop ], [ %i4.prol, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit.loopexit, label %outerloop.new
|
|
; PROLOG-BLOCK: outerloop.new:
|
|
; PROLOG-BLOCK-NEXT: br label %innerH
|
|
; PROLOG-BLOCK: innerH:
|
|
; PROLOG-BLOCK-NEXT: %i3 = phi i64 [ %i3.unr, %outerloop.new ], [ %i4.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %i4.1 = add nuw nsw i64 %i3, 2
|
|
; PROLOG-BLOCK-NEXT: br i1 false, label %outerloop.loopexit.loopexit, label %latch.1
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %i6.1 = icmp ult i64 %i4.1, 100
|
|
; PROLOG-BLOCK-NEXT: br i1 %i6.1, label %innerH, label %exit.unr-lcssa.loopexit, !llvm.loop !12
|
|
; PROLOG-BLOCK: exit.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit.unr-lcssa
|
|
; PROLOG-BLOCK: exit.unr-lcssa.loopexit2:
|
|
; PROLOG-BLOCK-NEXT: br label %exit.unr-lcssa
|
|
; PROLOG-BLOCK: exit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit
|
|
; PROLOG-BLOCK: exit.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit
|
|
; PROLOG-BLOCK: exit:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
|
|
bb:
|
|
br label %outerloop
|
|
|
|
outerloop: ; preds = %innerH, %bb
|
|
%i = phi i64 [ 3, %bb ], [ 0, %innerH ]
|
|
br label %innerH
|
|
|
|
innerH: ; preds = %latch, %outerloop
|
|
%i3 = phi i64 [ %i4, %latch ], [ %i, %outerloop ]
|
|
%i4 = add nuw nsw i64 %i3, 1
|
|
br i1 false, label %outerloop, label %latch
|
|
|
|
latch: ; preds = %innerH
|
|
%i6 = icmp ult i64 %i4, 100
|
|
br i1 %i6, label %innerH, label %exit
|
|
|
|
exit: ; preds = %latch
|
|
ret void
|
|
}
|
|
|
|
declare ptr addrspace(1) @foo(i32)
|
|
; inner loop prolog unrolled
|
|
; a value from outer loop is used in exit block of inner loop.
|
|
; Don't create VMap entries for such values (%trip).
|
|
define ptr addrspace(1) @test9(ptr nocapture readonly %arg, i32 %n) {
|
|
; EPILOG-LABEL: @test9(
|
|
; EPILOG-NEXT: bb:
|
|
; EPILOG-NEXT: %0 = add i32 %n, -1
|
|
; EPILOG-NEXT: br label %outerloopHdr
|
|
; EPILOG: outerloopHdr:
|
|
; EPILOG-NEXT: %trip = add i32 %n, -1
|
|
; EPILOG-NEXT: %outercnd = icmp slt i32 0, %trip
|
|
; EPILOG-NEXT: br i1 %outercnd, label %preheader, label %outerLatch
|
|
; EPILOG: preheader:
|
|
; EPILOG-NEXT: %i4 = zext i32 0 to i64
|
|
; EPILOG-NEXT: %1 = freeze i32 %0
|
|
; EPILOG-NEXT: %2 = add i32 %1, -1
|
|
; EPILOG-NEXT: %xtraiter = and i32 %1, 7
|
|
; EPILOG-NEXT: %3 = icmp ult i32 %2, 7
|
|
; EPILOG-NEXT: br i1 %3, label %header.epil.preheader, label %preheader.new
|
|
; EPILOG: preheader.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i32 %1, %xtraiter
|
|
; EPILOG-NEXT: br label %header
|
|
; EPILOG: header:
|
|
; EPILOG-NEXT: %phi = phi i64 [ %i4, %preheader.new ], [ %iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i32 [ 0, %preheader.new ], [ %niter.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: br i1 true, label %latch, label %innerexit.loopexit
|
|
; EPILOG: innerexit.loopexit:
|
|
; EPILOG-NEXT: %trip.lcssa.ph = phi i32 [ %trip, %header ], [ %trip, %latch ], [ %trip, %latch.1 ], [ %trip, %latch.2 ], [ %trip, %latch.3 ], [ %trip, %latch.4 ], [ %trip, %latch.5 ], [ %trip, %latch.6 ]
|
|
; EPILOG-NEXT: br label %innerexit
|
|
; EPILOG: innerexit.loopexit2:
|
|
; EPILOG-NEXT: %trip.lcssa.ph3 = phi i32 [ %trip, %header.epil ]
|
|
; EPILOG-NEXT: br label %innerexit
|
|
; EPILOG: innerexit:
|
|
; EPILOG-NEXT: %trip.lcssa = phi i32 [ %trip.lcssa.ph, %innerexit.loopexit ], [ %trip.lcssa.ph3, %innerexit.loopexit2 ]
|
|
; EPILOG-NEXT: %i9 = call ptr addrspace(1) @foo(i32 %trip.lcssa)
|
|
; EPILOG-NEXT: ret ptr addrspace(1) %i9
|
|
; EPILOG: latch:
|
|
; EPILOG-NEXT: br i1 true, label %latch.1, label %innerexit.loopexit
|
|
; EPILOG: latch.1:
|
|
; EPILOG-NEXT: br i1 true, label %latch.2, label %innerexit.loopexit
|
|
; EPILOG: latch.2:
|
|
; EPILOG-NEXT: br i1 true, label %latch.3, label %innerexit.loopexit
|
|
; EPILOG: latch.3:
|
|
; EPILOG-NEXT: br i1 true, label %latch.4, label %innerexit.loopexit
|
|
; EPILOG: latch.4:
|
|
; EPILOG-NEXT: br i1 true, label %latch.5, label %innerexit.loopexit
|
|
; EPILOG: latch.5:
|
|
; EPILOG-NEXT: br i1 true, label %latch.6, label %innerexit.loopexit
|
|
; EPILOG: latch.6:
|
|
; EPILOG-NEXT: br i1 true, label %latch.7, label %innerexit.loopexit
|
|
; EPILOG: latch.7:
|
|
; EPILOG-NEXT: %iv.next.7 = add nuw nsw i64 %phi, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i32 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i32 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %header, label %outerLatch.loopexit.unr-lcssa
|
|
; EPILOG: outerLatch.loopexit.unr-lcssa:
|
|
; EPILOG-NEXT: %phi.unr = phi i64 [ %iv.next.7, %latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %outerLatch.loopexit
|
|
; EPILOG: header.epil.preheader:
|
|
; EPILOG-NEXT: %phi.epil.init = phi i64 [ %i4, %preheader ], [ %phi.unr, %outerLatch.loopexit.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %header.epil
|
|
; EPILOG: header.epil:
|
|
; EPILOG-NEXT: %phi.epil = phi i64 [ %phi.epil.init, %header.epil.preheader ], [ %iv.next.epil, %latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i32 [ 0, %header.epil.preheader ], [ %epil.iter.next, %latch.epil ]
|
|
; EPILOG-NEXT: %i7.epil = trunc i64 %phi.epil to i32
|
|
; EPILOG-NEXT: br i1 true, label %latch.epil, label %innerexit.loopexit2
|
|
; EPILOG: latch.epil:
|
|
; EPILOG-NEXT: %i11.epil = add nsw i32 %i7.epil, 1
|
|
; EPILOG-NEXT: %innercnd.epil = icmp slt i32 %i11.epil, %trip
|
|
; EPILOG-NEXT: %iv.next.epil = add nuw nsw i64 %phi.epil, 1
|
|
; EPILOG-NEXT: %epil.iter.next = add i32 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i32 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %header.epil, label %outerLatch.loopexit.epilog-lcssa, !llvm.loop !13
|
|
; EPILOG: outerLatch.loopexit.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %outerLatch.loopexit
|
|
; EPILOG: outerLatch.loopexit:
|
|
; EPILOG-NEXT: br label %outerLatch
|
|
; EPILOG: outerLatch:
|
|
; EPILOG-NEXT: br label %outerloopHdr
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test9(
|
|
; EPILOG-BLOCK-NEXT: bb:
|
|
; EPILOG-BLOCK-NEXT: %0 = add i32 %n, -1
|
|
; EPILOG-BLOCK-NEXT: br label %outerloopHdr
|
|
; EPILOG-BLOCK: outerloopHdr:
|
|
; EPILOG-BLOCK-NEXT: %trip = add i32 %n, -1
|
|
; EPILOG-BLOCK-NEXT: %outercnd = icmp slt i32 0, %trip
|
|
; EPILOG-BLOCK-NEXT: br i1 %outercnd, label %preheader, label %outerLatch
|
|
; EPILOG-BLOCK: preheader:
|
|
; EPILOG-BLOCK-NEXT: %1 = freeze i32 %0
|
|
; EPILOG-BLOCK-NEXT: %2 = add i32 %1, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i32 %1, 1
|
|
; EPILOG-BLOCK-NEXT: %3 = icmp ult i32 %2, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %3, label %header.epil.preheader, label %preheader.new
|
|
; EPILOG-BLOCK: preheader.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i32 %1, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %header
|
|
; EPILOG-BLOCK: header:
|
|
; EPILOG-BLOCK-NEXT: %phi = phi i64 [ 0, %preheader.new ], [ %iv.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i32 [ 0, %preheader.new ], [ %niter.next.1, %latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 true, label %latch, label %innerexit.loopexit.loopexit
|
|
; EPILOG-BLOCK: innerexit.loopexit.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %trip.lcssa.ph.ph = phi i32 [ %trip, %latch ], [ %trip, %header ]
|
|
; EPILOG-BLOCK-NEXT: br label %innerexit.loopexit
|
|
; EPILOG-BLOCK: innerexit.loopexit.loopexit5:
|
|
; EPILOG-BLOCK-NEXT: %trip.lcssa.ph.ph6 = phi i32 [ %trip.1, %latch.14 ], [ %trip.1, %header.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %innerexit.loopexit
|
|
; EPILOG-BLOCK: innerexit.loopexit:
|
|
; EPILOG-BLOCK-NEXT: %trip.lcssa.ph = phi i32 [ %trip.lcssa.ph.ph, %innerexit.loopexit.loopexit ], [ %trip.lcssa.ph.ph6, %innerexit.loopexit.loopexit5 ]
|
|
; EPILOG-BLOCK-NEXT: br label %innerexit
|
|
; EPILOG-BLOCK: innerexit.loopexit2:
|
|
; EPILOG-BLOCK-NEXT: %trip.lcssa.ph3 = phi i32 [ %trip, %header.epil ], [ %trip.1, %header.epil.1 ]
|
|
; EPILOG-BLOCK-NEXT: br label %innerexit
|
|
; EPILOG-BLOCK: innerexit:
|
|
; EPILOG-BLOCK-NEXT: %trip.lcssa = phi i32 [ %trip.lcssa.ph, %innerexit.loopexit ], [ %trip.lcssa.ph3, %innerexit.loopexit2 ]
|
|
; EPILOG-BLOCK-NEXT: %i9 = call ptr addrspace(1) @foo(i32 %trip.lcssa)
|
|
; EPILOG-BLOCK-NEXT: ret ptr addrspace(1) %i9
|
|
; EPILOG-BLOCK: latch:
|
|
; EPILOG-BLOCK-NEXT: br i1 true, label %latch.1, label %innerexit.loopexit.loopexit
|
|
; EPILOG-BLOCK: latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv.next.1 = add nuw nsw i64 %phi, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i32 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i32 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %header, label %outerLatch.loopexit.unr-lcssa, !llvm.loop !14
|
|
; EPILOG-BLOCK: outerLatch.loopexit.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.epil.preheader, label %outerLatch.loopexit
|
|
; EPILOG-BLOCK: header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i32 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil
|
|
; EPILOG-BLOCK: header.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 true, label %latch.epil, label %innerexit.loopexit2
|
|
; EPILOG-BLOCK: latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %outerLatch.loopexit
|
|
; EPILOG-BLOCK: outerLatch.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %outerLatch
|
|
; EPILOG-BLOCK: outerLatch:
|
|
; EPILOG-BLOCK-NEXT: %trip.1 = add i32 %n, -1
|
|
; EPILOG-BLOCK-NEXT: %outercnd.1 = icmp slt i32 0, %trip.1
|
|
; EPILOG-BLOCK-NEXT: br i1 %outercnd.1, label %preheader.1, label %outerLatch.1
|
|
; EPILOG-BLOCK: preheader.1:
|
|
; EPILOG-BLOCK-NEXT: %4 = freeze i32 %0
|
|
; EPILOG-BLOCK-NEXT: %5 = add i32 %4, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter.1 = and i32 %4, 1
|
|
; EPILOG-BLOCK-NEXT: %6 = icmp ult i32 %5, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %6, label %header.epil.preheader.1, label %preheader.new.1
|
|
; EPILOG-BLOCK: preheader.new.1:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter.1 = sub i32 %4, %xtraiter.1
|
|
; EPILOG-BLOCK-NEXT: br label %header.1
|
|
; EPILOG-BLOCK: header.1:
|
|
; EPILOG-BLOCK-NEXT: %phi.1 = phi i64 [ 0, %preheader.new.1 ], [ %iv.next.1.1, %latch.1.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter.1 = phi i32 [ 0, %preheader.new.1 ], [ %niter.next.1.1, %latch.1.1 ]
|
|
; EPILOG-BLOCK-NEXT: br i1 true, label %latch.14, label %innerexit.loopexit.loopexit5
|
|
; EPILOG-BLOCK: latch.14:
|
|
; EPILOG-BLOCK-NEXT: br i1 true, label %latch.1.1, label %innerexit.loopexit.loopexit5
|
|
; EPILOG-BLOCK: latch.1.1:
|
|
; EPILOG-BLOCK-NEXT: %iv.next.1.1 = add nuw nsw i64 %phi.1, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1.1 = add i32 %niter.1, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1.1 = icmp ne i32 %niter.next.1.1, %unroll_iter.1
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1.1, label %header.1, label %outerLatch.loopexit.unr-lcssa.1, !llvm.loop !14
|
|
; EPILOG-BLOCK: outerLatch.loopexit.unr-lcssa.1:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod.1 = icmp ne i32 %xtraiter.1, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod.1, label %header.epil.preheader.1, label %outerLatch.loopexit.1
|
|
; EPILOG-BLOCK: header.epil.preheader.1:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1.1 = icmp ne i32 %xtraiter.1, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1.1)
|
|
; EPILOG-BLOCK-NEXT: br label %header.epil.1
|
|
; EPILOG-BLOCK: header.epil.1:
|
|
; EPILOG-BLOCK-NEXT: br i1 true, label %latch.epil.1, label %innerexit.loopexit2
|
|
; EPILOG-BLOCK: latch.epil.1:
|
|
; EPILOG-BLOCK-NEXT: br label %outerLatch.loopexit.1
|
|
; EPILOG-BLOCK: outerLatch.loopexit.1:
|
|
; EPILOG-BLOCK-NEXT: br label %outerLatch.1
|
|
; EPILOG-BLOCK: outerLatch.1:
|
|
; EPILOG-BLOCK-NEXT: br label %outerloopHdr, !llvm.loop !15
|
|
;
|
|
; PROLOG-LABEL: @test9(
|
|
; PROLOG-NEXT: bb:
|
|
; PROLOG-NEXT: %0 = add i32 %n, -1
|
|
; PROLOG-NEXT: br label %outerloopHdr
|
|
; PROLOG: outerloopHdr:
|
|
; PROLOG-NEXT: %trip = add i32 %n, -1
|
|
; PROLOG-NEXT: %outercnd = icmp slt i32 0, %trip
|
|
; PROLOG-NEXT: br i1 %outercnd, label %preheader, label %outerLatch
|
|
; PROLOG: preheader:
|
|
; PROLOG-NEXT: %i4 = zext i32 0 to i64
|
|
; PROLOG-NEXT: %1 = freeze i32 %0
|
|
; PROLOG-NEXT: %2 = add i32 %1, -1
|
|
; PROLOG-NEXT: %xtraiter = and i32 %1, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG: header.prol.preheader:
|
|
; PROLOG-NEXT: br label %header.prol
|
|
; PROLOG: header.prol:
|
|
; PROLOG-NEXT: %phi.prol = phi i64 [ %i4, %header.prol.preheader ], [ %iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i32 [ 0, %header.prol.preheader ], [ %prol.iter.next, %latch.prol ]
|
|
; PROLOG-NEXT: %i7.prol = trunc i64 %phi.prol to i32
|
|
; PROLOG-NEXT: br i1 true, label %latch.prol, label %innerexit.loopexit1
|
|
; PROLOG: latch.prol:
|
|
; PROLOG-NEXT: %i11.prol = add nsw i32 %i7.prol, 1
|
|
; PROLOG-NEXT: %innercnd.prol = icmp slt i32 %i11.prol, %trip
|
|
; PROLOG-NEXT: %iv.next.prol = add nuw nsw i64 %phi.prol, 1
|
|
; PROLOG-NEXT: %prol.iter.next = add i32 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i32 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %header.prol, label %header.prol.loopexit.unr-lcssa, !llvm.loop !13
|
|
; PROLOG: header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %phi.unr.ph = phi i64 [ %iv.next.prol, %latch.prol ]
|
|
; PROLOG-NEXT: br label %header.prol.loopexit
|
|
; PROLOG: header.prol.loopexit:
|
|
; PROLOG-NEXT: %phi.unr = phi i64 [ %i4, %preheader ], [ %phi.unr.ph, %header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %3 = icmp ult i32 %2, 7
|
|
; PROLOG-NEXT: br i1 %3, label %outerLatch.loopexit, label %preheader.new
|
|
; PROLOG: preheader.new:
|
|
; PROLOG-NEXT: br label %header
|
|
; PROLOG: header:
|
|
; PROLOG-NEXT: %phi = phi i64 [ %phi.unr, %preheader.new ], [ %iv.next.7, %latch.7 ]
|
|
; PROLOG-NEXT: br i1 true, label %latch, label %innerexit.loopexit
|
|
; PROLOG: innerexit.loopexit:
|
|
; PROLOG-NEXT: %trip.lcssa.ph = phi i32 [ %trip, %header ], [ %trip, %latch ], [ %trip, %latch.1 ], [ %trip, %latch.2 ], [ %trip, %latch.3 ], [ %trip, %latch.4 ], [ %trip, %latch.5 ], [ %trip, %latch.6 ]
|
|
; PROLOG-NEXT: br label %innerexit
|
|
; PROLOG: innerexit.loopexit1:
|
|
; PROLOG-NEXT: %trip.lcssa.ph2 = phi i32 [ %trip, %header.prol ]
|
|
; PROLOG-NEXT: br label %innerexit
|
|
; PROLOG: innerexit:
|
|
; PROLOG-NEXT: %trip.lcssa = phi i32 [ %trip.lcssa.ph, %innerexit.loopexit ], [ %trip.lcssa.ph2, %innerexit.loopexit1 ]
|
|
; PROLOG-NEXT: %i9 = call ptr addrspace(1) @foo(i32 %trip.lcssa)
|
|
; PROLOG-NEXT: ret ptr addrspace(1) %i9
|
|
; PROLOG: latch:
|
|
; PROLOG-NEXT: br i1 true, label %latch.1, label %innerexit.loopexit
|
|
; PROLOG: latch.1:
|
|
; PROLOG-NEXT: br i1 true, label %latch.2, label %innerexit.loopexit
|
|
; PROLOG: latch.2:
|
|
; PROLOG-NEXT: br i1 true, label %latch.3, label %innerexit.loopexit
|
|
; PROLOG: latch.3:
|
|
; PROLOG-NEXT: br i1 true, label %latch.4, label %innerexit.loopexit
|
|
; PROLOG: latch.4:
|
|
; PROLOG-NEXT: br i1 true, label %latch.5, label %innerexit.loopexit
|
|
; PROLOG: latch.5:
|
|
; PROLOG-NEXT: br i1 true, label %latch.6, label %innerexit.loopexit
|
|
; PROLOG: latch.6:
|
|
; PROLOG-NEXT: %iv.next.6 = add nuw nsw i64 %phi, 7
|
|
; PROLOG-NEXT: %i7.7 = trunc i64 %iv.next.6 to i32
|
|
; PROLOG-NEXT: br i1 true, label %latch.7, label %innerexit.loopexit
|
|
; PROLOG: latch.7:
|
|
; PROLOG-NEXT: %i11.7 = add nsw i32 %i7.7, 1
|
|
; PROLOG-NEXT: %innercnd.7 = icmp slt i32 %i11.7, %trip
|
|
; PROLOG-NEXT: %iv.next.7 = add nuw nsw i64 %phi, 8
|
|
; PROLOG-NEXT: br i1 %innercnd.7, label %header, label %outerLatch.loopexit.unr-lcssa
|
|
; PROLOG: outerLatch.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: br label %outerLatch.loopexit
|
|
; PROLOG: outerLatch.loopexit:
|
|
; PROLOG-NEXT: br label %outerLatch
|
|
; PROLOG: outerLatch:
|
|
; PROLOG-NEXT: br label %outerloopHdr
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test9(
|
|
; PROLOG-BLOCK-NEXT: bb:
|
|
; PROLOG-BLOCK-NEXT: %0 = add i32 %n, -1
|
|
; PROLOG-BLOCK-NEXT: br label %outerloopHdr
|
|
; PROLOG-BLOCK: outerloopHdr:
|
|
; PROLOG-BLOCK-NEXT: %trip = add i32 %n, -1
|
|
; PROLOG-BLOCK-NEXT: %outercnd = icmp slt i32 0, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %outercnd, label %preheader, label %outerLatch
|
|
; PROLOG-BLOCK: preheader:
|
|
; PROLOG-BLOCK-NEXT: %1 = freeze i32 %0
|
|
; PROLOG-BLOCK-NEXT: %2 = add i32 %1, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i32 %1, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i32 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %header.prol.preheader, label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol
|
|
; PROLOG-BLOCK: header.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 true, label %latch.prol, label %innerexit.loopexit1
|
|
; PROLOG-BLOCK: latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit
|
|
; PROLOG-BLOCK: header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %phi.unr = phi i64 [ 0, %preheader ], [ 1, %latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %3 = icmp ult i32 %2, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %3, label %outerLatch.loopexit, label %preheader.new
|
|
; PROLOG-BLOCK: preheader.new:
|
|
; PROLOG-BLOCK-NEXT: br label %header
|
|
; PROLOG-BLOCK: header:
|
|
; PROLOG-BLOCK-NEXT: %phi = phi i64 [ %phi.unr, %preheader.new ], [ %iv.next.1, %latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 true, label %latch, label %innerexit.loopexit.loopexit
|
|
; PROLOG-BLOCK: innerexit.loopexit.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %trip.lcssa.ph.ph = phi i32 [ %trip, %latch ], [ %trip, %header ]
|
|
; PROLOG-BLOCK-NEXT: br label %innerexit.loopexit
|
|
; PROLOG-BLOCK: innerexit.loopexit.loopexit5:
|
|
; PROLOG-BLOCK-NEXT: %trip.lcssa.ph.ph6 = phi i32 [ %trip.1, %latch.14 ], [ %trip.1, %header.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %innerexit.loopexit
|
|
; PROLOG-BLOCK: innerexit.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %trip.lcssa.ph = phi i32 [ %trip.lcssa.ph.ph, %innerexit.loopexit.loopexit ], [ %trip.lcssa.ph.ph6, %innerexit.loopexit.loopexit5 ]
|
|
; PROLOG-BLOCK-NEXT: br label %innerexit
|
|
; PROLOG-BLOCK: innerexit.loopexit1:
|
|
; PROLOG-BLOCK-NEXT: %trip.lcssa.ph2 = phi i32 [ %trip, %header.prol ], [ %trip.1, %header.prol.1 ]
|
|
; PROLOG-BLOCK-NEXT: br label %innerexit
|
|
; PROLOG-BLOCK: innerexit:
|
|
; PROLOG-BLOCK-NEXT: %trip.lcssa = phi i32 [ %trip.lcssa.ph, %innerexit.loopexit ], [ %trip.lcssa.ph2, %innerexit.loopexit1 ]
|
|
; PROLOG-BLOCK-NEXT: %i9 = call ptr addrspace(1) @foo(i32 %trip.lcssa)
|
|
; PROLOG-BLOCK-NEXT: ret ptr addrspace(1) %i9
|
|
; PROLOG-BLOCK: latch:
|
|
; PROLOG-BLOCK-NEXT: %iv.next = add nuw nsw i64 %phi, 1
|
|
; PROLOG-BLOCK-NEXT: %i7.1 = trunc i64 %iv.next to i32
|
|
; PROLOG-BLOCK-NEXT: br i1 true, label %latch.1, label %innerexit.loopexit.loopexit
|
|
; PROLOG-BLOCK: latch.1:
|
|
; PROLOG-BLOCK-NEXT: %i11.1 = add nsw i32 %i7.1, 1
|
|
; PROLOG-BLOCK-NEXT: %innercnd.1 = icmp slt i32 %i11.1, %trip
|
|
; PROLOG-BLOCK-NEXT: %iv.next.1 = add nuw nsw i64 %phi, 2
|
|
; PROLOG-BLOCK-NEXT: br i1 %innercnd.1, label %header, label %outerLatch.loopexit.unr-lcssa, !llvm.loop !14
|
|
; PROLOG-BLOCK: outerLatch.loopexit.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %outerLatch.loopexit
|
|
; PROLOG-BLOCK: outerLatch.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %outerLatch
|
|
; PROLOG-BLOCK: outerLatch:
|
|
; PROLOG-BLOCK-NEXT: %trip.1 = add i32 %n, -1
|
|
; PROLOG-BLOCK-NEXT: %outercnd.1 = icmp slt i32 0, %trip.1
|
|
; PROLOG-BLOCK-NEXT: br i1 %outercnd.1, label %preheader.1, label %outerLatch.1
|
|
; PROLOG-BLOCK: preheader.1:
|
|
; PROLOG-BLOCK-NEXT: %4 = freeze i32 %0
|
|
; PROLOG-BLOCK-NEXT: %5 = add i32 %4, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter.1 = and i32 %4, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod.1 = icmp ne i32 %xtraiter.1, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod.1, label %header.prol.preheader.1, label %header.prol.loopexit.1
|
|
; PROLOG-BLOCK: header.prol.preheader.1:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.1
|
|
; PROLOG-BLOCK: header.prol.1:
|
|
; PROLOG-BLOCK-NEXT: br i1 true, label %latch.prol.1, label %innerexit.loopexit1
|
|
; PROLOG-BLOCK: latch.prol.1:
|
|
; PROLOG-BLOCK-NEXT: br label %header.prol.loopexit.1
|
|
; PROLOG-BLOCK: header.prol.loopexit.1:
|
|
; PROLOG-BLOCK-NEXT: %phi.unr.1 = phi i64 [ 0, %preheader.1 ], [ 1, %latch.prol.1 ]
|
|
; PROLOG-BLOCK-NEXT: %6 = icmp ult i32 %5, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %6, label %outerLatch.loopexit.1, label %preheader.new.1
|
|
; PROLOG-BLOCK: preheader.new.1:
|
|
; PROLOG-BLOCK-NEXT: br label %header.1
|
|
; PROLOG-BLOCK: header.1:
|
|
; PROLOG-BLOCK-NEXT: %phi.1 = phi i64 [ %phi.unr.1, %preheader.new.1 ], [ %iv.next.1.1, %latch.1.1 ]
|
|
; PROLOG-BLOCK-NEXT: br i1 true, label %latch.14, label %innerexit.loopexit.loopexit5
|
|
; PROLOG-BLOCK: latch.14:
|
|
; PROLOG-BLOCK-NEXT: %iv.next.13 = add nuw nsw i64 %phi.1, 1
|
|
; PROLOG-BLOCK-NEXT: %i7.1.1 = trunc i64 %iv.next.13 to i32
|
|
; PROLOG-BLOCK-NEXT: br i1 true, label %latch.1.1, label %innerexit.loopexit.loopexit5
|
|
; PROLOG-BLOCK: latch.1.1:
|
|
; PROLOG-BLOCK-NEXT: %i11.1.1 = add nsw i32 %i7.1.1, 1
|
|
; PROLOG-BLOCK-NEXT: %innercnd.1.1 = icmp slt i32 %i11.1.1, %trip.1
|
|
; PROLOG-BLOCK-NEXT: %iv.next.1.1 = add nuw nsw i64 %phi.1, 2
|
|
; PROLOG-BLOCK-NEXT: br i1 %innercnd.1.1, label %header.1, label %outerLatch.loopexit.unr-lcssa.1, !llvm.loop !14
|
|
; PROLOG-BLOCK: outerLatch.loopexit.unr-lcssa.1:
|
|
; PROLOG-BLOCK-NEXT: br label %outerLatch.loopexit.1
|
|
; PROLOG-BLOCK: outerLatch.loopexit.1:
|
|
; PROLOG-BLOCK-NEXT: br label %outerLatch.1
|
|
; PROLOG-BLOCK: outerLatch.1:
|
|
; PROLOG-BLOCK-NEXT: br label %outerloopHdr, !llvm.loop !15
|
|
;
|
|
bb:
|
|
br label %outerloopHdr
|
|
|
|
outerloopHdr: ; preds = %outerLatch, %bb
|
|
%trip = add i32 %n, -1
|
|
%outercnd = icmp slt i32 0, %trip
|
|
br i1 %outercnd, label %preheader, label %outerLatch
|
|
|
|
preheader: ; preds = %outerloopHdr
|
|
%i4 = zext i32 0 to i64
|
|
br label %header
|
|
|
|
header: ; preds = %latch, %preheader
|
|
%phi = phi i64 [ %i4, %preheader ], [ %iv.next, %latch ]
|
|
%i7 = trunc i64 %phi to i32
|
|
br i1 true, label %latch, label %innerexit
|
|
|
|
innerexit: ; preds = %header
|
|
%i9 = call ptr addrspace(1) @foo(i32 %trip)
|
|
ret ptr addrspace(1) %i9
|
|
|
|
latch: ; preds = %header
|
|
%i11 = add nsw i32 %i7, 1
|
|
%innercnd = icmp slt i32 %i11, %trip
|
|
%iv.next = add nuw nsw i64 %phi, 1
|
|
br i1 %innercnd, label %header, label %outerLatch
|
|
|
|
outerLatch: ; preds = %latch, %outerloopHdr
|
|
br label %outerloopHdr
|
|
}
|
|
|
|
declare void @bar()
|
|
|
|
; This is a case where we should be able to eliminate N-1 copies
|
|
; of the early exit test in the main loop when runtime unrolling
|
|
; by N.
|
|
define void @test10(i64 %trip, i64 %trip2) {
|
|
; EPILOG-LABEL: @test10(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early, label %loop_latch, label %exit1.loopexit
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.1, label %loop_latch.1, label %exit1.loopexit
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.2 = icmp ne i64 %iv_next.1, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.2, label %loop_latch.2, label %exit1.loopexit
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: %iv_next.2 = add nuw nsw i64 %iv, 3
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.3 = icmp ne i64 %iv_next.2, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.3, label %loop_latch.3, label %exit1.loopexit
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: %iv_next.3 = add nuw nsw i64 %iv, 4
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.4 = icmp ne i64 %iv_next.3, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.4, label %loop_latch.4, label %exit1.loopexit
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: %iv_next.4 = add nuw nsw i64 %iv, 5
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.5 = icmp ne i64 %iv_next.4, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.5, label %loop_latch.5, label %exit1.loopexit
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: %iv_next.5 = add nuw nsw i64 %iv, 6
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.6 = icmp ne i64 %iv_next.5, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.6, label %loop_latch.6, label %exit1.loopexit
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: %iv_next.6 = add nuw nsw i64 %iv, 7
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.7 = icmp ne i64 %iv_next.6, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.7, label %loop_latch.7, label %exit1.loopexit
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit2.unr-lcssa
|
|
; EPILOG: exit1.loopexit:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
; EPILOG: exit2.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit2.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.epil = icmp ne i64 %iv.epil, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.epil, label %loop_latch.epil, label %exit1.loopexit2
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit2.epilog-lcssa, !llvm.loop !14
|
|
; EPILOG: exit2.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit2
|
|
; EPILOG: exit2:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test10(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early, label %loop_latch, label %exit1.loopexit
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early.1, label %loop_latch.1, label %exit1.loopexit
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit2.unr-lcssa, !llvm.loop !16
|
|
; EPILOG-BLOCK: exit1.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
; EPILOG-BLOCK: exit2.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %iv.unr = phi i64 [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit2.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early.epil = icmp ne i64 %iv.epil.init, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early.epil, label %loop_latch.epil, label %exit1
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit2
|
|
; EPILOG-BLOCK: exit2:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test10(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.prol = icmp ne i64 %iv.prol, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.prol, label %loop_latch.prol, label %exit1.loopexit1
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !14
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit2, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early, label %loop_latch, label %exit1.loopexit
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: %iv_next = add i64 %iv, 1
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.1, label %loop_latch.1, label %exit1.loopexit
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.2 = icmp ne i64 %iv_next.1, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.2, label %loop_latch.2, label %exit1.loopexit
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: %iv_next.2 = add i64 %iv, 3
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.3 = icmp ne i64 %iv_next.2, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.3, label %loop_latch.3, label %exit1.loopexit
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: %iv_next.3 = add i64 %iv, 4
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.4 = icmp ne i64 %iv_next.3, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.4, label %loop_latch.4, label %exit1.loopexit
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: %iv_next.4 = add i64 %iv, 5
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.5 = icmp ne i64 %iv_next.4, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.5, label %loop_latch.5, label %exit1.loopexit
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: %iv_next.5 = add i64 %iv, 6
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.6 = icmp ne i64 %iv_next.5, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.6, label %loop_latch.6, label %exit1.loopexit
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: %iv_next.6 = add i64 %iv, 7
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.7 = icmp ne i64 %iv_next.6, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.7, label %loop_latch.7, label %exit1.loopexit
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit2.unr-lcssa
|
|
; PROLOG: exit1.loopexit:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
; PROLOG: exit2.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit2
|
|
; PROLOG: exit2:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test10(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early.prol = icmp ne i64 0, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early.prol, label %loop_latch.prol, label %exit1
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit2, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early, label %loop_latch, label %exit1.loopexit
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: %iv_next = add i64 %iv, 1
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early.1, label %loop_latch.1, label %exit1.loopexit
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit2.unr-lcssa, !llvm.loop !16
|
|
; PROLOG-BLOCK: exit1.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
; PROLOG-BLOCK: exit2.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit2
|
|
; PROLOG-BLOCK: exit2:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
call void @bar()
|
|
%cmp_early = icmp ne i64 %iv, %trip2
|
|
br i1 %cmp_early, label %loop_latch, label %exit1
|
|
|
|
loop_latch:
|
|
%iv_next = add i64 %iv, 1
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit2
|
|
|
|
exit1:
|
|
ret void
|
|
|
|
exit2:
|
|
ret void
|
|
}
|
|
|
|
; With a loop invariant, we can eliminate the last N-1
|
|
; copies of the exit test in the unrolled main loop body.
|
|
define void @test11(i64 %trip, i1 %cond) {
|
|
; EPILOG-LABEL: @test11(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch, label %exit1.loopexit
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.loopexit
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.2, label %exit1.loopexit
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.3, label %exit1.loopexit
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.4, label %exit1.loopexit
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.5, label %exit1.loopexit
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.6, label %exit1.loopexit
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.7, label %exit1.loopexit
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit2.unr-lcssa
|
|
; EPILOG: exit1.loopexit:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
; EPILOG: exit2.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit2.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.epil, label %exit1.loopexit2
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit2.epilog-lcssa, !llvm.loop !15
|
|
; EPILOG: exit2.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit2
|
|
; EPILOG: exit2:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test11(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %exit1.loopexit
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.loopexit
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit2.unr-lcssa, !llvm.loop !17
|
|
; EPILOG-BLOCK: exit1.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
; EPILOG-BLOCK: exit2.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit2
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.epil, label %exit1
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit2
|
|
; EPILOG-BLOCK: exit2:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test11(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.prol, label %exit1.loopexit1
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !15
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit2, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch, label %exit1.loopexit
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.loopexit
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.2, label %exit1.loopexit
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.3, label %exit1.loopexit
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.4, label %exit1.loopexit
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.5, label %exit1.loopexit
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.6, label %exit1.loopexit
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.7, label %exit1.loopexit
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit2.unr-lcssa
|
|
; PROLOG: exit1.loopexit:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
; PROLOG: exit2.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit2
|
|
; PROLOG: exit2:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test11(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.prol, label %exit1
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit2, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %exit1.loopexit
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.loopexit
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit2.unr-lcssa, !llvm.loop !17
|
|
; PROLOG-BLOCK: exit1.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
; PROLOG-BLOCK: exit2.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit2
|
|
; PROLOG-BLOCK: exit2:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
call void @bar()
|
|
br i1 %cond, label %loop_latch, label %exit1
|
|
|
|
loop_latch:
|
|
%iv_next = add i64 %iv, 1
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit2
|
|
|
|
exit1:
|
|
ret void
|
|
|
|
exit2:
|
|
ret void
|
|
}
|
|
|
|
; Combine a computeable and invariant test to make sure
|
|
; the interaction of both doesn't do anything weird
|
|
define void @test12(i64 %trip, i64 %trip2, i1 %cond) {
|
|
; EPILOG-LABEL: @test12(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.1:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.2 = icmp ne i64 %iv_next.1, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.2, label %loop_exiting_bb2.2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.2:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: %iv_next.2 = add nuw nsw i64 %iv, 3
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.3 = icmp ne i64 %iv_next.2, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.3, label %loop_exiting_bb2.3, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.3:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.3, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: %iv_next.3 = add nuw nsw i64 %iv, 4
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.4 = icmp ne i64 %iv_next.3, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.4, label %loop_exiting_bb2.4, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.4:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.4, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: %iv_next.4 = add nuw nsw i64 %iv, 5
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.5 = icmp ne i64 %iv_next.4, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.5, label %loop_exiting_bb2.5, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.5:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.5, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: %iv_next.5 = add nuw nsw i64 %iv, 6
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.6 = icmp ne i64 %iv_next.5, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.6, label %loop_exiting_bb2.6, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.6:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.6, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: %iv_next.6 = add nuw nsw i64 %iv, 7
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.7 = icmp ne i64 %iv_next.6, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.7, label %loop_exiting_bb2.7, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.7:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.7, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit1.unr-lcssa
|
|
; EPILOG: exit1.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit1
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit1.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.epil = icmp ne i64 %iv.epil, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.epil, label %loop_exiting_bb2.epil, label %exit1.epilog-lcssa.loopexit2
|
|
; EPILOG: loop_exiting_bb2.epil:
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_latch.epil, label %exit1.epilog-lcssa.loopexit2
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit1.epilog-lcssa.loopexit2, !llvm.loop !16
|
|
; EPILOG: exit1.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG: exit1.epilog-lcssa.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG: exit1.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test12(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2.1:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit1.unr-lcssa, !llvm.loop !18
|
|
; EPILOG-BLOCK: exit1.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %iv.unr = phi i64 [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit1
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit1.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early.epil = icmp ne i64 %iv.epil.init, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early.epil, label %loop_exiting_bb2.epil, label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: loop_exiting_bb2.epil:
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.epil, label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: exit1.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: exit1.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test12(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.prol = icmp ne i64 %iv.prol, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.prol, label %loop_exiting_bb2.prol, label %exit1.unr-lcssa.loopexit1
|
|
; PROLOG: loop_exiting_bb2.prol:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.prol, label %exit1.unr-lcssa.loopexit1
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !16
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit1, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: %iv_next = add i64 %iv, 1
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.1:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.2 = icmp ne i64 %iv_next.1, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.2, label %loop_exiting_bb2.2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.2:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: %iv_next.2 = add i64 %iv, 3
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.3 = icmp ne i64 %iv_next.2, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.3, label %loop_exiting_bb2.3, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.3:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.3, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: %iv_next.3 = add i64 %iv, 4
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.4 = icmp ne i64 %iv_next.3, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.4, label %loop_exiting_bb2.4, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.4:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.4, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: %iv_next.4 = add i64 %iv, 5
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.5 = icmp ne i64 %iv_next.4, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.5, label %loop_exiting_bb2.5, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.5:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.5, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: %iv_next.5 = add i64 %iv, 6
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.6 = icmp ne i64 %iv_next.5, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.6, label %loop_exiting_bb2.6, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.6:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.6, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: %iv_next.6 = add i64 %iv, 7
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.7 = icmp ne i64 %iv_next.6, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.7, label %loop_exiting_bb2.7, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.7:
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_latch.7, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: exit1.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG: exit1.unr-lcssa.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG: exit1.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test12(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early.prol = icmp ne i64 0, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early.prol, label %loop_exiting_bb2.prol, label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: loop_exiting_bb2.prol:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.prol, label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit1, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: %iv_next = add i64 %iv, 1
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2.1:
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_latch.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit1.unr-lcssa.loopexit, !llvm.loop !18
|
|
; PROLOG-BLOCK: exit1.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: exit1.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
call void @bar()
|
|
%cmp_early = icmp ne i64 %iv, %trip2
|
|
br i1 %cmp_early, label %loop_exiting_bb2, label %exit1
|
|
|
|
loop_exiting_bb2:
|
|
br i1 %cond, label %loop_latch, label %exit1
|
|
|
|
loop_latch:
|
|
%iv_next = add i64 %iv, 1
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit1
|
|
|
|
exit1:
|
|
ret void
|
|
}
|
|
|
|
declare i1 @unknown_cond()
|
|
|
|
; Mix of computable and uncompatable exits
|
|
define void @test13(i64 %trip, i64 %trip2) {
|
|
; EPILOG-LABEL: @test13(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2:
|
|
; EPILOG-NEXT: %unknown = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown, label %loop_latch, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.1:
|
|
; EPILOG-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: %iv_next.1 = add nuw nsw i64 %iv, 2
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.2 = icmp ne i64 %iv_next.1, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.2, label %loop_exiting_bb2.2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.2:
|
|
; EPILOG-NEXT: %unknown.2 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.2, label %loop_latch.2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: %iv_next.2 = add nuw nsw i64 %iv, 3
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.3 = icmp ne i64 %iv_next.2, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.3, label %loop_exiting_bb2.3, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.3:
|
|
; EPILOG-NEXT: %unknown.3 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.3, label %loop_latch.3, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: %iv_next.3 = add nuw nsw i64 %iv, 4
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.4 = icmp ne i64 %iv_next.3, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.4, label %loop_exiting_bb2.4, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.4:
|
|
; EPILOG-NEXT: %unknown.4 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.4, label %loop_latch.4, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: %iv_next.4 = add nuw nsw i64 %iv, 5
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.5 = icmp ne i64 %iv_next.4, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.5, label %loop_exiting_bb2.5, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.5:
|
|
; EPILOG-NEXT: %unknown.5 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.5, label %loop_latch.5, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: %iv_next.5 = add nuw nsw i64 %iv, 6
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.6 = icmp ne i64 %iv_next.5, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.6, label %loop_exiting_bb2.6, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.6:
|
|
; EPILOG-NEXT: %unknown.6 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.6, label %loop_latch.6, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: %iv_next.6 = add nuw nsw i64 %iv, 7
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.7 = icmp ne i64 %iv_next.6, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.7, label %loop_exiting_bb2.7, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.7:
|
|
; EPILOG-NEXT: %unknown.7 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.7, label %loop_latch.7, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit1.unr-lcssa
|
|
; EPILOG: exit1.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit1
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit1.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: %cmp_early.epil = icmp ne i64 %iv.epil, %trip2
|
|
; EPILOG-NEXT: br i1 %cmp_early.epil, label %loop_exiting_bb2.epil, label %exit1.epilog-lcssa.loopexit2
|
|
; EPILOG: loop_exiting_bb2.epil:
|
|
; EPILOG-NEXT: %unknown.epil = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.epil, label %loop_latch.epil, label %exit1.epilog-lcssa.loopexit2
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit1.epilog-lcssa.loopexit2, !llvm.loop !17
|
|
; EPILOG: exit1.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG: exit1.epilog-lcssa.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG: exit1.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test13(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2:
|
|
; EPILOG-BLOCK-NEXT: %unknown = call i1 @unknown_cond()
|
|
; EPILOG-BLOCK-NEXT: br i1 %unknown, label %loop_latch, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: %iv_next = add nuw nsw i64 %iv, 1
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2.1:
|
|
; EPILOG-BLOCK-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; EPILOG-BLOCK-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit1.unr-lcssa, !llvm.loop !19
|
|
; EPILOG-BLOCK: exit1.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %iv.unr = phi i64 [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit1
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit1.unr-lcssa ]
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: %cmp_early.epil = icmp ne i64 %iv.epil.init, %trip2
|
|
; EPILOG-BLOCK-NEXT: br i1 %cmp_early.epil, label %loop_exiting_bb2.epil, label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: loop_exiting_bb2.epil:
|
|
; EPILOG-BLOCK-NEXT: %unknown.epil = call i1 @unknown_cond()
|
|
; EPILOG-BLOCK-NEXT: br i1 %unknown.epil, label %loop_latch.epil, label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: exit1.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: exit1.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test13(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.prol = icmp ne i64 %iv.prol, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.prol, label %loop_exiting_bb2.prol, label %exit1.unr-lcssa.loopexit1
|
|
; PROLOG: loop_exiting_bb2.prol:
|
|
; PROLOG-NEXT: %unknown.prol = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.prol, label %loop_latch.prol, label %exit1.unr-lcssa.loopexit1
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !17
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit1, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2:
|
|
; PROLOG-NEXT: %unknown = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown, label %loop_latch, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: %iv_next = add i64 %iv, 1
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.1:
|
|
; PROLOG-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.2 = icmp ne i64 %iv_next.1, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.2, label %loop_exiting_bb2.2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.2:
|
|
; PROLOG-NEXT: %unknown.2 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.2, label %loop_latch.2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: %iv_next.2 = add i64 %iv, 3
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.3 = icmp ne i64 %iv_next.2, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.3, label %loop_exiting_bb2.3, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.3:
|
|
; PROLOG-NEXT: %unknown.3 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.3, label %loop_latch.3, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: %iv_next.3 = add i64 %iv, 4
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.4 = icmp ne i64 %iv_next.3, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.4, label %loop_exiting_bb2.4, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.4:
|
|
; PROLOG-NEXT: %unknown.4 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.4, label %loop_latch.4, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: %iv_next.4 = add i64 %iv, 5
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.5 = icmp ne i64 %iv_next.4, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.5, label %loop_exiting_bb2.5, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.5:
|
|
; PROLOG-NEXT: %unknown.5 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.5, label %loop_latch.5, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: %iv_next.5 = add i64 %iv, 6
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.6 = icmp ne i64 %iv_next.5, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.6, label %loop_exiting_bb2.6, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.6:
|
|
; PROLOG-NEXT: %unknown.6 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.6, label %loop_latch.6, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: %iv_next.6 = add i64 %iv, 7
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: %cmp_early.7 = icmp ne i64 %iv_next.6, %trip2
|
|
; PROLOG-NEXT: br i1 %cmp_early.7, label %loop_exiting_bb2.7, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.7:
|
|
; PROLOG-NEXT: %unknown.7 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.7, label %loop_latch.7, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: exit1.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG: exit1.unr-lcssa.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG: exit1.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test13(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early.prol = icmp ne i64 0, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early.prol, label %loop_exiting_bb2.prol, label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: loop_exiting_bb2.prol:
|
|
; PROLOG-BLOCK-NEXT: %unknown.prol = call i1 @unknown_cond()
|
|
; PROLOG-BLOCK-NEXT: br i1 %unknown.prol, label %loop_latch.prol, label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit1, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early = icmp ne i64 %iv, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early, label %loop_exiting_bb2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2:
|
|
; PROLOG-BLOCK-NEXT: %unknown = call i1 @unknown_cond()
|
|
; PROLOG-BLOCK-NEXT: br i1 %unknown, label %loop_latch, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: %iv_next = add i64 %iv, 1
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: %cmp_early.1 = icmp ne i64 %iv_next, %trip2
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp_early.1, label %loop_exiting_bb2.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2.1:
|
|
; PROLOG-BLOCK-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; PROLOG-BLOCK-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit1.unr-lcssa.loopexit, !llvm.loop !19
|
|
; PROLOG-BLOCK: exit1.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: exit1.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
call void @bar()
|
|
%cmp_early = icmp ne i64 %iv, %trip2
|
|
br i1 %cmp_early, label %loop_exiting_bb2, label %exit1
|
|
|
|
loop_exiting_bb2:
|
|
%unknown = call i1 @unknown_cond()
|
|
br i1 %unknown, label %loop_latch, label %exit1
|
|
|
|
loop_latch:
|
|
%iv_next = add i64 %iv, 1
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit1
|
|
|
|
exit1:
|
|
ret void
|
|
}
|
|
|
|
; Mix of invariant and (even in theory) uncomputable exits
|
|
define void @test14(i64 %trip, i1 %cond) {
|
|
; EPILOG-LABEL: @test14(
|
|
; EPILOG-NEXT: entry:
|
|
; EPILOG-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; EPILOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; EPILOG-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG: entry.new:
|
|
; EPILOG-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-NEXT: br label %loop_header
|
|
; EPILOG: loop_header:
|
|
; EPILOG-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2:
|
|
; EPILOG-NEXT: %unknown = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown, label %loop_latch, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.1:
|
|
; EPILOG-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.1:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.2:
|
|
; EPILOG-NEXT: %unknown.2 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.2, label %loop_latch.2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.2:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.3, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.3:
|
|
; EPILOG-NEXT: %unknown.3 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.3, label %loop_latch.3, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.3:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.4, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.4:
|
|
; EPILOG-NEXT: %unknown.4 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.4, label %loop_latch.4, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.4:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.5, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.5:
|
|
; EPILOG-NEXT: %unknown.5 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.5, label %loop_latch.5, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.5:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.6, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.6:
|
|
; EPILOG-NEXT: %unknown.6 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.6, label %loop_latch.6, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.6:
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.7, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_exiting_bb2.7:
|
|
; EPILOG-NEXT: %unknown.7 = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.7, label %loop_latch.7, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG: loop_latch.7:
|
|
; EPILOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; EPILOG-NEXT: %niter.next.7 = add i64 %niter, 8
|
|
; EPILOG-NEXT: %niter.ncmp.7 = icmp ne i64 %niter.next.7, %unroll_iter
|
|
; EPILOG-NEXT: br i1 %niter.ncmp.7, label %loop_header, label %exit1.unr-lcssa
|
|
; EPILOG: exit1.unr-lcssa:
|
|
; EPILOG-NEXT: %iv.unr = phi i64 [ %iv_next.7, %loop_latch.7 ]
|
|
; EPILOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit1
|
|
; EPILOG: loop_header.epil.preheader:
|
|
; EPILOG-NEXT: %iv.epil.init = phi i64 [ 0, %entry ], [ %iv.unr, %exit1.unr-lcssa ]
|
|
; EPILOG-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-NEXT: br label %loop_header.epil
|
|
; EPILOG: loop_header.epil:
|
|
; EPILOG-NEXT: %iv.epil = phi i64 [ %iv.epil.init, %loop_header.epil.preheader ], [ %iv_next.epil, %loop_latch.epil ]
|
|
; EPILOG-NEXT: %epil.iter = phi i64 [ 0, %loop_header.epil.preheader ], [ %epil.iter.next, %loop_latch.epil ]
|
|
; EPILOG-NEXT: call void @bar()
|
|
; EPILOG-NEXT: br i1 %cond, label %loop_exiting_bb2.epil, label %exit1.epilog-lcssa.loopexit2
|
|
; EPILOG: loop_exiting_bb2.epil:
|
|
; EPILOG-NEXT: %unknown.epil = call i1 @unknown_cond()
|
|
; EPILOG-NEXT: br i1 %unknown.epil, label %loop_latch.epil, label %exit1.epilog-lcssa.loopexit2
|
|
; EPILOG: loop_latch.epil:
|
|
; EPILOG-NEXT: %iv_next.epil = add i64 %iv.epil, 1
|
|
; EPILOG-NEXT: %cmp.epil = icmp ne i64 %iv_next.epil, %trip
|
|
; EPILOG-NEXT: %epil.iter.next = add i64 %epil.iter, 1
|
|
; EPILOG-NEXT: %epil.iter.cmp = icmp ne i64 %epil.iter.next, %xtraiter
|
|
; EPILOG-NEXT: br i1 %epil.iter.cmp, label %loop_header.epil, label %exit1.epilog-lcssa.loopexit2, !llvm.loop !18
|
|
; EPILOG: exit1.epilog-lcssa.loopexit:
|
|
; EPILOG-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG: exit1.epilog-lcssa.loopexit2:
|
|
; EPILOG-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG: exit1.epilog-lcssa:
|
|
; EPILOG-NEXT: br label %exit1
|
|
; EPILOG: exit1:
|
|
; EPILOG-NEXT: ret void
|
|
;
|
|
; EPILOG-BLOCK-LABEL: @test14(
|
|
; EPILOG-BLOCK-NEXT: entry:
|
|
; EPILOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; EPILOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; EPILOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; EPILOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; EPILOG-BLOCK-NEXT: br i1 %2, label %loop_header.epil.preheader, label %entry.new
|
|
; EPILOG-BLOCK: entry.new:
|
|
; EPILOG-BLOCK-NEXT: %unroll_iter = sub i64 %0, %xtraiter
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header
|
|
; EPILOG-BLOCK: loop_header:
|
|
; EPILOG-BLOCK-NEXT: %iv = phi i64 [ 0, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: %niter = phi i64 [ 0, %entry.new ], [ %niter.next.1, %loop_latch.1 ]
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_exiting_bb2, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2:
|
|
; EPILOG-BLOCK-NEXT: %unknown = call i1 @unknown_cond()
|
|
; EPILOG-BLOCK-NEXT: br i1 %unknown, label %loop_latch, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_latch:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_exiting_bb2.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_exiting_bb2.1:
|
|
; EPILOG-BLOCK-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; EPILOG-BLOCK-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.epilog-lcssa.loopexit
|
|
; EPILOG-BLOCK: loop_latch.1:
|
|
; EPILOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.next.1 = add i64 %niter, 2
|
|
; EPILOG-BLOCK-NEXT: %niter.ncmp.1 = icmp ne i64 %niter.next.1, %unroll_iter
|
|
; EPILOG-BLOCK-NEXT: br i1 %niter.ncmp.1, label %loop_header, label %exit1.unr-lcssa, !llvm.loop !20
|
|
; EPILOG-BLOCK: exit1.unr-lcssa:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.epil.preheader, label %exit1
|
|
; EPILOG-BLOCK: loop_header.epil.preheader:
|
|
; EPILOG-BLOCK-NEXT: %lcmp.mod1 = icmp ne i64 %xtraiter, 0
|
|
; EPILOG-BLOCK-NEXT: call void @llvm.assume(i1 %lcmp.mod1)
|
|
; EPILOG-BLOCK-NEXT: br label %loop_header.epil
|
|
; EPILOG-BLOCK: loop_header.epil:
|
|
; EPILOG-BLOCK-NEXT: call void @bar()
|
|
; EPILOG-BLOCK-NEXT: br i1 %cond, label %loop_exiting_bb2.epil, label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: loop_exiting_bb2.epil:
|
|
; EPILOG-BLOCK-NEXT: %unknown.epil = call i1 @unknown_cond()
|
|
; EPILOG-BLOCK-NEXT: br i1 %unknown.epil, label %loop_latch.epil, label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: loop_latch.epil:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: exit1.epilog-lcssa.loopexit:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1.epilog-lcssa
|
|
; EPILOG-BLOCK: exit1.epilog-lcssa:
|
|
; EPILOG-BLOCK-NEXT: br label %exit1
|
|
; EPILOG-BLOCK: exit1:
|
|
; EPILOG-BLOCK-NEXT: ret void
|
|
;
|
|
; PROLOG-LABEL: @test14(
|
|
; PROLOG-NEXT: entry:
|
|
; PROLOG-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-NEXT: %xtraiter = and i64 %0, 7
|
|
; PROLOG-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.preheader:
|
|
; PROLOG-NEXT: br label %loop_header.prol
|
|
; PROLOG: loop_header.prol:
|
|
; PROLOG-NEXT: %iv.prol = phi i64 [ 0, %loop_header.prol.preheader ], [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: %prol.iter = phi i64 [ 0, %loop_header.prol.preheader ], [ %prol.iter.next, %loop_latch.prol ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.prol, label %exit1.unr-lcssa.loopexit1
|
|
; PROLOG: loop_exiting_bb2.prol:
|
|
; PROLOG-NEXT: %unknown.prol = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.prol, label %loop_latch.prol, label %exit1.unr-lcssa.loopexit1
|
|
; PROLOG: loop_latch.prol:
|
|
; PROLOG-NEXT: %iv_next.prol = add i64 %iv.prol, 1
|
|
; PROLOG-NEXT: %cmp.prol = icmp ne i64 %iv_next.prol, %trip
|
|
; PROLOG-NEXT: %prol.iter.next = add i64 %prol.iter, 1
|
|
; PROLOG-NEXT: %prol.iter.cmp = icmp ne i64 %prol.iter.next, %xtraiter
|
|
; PROLOG-NEXT: br i1 %prol.iter.cmp, label %loop_header.prol, label %loop_header.prol.loopexit.unr-lcssa, !llvm.loop !18
|
|
; PROLOG: loop_header.prol.loopexit.unr-lcssa:
|
|
; PROLOG-NEXT: %iv.unr.ph = phi i64 [ %iv_next.prol, %loop_latch.prol ]
|
|
; PROLOG-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG: loop_header.prol.loopexit:
|
|
; PROLOG-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ %iv.unr.ph, %loop_header.prol.loopexit.unr-lcssa ]
|
|
; PROLOG-NEXT: %2 = icmp ult i64 %1, 7
|
|
; PROLOG-NEXT: br i1 %2, label %exit1, label %entry.new
|
|
; PROLOG: entry.new:
|
|
; PROLOG-NEXT: br label %loop_header
|
|
; PROLOG: loop_header:
|
|
; PROLOG-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.7, %loop_latch.7 ]
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2:
|
|
; PROLOG-NEXT: %unknown = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown, label %loop_latch, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.1:
|
|
; PROLOG-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.1:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.2:
|
|
; PROLOG-NEXT: %unknown.2 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.2, label %loop_latch.2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.2:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.3, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.3:
|
|
; PROLOG-NEXT: %unknown.3 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.3, label %loop_latch.3, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.3:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.4, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.4:
|
|
; PROLOG-NEXT: %unknown.4 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.4, label %loop_latch.4, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.4:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.5, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.5:
|
|
; PROLOG-NEXT: %unknown.5 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.5, label %loop_latch.5, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.5:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.6, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.6:
|
|
; PROLOG-NEXT: %unknown.6 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.6, label %loop_latch.6, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.6:
|
|
; PROLOG-NEXT: call void @bar()
|
|
; PROLOG-NEXT: br i1 %cond, label %loop_exiting_bb2.7, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_exiting_bb2.7:
|
|
; PROLOG-NEXT: %unknown.7 = call i1 @unknown_cond()
|
|
; PROLOG-NEXT: br i1 %unknown.7, label %loop_latch.7, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: loop_latch.7:
|
|
; PROLOG-NEXT: %iv_next.7 = add i64 %iv, 8
|
|
; PROLOG-NEXT: %cmp.7 = icmp ne i64 %iv_next.7, %trip
|
|
; PROLOG-NEXT: br i1 %cmp.7, label %loop_header, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG: exit1.unr-lcssa.loopexit:
|
|
; PROLOG-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG: exit1.unr-lcssa.loopexit1:
|
|
; PROLOG-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG: exit1.unr-lcssa:
|
|
; PROLOG-NEXT: br label %exit1
|
|
; PROLOG: exit1:
|
|
; PROLOG-NEXT: ret void
|
|
;
|
|
; PROLOG-BLOCK-LABEL: @test14(
|
|
; PROLOG-BLOCK-NEXT: entry:
|
|
; PROLOG-BLOCK-NEXT: %0 = freeze i64 %trip
|
|
; PROLOG-BLOCK-NEXT: %1 = add i64 %0, -1
|
|
; PROLOG-BLOCK-NEXT: %xtraiter = and i64 %0, 1
|
|
; PROLOG-BLOCK-NEXT: %lcmp.mod = icmp ne i64 %xtraiter, 0
|
|
; PROLOG-BLOCK-NEXT: br i1 %lcmp.mod, label %loop_header.prol.preheader, label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.preheader:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol
|
|
; PROLOG-BLOCK: loop_header.prol:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_exiting_bb2.prol, label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: loop_exiting_bb2.prol:
|
|
; PROLOG-BLOCK-NEXT: %unknown.prol = call i1 @unknown_cond()
|
|
; PROLOG-BLOCK-NEXT: br i1 %unknown.prol, label %loop_latch.prol, label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: loop_latch.prol:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header.prol.loopexit
|
|
; PROLOG-BLOCK: loop_header.prol.loopexit:
|
|
; PROLOG-BLOCK-NEXT: %iv.unr = phi i64 [ 0, %entry ], [ 1, %loop_latch.prol ]
|
|
; PROLOG-BLOCK-NEXT: %2 = icmp ult i64 %1, 1
|
|
; PROLOG-BLOCK-NEXT: br i1 %2, label %exit1, label %entry.new
|
|
; PROLOG-BLOCK: entry.new:
|
|
; PROLOG-BLOCK-NEXT: br label %loop_header
|
|
; PROLOG-BLOCK: loop_header:
|
|
; PROLOG-BLOCK-NEXT: %iv = phi i64 [ %iv.unr, %entry.new ], [ %iv_next.1, %loop_latch.1 ]
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_exiting_bb2, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2:
|
|
; PROLOG-BLOCK-NEXT: %unknown = call i1 @unknown_cond()
|
|
; PROLOG-BLOCK-NEXT: br i1 %unknown, label %loop_latch, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_latch:
|
|
; PROLOG-BLOCK-NEXT: call void @bar()
|
|
; PROLOG-BLOCK-NEXT: br i1 %cond, label %loop_exiting_bb2.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_exiting_bb2.1:
|
|
; PROLOG-BLOCK-NEXT: %unknown.1 = call i1 @unknown_cond()
|
|
; PROLOG-BLOCK-NEXT: br i1 %unknown.1, label %loop_latch.1, label %exit1.unr-lcssa.loopexit
|
|
; PROLOG-BLOCK: loop_latch.1:
|
|
; PROLOG-BLOCK-NEXT: %iv_next.1 = add i64 %iv, 2
|
|
; PROLOG-BLOCK-NEXT: %cmp.1 = icmp ne i64 %iv_next.1, %trip
|
|
; PROLOG-BLOCK-NEXT: br i1 %cmp.1, label %loop_header, label %exit1.unr-lcssa.loopexit, !llvm.loop !20
|
|
; PROLOG-BLOCK: exit1.unr-lcssa.loopexit:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1.unr-lcssa
|
|
; PROLOG-BLOCK: exit1.unr-lcssa:
|
|
; PROLOG-BLOCK-NEXT: br label %exit1
|
|
; PROLOG-BLOCK: exit1:
|
|
; PROLOG-BLOCK-NEXT: ret void
|
|
;
|
|
entry:
|
|
br label %loop_header
|
|
|
|
loop_header:
|
|
%iv = phi i64 [ 0, %entry ], [ %iv_next, %loop_latch ]
|
|
call void @bar()
|
|
br i1 %cond, label %loop_exiting_bb2, label %exit1
|
|
|
|
loop_exiting_bb2:
|
|
%unknown = call i1 @unknown_cond()
|
|
br i1 %unknown, label %loop_latch, label %exit1
|
|
|
|
loop_latch:
|
|
%iv_next = add i64 %iv, 1
|
|
%cmp = icmp ne i64 %iv_next, %trip
|
|
br i1 %cmp, label %loop_header, label %exit1
|
|
|
|
exit1:
|
|
ret void
|
|
}
|