
Support for translating the operations introduced in #144785 to LLVM-IR. In order to keep the lowering simple, `OpenMPIRBuider::unrollLoopHeuristic` is applied when encountering the `omp.unroll_heuristic` op. As a result, the operation that unrolling is applied to (`omp.canonical_loop`) must have been emitted before even though logically there is no such requirement. Eventually, all transformations on a loop must be applied directly after emitting `omp.canonical_loop`, i.e. future transformations must be looked-up when encountering `omp.canonical_loop` itself. This is because many OpenMPIRBuilder methods (e.g. `createParallel`) expect all the region code to be emitted withing a callback. In the case of `createParallel`, the region code is getting outlined into a new function. Therefore, making the operation order a formal requirement would not make the implementation any easier.
176 lines
6.3 KiB
MLIR
176 lines
6.3 KiB
MLIR
// Test lowering of standalone omp.canonical_loop
|
|
// RUN: mlir-translate -mlir-to-llvmir %s | FileCheck %s
|
|
|
|
// CHECK-LABEL: define void @anon_loop(
|
|
// CHECK-SAME: ptr %[[ptr:.+]],
|
|
// CHECK-SAME: i32 %[[tc:.+]]) {
|
|
// CHECK-NEXT: br label %omp_omp.loop.preheader
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.preheader:
|
|
// CHECK-NEXT: br label %omp_omp.loop.header
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.header:
|
|
// CHECK-NEXT: %omp_omp.loop.iv = phi i32 [ 0, %omp_omp.loop.preheader ], [ %omp_omp.loop.next, %omp_omp.loop.inc ]
|
|
// CHECK-NEXT: br label %omp_omp.loop.cond
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.cond:
|
|
// CHECK-NEXT: %omp_omp.loop.cmp = icmp ult i32 %omp_omp.loop.iv, %[[tc]]
|
|
// CHECK-NEXT: br i1 %omp_omp.loop.cmp, label %omp_omp.loop.body, label %omp_omp.loop.exit
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.body:
|
|
// CHECK-NEXT: br label %omp.loop.region
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.loop.region:
|
|
// CHECK-NEXT: store float 4.200000e+01, ptr %[[ptr]], align 4
|
|
// CHECK-NEXT: br label %omp.region.cont
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.region.cont:
|
|
// CHECK-NEXT: br label %omp_omp.loop.inc
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.inc:
|
|
// CHECK-NEXT: %omp_omp.loop.next = add nuw i32 %omp_omp.loop.iv, 1
|
|
// CHECK-NEXT: br label %omp_omp.loop.header
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.exit:
|
|
// CHECK-NEXT: br label %omp_omp.loop.after
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.after:
|
|
// CHECK-NEXT: ret void
|
|
// CHECK-NEXT: }
|
|
llvm.func @anon_loop(%ptr: !llvm.ptr, %tc : i32) -> () {
|
|
omp.canonical_loop %iv : i32 in range(%tc) {
|
|
%val = llvm.mlir.constant(42.0 : f32) : f32
|
|
llvm.store %val, %ptr : f32, !llvm.ptr
|
|
omp.terminator
|
|
}
|
|
llvm.return
|
|
}
|
|
|
|
|
|
|
|
// CHECK-LABEL: define void @trivial_loop(
|
|
// CHECK-SAME: ptr %[[ptr:.+]],
|
|
// CHECK-SAME: i32 %[[tc:.+]]) {
|
|
// CHECK-NEXT: br label %omp_omp.loop.preheader
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.preheader:
|
|
// CHECK-NEXT: br label %omp_omp.loop.header
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.header:
|
|
// CHECK-NEXT: %omp_omp.loop.iv = phi i32 [ 0, %omp_omp.loop.preheader ], [ %omp_omp.loop.next, %omp_omp.loop.inc ]
|
|
// CHECK-NEXT: br label %omp_omp.loop.cond
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.cond:
|
|
// CHECK-NEXT: %omp_omp.loop.cmp = icmp ult i32 %omp_omp.loop.iv, %[[tc]]
|
|
// CHECK-NEXT: br i1 %omp_omp.loop.cmp, label %omp_omp.loop.body, label %omp_omp.loop.exit
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.body:
|
|
// CHECK-NEXT: br label %omp.loop.region
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.loop.region:
|
|
// CHECK-NEXT: store float 4.200000e+01, ptr %[[ptr]], align 4
|
|
// CHECK-NEXT: br label %omp.region.cont
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.region.cont:
|
|
// CHECK-NEXT: br label %omp_omp.loop.inc
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.inc:
|
|
// CHECK-NEXT: %omp_omp.loop.next = add nuw i32 %omp_omp.loop.iv, 1
|
|
// CHECK-NEXT: br label %omp_omp.loop.header
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.exit:
|
|
// CHECK-NEXT: br label %omp_omp.loop.after
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.after:
|
|
// CHECK-NEXT: ret void
|
|
// CHECK-NEXT: }
|
|
llvm.func @trivial_loop(%ptr: !llvm.ptr, %tc : i32) -> () {
|
|
%cli = omp.new_cli
|
|
omp.canonical_loop(%cli) %iv : i32 in range(%tc) {
|
|
%val = llvm.mlir.constant(42.0 : f32) : f32
|
|
llvm.store %val, %ptr : f32, !llvm.ptr
|
|
omp.terminator
|
|
}
|
|
llvm.return
|
|
}
|
|
|
|
|
|
// CHECK-LABEL: define void @nested_loop(
|
|
// CHECK-SAME: ptr %[[ptr:.+]], i32 %[[outer_tc:.+]], i32 %[[inner_tc:.+]]) {
|
|
// CHECK-NEXT: br label %omp_omp.loop.preheader
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.preheader:
|
|
// CHECK-NEXT: br label %omp_omp.loop.header
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.header:
|
|
// CHECK-NEXT: %omp_omp.loop.iv = phi i32 [ 0, %omp_omp.loop.preheader ], [ %omp_omp.loop.next, %omp_omp.loop.inc ]
|
|
// CHECK-NEXT: br label %omp_omp.loop.cond
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.cond:
|
|
// CHECK-NEXT: %omp_omp.loop.cmp = icmp ult i32 %omp_omp.loop.iv, %[[outer_tc]]
|
|
// CHECK-NEXT: br i1 %omp_omp.loop.cmp, label %omp_omp.loop.body, label %omp_omp.loop.exit
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.body:
|
|
// CHECK-NEXT: br label %omp.loop.region
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.loop.region:
|
|
// CHECK-NEXT: br label %omp_omp.loop.preheader1
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.preheader1:
|
|
// CHECK-NEXT: br label %omp_omp.loop.header2
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.header2:
|
|
// CHECK-NEXT: %omp_omp.loop.iv8 = phi i32 [ 0, %omp_omp.loop.preheader1 ], [ %omp_omp.loop.next10, %omp_omp.loop.inc5 ]
|
|
// CHECK-NEXT: br label %omp_omp.loop.cond3
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.cond3:
|
|
// CHECK-NEXT: %omp_omp.loop.cmp9 = icmp ult i32 %omp_omp.loop.iv8, %[[inner_tc]]
|
|
// CHECK-NEXT: br i1 %omp_omp.loop.cmp9, label %omp_omp.loop.body4, label %omp_omp.loop.exit6
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.body4:
|
|
// CHECK-NEXT: br label %omp.loop.region12
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.loop.region12:
|
|
// CHECK-NEXT: store float 4.200000e+01, ptr %[[ptr]], align 4
|
|
// CHECK-NEXT: br label %omp.region.cont11
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.region.cont11:
|
|
// CHECK-NEXT: br label %omp_omp.loop.inc5
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.inc5:
|
|
// CHECK-NEXT: %omp_omp.loop.next10 = add nuw i32 %omp_omp.loop.iv8, 1
|
|
// CHECK-NEXT: br label %omp_omp.loop.header2
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.exit6:
|
|
// CHECK-NEXT: br label %omp_omp.loop.after7
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.after7:
|
|
// CHECK-NEXT: br label %omp.region.cont
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp.region.cont:
|
|
// CHECK-NEXT: br label %omp_omp.loop.inc
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.inc:
|
|
// CHECK-NEXT: %omp_omp.loop.next = add nuw i32 %omp_omp.loop.iv, 1
|
|
// CHECK-NEXT: br label %omp_omp.loop.header
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.exit:
|
|
// CHECK-NEXT: br label %omp_omp.loop.after
|
|
// CHECK-EMPTY:
|
|
// CHECK-NEXT: omp_omp.loop.after:
|
|
// CHECK-NEXT: ret void
|
|
// CHECK-NEXT: }
|
|
llvm.func @nested_loop(%ptr: !llvm.ptr, %outer_tc : i32, %inner_tc : i32) -> () {
|
|
%outer_cli = omp.new_cli
|
|
%inner_cli = omp.new_cli
|
|
omp.canonical_loop(%outer_cli) %outer_iv : i32 in range(%outer_tc) {
|
|
omp.canonical_loop(%inner_cli) %inner_iv : i32 in range(%inner_tc) {
|
|
%val = llvm.mlir.constant(42.0 : f32) : f32
|
|
llvm.store %val, %ptr : f32, !llvm.ptr
|
|
omp.terminator
|
|
}
|
|
omp.terminator
|
|
}
|
|
llvm.return
|
|
}
|