The semantics of the ops that implement the `OffsetSizeAndStrideOpInterface` is that if the number of offsets, sizes or strides are less than the rank of the source, then some default values are filled along the trailing dimensions (0 for offset, source dimension of sizes, and 1 for strides). This is confusing, especially with rank-reducing semantics. Immediate issue here is that the methods of `OffsetSizeAndStridesOpInterface` assumes that the number of values is same as the source rank. This cause out-of-bounds errors. So simplifying the specification of `OffsetSizeAndStridesOpInterface` to make it invalid to specify number of offsets/sizes/strides not equal to the source rank. Differential Revision: https://reviews.llvm.org/D115677
139 lines
8.7 KiB
MLIR
139 lines
8.7 KiB
MLIR
// RUN: mlir-opt %s | mlir-opt | FileCheck %s
|
|
// RUN: mlir-opt %s --mlir-print-op-generic | mlir-opt | FileCheck %s
|
|
|
|
// CHECK-DAG: #[[$BASE_MAP0:map[0-9]+]] = affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2)>
|
|
// CHECK-DAG: #[[$BASE_MAP3:map[0-9]+]] = affine_map<(d0, d1, d2)[s0, s1, s2, s3] -> (d0 * s1 + s0 + d1 * s2 + d2 * s3)>
|
|
|
|
// CHECK-DAG: #[[$BASE_MAP1:map[0-9]+]] = affine_map<(d0)[s0] -> (d0 + s0)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP1:map[0-9]+]] = affine_map<(d0)[s0, s1] -> (d0 * s1 + s0)>
|
|
|
|
// CHECK-DAG: #[[$BASE_MAP2:map[0-9]+]] = affine_map<(d0, d1) -> (d0 * 22 + d1)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP2:map[0-9]+]] = affine_map<(d0, d1)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP3:map[0-9]+]] = affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2 + 8)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP4:map[0-9]+]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP5:map[0-9]+]] = affine_map<(d0, d1)[s0] -> (d0 * 8 + s0 + d1 * 2)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP6:map[0-9]+]] = affine_map<(d0, d1, d2, d3, d4) -> (d0 * 36 + d1 * 36 + d2 * 4 + d3 * 4 + d4)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP7:map[0-9]+]] = affine_map<(d0, d1, d2, d3, d4, d5)[s0, s1, s2, s3, s4, s5, s6] -> (d0 * s1 + s0 + d1 * s2 + d2 * s3 + d3 * s4 + d4 * s5 + d5 * s6)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP8:map[0-9]+]] = affine_map<(d0, d1, d2, d3)[s0, s1, s2, s3, s4] -> (d0 * s1 + s0 + d1 * s2 + d2 * s3 + d3 * s4)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP9:map[0-9]+]] = affine_map<(d0, d1) -> (d0 * 3 + d1 + 6)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP10:map[0-9]+]] = affine_map<(d0) -> (d0 + 3)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP11:map[0-9]+]] = affine_map<() -> (4)>
|
|
// CHECK-DAG: #[[$SUBVIEW_MAP12:map[0-9]+]] = affine_map<()[s0] -> (s0)>
|
|
|
|
// CHECK-LABEL: func @memref_subview(%arg0
|
|
func @memref_subview(%arg0 : index, %arg1 : index, %arg2 : index) {
|
|
%c0 = arith.constant 0 : index
|
|
%c1 = arith.constant 1 : index
|
|
|
|
%0 = memref.alloc() : memref<8x16x4xf32, affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2)>>
|
|
// CHECK: subview %0[%c0, %c0, %c0] [%arg0, %arg1, %arg2] [%c1, %c1, %c1] :
|
|
// CHECK-SAME: memref<8x16x4xf32, #[[$BASE_MAP0]]>
|
|
// CHECK-SAME: to memref<?x?x?xf32, #[[$BASE_MAP3]]>
|
|
%1 = memref.subview %0[%c0, %c0, %c0][%arg0, %arg1, %arg2][%c1, %c1, %c1]
|
|
: memref<8x16x4xf32, offset:0, strides: [64, 4, 1]> to
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, ?]>
|
|
|
|
%2 = memref.alloc()[%arg2] : memref<64xf32, affine_map<(d0)[s0] -> (d0 + s0)>>
|
|
// CHECK: memref.subview %2[%c1] [%arg0] [%c1] :
|
|
// CHECK-SAME: memref<64xf32, #[[$BASE_MAP1]]>
|
|
// CHECK-SAME: to memref<?xf32, #[[$SUBVIEW_MAP1]]>
|
|
%3 = memref.subview %2[%c1][%arg0][%c1]
|
|
: memref<64xf32, affine_map<(d0)[s0] -> (d0 + s0)>> to
|
|
memref<?xf32, affine_map<(d0)[s0, s1] -> (d0 * s1 + s0)>>
|
|
|
|
%4 = memref.alloc() : memref<64x22xf32, affine_map<(d0, d1) -> (d0 * 22 + d1)>>
|
|
// CHECK: memref.subview %4[%c0, %c1] [%arg0, %arg1] [%c1, %c0] :
|
|
// CHECK-SAME: memref<64x22xf32, #[[$BASE_MAP2]]>
|
|
// CHECK-SAME: to memref<?x?xf32, #[[$SUBVIEW_MAP2]]>
|
|
%5 = memref.subview %4[%c0, %c1][%arg0, %arg1][%c1, %c0]
|
|
: memref<64x22xf32, offset:0, strides: [22, 1]> to
|
|
memref<?x?xf32, offset:?, strides: [?, ?]>
|
|
|
|
// CHECK: memref.subview %0[0, 2, 0] [4, 4, 4] [1, 1, 1] :
|
|
// CHECK-SAME: memref<8x16x4xf32, #[[$BASE_MAP0]]>
|
|
// CHECK-SAME: to memref<4x4x4xf32, #[[$SUBVIEW_MAP3]]>
|
|
%6 = memref.subview %0[0, 2, 0][4, 4, 4][1, 1, 1]
|
|
: memref<8x16x4xf32, offset:0, strides: [64, 4, 1]> to
|
|
memref<4x4x4xf32, offset:8, strides: [64, 4, 1]>
|
|
|
|
%7 = memref.alloc(%arg1, %arg2) : memref<?x?xf32>
|
|
// CHECK: memref.subview {{%.*}}[0, 0] [4, 4] [1, 1] :
|
|
// CHECK-SAME: memref<?x?xf32>
|
|
// CHECK-SAME: to memref<4x4xf32, #[[$SUBVIEW_MAP4]]>
|
|
%8 = memref.subview %7[0, 0][4, 4][1, 1]
|
|
: memref<?x?xf32> to memref<4x4xf32, offset: ?, strides:[?, 1]>
|
|
|
|
%9 = memref.alloc() : memref<16x4xf32>
|
|
// CHECK: memref.subview {{%.*}}[{{%.*}}, {{%.*}}] [4, 4] [{{%.*}}, {{%.*}}] :
|
|
// CHECK-SAME: memref<16x4xf32>
|
|
// CHECK-SAME: to memref<4x4xf32, #[[$SUBVIEW_MAP2]]
|
|
%10 = memref.subview %9[%arg1, %arg1][4, 4][%arg2, %arg2]
|
|
: memref<16x4xf32> to memref<4x4xf32, offset: ?, strides:[?, ?]>
|
|
|
|
// CHECK: memref.subview {{%.*}}[{{%.*}}, {{%.*}}] [4, 4] [2, 2] :
|
|
// CHECK-SAME: memref<16x4xf32>
|
|
// CHECK-SAME: to memref<4x4xf32, #[[$SUBVIEW_MAP5]]
|
|
%11 = memref.subview %9[%arg1, %arg2][4, 4][2, 2]
|
|
: memref<16x4xf32> to memref<4x4xf32, offset: ?, strides:[8, 2]>
|
|
|
|
%12 = memref.alloc() : memref<1x9x1x4x1xf32, affine_map<(d0, d1, d2, d3, d4) -> (36 * d0 + 36 * d1 + 4 * d2 + 4 * d3 + d4)>>
|
|
// CHECK: memref.subview %12[%arg1, %arg1, %arg1, %arg1, %arg1]
|
|
// CHECK-SAME: [1, 9, 1, 4, 1] [%arg2, %arg2, %arg2, %arg2, %arg2] :
|
|
// CHECK-SAME: memref<1x9x1x4x1xf32, #[[$SUBVIEW_MAP6]]> to memref<9x4xf32, #[[$SUBVIEW_MAP2]]>
|
|
%13 = memref.subview %12[%arg1, %arg1, %arg1, %arg1, %arg1][1, 9, 1, 4, 1][%arg2, %arg2, %arg2, %arg2, %arg2] : memref<1x9x1x4x1xf32, offset: 0, strides: [36, 36, 4, 4, 1]> to memref<9x4xf32, offset: ?, strides: [?, ?]>
|
|
// CHECK: memref.subview %12[%arg1, %arg1, %arg1, %arg1, %arg1]
|
|
// CHECK-SAME: [1, 9, 1, 4, 1] [%arg2, %arg2, %arg2, %arg2, %arg2] :
|
|
// CHECK-SAME: memref<1x9x1x4x1xf32, #[[$SUBVIEW_MAP6]]> to memref<1x9x4xf32, #[[$BASE_MAP3]]>
|
|
%14 = memref.subview %12[%arg1, %arg1, %arg1, %arg1, %arg1][1, 9, 1, 4, 1][%arg2, %arg2, %arg2, %arg2, %arg2] : memref<1x9x1x4x1xf32, offset: 0, strides: [36, 36, 4, 4, 1]> to memref<1x9x4xf32, offset: ?, strides: [?, ?, ?]>
|
|
|
|
%15 = memref.alloc(%arg1, %arg2)[%c0, %c1, %arg1, %arg0, %arg0, %arg2, %arg2] : memref<1x?x5x1x?x1xf32, affine_map<(d0, d1, d2, d3, d4, d5)[s0, s1, s2, s3, s4, s5, s6] -> (s0 + s1 * d0 + s2 * d1 + s3 * d2 + s4 * d3 + s5 * d4 + s6 * d5)>>
|
|
// CHECK: memref.subview %15[0, 0, 0, 0, 0, 0] [1, %arg1, 5, 1, %arg2, 1] [1, 1, 1, 1, 1, 1] :
|
|
// CHECK-SAME: memref<1x?x5x1x?x1xf32, #[[$SUBVIEW_MAP7]]> to memref<?x5x?xf32, #[[$BASE_MAP3]]>
|
|
%16 = memref.subview %15[0, 0, 0, 0, 0, 0][1, %arg1, 5, 1, %arg2, 1][1, 1, 1, 1, 1, 1] : memref<1x?x5x1x?x1xf32, offset: ?, strides: [?, ?, ?, ?, ?, ?]> to memref<?x5x?xf32, offset: ?, strides: [?, ?, ?]>
|
|
// CHECK: memref.subview %15[%arg1, %arg1, %arg1, %arg1, %arg1, %arg1] [1, %arg1, 5, 1, %arg2, 1] [1, 1, 1, 1, 1, 1] :
|
|
// CHECK-SAME: memref<1x?x5x1x?x1xf32, #[[$SUBVIEW_MAP7]]> to memref<?x5x?x1xf32, #[[$SUBVIEW_MAP8]]>
|
|
%17 = memref.subview %15[%arg1, %arg1, %arg1, %arg1, %arg1, %arg1][1, %arg1, 5, 1, %arg2, 1][1, 1, 1, 1, 1, 1] : memref<1x?x5x1x?x1xf32, offset: ?, strides: [?, ?, ?, ?, ?, ?]> to memref<?x5x?x1xf32, offset: ?, strides: [?, ?, ?, ?]>
|
|
|
|
%18 = memref.alloc() : memref<1x8xf32>
|
|
// CHECK: memref.subview %18[0, 0] [1, 8] [1, 1] : memref<1x8xf32> to memref<8xf32>
|
|
%19 = memref.subview %18[0, 0][1, 8][1, 1] : memref<1x8xf32> to memref<8xf32>
|
|
|
|
%20 = memref.alloc() : memref<8x16x4xf32>
|
|
// CHECK: memref.subview %20[0, 0, 0] [1, 16, 4] [1, 1, 1] : memref<8x16x4xf32> to memref<16x4xf32>
|
|
%21 = memref.subview %20[0, 0, 0][1, 16, 4][1, 1, 1] : memref<8x16x4xf32> to memref<16x4xf32>
|
|
|
|
%22 = memref.subview %20[3, 4, 2][1, 6, 3][1, 1, 1] : memref<8x16x4xf32> to memref<6x3xf32, offset: 210, strides: [4, 1]>
|
|
|
|
%23 = memref.alloc() : memref<f32>
|
|
%78 = memref.subview %23[] [] [] : memref<f32> to memref<f32>
|
|
|
|
/// Subview with only leading operands.
|
|
%24 = memref.alloc() : memref<5x3xf32>
|
|
// CHECK: memref.subview %{{.*}}[2, 0] [3, 3] [1, 1] : memref<5x3xf32> to memref<3x3xf32, #[[$SUBVIEW_MAP9]]>
|
|
%25 = memref.subview %24[2, 0][3, 3][1, 1]: memref<5x3xf32> to memref<3x3xf32, offset: 6, strides: [3, 1]>
|
|
|
|
/// Rank-reducing subview with only leading operands.
|
|
// CHECK: memref.subview %{{.*}}[1, 0] [1, 3] [1, 1] : memref<5x3xf32> to memref<3xf32, #[[$SUBVIEW_MAP10]]>
|
|
%26 = memref.subview %24[1, 0][1, 3][1, 1]: memref<5x3xf32> to memref<3xf32, offset: 3, strides: [1]>
|
|
|
|
// Corner-case of 0-D rank-reducing subview with an offset.
|
|
// CHECK: memref.subview %{{.*}}[1, 1] [1, 1] [1, 1] : memref<5x3xf32> to memref<f32, #[[$SUBVIEW_MAP11]]>
|
|
%27 = memref.subview %24[1, 1] [1, 1] [1, 1] : memref<5x3xf32> to memref<f32, affine_map<() -> (4)>>
|
|
|
|
// CHECK: memref.subview %{{.*}}[%{{.*}}, 1] [1, 1] [1, 1] : memref<5x3xf32> to memref<f32, #[[$SUBVIEW_MAP12]]>
|
|
%28 = memref.subview %24[%arg0, 1] [1, 1] [1, 1] : memref<5x3xf32> to memref<f32, affine_map<()[s0] -> (s0)>>
|
|
|
|
// CHECK: memref.subview %{{.*}}[0, %{{.*}}] [%{{.*}}, 1] [1, 1] : memref<?x?xf32> to memref<?xf32, #[[$SUBVIEW_MAP1]]>
|
|
%a30 = memref.alloc(%arg0, %arg0) : memref<?x?xf32>
|
|
%30 = memref.subview %a30[0, %arg1][%arg2, 1][1, 1] : memref<?x?xf32> to memref<?xf32, affine_map<(d0)[s0, s1] -> (d0 * s1 + s0)>>
|
|
|
|
%c8 = arith.constant 8 : index
|
|
%a40 = memref.alloc() : memref<16x16xf32>
|
|
// CHECK: memref.subview
|
|
%40 = memref.subview %a40[%c8, 8][8, 8][1, 1] :
|
|
memref<16x16xf32> to memref<8x8xf32, affine_map<(d0, d1)[s0] -> (d0 * 16 + d1 + s0)>>
|
|
|
|
return
|
|
}
|
|
|