forked from OSchip/llvm-project
636 lines
28 KiB
MLIR
636 lines
28 KiB
MLIR
// RUN: mlir-opt -split-input-file %s | FileCheck %s
|
|
// | mlir-opt | FileCheck %s
|
|
|
|
// TODO(pifon): Re-enable LLVM lowering test after IndexedGenericOp is lowered.
|
|
//
|
|
// Test that we can lower all the way to LLVM without crashing, don't check results here.
|
|
// DISABLED: mlir-opt %s --convert-linalg-to-llvm -o=/dev/null 2>&1
|
|
|
|
func @range(%arg0: index, %arg1: index, %arg2: index) {
|
|
%0 = linalg.range %arg0:%arg1:%arg2 : !linalg.range
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @range(%{{.*}}: index, %{{.*}}: index, %{{.*}}: index) {
|
|
// CHECK-NEXT: linalg.range %{{.*}} : %{{.*}} : %{{.*}} : !linalg.range
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided1D:.*]] = affine_map<(d0)[s0] -> (d0 + s0)>
|
|
// CHECK-DAG: #[[strided2D:.*]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)>
|
|
|
|
func @views(%arg0: index, %arg1: index, %arg2: index, %arg3: index, %arg4: index) {
|
|
%c0 = constant 0 : index
|
|
%0 = muli %arg0, %arg0 : index
|
|
%1 = alloc (%0) : memref<?xi8>
|
|
%2 = linalg.range %arg0:%arg1:%arg2 : !linalg.range
|
|
%3 = view %1[%c0][%arg0, %arg0] :
|
|
memref<?xi8> to memref<?x?xf32, offset: ?, strides: [?, 1]>
|
|
%4 = linalg.slice %3[%2, %2] :
|
|
memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
!linalg.range,
|
|
!linalg.range,
|
|
memref<?x?xf32, offset: ?, strides: [?, 1]>
|
|
%5 = linalg.slice %3[%2, %arg2] : memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
!linalg.range,
|
|
index,
|
|
memref<?xf32, offset: ?, strides: [1]>
|
|
%6 = linalg.slice %3[%arg2, %2] : memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
index,
|
|
!linalg.range,
|
|
memref<?xf32, offset: ?, strides: [1]>
|
|
%7 = linalg.slice %3[%arg2, %arg3] : memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
index,
|
|
index,
|
|
memref<f32>
|
|
%8 = view %1[%c0][%arg0, %arg0] :
|
|
memref<?xi8> to memref<?x?xvector<4x4xf32>, offset: ?, strides: [?, 1]>
|
|
dealloc %1 : memref<?xi8>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @views
|
|
// CHECK: muli %{{.*}}, %{{.*}} : index
|
|
// CHECK-NEXT: alloc(%{{.*}}) : memref<?xi8>
|
|
// CHECK-NEXT: range
|
|
// CHECK-NEXT: std.view %{{.*}}[%{{.*}}][%{{.*}}] :
|
|
// CHECK-SAME: memref<?xi8> to memref<?x?xf32, #[[strided2D]]>
|
|
// CHECK-NEXT: linalg.slice %{{.*}}[%{{.*}}, %{{.*}}] :
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: !linalg.range,
|
|
// CHECK-SAME: !linalg.range,
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>
|
|
// CHECK-NEXT: linalg.slice %{{.*}}[%{{.*}}, %{{.*}}] :
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: !linalg.range,
|
|
// CHECK-SAME: index,
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>
|
|
// CHECK-NEXT: linalg.slice %{{.*}}[%{{.*}}, %{{.*}}] :
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: index,
|
|
// CHECK-SAME: !linalg.range,
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>
|
|
// CHECK-NEXT: linalg.slice %{{.*}}[%{{.*}}, %{{.*}}] :
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: index,
|
|
// CHECK-SAME: index,
|
|
// CHECK-SAME: memref<f32>
|
|
// CHECK-NEXT: view %{{.*}}[%{{.*}}][%{{.*}}] :
|
|
// CHECK-SAME: memref<?xi8> to memref<?x?xvector<4x4xf32>, #[[strided2D]]>
|
|
// CHECK-NEXT: dealloc %{{.*}} : memref<?xi8>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided1D:.*]] = affine_map<(d0)[s0] -> (d0 + s0)>
|
|
// CHECK-DAG: #[[strided2D:.*]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)>
|
|
|
|
func @ops(%arg0: memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
%arg1: memref<?xf32, offset: ?, strides: [1]>,
|
|
%arg2: memref<?xf32, offset: ?, strides: [1]>,
|
|
%arg3: memref<f32>) {
|
|
linalg.matmul(%arg0, %arg0, %arg0) : memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
memref<?x?xf32, offset: ?, strides: [?, 1]>
|
|
linalg.matvec(%arg0, %arg1, %arg2) : memref<?x?xf32, offset: ?, strides: [?, 1]>,
|
|
memref<?xf32, offset: ?, strides: [1]>,
|
|
memref<?xf32, offset: ?, strides: [1]>
|
|
linalg.dot(%arg1, %arg2, %arg3) : memref<?xf32, offset: ?, strides: [1]>,
|
|
memref<?xf32, offset: ?, strides: [1]>,
|
|
memref<f32>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @ops(%
|
|
// CHECK-NEXT: linalg.matmul(%{{.*}}, %{{.*}}, %{{.*}}) :
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>
|
|
// CHECK-NEXT: linalg.matvec(%{{.*}}, %{{.*}}, %{{.*}}) :
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]>,
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>,
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>
|
|
// CHECK-NEXT: linalg.dot(%{{.*}}, %{{.*}}, %{{.*}}) :
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>,
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>,
|
|
// CHECK-SAME: memref<f32>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided1D:.*]] = affine_map<(d0)[s0] -> (d0 + s0)>
|
|
|
|
func @fill_view(%arg0: memref<?xf32, offset: ?, strides: [1]>, %arg1: f32) {
|
|
linalg.fill(%arg0, %arg1) : memref<?xf32, offset: ?, strides: [1]>, f32
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @fill_view(
|
|
// CHECK: %{{.*}}: memref<?xf32, #[[strided1D]]>, %{{.*}}: f32) {
|
|
// CHECK: linalg.fill(%{{.*}}, %{{.*}}) : memref<?xf32, #[[strided1D]]>, f32
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
|
|
func @transpose(%arg0: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
%0 = linalg.transpose %arg0 (i, j, k) -> (k, j, i) : memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @transpose
|
|
// CHECK: linalg.transpose %{{.*}} ([[i:.*]], [[j:.*]], [[k:.*]]) -> ([[k]], [[j]], [[i]]) :
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
|
|
func @fill_view3(%arg0: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>, %arg1: f32) {
|
|
linalg.fill(%arg0, %arg1) : memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>, f32
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @fill_view3(
|
|
// CHECK: %{{.*}}: memref<?x?x?xf32, #[[strided3D]]>, %{{.*}}: f32) {
|
|
// CHECK: linalg.fill(%{{.*}}, %{{.*}}) : memref<?x?x?xf32, #[[strided3D]]>, f32
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided1D:.*]] = affine_map<(d0)[s0] -> (d0 + s0)>
|
|
|
|
func @copy_view(%arg0: memref<?xf32, offset: ?, strides: [1]>,
|
|
%arg1: memref<?xf32, offset: ?, strides: [1]>) {
|
|
linalg.copy(%arg0, %arg1) : memref<?xf32, offset: ?, strides: [1]>,
|
|
memref<?xf32, offset: ?, strides: [1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @copy_view(
|
|
// CHECK: linalg.copy(%{{.*}}, %{{.*}}) :
|
|
// CHECK-SAME: memref<?xf32, #[[strided1D]]>, memref<?xf32, #[[strided1D]]>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
// CHECK-DAG: #[[map0:.*]] = affine_map<(d0, d1, d2) -> (d0, d2, d1)>
|
|
// CHECK-DAG: #[[map1:.*]] = affine_map<(d0, d1, d2) -> (d2, d1, d0)>
|
|
|
|
func @copy_view3(%arg0: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>,
|
|
%arg1: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
linalg.copy(%arg0, %arg1) {inputPermutation = affine_map<(i, j, k) -> (i, k, j)>,
|
|
outputPermutation = affine_map<(i, j, k) -> (k, j, i)>} :
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>, memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @copy_view3(
|
|
// CHECK: %{{.*}}: memref<?x?x?xf32, #[[strided3D]]>, %{{.*}}: memref<?x?x?xf32, #[[strided3D]]>) {
|
|
// CHECK: linalg.copy(%{{.*}}, %{{.*}}) {
|
|
// CHECK-SAME: inputPermutation = #[[map0]],
|
|
// CHECK-SAME: outputPermutation = #[[map1]]} :
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>,
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
|
|
func @conv_view3(%arg0: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>,
|
|
%arg1: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>,
|
|
%arg2: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
linalg.conv(%arg0, %arg1, %arg2) : memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>,
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>,
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @conv_view3(
|
|
// CHECK: linalg.conv(%{{.*}}, %{{.*}}, %{{.*}}) :
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>,
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>,
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided6D:.*]] = affine_map<(d0, d1, d2, d3, d4, d5)[s0, s1, s2, s3, s4, s5] -> (d0 * s1 + s0 + d1 * s2 + d2 * s3 + d3 * s4 + d4 * s5 + d5)>
|
|
|
|
func @conv_view6(%arg0: memref<?x?x?x?x?x?xf32, offset: ?, strides: [?, ?, ?, ?, ?, 1]>,
|
|
%arg1: memref<?x?x?x?x?x?xf32, offset: ?, strides: [?, ?, ?, ?, ?, 1]>,
|
|
%arg2: memref<?x?x?x?x?x?xf32, offset: ?, strides: [?, ?, ?, ?, ?, 1]>) {
|
|
linalg.conv(%arg0, %arg1, %arg2) {dilations = [4, 4, 5, 5], strides = [2, 2, 3, 3]} :
|
|
memref<?x?x?x?x?x?xf32, offset: ?, strides: [?, ?, ?, ?, ?, 1]>,
|
|
memref<?x?x?x?x?x?xf32, offset: ?, strides: [?, ?, ?, ?, ?, 1]>,
|
|
memref<?x?x?x?x?x?xf32, offset: ?, strides: [?, ?, ?, ?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @conv_view6(
|
|
// CHECK: linalg.conv(%{{.*}}, %{{.*}}, %{{.*}}) {
|
|
// CHECK-SAME: dilations = [4, 4, 5, 5], strides = [2, 2, 3, 3]} :
|
|
// CHECK-SAME: memref<?x?x?x?x?x?xf32, #[[strided6D]]>,
|
|
// CHECK-SAME: memref<?x?x?x?x?x?xf32, #[[strided6D]]>,
|
|
// CHECK-SAME: memref<?x?x?x?x?x?xf32, #[[strided6D]]>
|
|
|
|
// -----
|
|
|
|
func @conv_padding(%arg0: memref<?x?x?x?xf32>,
|
|
%arg1: memref<?x?x?x?xf32>,
|
|
%arg2: memref<?x?x?x?xf32>) {
|
|
linalg.conv(%arg0, %arg1, %arg2) {dilations = [1, 1],
|
|
padding = dense<[[0, 1], [1, 1]]> : tensor<2x2xi64>,
|
|
strides = [1, 1]} :
|
|
memref<?x?x?x?xf32>, memref<?x?x?x?xf32>, memref<?x?x?x?xf32>
|
|
return
|
|
}
|
|
|
|
// CHECK-LABEL: func @conv_padding(
|
|
// CHECK: linalg.conv(%{{.*}}, %{{.*}}, %{{.*}}) {
|
|
// CHECK-SAME: dilations = [1, 1],
|
|
// CHECK-SAME: padding = dense<[
|
|
// CHECK-SAME: [0, 1], [1, 1]]> : tensor<2x2xi64>,
|
|
// CHECK-SAME: strides = [1, 1]} :
|
|
// CHECK-SAME: memref<?x?x?x?xf32>,
|
|
// CHECK-SAME: memref<?x?x?x?xf32>,
|
|
// CHECK-SAME: memref<?x?x?x?xf32>
|
|
|
|
// -----
|
|
|
|
func @pooling_max(%arg0: memref<?x?x?xf32>,
|
|
%arg1: memref<?x?x?xi32>,
|
|
%arg2: memref<?x?x?xf32>) {
|
|
linalg.pooling_max(%arg0, %arg1, %arg2) {strides = [2, 1, 2]}:
|
|
memref<?x?x?xf32>, memref<?x?x?xi32>, memref<?x?x?xf32>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @pooling_max
|
|
// CHECK: linalg.pooling_max(%{{.*}}, %{{.*}}, %{{.*}})
|
|
// CHECK-SAME: {strides = [2, 1, 2]}
|
|
// CHECK-SAME: memref<?x?x?xf32>, memref<?x?x?xi32>, memref<?x?x?xf32>
|
|
|
|
// -----
|
|
|
|
func @pooling_min(%arg0: memref<?x?x?xf32>,
|
|
%arg1: memref<?x?x?xi32>,
|
|
%arg2: memref<?x?x?xf32>) {
|
|
linalg.pooling_min(%arg0, %arg1, %arg2) {strides = [2, 1, 2]}:
|
|
memref<?x?x?xf32>, memref<?x?x?xi32>, memref<?x?x?xf32>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @pooling_min
|
|
// CHECK: linalg.pooling_min(%{{.*}}, %{{.*}}, %{{.*}})
|
|
// CHECK-SAME: {strides = [2, 1, 2]}
|
|
// CHECK-SAME: memref<?x?x?xf32>, memref<?x?x?xi32>, memref<?x?x?xf32>
|
|
|
|
// -----
|
|
|
|
func @pooling_sum(%arg0: memref<?x?x?xf32>,
|
|
%arg1: memref<?x?x?xi32>,
|
|
%arg2: memref<?x?x?xf32>) {
|
|
linalg.pooling_sum(%arg0, %arg1, %arg2) {strides = [2, 1, 2]}:
|
|
memref<?x?x?xf32>, memref<?x?x?xi32>, memref<?x?x?xf32>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @pooling_sum
|
|
// CHECK: linalg.pooling_sum(%{{.*}}, %{{.*}}, %{{.*}})
|
|
// CHECK-SAME: {strides = [2, 1, 2]}
|
|
// CHECK-SAME: memref<?x?x?xf32>, memref<?x?x?xi32>, memref<?x?x?xf32>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided2D:.*]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)>
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
|
|
#accesses = [
|
|
affine_map<(i, j, k) -> (j, i)>,
|
|
affine_map<(i, j, k) -> (i, k, i + j)>
|
|
]
|
|
|
|
#trait = {
|
|
args_in = 1,
|
|
args_out = 1,
|
|
indexing_maps = #accesses,
|
|
iterator_types = ["parallel", "parallel", "parallel"],
|
|
library_call = "some_external_function_name_1"
|
|
}
|
|
|
|
func @generic(%arg0: memref<?x?xvector<3x4xi4>, offset: ?, strides: [?, 1]>,
|
|
%arg1: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
linalg.generic #trait {foo = 1} %arg0, %arg1 {
|
|
^bb(%0: vector<3x4xi4>, %1: f32) :
|
|
%f0 = constant 0.0 : f32
|
|
linalg.yield %f0 : f32
|
|
} : memref<?x?xvector<3x4xi4>, offset: ?, strides: [?, 1]>,
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @generic
|
|
// CHECK: linalg.generic {args_in = 1 : i64, args_out = 1 : i64,
|
|
// CHECK-SAME: indexing_maps = [#{{.*}}, #{{.*}}], iterator_types = ["parallel", "parallel", "parallel"],
|
|
// CHECK-SAME: library_call = "some_external_function_name_1"
|
|
// CHECK-SAME: {foo = 1 : i64}
|
|
// CHECK: memref<?x?xvector<3x4xi4>, #[[strided2D]]>, memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
func @generic_with_tensor_input(%arg0: tensor<?x?xvector<3x4xi4>>,
|
|
%arg1: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
linalg.generic #trait {foo = 1} %arg0, %arg1 {
|
|
^bb(%0: vector<3x4xi4>, %1: f32) :
|
|
%f0 = constant 0.0 : f32
|
|
linalg.yield %f0 : f32
|
|
} : tensor<?x?xvector<3x4xi4>>,
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @generic_with_tensor_input
|
|
// CHECK: linalg.generic {args_in = 1 : i64, args_out = 1 : i64,
|
|
// CHECK-SAME: indexing_maps = [#{{.*}}, #{{.*}}], iterator_types = ["parallel", "parallel", "parallel"],
|
|
// CHECK-SAME: library_call = "some_external_function_name_1"}
|
|
// CHECK-SAME: {foo = 1 : i64}
|
|
// CHECK: tensor<?x?xvector<3x4xi4>>, memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
// -----
|
|
|
|
#accesses = [
|
|
affine_map<(i, j, k) -> (j, i)>,
|
|
affine_map<(i, j, k) -> (i, k, i + j)>
|
|
]
|
|
|
|
#trait2 = {
|
|
args_in = 2,
|
|
args_out = 1,
|
|
indexing_maps = #accesses,
|
|
iterator_types = ["parallel", "parallel", "parallel"],
|
|
library_call = "some_external_function_name_1"
|
|
}
|
|
|
|
func @generic_with_tensor_input_and_output(
|
|
%arg0: tensor<?x?xvector<3x4xi4>>, %arg1: tensor<?x?x?xf32>)
|
|
-> (tensor<?x?x?xf32>) {
|
|
%0 = linalg.generic #trait2 {foo = 1} %arg0, %arg1 {
|
|
^bb(%0: vector<3x4xi4>, %1: f32) :
|
|
%f0 = constant 0.0 : f32
|
|
linalg.yield %f0 : f32
|
|
} : tensor<?x?xvector<3x4xi4>>, tensor<?x?x?xf32> -> tensor<?x?x?xf32>
|
|
return %0 : tensor<?x?x?xf32>
|
|
}
|
|
// CHECK-LABEL: func @generic_with_tensor_input_and_output
|
|
// CHECK: linalg.generic {args_in = 2 : i64, args_out = 1 : i64,
|
|
// CHECK-SAME: indexing_maps = [#{{.*}}, #{{.*}}], iterator_types = ["parallel", "parallel", "parallel"],
|
|
// CHECK-SAME: library_call = "some_external_function_name_1"}
|
|
// CHECK-SAME: {foo = 1 : i64}
|
|
// CHECK-SAME: %{{.*}}, %{{.*}}
|
|
// CHECK: tensor<?x?xvector<3x4xi4>>, tensor<?x?x?xf32> -> tensor<?x?x?xf32>
|
|
// CHECK: return {{.*}} : tensor<?x?x?xf32>
|
|
|
|
// -----
|
|
|
|
#accesses = [
|
|
affine_map<(i, j, k) -> (j, i)>,
|
|
affine_map<(i, j, k) -> (i, k, i + j)>
|
|
]
|
|
|
|
#trait2 = {
|
|
args_in = 2,
|
|
args_out = 1,
|
|
indexing_maps = #accesses,
|
|
iterator_types = ["parallel", "parallel", "parallel"],
|
|
library_call = "some_external_function_name_1"
|
|
}
|
|
|
|
func @indexed_generic_with_tensor_input_and_output(
|
|
%arg0: tensor<?x?xvector<3x4xi4>>, %arg1: tensor<?x?x?xf32>)
|
|
-> (tensor<?x?x?xf32>) {
|
|
%0 = linalg.indexed_generic #trait2 {foo = 1} %arg0, %arg1 {
|
|
^bb(%i: index, %j: index, %k: index, %0: vector<3x4xi4>, %1: f32) :
|
|
%f0 = constant 0.0 : f32
|
|
linalg.yield %f0 : f32
|
|
} : tensor<?x?xvector<3x4xi4>>, tensor<?x?x?xf32> -> tensor<?x?x?xf32>
|
|
return %0 : tensor<?x?x?xf32>
|
|
}
|
|
// CHECK-LABEL: func @indexed_generic_with_tensor_input_and_output
|
|
// CHECK: linalg.indexed_generic {args_in = 2 : i64, args_out = 1 : i64,
|
|
// CHECK-SAME: indexing_maps = [#{{.*}}, #{{.*}}], iterator_types = ["parallel", "parallel", "parallel"],
|
|
// CHECK-SAME: library_call = "some_external_function_name_1"}
|
|
// CHECK-SAME: {foo = 1 : i64}
|
|
// CHECK-SAME: %{{.*}}, %{{.*}}
|
|
// CHECK: tensor<?x?xvector<3x4xi4>>, tensor<?x?x?xf32> -> tensor<?x?x?xf32>
|
|
// CHECK: return {{.*}} : tensor<?x?x?xf32>
|
|
|
|
// -----
|
|
|
|
#broadcast_access = [
|
|
affine_map<(i, j) -> ()>,
|
|
affine_map<(i, j) -> (i, j)>
|
|
]
|
|
|
|
#trait_broadcast = {
|
|
args_in = 1,
|
|
args_out = 1,
|
|
indexing_maps = #broadcast_access,
|
|
iterator_types = ["parallel", "parallel"],
|
|
library_call = "some_broadcast_external_fn"
|
|
}
|
|
|
|
func @generic_op_zero_rank(%arg0: tensor<f32>) -> (tensor<3x4xf32>)
|
|
{
|
|
%0 = linalg.generic #trait_broadcast %arg0 {
|
|
^bb(%a: f32) :
|
|
linalg.yield %a : f32
|
|
} : tensor<f32> -> tensor<3x4xf32>
|
|
return %0 : tensor<3x4xf32>
|
|
}
|
|
|
|
func @indexed_generic_op_zero_rank(%arg0: tensor<f32>) -> (tensor<3x4xf32>)
|
|
{
|
|
%0 = linalg.indexed_generic #trait_broadcast %arg0 {
|
|
^bb(%i: index, %j: index, %a: f32) :
|
|
linalg.yield %a : f32
|
|
} : tensor<f32> -> tensor<3x4xf32>
|
|
return %0 : tensor<3x4xf32>
|
|
}
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided2D:.*]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)>
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
|
|
#accesses = [
|
|
affine_map<(i, j, k) -> (j, i)>,
|
|
affine_map<(i, j, k) -> (i, k, i + j)>
|
|
]
|
|
|
|
#trait3 = {
|
|
args_in = 1,
|
|
args_out = 1,
|
|
indexing_maps = #accesses,
|
|
iterator_types = ["parallel", "parallel", "parallel"],
|
|
library_call = "some_external_function_name_2"
|
|
}
|
|
|
|
func @generic_region(%arg0: memref<?x?xvector<3x4xi4>, offset: ?, strides: [?, 1]>,
|
|
%arg1: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
linalg.generic #trait3 {foo = 1} %arg0, %arg1 {
|
|
^bb(%a: vector<3x4xi4>, %b: f32) :
|
|
linalg.yield %b : f32
|
|
} : memref<?x?xvector<3x4xi4>, offset: ?, strides: [?, 1]>,
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @generic_region
|
|
// CHECK: linalg.generic {args_in = 1 : i64, args_out = 1 : i64,
|
|
// CHECK-SAME: indexing_maps = [#{{.*}}, #{{.*}}], iterator_types = ["parallel", "parallel", "parallel"],
|
|
// CHECK-SAME: library_call = "some_external_function_name_2"
|
|
// CHECK-SAME: {foo = 1 : i64}
|
|
// CHECK: ^{{.*}}(%{{.*}}: vector<3x4xi4>, %{{.*}}: f32):
|
|
// CHECK: linalg.yield %{{.*}} : f32
|
|
// CHECK: memref<?x?xvector<3x4xi4>, #[[strided2D]]>,
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
func @indexed_generic(%arg0: memref<?x?xvector<3x4xi4>, offset: ?, strides: [?, 1]>,
|
|
%arg1: memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>) {
|
|
linalg.indexed_generic #trait3 {foo = 1} %arg0, %arg1 {
|
|
^bb(%i: index, %j: index, %k: index, %a: vector<3x4xi4>, %b: f32) :
|
|
linalg.yield %b : f32
|
|
}: memref<?x?xvector<3x4xi4>, offset: ?, strides: [?, 1]>,
|
|
memref<?x?x?xf32, offset: ?, strides: [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @indexed_generic
|
|
// CHECK: linalg.indexed_generic {args_in = 1 : i64, args_out = 1 : i64,
|
|
// CHECK-SAME: indexing_maps = [#{{.*}}, #{{.*}}], iterator_types = ["parallel", "parallel", "parallel"],
|
|
// CHECK-SAME: library_call = "some_external_function_name_2"
|
|
// CHECK-SAME: {foo = 1 : i64}
|
|
// CHECK: ^{{.*}}(%{{.*}}: index, %{{.*}}: index, %{{.*}}: index, %{{.*}}: vector<3x4xi4>, %{{.*}}: f32):
|
|
// CHECK: linalg.yield %{{.*}} : f32
|
|
// CHECK: }: memref<?x?xvector<3x4xi4>, #[[strided2D]]>,
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[reshapeD01:.*]] = affine_map<(d0, d1, d2) -> (d0, d1)>
|
|
// CHECK-DAG: #[[reshapeD2:.*]] = affine_map<(d0, d1, d2) -> (d2)>
|
|
// CHECK-DAG: #[[reshapeD0:.*]] = affine_map<(d0, d1, d2) -> (d0)>
|
|
// CHECK-DAG: #[[reshapeD12:.*]] = affine_map<(d0, d1, d2) -> (d1, d2)>
|
|
// CHECK-DAG: #[[reshapeD012:.*]] = affine_map<(d0, d1, d2) -> (d0, d1, d2)>
|
|
// CHECK-DAG: #[[reshape5D01:.*]] = affine_map<(d0, d1, d2, d3, d4) -> (d0, d1)>
|
|
// CHECK-DAG: #[[reshape5D2:.*]] = affine_map<(d0, d1, d2, d3, d4) -> (d2)>
|
|
// CHECK-DAG: #[[reshape5D34:.*]] = affine_map<(d0, d1, d2, d3, d4) -> (d3, d4)>
|
|
|
|
func @reshape_static(%arg0: memref<3x4x5xf32>, %arg1: tensor<3x4x5xf32>, %arg2: tensor<3x?x5xf32>) {
|
|
// Reshapes that collapse and expand back a contiguous buffer.
|
|
%0 = linalg.reshape %arg0 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<3x4x5xf32> into memref<12x5xf32>
|
|
%r0 = linalg.reshape %0 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<12x5xf32> into memref<3x4x5xf32>
|
|
%1 = linalg.reshape %arg0 [affine_map<(i, j, k) -> (i)>,
|
|
affine_map<(i, j, k) -> (j, k)>] :
|
|
memref<3x4x5xf32> into memref<3x20xf32>
|
|
%r1 = linalg.reshape %1 [affine_map<(i, j, k) -> (i)>,
|
|
affine_map<(i, j, k) -> (j, k)>] :
|
|
memref<3x20xf32> into memref<3x4x5xf32>
|
|
%2 = linalg.reshape %arg0 [affine_map<(i, j, k) -> (i, j, k)>] :
|
|
memref<3x4x5xf32> into memref<60xf32>
|
|
%r2 = linalg.reshape %2 [affine_map<(i, j, k) -> (i, j, k)>] :
|
|
memref<60xf32> into memref<3x4x5xf32>
|
|
// Reshapes that expand and collapse back a contiguous buffer with some 1's.
|
|
%3 = linalg.reshape %arg0 [affine_map<(i, j, k, l, m) -> (i, j)>,
|
|
affine_map<(i, j, k, l, m) -> (k)>,
|
|
affine_map<(i, j, k, l, m) -> (l, m)>] :
|
|
memref<3x4x5xf32> into memref<1x3x4x1x5xf32>
|
|
%r3 = linalg.reshape %3 [affine_map<(i, j, k, l, m) -> (i, j)>,
|
|
affine_map<(i, j, k, l, m) -> (k)>,
|
|
affine_map<(i, j, k, l, m) -> (l, m)>] :
|
|
memref<1x3x4x1x5xf32> into memref<3x4x5xf32>
|
|
// Reshapes on tensors.
|
|
%t0 = linalg.tensor_reshape %arg1 [affine_map<(i, j, k, l, m) -> (i, j)>,
|
|
affine_map<(i, j, k, l, m) -> (k)>,
|
|
affine_map<(i, j, k, l, m) -> (l, m)>] :
|
|
tensor<3x4x5xf32> into tensor<1x3x4x1x5xf32>
|
|
%rt0 = linalg.tensor_reshape %t0 [affine_map<(i, j, k, l, m) -> (i, j)>,
|
|
affine_map<(i, j, k, l, m) -> (k)>,
|
|
affine_map<(i, j, k, l, m) -> (l, m)>] :
|
|
tensor<1x3x4x1x5xf32> into tensor<3x4x5xf32>
|
|
%t1 = linalg.tensor_reshape %arg2 [affine_map<(i, j, k, l, m) -> (i, j)>,
|
|
affine_map<(i, j, k, l, m) -> (k)>,
|
|
affine_map<(i, j, k, l, m) -> (l, m)>] :
|
|
tensor<3x?x5xf32> into tensor<1x3x?x1x5xf32>
|
|
%rt1 = linalg.tensor_reshape %t1 [affine_map<(i, j, k, l, m) -> (i)>,
|
|
affine_map<(i, j, k, l, m) -> (j, k)>,
|
|
affine_map<(i, j, k, l, m) -> (l, m)>] :
|
|
tensor<1x3x?x1x5xf32> into tensor<1x?x5xf32>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @reshape_static
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<3x4x5xf32> into memref<12x5xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<12x5xf32> into memref<3x4x5xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD0]], #[[reshapeD12]]]
|
|
// CHECK-SAME: memref<3x4x5xf32> into memref<3x20xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD0]], #[[reshapeD12]]]
|
|
// CHECK-SAME: memref<3x20xf32> into memref<3x4x5xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD012]]]
|
|
// CHECK-SAME: memref<3x4x5xf32> into memref<60xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD012]]]
|
|
// CHECK-SAME: memref<60xf32> into memref<3x4x5xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshape5D01]], #[[reshape5D2]], #[[reshape5D34]]]
|
|
// CHECK-SAME: memref<3x4x5xf32> into memref<1x3x4x1x5xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshape5D01]], #[[reshape5D2]], #[[reshape5D34]]]
|
|
// CHECK-SAME: memref<1x3x4x1x5xf32> into memref<3x4x5xf32>
|
|
//
|
|
// CHECK: linalg.tensor_reshape {{.*}}: tensor<3x4x5xf32> into tensor<1x3x4x1x5xf32>
|
|
// CHECK: linalg.tensor_reshape {{.*}}: tensor<1x3x4x1x5xf32> into tensor<3x4x5xf32>
|
|
// CHECK: linalg.tensor_reshape {{.*}}: tensor<3x?x5xf32> into tensor<1x3x?x1x5xf32>
|
|
// CHECK: linalg.tensor_reshape {{.*}}: tensor<1x3x?x1x5xf32> into tensor<1x?x5xf32>
|
|
|
|
// -----
|
|
|
|
// CHECK-DAG: #[[strided2D:.*]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + s0 + d1)>
|
|
// CHECK-DAG: #[[strided2DOFF0:.*]] = affine_map<(d0, d1)[s0] -> (d0 * s0 + d1)>
|
|
// CHECK-DAG: #[[strided3D:.*]] = affine_map<(d0, d1, d2)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2 + d2)>
|
|
// CHECK-DAG: #[[strided3DOFF0:.*]] = affine_map<(d0, d1, d2)[s0, s1] -> (d0 * s0 + d1 * s1 + d2)>
|
|
|
|
func @reshape_dynamic(%arg0: memref<?x?x?xf32>,
|
|
%arg1: memref<?x?x?xf32, offset : 0, strides : [?, ?, 1]>,
|
|
%arg2: memref<?x?x?xf32, offset : ?, strides : [?, ?, 1]>) {
|
|
%0 = linalg.reshape %arg0 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<?x?x?xf32> into memref<?x?xf32>
|
|
%r0 = linalg.reshape %0 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<?x?xf32> into memref<?x?x?xf32>
|
|
%1 = linalg.reshape %arg1 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<?x?x?xf32, offset : 0, strides : [?, ?, 1]> into
|
|
memref<?x?xf32, offset : 0, strides : [?, 1]>
|
|
%r1 = linalg.reshape %1 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<?x?xf32, offset : 0, strides : [?, 1]> into
|
|
memref<?x?x?xf32, offset : 0, strides : [?, ?, 1]>
|
|
%2 = linalg.reshape %arg2 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<?x?x?xf32, offset : ?, strides : [?, ?, 1]> into
|
|
memref<?x?xf32, offset : ?, strides : [?, 1]>
|
|
%r2 = linalg.reshape %2 [affine_map<(i, j, k) -> (i, j)>,
|
|
affine_map<(i, j, k) -> (k)>] :
|
|
memref<?x?xf32, offset : ?, strides : [?, 1]> into
|
|
memref<?x?x?xf32, offset : ?, strides : [?, ?, 1]>
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @reshape
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<?x?x?xf32> into memref<?x?xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<?x?xf32> into memref<?x?x?xf32>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3DOFF0]]> into memref<?x?xf32, #[[strided2DOFF0]]>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2DOFF0]]> into memref<?x?x?xf32, #[[strided3DOFF0]]>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<?x?x?xf32, #[[strided3D]]> into memref<?x?xf32, #[[strided2D]]>
|
|
// CHECK: linalg.reshape {{.*}} [#[[reshapeD01]], #[[reshapeD2]]]
|
|
// CHECK-SAME: memref<?x?xf32, #[[strided2D]]> into memref<?x?x?xf32, #[[strided3D]]>
|
|
|
|
|
|
// TODO: Return tensors need a semantics convention update.
|
|
func @named_ops(%a3: memref<?x?x?xf32>, %b3: memref<?x?x?xf32>, %c3: memref<?x?x?xf32>,
|
|
%ta3: tensor<?x?x?xf32>, %tb3: tensor<?x?x?xf32>, %tc3: tensor<?x?x?xf32>) {
|
|
linalg.batch_matmul %a3, %b3, %c3 : (memref<?x?x?xf32>, memref<?x?x?xf32>, memref<?x?x?xf32>) -> ()
|
|
linalg.batch_matmul %ta3, %tb3, %c3 : (tensor<?x?x?xf32>, tensor<?x?x?xf32>, memref<?x?x?xf32>) -> ()
|
|
return
|
|
}
|
|
// CHECK-LABEL: func @named_ops
|
|
// CHECK: linalg.batch_matmul
|
|
// CHECK: linalg.batch_matmul
|
|
|