2020-03-30 06:35:38 +08:00
|
|
|
// RUN: mlir-opt -allow-unregistered-dialect %s | FileCheck %s
|
2018-11-18 00:24:07 +08:00
|
|
|
// Verify the printed output can be parsed.
|
2020-03-30 06:35:38 +08:00
|
|
|
// RUN: mlir-opt -allow-unregistered-dialect %s | mlir-opt -allow-unregistered-dialect | FileCheck %s
|
2019-02-06 03:47:02 +08:00
|
|
|
// Verify the generic form can be parsed.
|
2020-03-30 06:35:38 +08:00
|
|
|
// RUN: mlir-opt -allow-unregistered-dialect -mlir-print-op-generic %s | mlir-opt -allow-unregistered-dialect | FileCheck %s
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
// CHECK: #map0 = affine_map<(d0) -> (d0 + 1)>
|
2018-07-29 00:36:25 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
// CHECK: #map1 = affine_map<()[s0] -> (s0 + 1)>
|
2019-11-07 03:25:16 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
// CHECK-DAG: #[[VIEW_MAP1:map[0-9]+]] = affine_map<(d0, d1) -> (d0 * 4 + d1)>
|
|
|
|
// CHECK-DAG: #[[VIEW_MAP2:map[0-9]+]] = affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + d1 + s0)>
|
|
|
|
// CHECK-DAG: #[[VIEW_MAP3:map[0-9]+]] = affine_map<(d0, d1)[s0] -> (d0 * s0 + d1)>
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
// CHECK-DAG: #[[BASE_MAP0:map[0-9]+]] = affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2)>
|
|
|
|
// CHECK-DAG: #[[BASE_MAP3:map[0-9]+]] = affine_map<(d0, d1, d2)[s0, s1, s2, s3] -> (d0 * s1 + s0 + d1 * s2 + d2 * s3)>
|
|
|
|
// CHECK-DAG: #[[SUBVIEW_MAP0:map[0-9]+]] = affine_map<(d0, d1, d2)[s0, s1, s2, s3] -> (d0 * s1 + d1 * s2 + d2 * s3 + s0)>
|
2019-11-12 02:32:52 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
// CHECK-DAG: #[[BASE_MAP1:map[0-9]+]] = affine_map<(d0)[s0] -> (d0 + s0)>
|
|
|
|
// CHECK-DAG: #[[SUBVIEW_MAP1:map[0-9]+]] = affine_map<(d0)[s0, s1] -> (d0 * s1 + s0)>
|
2019-11-12 02:32:52 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
// CHECK-DAG: #[[BASE_MAP2:map[0-9]+]] = affine_map<(d0, d1) -> (d0 * 22 + d1)>
|
|
|
|
// CHECK-DAG: #[[SUBVIEW_MAP2:map[0-9]+]] = affine_map<(d0, d1)[s0, s1, s2] -> (d0 * s1 + d1 * s2 + s0)>
|
|
|
|
// CHECK-DAG: #[[SUBVIEW_MAP3:map[0-9]+]] = affine_map<(d0, d1, d2) -> (d0 * 16 + d1 * 4 + d2 + 8)>
|
|
|
|
// CHECK-DAG: #[[SUBVIEW_MAP4:map[0-9]+]] = affine_map<(d0, d1)[s0, s1, s2] -> (d0 * s1 + s0 + d1 * s2)>
|
|
|
|
// CHECK-DAG: #[[SUBVIEW_MAP5:map[0-9]+]] = affine_map<(d0, d1)[s0] -> (d0 * 8 + s0 + d1 * 2)>
|
2019-11-12 02:32:52 +08:00
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @func_with_ops(%arg0: f32) {
|
|
|
|
func @func_with_ops(f32) {
|
2018-12-30 03:32:37 +08:00
|
|
|
^bb0(%a : f32):
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %0 = "getTensor"() : () -> tensor<4x4x?xf32>
|
2018-07-25 01:13:31 +08:00
|
|
|
%t = "getTensor"() : () -> tensor<4x4x?xf32>
|
|
|
|
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %1 = dim %0, 2 : tensor<4x4x?xf32>
|
2019-06-26 10:06:06 +08:00
|
|
|
%t2 = "std.dim"(%t){index = 2} : (tensor<4x4x?xf32>) -> index
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %2 = addf %arg0, %arg0 : f32
|
2019-03-03 10:03:03 +08:00
|
|
|
%x = "std.addf"(%a, %a) : (f32,f32) -> (f32)
|
2018-07-25 01:13:31 +08:00
|
|
|
|
|
|
|
// CHECK: return
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-10-04 07:36:43 +08:00
|
|
|
// CHECK-LABEL: func @standard_instrs(%arg0: tensor<4x4x?xf32>, %arg1: f32, %arg2: i32, %arg3: index, %arg4: i64, %arg5: f16) {
|
|
|
|
func @standard_instrs(tensor<4x4x?xf32>, f32, i32, index, i64, f16) {
|
|
|
|
^bb42(%t: tensor<4x4x?xf32>, %f: f32, %i: i32, %idx : index, %j: i64, %half: f16):
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %0 = dim %arg0, 2 : tensor<4x4x?xf32>
|
2019-06-26 10:06:06 +08:00
|
|
|
%a = "std.dim"(%t){index = 2} : (tensor<4x4x?xf32>) -> index
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %1 = dim %arg0, 2 : tensor<4x4x?xf32>
|
2018-07-26 02:15:20 +08:00
|
|
|
%a2 = dim %t, 2 : tensor<4x4x?xf32>
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %2 = addf %arg1, %arg1 : f32
|
2019-03-03 10:03:03 +08:00
|
|
|
%f2 = "std.addf"(%f, %f) : (f32,f32) -> f32
|
2018-07-25 01:41:30 +08:00
|
|
|
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %3 = addf %2, %2 : f32
|
2018-07-26 02:15:20 +08:00
|
|
|
%f3 = addf %f2, %f2 : f32
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
2018-10-04 00:43:13 +08:00
|
|
|
// CHECK: %4 = addi %arg2, %arg2 : i32
|
2019-03-03 10:03:03 +08:00
|
|
|
%i2 = "std.addi"(%i, %i) : (i32,i32) -> i32
|
2018-10-04 00:43:13 +08:00
|
|
|
|
|
|
|
// CHECK: %5 = addi %4, %4 : i32
|
|
|
|
%i3 = addi %i2, %i2 : i32
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = addi %arg3, %arg3 : index
|
|
|
|
%idx1 = addi %idx, %idx : index
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = addi %arg3, %{{[0-9]+}} : index
|
2019-03-03 10:03:03 +08:00
|
|
|
%idx2 = "std.addi"(%idx, %idx1) : (index, index) -> index
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
|
|
|
// CHECK: %8 = subf %arg1, %arg1 : f32
|
2019-03-03 10:03:03 +08:00
|
|
|
%f4 = "std.subf"(%f, %f) : (f32,f32) -> f32
|
2018-10-04 00:43:13 +08:00
|
|
|
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
// CHECK: %9 = subf %8, %8 : f32
|
2018-10-04 00:43:13 +08:00
|
|
|
%f5 = subf %f4, %f4 : f32
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
|
|
|
// CHECK: %10 = subi %arg2, %arg2 : i32
|
2019-03-03 10:03:03 +08:00
|
|
|
%i4 = "std.subi"(%i, %i) : (i32,i32) -> i32
|
2018-10-04 00:43:13 +08:00
|
|
|
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
// CHECK: %11 = subi %10, %10 : i32
|
2018-10-04 00:43:13 +08:00
|
|
|
%i5 = subi %i4, %i4 : i32
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
|
|
|
// CHECK: %12 = mulf %2, %2 : f32
|
2018-10-04 00:43:13 +08:00
|
|
|
%f6 = mulf %f2, %f2 : f32
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
|
|
|
// CHECK: %13 = muli %4, %4 : i32
|
2018-10-04 00:43:13 +08:00
|
|
|
%i6 = muli %i2, %i2 : i32
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %c42_i32 = constant 42 : i32
|
2019-06-26 10:06:06 +08:00
|
|
|
%x = "std.constant"(){value = 42 : i32} : () -> i32
|
2018-08-02 01:43:18 +08:00
|
|
|
|
|
|
|
// CHECK: %c42_i32_0 = constant 42 : i32
|
|
|
|
%7 = constant 42 : i32
|
2018-08-03 07:54:36 +08:00
|
|
|
|
2019-06-26 10:06:06 +08:00
|
|
|
// CHECK: %c43 = constant {crazy = "std.foo"} 43 : index
|
|
|
|
%8 = constant {crazy = "std.foo"} 43: index
|
2018-08-17 07:56:40 +08:00
|
|
|
|
2018-08-20 12:17:22 +08:00
|
|
|
// CHECK: %cst = constant 4.300000e+01 : bf16
|
2018-08-17 07:56:40 +08:00
|
|
|
%9 = constant 43.0 : bf16
|
2018-08-20 12:17:22 +08:00
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK: %f = constant @func_with_ops : (f32) -> ()
|
|
|
|
%10 = constant @func_with_ops : (f32) -> ()
|
2018-08-20 12:17:22 +08:00
|
|
|
|
|
|
|
// CHECK: %f_1 = constant @affine_apply : () -> ()
|
|
|
|
%11 = constant @affine_apply : () -> ()
|
|
|
|
|
2018-08-22 08:55:22 +08:00
|
|
|
// CHECK: %f_2 = constant @affine_apply : () -> ()
|
|
|
|
%12 = constant @affine_apply : () -> ()
|
|
|
|
|
2019-06-26 07:06:13 +08:00
|
|
|
// CHECK: %cst_3 = constant dense<0> : vector<4xi32>
|
|
|
|
%13 = constant dense<0> : vector<4 x i32>
|
2018-10-30 01:22:49 +08:00
|
|
|
|
2019-06-26 07:06:13 +08:00
|
|
|
// CHECK: %cst_4 = constant dense<0> : tensor<42xi32>
|
|
|
|
%tci32 = constant dense<0> : tensor<42 x i32>
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
2019-06-26 07:06:13 +08:00
|
|
|
// CHECK: %cst_5 = constant dense<0> : vector<42xi32>
|
|
|
|
%vci32 = constant dense<0> : vector<42 x i32>
|
2018-11-08 22:48:09 +08:00
|
|
|
|
2018-11-08 20:02:00 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "eq", %{{[0-9]+}}, %{{[0-9]+}} : i32
|
|
|
|
%14 = cmpi "eq", %i3, %i4 : i32
|
|
|
|
|
|
|
|
// Predicate 1 means inequality comparison.
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "ne", %{{[0-9]+}}, %{{[0-9]+}} : i32
|
2019-06-26 10:06:06 +08:00
|
|
|
%15 = "std.cmpi"(%i3, %i4) {predicate = 1} : (i32, i32) -> i1
|
2018-11-08 20:02:00 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "slt", %cst_3, %cst_3 : vector<4xi32>
|
|
|
|
%16 = cmpi "slt", %13, %13 : vector<4 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "ne", %cst_3, %cst_3 : vector<4xi32>
|
2019-06-26 10:06:06 +08:00
|
|
|
%17 = "std.cmpi"(%13, %13) {predicate = 1} : (vector<4 x i32>, vector<4 x i32>) -> vector<4 x i1>
|
2018-11-08 20:02:00 +08:00
|
|
|
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "slt", %arg3, %arg3 : index
|
|
|
|
%18 = cmpi "slt", %idx, %idx : index
|
|
|
|
|
2018-12-12 05:49:43 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "eq", %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%19 = cmpi "eq", %tci32, %tci32 : tensor<42 x i32>
|
Enable arithmetics for index types.
Arithmetic and comparison instructions are necessary to implement, e.g.,
control flow when lowering MLFunctions to CFGFunctions. (While it is possible
to replace some of the arithmetics by affine_apply instructions for loop
bounds, it is still necessary for loop bounds checking, steps, if-conditions,
non-trivial memref subscripts, etc.) Furthermore, working with indirect
accesses in, e.g., lookup tables for large embeddings, may require operating on
tensors of indexes. For example, the equivalents to C code "LUT[Index[i]]" or
"ResultIndex[i] = i + j" where i, j are loop induction variables require the
arithmetics on indices as well as the possibility to operate on tensors
thereof. Allow arithmetic and comparison operations to apply to index types by
declaring them integer-like. Allow tensors whose element type is index for
indirection purposes.
The absence of vectors with "index" element type is explicitly tested, but the
only justification for this restriction in the CL introducing the test is
"because we don't need them". Do NOT enable vectors of index types, although
it makes vector and tensor types inconsistent with respect to allowed element
types.
PiperOrigin-RevId: 220614055
2018-11-08 20:04:32 +08:00
|
|
|
|
2018-12-12 05:49:43 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = cmpi "eq", %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%20 = cmpi "eq", %vci32, %vci32 : vector<42 x i32>
|
2018-11-08 22:48:09 +08:00
|
|
|
|
2018-11-28 23:08:55 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = select %{{[0-9]+}}, %arg3, %arg3 : index
|
|
|
|
%21 = select %18, %idx, %idx : index
|
|
|
|
|
2018-12-12 05:49:43 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = select %{{[0-9]+}}, %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%22 = select %19, %tci32, %tci32 : tensor<42 x i32>
|
2018-11-28 23:08:55 +08:00
|
|
|
|
2018-12-12 05:49:43 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = select %{{[0-9]+}}, %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%23 = select %20, %vci32, %vci32 : vector<42 x i32>
|
2018-11-28 23:08:55 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = select %{{[0-9]+}}, %arg3, %arg3 : index
|
2019-03-03 10:03:03 +08:00
|
|
|
%24 = "std.select"(%18, %idx, %idx) : (i1, index, index) -> index
|
2018-11-28 23:08:55 +08:00
|
|
|
|
2018-12-12 05:49:43 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = select %{{[0-9]+}}, %cst_4, %cst_4 : tensor<42xi32>
|
2019-03-03 10:03:03 +08:00
|
|
|
%25 = "std.select"(%19, %tci32, %tci32) : (tensor<42 x i1>, tensor<42 x i32>, tensor<42 x i32>) -> tensor<42 x i32>
|
2018-11-28 23:08:55 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_signed %arg2, %arg2 : i32
|
|
|
|
%26 = divi_signed %i, %i : i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_signed %arg3, %arg3 : index
|
|
|
|
%27 = divi_signed %idx, %idx : index
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_signed %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%28 = divi_signed %vci32, %vci32 : vector<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_signed %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%29 = divi_signed %tci32, %tci32 : tensor<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_signed %arg2, %arg2 : i32
|
|
|
|
%30 = "std.divi_signed"(%i, %i) : (i32, i32) -> i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_unsigned %arg2, %arg2 : i32
|
|
|
|
%31 = divi_unsigned %i, %i : i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_unsigned %arg3, %arg3 : index
|
|
|
|
%32 = divi_unsigned %idx, %idx : index
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_unsigned %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%33 = divi_unsigned %vci32, %vci32 : vector<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_unsigned %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%34 = divi_unsigned %tci32, %tci32 : tensor<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divi_unsigned %arg2, %arg2 : i32
|
|
|
|
%35 = "std.divi_unsigned"(%i, %i) : (i32, i32) -> i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_signed %arg2, %arg2 : i32
|
|
|
|
%36 = remi_signed %i, %i : i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_signed %arg3, %arg3 : index
|
|
|
|
%37 = remi_signed %idx, %idx : index
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_signed %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%38 = remi_signed %vci32, %vci32 : vector<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_signed %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%39 = remi_signed %tci32, %tci32 : tensor<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_signed %arg2, %arg2 : i32
|
|
|
|
%40 = "std.remi_signed"(%i, %i) : (i32, i32) -> i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_unsigned %arg2, %arg2 : i32
|
|
|
|
%41 = remi_unsigned %i, %i : i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_unsigned %arg3, %arg3 : index
|
|
|
|
%42 = remi_unsigned %idx, %idx : index
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_unsigned %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%43 = remi_unsigned %vci32, %vci32 : vector<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_unsigned %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%44 = remi_unsigned %tci32, %tci32 : tensor<42 x i32>
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-12-23 02:01:35 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = remi_unsigned %arg2, %arg2 : i32
|
|
|
|
%45 = "std.remi_unsigned"(%i, %i) : (i32, i32) -> i32
|
2019-01-07 06:08:42 +08:00
|
|
|
|
2019-02-21 22:30:53 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = divf %arg1, %arg1 : f32
|
2019-03-03 10:03:03 +08:00
|
|
|
%46 = "std.divf"(%f, %f) : (f32,f32) -> f32
|
2019-02-21 22:30:53 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = divf %arg1, %arg1 : f32
|
|
|
|
%47 = divf %f, %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = divf %arg0, %arg0 : tensor<4x4x?xf32>
|
|
|
|
%48 = divf %t, %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = remf %arg1, %arg1 : f32
|
2019-03-03 10:03:03 +08:00
|
|
|
%49 = "std.remf"(%f, %f) : (f32,f32) -> f32
|
2019-02-21 22:30:53 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = remf %arg1, %arg1 : f32
|
|
|
|
%50 = remf %f, %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = remf %arg0, %arg0 : tensor<4x4x?xf32>
|
|
|
|
%51 = remf %t, %t : tensor<4x4x?xf32>
|
|
|
|
|
2019-04-08 15:00:46 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = and %arg2, %arg2 : i32
|
|
|
|
%52 = "std.and"(%i, %i) : (i32,i32) -> i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = and %arg2, %arg2 : i32
|
|
|
|
%53 = and %i, %i : i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = and %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%54 = std.and %vci32, %vci32 : vector<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = and %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%55 = and %tci32, %tci32 : tensor<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = or %arg2, %arg2 : i32
|
|
|
|
%56 = "std.or"(%i, %i) : (i32,i32) -> i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = or %arg2, %arg2 : i32
|
|
|
|
%57 = or %i, %i : i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = or %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%58 = std.or %vci32, %vci32 : vector<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = or %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%59 = or %tci32, %tci32 : tensor<42 x i32>
|
|
|
|
|
2019-04-08 20:53:59 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = xor %arg2, %arg2 : i32
|
|
|
|
%60 = "std.xor"(%i, %i) : (i32,i32) -> i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = xor %arg2, %arg2 : i32
|
|
|
|
%61 = xor %i, %i : i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = xor %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%62 = std.xor %vci32, %vci32 : vector<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = xor %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%63 = xor %tci32, %tci32 : tensor<42 x i32>
|
|
|
|
|
2019-06-26 07:06:13 +08:00
|
|
|
%64 = constant dense<0.> : vector<4 x f32>
|
|
|
|
%tcf32 = constant dense<0.> : tensor<42 x f32>
|
|
|
|
%vcf32 = constant dense<0.> : vector<4 x f32>
|
2019-05-07 08:51:08 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpf "ogt", %{{[0-9]+}}, %{{[0-9]+}} : f32
|
|
|
|
%65 = cmpf "ogt", %f3, %f4 : f32
|
|
|
|
|
|
|
|
// Predicate 0 means ordered equality comparison.
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpf "oeq", %{{[0-9]+}}, %{{[0-9]+}} : f32
|
2019-06-26 10:06:06 +08:00
|
|
|
%66 = "std.cmpf"(%f3, %f4) {predicate = 1} : (f32, f32) -> i1
|
2019-05-07 08:51:08 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpf "olt", %cst_8, %cst_8 : vector<4xf32>
|
|
|
|
%67 = cmpf "olt", %vcf32, %vcf32 : vector<4 x f32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpf "oeq", %cst_8, %cst_8 : vector<4xf32>
|
2019-06-26 10:06:06 +08:00
|
|
|
%68 = "std.cmpf"(%vcf32, %vcf32) {predicate = 1} : (vector<4 x f32>, vector<4 x f32>) -> vector<4 x i1>
|
2019-05-07 08:51:08 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpf "oeq", %cst_7, %cst_7 : tensor<42xf32>
|
|
|
|
%69 = cmpf "oeq", %tcf32, %tcf32 : tensor<42 x f32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cmpf "oeq", %cst_8, %cst_8 : vector<4xf32>
|
|
|
|
%70 = cmpf "oeq", %vcf32, %vcf32 : vector<4 x f32>
|
|
|
|
|
2019-05-30 00:22:30 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = rank %arg0 : tensor<4x4x?xf32>
|
|
|
|
%71 = "std.rank"(%t) : (tensor<4x4x?xf32>) -> index
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = rank %arg0 : tensor<4x4x?xf32>
|
|
|
|
%72 = rank %t : tensor<4x4x?xf32>
|
|
|
|
|
2019-06-02 01:10:24 +08:00
|
|
|
// CHECK: = constant unit
|
|
|
|
%73 = constant unit
|
|
|
|
|
2019-07-23 12:43:14 +08:00
|
|
|
// CHECK: constant true
|
|
|
|
%74 = constant true
|
|
|
|
|
|
|
|
// CHECK: constant false
|
|
|
|
%75 = constant false
|
|
|
|
|
2019-06-18 02:35:05 +08:00
|
|
|
// CHECK: = index_cast {{.*}} : index to i64
|
2019-07-23 12:43:14 +08:00
|
|
|
%76 = index_cast %idx : index to i64
|
2019-06-18 02:35:05 +08:00
|
|
|
|
|
|
|
// CHECK: = index_cast {{.*}} : i32 to index
|
2019-07-23 12:43:14 +08:00
|
|
|
%77 = index_cast %i : i32 to index
|
2019-06-18 02:35:05 +08:00
|
|
|
|
2019-07-24 02:23:14 +08:00
|
|
|
// CHECK: = sitofp {{.*}} : i32 to f32
|
|
|
|
%78 = sitofp %i : i32 to f32
|
|
|
|
|
|
|
|
// CHECK: = sitofp {{.*}} : i32 to f64
|
|
|
|
%79 = sitofp %i : i32 to f64
|
|
|
|
|
|
|
|
// CHECK: = sitofp {{.*}} : i64 to f32
|
|
|
|
%80 = sitofp %j : i64 to f32
|
|
|
|
|
|
|
|
// CHECK: = sitofp {{.*}} : i64 to f64
|
|
|
|
%81 = sitofp %j : i64 to f64
|
|
|
|
|
2019-09-22 07:14:07 +08:00
|
|
|
// CHECK: = sexti %arg2 : i32 to i64
|
|
|
|
%82 = "std.sexti"(%i) : (i32) -> i64
|
|
|
|
|
|
|
|
// CHECK: = sexti %arg2 : i32 to i64
|
|
|
|
%83 = sexti %i : i32 to i64
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = sexti %cst_5 : vector<42xi32>
|
|
|
|
%84 = sexti %vci32 : vector<42 x i32> to vector<42 x i64>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = sexti %cst_4 : tensor<42xi32>
|
|
|
|
%85 = sexti %tci32 : tensor<42 x i32> to tensor<42 x i64>
|
|
|
|
|
|
|
|
// CHECK: = zexti %arg2 : i32 to i64
|
|
|
|
%86 = "std.zexti"(%i) : (i32) -> i64
|
|
|
|
|
|
|
|
// CHECK: = zexti %arg2 : i32 to i64
|
|
|
|
%87 = zexti %i : i32 to i64
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = zexti %cst_5 : vector<42xi32>
|
|
|
|
%88 = zexti %vci32 : vector<42 x i32> to vector<42 x i64>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = zexti %cst_4 : tensor<42xi32>
|
|
|
|
%89 = zexti %tci32 : tensor<42 x i32> to tensor<42 x i64>
|
|
|
|
|
|
|
|
// CHECK: = trunci %arg2 : i32 to i16
|
|
|
|
%90 = "std.trunci"(%i) : (i32) -> i16
|
|
|
|
|
|
|
|
// CHECK: = trunci %arg2 : i32 to i16
|
|
|
|
%91 = trunci %i : i32 to i16
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = trunci %cst_5 : vector<42xi32>
|
|
|
|
%92 = trunci %vci32 : vector<42 x i32> to vector<42 x i16>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = trunci %cst_4 : tensor<42xi32>
|
|
|
|
%93 = trunci %tci32 : tensor<42 x i32> to tensor<42 x i16>
|
|
|
|
|
2019-10-04 07:36:43 +08:00
|
|
|
// CHECK: = fpext {{.*}} : f16 to f32
|
|
|
|
%94 = fpext %half : f16 to f32
|
|
|
|
|
|
|
|
// CHECK: = fptrunc {{.*}} : f32 to f16
|
|
|
|
%95 = fptrunc %f : f32 to f16
|
|
|
|
|
2019-10-11 20:13:18 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = exp %arg1 : f32
|
|
|
|
%96 = "std.exp"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = exp %arg1 : f32
|
|
|
|
%97 = exp %f : f32
|
|
|
|
|
2019-12-04 23:17:01 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = exp %cst_8 : vector<4xf32>
|
|
|
|
%98 = exp %vcf32 : vector<4xf32>
|
|
|
|
|
2019-10-11 20:13:18 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = exp %arg0 : tensor<4x4x?xf32>
|
2019-12-04 23:17:01 +08:00
|
|
|
%99 = exp %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = absf %arg1 : f32
|
|
|
|
%100 = "std.absf"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = absf %arg1 : f32
|
|
|
|
%101 = absf %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = absf %cst_8 : vector<4xf32>
|
|
|
|
%102 = absf %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = absf %arg0 : tensor<4x4x?xf32>
|
|
|
|
%103 = absf %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = ceilf %arg1 : f32
|
|
|
|
%104 = "std.ceilf"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = ceilf %arg1 : f32
|
|
|
|
%105 = ceilf %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = ceilf %cst_8 : vector<4xf32>
|
|
|
|
%106 = ceilf %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = ceilf %arg0 : tensor<4x4x?xf32>
|
|
|
|
%107 = ceilf %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cos %arg1 : f32
|
|
|
|
%108 = "std.cos"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cos %arg1 : f32
|
|
|
|
%109 = cos %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cos %cst_8 : vector<4xf32>
|
|
|
|
%110 = cos %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = cos %arg0 : tensor<4x4x?xf32>
|
|
|
|
%111 = cos %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = negf %arg1 : f32
|
|
|
|
%112 = "std.negf"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = negf %arg1 : f32
|
|
|
|
%113 = negf %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = negf %cst_8 : vector<4xf32>
|
|
|
|
%114 = negf %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = negf %arg0 : tensor<4x4x?xf32>
|
|
|
|
%115 = negf %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = copysign %arg1, %arg1 : f32
|
|
|
|
%116 = "std.copysign"(%f, %f) : (f32, f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = copysign %arg1, %arg1 : f32
|
|
|
|
%117 = copysign %f, %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = copysign %cst_8, %cst_8 : vector<4xf32>
|
|
|
|
%118 = copysign %vcf32, %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = copysign %arg0, %arg0 : tensor<4x4x?xf32>
|
|
|
|
%119 = copysign %t, %t : tensor<4x4x?xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = tanh %arg1 : f32
|
|
|
|
%120 = "std.tanh"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = tanh %arg1 : f32
|
|
|
|
%121 = tanh %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = tanh %cst_8 : vector<4xf32>
|
|
|
|
%122 = tanh %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = tanh %arg0 : tensor<4x4x?xf32>
|
|
|
|
%123 = tanh %t : tensor<4x4x?xf32>
|
2019-12-23 02:01:35 +08:00
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_left %arg2, %arg2 : i32
|
|
|
|
%124 = "std.shift_left"(%i, %i) : (i32, i32) -> i32
|
|
|
|
|
|
|
|
// CHECK:%{{[0-9]+}} = shift_left %4, %4 : i32
|
|
|
|
%125 = shift_left %i2, %i2 : i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_left %arg3, %arg3 : index
|
|
|
|
%126 = shift_left %idx, %idx : index
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_left %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%127 = shift_left %vci32, %vci32 : vector<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_left %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%128 = shift_left %tci32, %tci32 : tensor<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_signed %arg2, %arg2 : i32
|
|
|
|
%129 = "std.shift_right_signed"(%i, %i) : (i32, i32) -> i32
|
|
|
|
|
|
|
|
// CHECK:%{{[0-9]+}} = shift_right_signed %4, %4 : i32
|
|
|
|
%130 = shift_right_signed %i2, %i2 : i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_signed %arg3, %arg3 : index
|
|
|
|
%131 = shift_right_signed %idx, %idx : index
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_signed %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%132 = shift_right_signed %vci32, %vci32 : vector<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_signed %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%133 = shift_right_signed %tci32, %tci32 : tensor<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_unsigned %arg2, %arg2 : i32
|
|
|
|
%134 = "std.shift_right_unsigned"(%i, %i) : (i32, i32) -> i32
|
|
|
|
|
|
|
|
// CHECK:%{{[0-9]+}} = shift_right_unsigned %4, %4 : i32
|
|
|
|
%135 = shift_right_unsigned %i2, %i2 : i32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_unsigned %arg3, %arg3 : index
|
|
|
|
%136 = shift_right_unsigned %idx, %idx : index
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_unsigned %cst_5, %cst_5 : vector<42xi32>
|
|
|
|
%137 = shift_right_unsigned %vci32, %vci32 : vector<42 x i32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = shift_right_unsigned %cst_4, %cst_4 : tensor<42xi32>
|
|
|
|
%138 = shift_right_unsigned %tci32, %tci32 : tensor<42 x i32>
|
|
|
|
|
[MLIR] Add the sqrt operation to mlir.
Summary: Add and pipe through the sqrt operation for Standard and LLVM dialects.
Reviewers: nicolasvasilache, ftynse
Reviewed By: ftynse
Subscribers: frej, ftynse, merge_guards_bot, flaub, mehdi_amini, rriddle, jpienaar, burmako, shauheen, antiagainst, arpith-jacob, mgester, lucyrfox, aartbik, liufengdb, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D73571
2020-01-30 23:44:44 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = sqrt %arg1 : f32
|
|
|
|
%139 = "std.sqrt"(%f) : (f32) -> f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = sqrt %arg1 : f32
|
|
|
|
%140 = sqrt %f : f32
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = sqrt %cst_8 : vector<4xf32>
|
|
|
|
%141 = sqrt %vcf32 : vector<4xf32>
|
|
|
|
|
|
|
|
// CHECK: %{{[0-9]+}} = sqrt %arg0 : tensor<4x4x?xf32>
|
|
|
|
%142 = sqrt %t : tensor<4x4x?xf32>
|
|
|
|
|
2020-02-26 07:48:23 +08:00
|
|
|
// CHECK: = fpext {{.*}} : vector<4xf32> to vector<4xf64>
|
|
|
|
%143 = fpext %vcf32 : vector<4xf32> to vector<4xf64>
|
|
|
|
|
|
|
|
// CHECK: = fptrunc {{.*}} : vector<4xf32> to vector<4xf16>
|
|
|
|
%144 = fptrunc %vcf32 : vector<4xf32> to vector<4xf16>
|
|
|
|
|
2020-02-28 22:57:38 +08:00
|
|
|
// CHECK: %{{[0-9]+}} = rsqrt %arg1 : f32
|
|
|
|
%145 = rsqrt %f : f32
|
|
|
|
|
2018-07-25 01:13:31 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @affine_apply() {
|
|
|
|
func @affine_apply() {
|
2019-06-26 10:06:06 +08:00
|
|
|
%i = "std.constant"() {value = 0: index} : () -> index
|
|
|
|
%j = "std.constant"() {value = 1: index} : () -> index
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2019-02-07 03:08:18 +08:00
|
|
|
// CHECK: affine.apply #map0(%c0)
|
2020-01-14 05:12:37 +08:00
|
|
|
%a = "affine.apply" (%i) { map = affine_map<(d0) -> (d0 + 1)> } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
2018-07-25 01:13:31 +08:00
|
|
|
|
2019-02-07 03:08:18 +08:00
|
|
|
// CHECK: affine.apply #map1()[%c0]
|
2020-01-14 05:12:37 +08:00
|
|
|
%b = affine.apply affine_map<()[x] -> (x+1)>()[%i]
|
2018-07-29 00:36:25 +08:00
|
|
|
|
2018-07-25 01:13:31 +08:00
|
|
|
return
|
2018-07-26 02:15:20 +08:00
|
|
|
}
|
|
|
|
|
2019-12-19 01:59:37 +08:00
|
|
|
// CHECK-LABEL: func @load_store_prefetch
|
|
|
|
func @load_store_prefetch(memref<4x4xi32>, index) {
|
2018-12-30 03:32:37 +08:00
|
|
|
^bb0(%0: memref<4x4xi32>, %1: index):
|
2018-08-02 01:43:18 +08:00
|
|
|
// CHECK: %0 = load %arg0[%arg1, %arg1] : memref<4x4xi32>
|
2019-03-03 10:03:03 +08:00
|
|
|
%2 = "std.load"(%0, %1, %1) : (memref<4x4xi32>, index, index)->i32
|
2018-07-26 02:15:20 +08:00
|
|
|
|
2019-12-19 01:59:37 +08:00
|
|
|
// CHECK: %{{.*}} = load %arg0[%arg1, %arg1] : memref<4x4xi32>
|
2018-07-26 03:55:50 +08:00
|
|
|
%3 = load %0[%1, %1] : memref<4x4xi32>
|
2018-07-26 02:15:20 +08:00
|
|
|
|
2019-12-19 01:59:37 +08:00
|
|
|
// CHECK: prefetch %arg0[%arg1, %arg1], write, locality<1>, data : memref<4x4xi32>
|
|
|
|
prefetch %0[%1, %1], write, locality<1>, data : memref<4x4xi32>
|
|
|
|
|
|
|
|
// CHECK: prefetch %arg0[%arg1, %arg1], read, locality<3>, instr : memref<4x4xi32>
|
|
|
|
prefetch %0[%1, %1], read, locality<3>, instr : memref<4x4xi32>
|
|
|
|
|
2018-07-26 02:15:20 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-08-08 01:31:14 +08:00
|
|
|
// Test with zero-dimensional operands using no index in load/store.
|
|
|
|
// CHECK-LABEL: func @zero_dim_no_idx
|
|
|
|
func @zero_dim_no_idx(%arg0 : memref<i32>, %arg1 : memref<i32>, %arg2 : memref<i32>) {
|
|
|
|
%0 = std.load %arg0[] : memref<i32>
|
|
|
|
std.store %0, %arg1[] : memref<i32>
|
|
|
|
return
|
|
|
|
// CHECK: %0 = load %{{.*}}[] : memref<i32>
|
|
|
|
// CHECK: store %{{.*}}, %{{.*}}[] : memref<i32>
|
|
|
|
}
|
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @return_op(%arg0: i32) -> i32 {
|
|
|
|
func @return_op(%a : i32) -> i32 {
|
2018-08-10 03:28:58 +08:00
|
|
|
// CHECK: return %arg0 : i32
|
2019-03-03 10:03:03 +08:00
|
|
|
"std.return" (%a) : (i32)->()
|
2018-08-10 03:28:58 +08:00
|
|
|
}
|
2018-08-22 08:55:22 +08:00
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @calls(%arg0: i32) {
|
|
|
|
func @calls(%arg0: i32) {
|
2018-08-22 08:55:22 +08:00
|
|
|
// CHECK: %0 = call @return_op(%arg0) : (i32) -> i32
|
|
|
|
%x = call @return_op(%arg0) : (i32) -> i32
|
|
|
|
// CHECK: %1 = call @return_op(%0) : (i32) -> i32
|
|
|
|
%y = call @return_op(%x) : (i32) -> i32
|
|
|
|
// CHECK: %2 = call @return_op(%0) : (i32) -> i32
|
2019-06-26 10:06:06 +08:00
|
|
|
%z = "std.call"(%x) {callee = @return_op} : (i32) -> i32
|
2018-08-22 08:55:22 +08:00
|
|
|
|
|
|
|
// CHECK: %f = constant @affine_apply : () -> ()
|
|
|
|
%f = constant @affine_apply : () -> ()
|
|
|
|
|
|
|
|
// CHECK: call_indirect %f() : () -> ()
|
|
|
|
call_indirect %f() : () -> ()
|
|
|
|
|
|
|
|
// CHECK: %f_0 = constant @return_op : (i32) -> i32
|
|
|
|
%f_0 = constant @return_op : (i32) -> i32
|
|
|
|
|
|
|
|
// CHECK: %3 = call_indirect %f_0(%arg0) : (i32) -> i32
|
|
|
|
%2 = call_indirect %f_0(%arg0) : (i32) -> i32
|
|
|
|
|
|
|
|
// CHECK: %4 = call_indirect %f_0(%arg0) : (i32) -> i32
|
2019-03-03 10:03:03 +08:00
|
|
|
%3 = "std.call_indirect"(%f_0, %arg0) : ((i32) -> i32, i32) -> i32
|
2018-08-22 08:55:22 +08:00
|
|
|
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @extract_element(%arg0: tensor<*xi32>, %arg1: tensor<4x4xf32>) -> i32 {
|
|
|
|
func @extract_element(%arg0: tensor<*xi32>, %arg1 : tensor<4x4xf32>) -> i32 {
|
2019-06-26 10:06:06 +08:00
|
|
|
%c0 = "std.constant"() {value = 0: index} : () -> index
|
2018-08-24 00:58:23 +08:00
|
|
|
|
2018-09-14 01:43:35 +08:00
|
|
|
// CHECK: %0 = extract_element %arg0[%c0, %c0, %c0, %c0] : tensor<*xi32>
|
|
|
|
%0 = extract_element %arg0[%c0, %c0, %c0, %c0] : tensor<*xi32>
|
2018-08-24 00:58:23 +08:00
|
|
|
|
|
|
|
// CHECK: %1 = extract_element %arg1[%c0, %c0] : tensor<4x4xf32>
|
|
|
|
%1 = extract_element %arg1[%c0, %c0] : tensor<4x4xf32>
|
|
|
|
|
|
|
|
return %0 : i32
|
|
|
|
}
|
2018-08-22 08:55:22 +08:00
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @tensor_cast(%arg0
|
|
|
|
func @tensor_cast(%arg0: tensor<*xf32>, %arg1 : tensor<4x4xf32>, %arg2: tensor<?x?xf32>) {
|
2018-10-25 00:52:06 +08:00
|
|
|
// CHECK: %0 = tensor_cast %arg0 : tensor<*xf32> to tensor<?x?xf32>
|
|
|
|
%0 = tensor_cast %arg0 : tensor<*xf32> to tensor<?x?xf32>
|
2018-09-14 00:16:32 +08:00
|
|
|
|
2018-10-25 00:52:06 +08:00
|
|
|
// CHECK: %1 = tensor_cast %arg1 : tensor<4x4xf32> to tensor<*xf32>
|
|
|
|
%1 = tensor_cast %arg1 : tensor<4x4xf32> to tensor<*xf32>
|
2018-09-14 00:16:32 +08:00
|
|
|
|
2018-10-25 00:52:06 +08:00
|
|
|
// CHECK: %2 = tensor_cast %arg2 : tensor<?x?xf32> to tensor<4x?xf32>
|
|
|
|
%2 = tensor_cast %arg2 : tensor<?x?xf32> to tensor<4x?xf32>
|
2018-09-14 00:16:32 +08:00
|
|
|
|
2018-10-25 00:52:06 +08:00
|
|
|
// CHECK: %3 = tensor_cast %2 : tensor<4x?xf32> to tensor<?x?xf32>
|
|
|
|
%3 = tensor_cast %2 : tensor<4x?xf32> to tensor<?x?xf32>
|
2018-09-14 00:16:32 +08:00
|
|
|
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @memref_cast(%arg0
|
2019-11-26 02:10:58 +08:00
|
|
|
func @memref_cast(%arg0: memref<4xf32>, %arg1 : memref<?xf32>, %arg2 : memref<64x16x4xf32, offset: 0, strides: [64, 4, 1]>) {
|
2018-10-23 00:00:03 +08:00
|
|
|
// CHECK: %0 = memref_cast %arg0 : memref<4xf32> to memref<?xf32>
|
|
|
|
%0 = memref_cast %arg0 : memref<4xf32> to memref<?xf32>
|
|
|
|
|
|
|
|
// CHECK: %1 = memref_cast %arg1 : memref<?xf32> to memref<4xf32>
|
|
|
|
%1 = memref_cast %arg1 : memref<?xf32> to memref<4xf32>
|
2019-11-26 02:10:58 +08:00
|
|
|
|
|
|
|
// CHECK: {{%.*}} = memref_cast %arg2 : memref<64x16x4xf32, #[[BASE_MAP0]]> to memref<64x16x4xf32, #[[BASE_MAP3]]>
|
|
|
|
%2 = memref_cast %arg2 : memref<64x16x4xf32, offset: 0, strides: [64, 4, 1]> to memref<64x16x4xf32, offset: ?, strides: [?, ?, ?]>
|
|
|
|
|
|
|
|
// CHECK: {{%.*}} = memref_cast {{%.*}} : memref<64x16x4xf32, #[[BASE_MAP3]]> to memref<64x16x4xf32, #[[BASE_MAP0]]>
|
|
|
|
%3 = memref_cast %2 : memref<64x16x4xf32, offset: ?, strides: [?, ?, ?]> to memref<64x16x4xf32, offset: 0, strides: [64, 4, 1]>
|
|
|
|
|
2019-12-06 05:12:50 +08:00
|
|
|
// CHECK: memref_cast %{{.*}} : memref<4xf32> to memref<*xf32>
|
|
|
|
%4 = memref_cast %1 : memref<4xf32> to memref<*xf32>
|
|
|
|
|
|
|
|
// CHECK: memref_cast %{{.*}} : memref<*xf32> to memref<4xf32>
|
|
|
|
%5 = memref_cast %4 : memref<*xf32> to memref<4xf32>
|
2018-10-23 00:00:03 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-11-07 00:53:39 +08:00
|
|
|
// CHECK-LABEL: func @memref_view(%arg0
|
|
|
|
func @memref_view(%arg0 : index, %arg1 : index, %arg2 : index) {
|
|
|
|
%0 = alloc() : memref<2048xi8>
|
|
|
|
// Test two dynamic sizes and dynamic offset.
|
2019-11-08 02:19:54 +08:00
|
|
|
// CHECK: %{{.*}} = std.view %0[%arg2][%arg0, %arg1] : memref<2048xi8> to memref<?x?xf32, #[[VIEW_MAP2]]>
|
|
|
|
%1 = view %0[%arg2][%arg0, %arg1]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<2048xi8> to memref<?x?xf32, affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + d1 + s0)>>
|
2019-11-07 00:53:39 +08:00
|
|
|
|
|
|
|
// Test two dynamic sizes and static offset.
|
2019-11-08 02:19:54 +08:00
|
|
|
// CHECK: %{{.*}} = std.view %0[][%arg0, %arg1] : memref<2048xi8> to memref<?x?xf32, #[[VIEW_MAP3]]>
|
|
|
|
%2 = view %0[][%arg0, %arg1]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<2048xi8> to memref<?x?xf32, affine_map<(d0, d1)[s0] -> (d0 * s0 + d1)>>
|
2019-11-07 00:53:39 +08:00
|
|
|
|
|
|
|
// Test one dynamic size and dynamic offset.
|
2019-11-08 02:19:54 +08:00
|
|
|
// CHECK: %{{.*}} = std.view %0[%arg2][%arg1] : memref<2048xi8> to memref<4x?xf32, #[[VIEW_MAP2]]>
|
|
|
|
%3 = view %0[%arg2][%arg1]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<2048xi8> to memref<4x?xf32, affine_map<(d0, d1)[s0, s1] -> (d0 * s1 + d1 + s0)>>
|
2019-11-07 00:53:39 +08:00
|
|
|
|
|
|
|
// Test one dynamic size and static offset.
|
2019-11-08 02:19:54 +08:00
|
|
|
// CHECK: %{{.*}} = std.view %0[][%arg0] : memref<2048xi8> to memref<?x4xf32, #[[VIEW_MAP1]]>
|
|
|
|
%4 = view %0[][%arg0]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<2048xi8> to memref<?x4xf32, affine_map<(d0, d1) -> (d0 * 4 + d1)>>
|
2019-11-07 00:53:39 +08:00
|
|
|
|
|
|
|
// Test static sizes and static offset.
|
|
|
|
// CHECK: %{{.*}} = std.view %0[][] : memref<2048xi8> to memref<64x4xf32, #[[VIEW_MAP1]]>
|
|
|
|
%5 = view %0[][]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<2048xi8> to memref<64x4xf32, affine_map<(d0, d1) -> (d0 * 4 + d1)>>
|
2019-11-07 00:53:39 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-11-12 02:32:52 +08:00
|
|
|
// CHECK-LABEL: func @memref_subview(%arg0
|
|
|
|
func @memref_subview(%arg0 : index, %arg1 : index, %arg2 : index) {
|
|
|
|
%c0 = constant 0 : index
|
|
|
|
%c1 = constant 1 : index
|
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
%0 = alloc() : memref<8x16x4xf32, affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2)>>
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview %0[%c0, %c0, %c0] [%arg0, %arg1, %arg2] [%c1, %c1, %c1] : memref<8x16x4xf32, #[[BASE_MAP0]]> to memref<?x?x?xf32, #[[SUBVIEW_MAP0]]>
|
2019-11-12 02:32:52 +08:00
|
|
|
%1 = subview %0[%c0, %c0, %c0][%arg0, %arg1, %arg2][%c1, %c1, %c1]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<8x16x4xf32, affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2)>> to
|
2019-11-12 02:32:52 +08:00
|
|
|
memref<?x?x?xf32,
|
2020-01-14 05:12:37 +08:00
|
|
|
affine_map<(d0, d1, d2)[s0, s1, s2, s3] -> (d0 * s1 + d1 * s2 + d2 * s3 + s0)>>
|
2019-11-12 02:32:52 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
%2 = alloc()[%arg2] : memref<64xf32, affine_map<(d0)[s0] -> (d0 + s0)>>
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview %2[%c1] [%arg0] [%c1] : memref<64xf32, #[[BASE_MAP1]]> to memref<?xf32, #[[SUBVIEW_MAP1]]>
|
2019-11-12 02:32:52 +08:00
|
|
|
%3 = subview %2[%c1][%arg0][%c1]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<64xf32, affine_map<(d0)[s0] -> (d0 + s0)>> to
|
|
|
|
memref<?xf32, affine_map<(d0)[s0, s1] -> (d0 * s1 + s0)>>
|
2019-11-12 02:32:52 +08:00
|
|
|
|
2020-01-14 05:12:37 +08:00
|
|
|
%4 = alloc() : memref<64x22xf32, affine_map<(d0, d1) -> (d0 * 22 + d1)>>
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview %4[%c0, %c1] [%arg0, %arg1] [%c1, %c0] : memref<64x22xf32, #[[BASE_MAP2]]> to memref<?x?xf32, #[[SUBVIEW_MAP2]]>
|
2019-11-12 02:32:52 +08:00
|
|
|
%5 = subview %4[%c0, %c1][%arg0, %arg1][%c1, %c0]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<64x22xf32, affine_map<(d0, d1) -> (d0 * 22 + d1)>> to
|
|
|
|
memref<?x?xf32, affine_map<(d0, d1)[s0, s1, s2] -> (d0 * s1 + d1 * s2 + s0)>>
|
2019-11-15 04:22:28 +08:00
|
|
|
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview %0[] [] [] : memref<8x16x4xf32, #[[BASE_MAP0]]> to memref<4x4x4xf32, #[[SUBVIEW_MAP3]]>
|
2019-11-15 04:22:28 +08:00
|
|
|
%6 = subview %0[][][]
|
2020-01-14 05:12:37 +08:00
|
|
|
: memref<8x16x4xf32, affine_map<(d0, d1, d2) -> (d0 * 64 + d1 * 4 + d2)>> to
|
|
|
|
memref<4x4x4xf32, affine_map<(d0, d1, d2) -> (d0 * 16 + d1 * 4 + d2 + 8)>>
|
2019-11-15 04:22:28 +08:00
|
|
|
|
2019-11-21 03:16:37 +08:00
|
|
|
%7 = alloc(%arg1, %arg2) : memref<?x?xf32>
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview {{%.*}}[] [] [] : memref<?x?xf32> to memref<4x4xf32, #[[SUBVIEW_MAP4]]>
|
2019-11-21 03:16:37 +08:00
|
|
|
%8 = subview %7[][][]
|
|
|
|
: memref<?x?xf32> to memref<4x4xf32, offset: ?, strides:[?, ?]>
|
|
|
|
|
|
|
|
%9 = alloc() : memref<16x4xf32>
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview {{%.*}}[{{%.*}}, {{%.*}}] [] [{{%.*}}, {{%.*}}] : memref<16x4xf32> to memref<4x4xf32, #[[SUBVIEW_MAP4]]
|
2019-11-21 03:16:37 +08:00
|
|
|
%10 = subview %9[%arg1, %arg1][][%arg2, %arg2]
|
|
|
|
: memref<16x4xf32> to memref<4x4xf32, offset: ?, strides:[?, ?]>
|
2020-03-06 04:40:53 +08:00
|
|
|
// CHECK: subview {{%.*}}[{{%.*}}, {{%.*}}] [] [] : memref<16x4xf32> to memref<4x4xf32, #[[SUBVIEW_MAP5]]
|
2019-11-21 03:16:37 +08:00
|
|
|
%11 = subview %9[%arg1, %arg2][][]
|
|
|
|
: memref<16x4xf32> to memref<4x4xf32, offset: ?, strides:[8, 2]>
|
2019-11-12 02:32:52 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-01-03 02:20:00 +08:00
|
|
|
// CHECK-LABEL: func @test_dimop(%arg0
|
|
|
|
func @test_dimop(%arg0: tensor<4x4x?xf32>) {
|
2018-09-27 07:21:49 +08:00
|
|
|
// CHECK: %0 = dim %arg0, 2 : tensor<4x4x?xf32>
|
|
|
|
%0 = dim %arg0, 2 : tensor<4x4x?xf32>
|
2019-09-28 02:57:52 +08:00
|
|
|
// use dim as an index to ensure type correctness
|
2020-01-14 05:12:37 +08:00
|
|
|
%1 = affine.apply affine_map<(d0) -> (d0)>(%0)
|
2018-09-27 07:21:49 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-09-25 03:44:11 +08:00
|
|
|
// CHECK-LABEL: func @test_splat_op
|
|
|
|
// CHECK-SAME: [[S:%arg[0-9]+]]: f32
|
|
|
|
func @test_splat_op(%s : f32) {
|
|
|
|
%v = splat %s : vector<8xf32>
|
|
|
|
// CHECK: splat [[S]] : vector<8xf32>
|
|
|
|
%t = splat %s : tensor<8xf32>
|
|
|
|
// CHECK: splat [[S]] : tensor<8xf32>
|
|
|
|
%u = "std.splat"(%s) : (f32) -> vector<4xf32>
|
|
|
|
// CHECK: splat [[S]] : vector<4xf32>
|
|
|
|
return
|
|
|
|
}
|
[MLIR] Add VectorTransferOps
This CL implements and uses VectorTransferOps in lieu of the former custom
call op. Tests are updated accordingly.
VectorTransferOps come in 2 flavors: VectorTransferReadOp and
VectorTransferWriteOp.
VectorTransferOps can be thought of as a backend-independent
pseudo op/library call that needs to be legalized to MLIR (whiteboxed) before
it can be lowered to backend-dependent IR.
Note that the current implementation does not yet support a real permutation
map. Proper support will come in a followup CL.
VectorTransferReadOp
====================
VectorTransferReadOp performs a blocking read from a scalar memref
location into a super-vector of the same elemental type. This operation is
called 'read' by opposition to 'load' because the super-vector granularity
is generally not representable with a single hardware register. As a
consequence, memory transfers will generally be required when lowering
VectorTransferReadOp. A VectorTransferReadOp is thus a mid-level abstraction
that supports super-vectorization with non-effecting padding for full-tile
only code.
A vector transfer read has semantics similar to a vector load, with additional
support for:
1. an optional value of the elemental type of the MemRef. This value
supports non-effecting padding and is inserted in places where the
vector read exceeds the MemRef bounds. If the value is not specified,
the access is statically guaranteed to be within bounds;
2. an attribute of type AffineMap to specify a slice of the original
MemRef access and its transposition into the super-vector shape. The
permutation_map is an unbounded AffineMap that must represent a
permutation from the MemRef dim space projected onto the vector dim
space.
Example:
```mlir
%A = alloc(%size1, %size2, %size3, %size4) : memref<?x?x?x?xf32>
...
%val = `ssa-value` : f32
// let %i, %j, %k, %l be ssa-values of type index
%v0 = vector_transfer_read %src, %i, %j, %k, %l
{permutation_map: (d0, d1, d2, d3) -> (d3, d1, d2)} :
(memref<?x?x?x?xf32>, index, index, index, index) ->
vector<16x32x64xf32>
%v1 = vector_transfer_read %src, %i, %j, %k, %l, %val
{permutation_map: (d0, d1, d2, d3) -> (d3, d1, d2)} :
(memref<?x?x?x?xf32>, index, index, index, index, f32) ->
vector<16x32x64xf32>
```
VectorTransferWriteOp
=====================
VectorTransferWriteOp performs a blocking write from a super-vector to
a scalar memref of the same elemental type. This operation is
called 'write' by opposition to 'store' because the super-vector
granularity is generally not representable with a single hardware register. As
a consequence, memory transfers will generally be required when lowering
VectorTransferWriteOp. A VectorTransferWriteOp is thus a mid-level
abstraction that supports super-vectorization with non-effecting padding
for full-tile only code.
A vector transfer write has semantics similar to a vector store, with
additional support for handling out-of-bounds situations.
Example:
```mlir
%A = alloc(%size1, %size2, %size3, %size4) : memref<?x?x?x?xf32>.
%val = `ssa-value` : vector<16x32x64xf32>
// let %i, %j, %k, %l be ssa-values of type index
vector_transfer_write %val, %src, %i, %j, %k, %l
{permutation_map: (d0, d1, d2, d3) -> (d3, d1, d2)} :
(vector<16x32x64xf32>, memref<?x?x?x?xf32>, index, index, index, index)
```
PiperOrigin-RevId: 223873234
2018-12-04 07:21:27 +08:00
|
|
|
|
2019-08-29 02:25:19 +08:00
|
|
|
// CHECK-LABEL: func @tensor_load_store
|
|
|
|
func @tensor_load_store(%0 : memref<4x4xi32>) {
|
|
|
|
// CHECK: %[[TENSOR:.*]] = tensor_load %[[MEMREF:.*]] : memref<4x4xi32>
|
|
|
|
%1 = tensor_load %0 : memref<4x4xi32>
|
|
|
|
// CHECK: tensor_store %[[TENSOR]], %[[MEMREF]] : memref<4x4xi32>
|
|
|
|
tensor_store %1, %0 : memref<4x4xi32>
|
|
|
|
return
|
|
|
|
}
|
[MLIR] Add std.assume_alignment op.
Reviewers: ftynse, nicolasvasilache, andydavis1
Subscribers: bixia, sanjoy.google, mehdi_amini, rriddle, jpienaar, burmako, shauheen, antiagainst, arpith-jacob, mgester, lucyrfox, aartbik, liufengdb, Joonsoo, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D74378
2020-02-11 11:44:42 +08:00
|
|
|
|
2020-02-25 08:49:52 +08:00
|
|
|
// CHECK-LABEL: func @atomic_rmw
|
|
|
|
func @atomic_rmw(%I: memref<10xf32>, %val: f32, %i : index) {
|
|
|
|
// CHECK: %{{.*}} = atomic_rmw "addf" %{{.*}}, %{{.*}}[%{{.*}}]
|
|
|
|
%x = atomic_rmw "addf" %val, %I[%i] : (f32, memref<10xf32>) -> f32
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
[MLIR] Add std.assume_alignment op.
Reviewers: ftynse, nicolasvasilache, andydavis1
Subscribers: bixia, sanjoy.google, mehdi_amini, rriddle, jpienaar, burmako, shauheen, antiagainst, arpith-jacob, mgester, lucyrfox, aartbik, liufengdb, Joonsoo, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D74378
2020-02-11 11:44:42 +08:00
|
|
|
// CHECK-LABEL: func @assume_alignment
|
|
|
|
// CHECK-SAME: %[[MEMREF:.*]]: memref<4x4xf16>
|
|
|
|
func @assume_alignment(%0: memref<4x4xf16>) {
|
|
|
|
// CHECK: assume_alignment %[[MEMREF]], 16 : memref<4x4xf16>
|
|
|
|
assume_alignment %0, 16 : memref<4x4xf16>
|
|
|
|
return
|
|
|
|
}
|