2018-09-20 12:35:11 +08:00
|
|
|
// RUN: mlir-opt %s -loop-unroll -unroll-full | FileCheck %s
|
|
|
|
// RUN: mlir-opt %s -loop-unroll -unroll-full -unroll-full-threshold=2 | FileCheck %s --check-prefix SHORT
|
|
|
|
// RUN: mlir-opt %s -loop-unroll -unroll-factor=4 | FileCheck %s --check-prefix UNROLL-BY-4
|
2018-07-25 11:01:16 +08:00
|
|
|
|
2018-08-16 00:09:54 +08:00
|
|
|
// CHECK: #map0 = (d0) -> (d0 + 1)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK: #map1 = (d0) -> (d0 + 2)
|
|
|
|
// CHECK: #map2 = (d0) -> (d0 + 3)
|
|
|
|
// CHECK: #map3 = (d0) -> (d0 + 4)
|
|
|
|
// CHECK: #map4 = (d0, d1) -> (d0 + 1, d1 + 2)
|
|
|
|
// CHECK: #map5 = (d0, d1) -> (d0 + 3, d1 + 4)
|
|
|
|
// CHECK: #map6 = (d0)[s0] -> (d0 + s0 + 1)
|
|
|
|
// CHECK: #map7 = (d0) -> (d0 + 5)
|
|
|
|
// CHECK: #map8 = (d0) -> (d0 + 6)
|
|
|
|
// CHECK: #map9 = (d0) -> (d0 + 7)
|
|
|
|
// CHECK: #map10 = (d0, d1) -> (d0 * 16 + d1)
|
|
|
|
// CHECK: #map11 = (d0) -> (d0 + 8)
|
|
|
|
// CHECK: #map12 = (d0) -> (d0 + 9)
|
|
|
|
// CHECK: #map13 = (d0) -> (d0 + 10)
|
|
|
|
// CHECK: #map14 = (d0) -> (d0 + 15)
|
|
|
|
// CHECK: #map15 = (d0) -> (d0 + 20)
|
|
|
|
// CHECK: #map16 = (d0) -> (d0 + 25)
|
|
|
|
// CHECK: #map17 = (d0) -> (d0 + 30)
|
|
|
|
// CHECK: #map18 = (d0) -> (d0 + 35)
|
|
|
|
|
|
|
|
// SHORT: #map0 = (d0) -> (d0 + 1)
|
|
|
|
// SHORT: #map1 = (d0) -> (d0 + 2)
|
|
|
|
// SHORT: #map2 = (d0, d1) -> (d0 + 1, d1 + 2)
|
|
|
|
// SHORT: #map3 = (d0, d1) -> (d0 + 3, d1 + 4)
|
|
|
|
// SHORT: #map4 = (d0)[s0] -> (d0 + s0 + 1)
|
|
|
|
// SHORT: #map5 = (d0, d1) -> (d0 * 16 + d1)
|
|
|
|
|
|
|
|
// UNROLL-BY-4: #map0 = (d0) -> (d0 + 1)
|
|
|
|
// UNROLL-BY-4: #map1 = (d0) -> (d0 + 2)
|
|
|
|
// UNROLL-BY-4: #map2 = (d0) -> (d0 + 3)
|
|
|
|
// UNROLL-BY-4: #map3 = (d0, d1) -> (d0 + 1, d1 + 2)
|
|
|
|
// UNROLL-BY-4: #map4 = (d0, d1) -> (d0 + 3, d1 + 4)
|
|
|
|
// UNROLL-BY-4: #map5 = (d0)[s0] -> (d0 + s0 + 1)
|
|
|
|
// UNROLL-BY-4: #map6 = (d0, d1) -> (d0 * 16 + d1)
|
|
|
|
// UNROLL-BY-4: #map7 = (d0) -> (d0 + 5)
|
|
|
|
// UNROLL-BY-4: #map8 = (d0) -> (d0 + 10)
|
|
|
|
// UNROLL-BY-4: #map9 = (d0) -> (d0 + 15)
|
2018-08-16 00:09:54 +08:00
|
|
|
|
2018-08-04 04:22:26 +08:00
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_simplest() {
|
|
|
|
mlfunc @loop_nest_simplest() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %i = 0 to 100 step 2 {
|
2018-08-07 09:40:34 +08:00
|
|
|
// CHECK: %c1_i32 = constant 1 : i32
|
|
|
|
// CHECK-NEXT: %c1_i32_0 = constant 1 : i32
|
2018-08-02 13:36:12 +08:00
|
|
|
// CHECK-NEXT: %c1_i32_1 = constant 1 : i32
|
|
|
|
// CHECK-NEXT: %c1_i32_2 = constant 1 : i32
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 4 {
|
2018-08-02 13:36:12 +08:00
|
|
|
%x = constant 1 : i32
|
2018-07-25 11:01:16 +08:00
|
|
|
}
|
|
|
|
} // CHECK: }
|
|
|
|
return // CHECK: return
|
|
|
|
} // CHECK }
|
2018-08-02 13:36:12 +08:00
|
|
|
|
2018-08-04 04:22:26 +08:00
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_simple_iv_use() {
|
|
|
|
mlfunc @loop_nest_simple_iv_use() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %c0 = constant 0 : index
|
|
|
|
// CHECK-NEXT: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %i = 0 to 100 step 2 {
|
|
|
|
// CHECK: %0 = "addi32"(%c0, %c0) : (index, index) -> i32
|
|
|
|
// CHECK: %1 = affine_apply #map0(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %2 = "addi32"(%1, %1) : (index, index) -> i32
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %3 = affine_apply #map1(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %4 = "addi32"(%3, %3) : (index, index) -> i32
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %5 = affine_apply #map2(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %6 = "addi32"(%5, %5) : (index, index) -> i32
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 4 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%x = "addi32"(%j, %j) : (index, index) -> i32
|
2018-08-04 04:22:26 +08:00
|
|
|
}
|
|
|
|
} // CHECK: }
|
|
|
|
return // CHECK: return
|
|
|
|
} // CHECK }
|
|
|
|
|
2018-08-07 09:40:34 +08:00
|
|
|
// Operations in the loop body have results that are used therein.
|
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_body_def_use() {
|
|
|
|
mlfunc @loop_nest_body_def_use() {
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK: %c0 = constant 0 : index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %i = 0 to 100 step 2 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK: %c0_0 = constant 0 : index
|
|
|
|
%c0 = constant 0 : index
|
2018-08-16 00:09:54 +08:00
|
|
|
// CHECK: %0 = affine_apply #map0(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %1 = "addi32"(%0, %c0_0) : (index, index) -> index
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %2 = affine_apply #map0(%c0)
|
|
|
|
// CHECK-NEXT: %3 = affine_apply #map0(%2)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %4 = "addi32"(%3, %c0_0) : (index, index) -> index
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %5 = affine_apply #map1(%c0)
|
|
|
|
// CHECK-NEXT: %6 = affine_apply #map0(%5)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %7 = "addi32"(%6, %c0_0) : (index, index) -> index
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %8 = affine_apply #map2(%c0)
|
|
|
|
// CHECK-NEXT: %9 = affine_apply #map0(%8)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %10 = "addi32"(%9, %c0_0) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 4 {
|
2018-08-07 09:40:34 +08:00
|
|
|
%x = "affine_apply" (%j) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
|
|
|
%y = "addi32"(%x, %c0) : (index, index) -> index
|
2018-08-07 09:40:34 +08:00
|
|
|
}
|
|
|
|
} // CHECK: }
|
|
|
|
return // CHECK: return
|
|
|
|
} // CHECK }
|
|
|
|
|
2018-08-04 04:22:26 +08:00
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_strided() {
|
|
|
|
mlfunc @loop_nest_strided() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %c2 = constant 2 : index
|
|
|
|
// CHECK-NEXT: %c2_0 = constant 2 : index
|
|
|
|
// CHECK-NEXT: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
|
|
|
// CHECK: %0 = affine_apply #map0(%c2_0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %1 = "addi32"(%0, %0) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %2 = affine_apply #map1(%c2_0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %3 = affine_apply #map0(%2)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %4 = "addi32"(%3, %3) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 2 to 6 step 2 {
|
2018-08-04 04:22:26 +08:00
|
|
|
%x = "affine_apply" (%j) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
|
|
|
%y = "addi32"(%x, %x) : (index, index) -> index
|
2018-08-04 04:22:26 +08:00
|
|
|
}
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %5 = affine_apply #map0(%c2)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %6 = "addi32"(%5, %5) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %7 = affine_apply #map1(%c2)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %8 = affine_apply #map0(%7)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %9 = "addi32"(%8, %8) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %10 = affine_apply #map3(%c2)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %11 = affine_apply #map0(%10)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %12 = "addi32"(%11, %11) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
for %k = 2 to 7 step 2 {
|
2018-08-04 04:22:26 +08:00
|
|
|
%z = "affine_apply" (%k) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
|
|
|
%w = "addi32"(%z, %z) : (index, index) -> index
|
2018-08-04 04:22:26 +08:00
|
|
|
}
|
|
|
|
} // CHECK: }
|
|
|
|
return // CHECK: return
|
|
|
|
} // CHECK }
|
|
|
|
|
2018-08-07 09:40:34 +08:00
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_multiple_results() {
|
|
|
|
mlfunc @loop_nest_multiple_results() {
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK: %c0 = constant 0 : index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK: %0 = affine_apply #map4(%i0, %c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %1 = "addi32"(%0#0, %0#1) : (index, index) -> index
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %2 = affine_apply #map5(%i0, %c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %3 = "fma"(%2#0, %2#1, %0#0) : (index, index, index) -> (index, index)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %4 = affine_apply #map0(%c0)
|
|
|
|
// CHECK-NEXT: %5 = affine_apply #map4(%i0, %4)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %6 = "addi32"(%5#0, %5#1) : (index, index) -> index
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %7 = affine_apply #map5(%i0, %4)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %8 = "fma"(%7#0, %7#1, %5#0) : (index, index, index) -> (index, index)
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 2 step 1 {
|
2018-08-07 09:40:34 +08:00
|
|
|
%x = "affine_apply" (%i, %j) { map: (d0, d1) -> (d0 + 1, d1 + 2) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index, index) -> (index, index)
|
|
|
|
%y = "addi32"(%x#0, %x#1) : (index, index) -> index
|
2018-08-07 09:40:34 +08:00
|
|
|
%z = "affine_apply" (%i, %j) { map: (d0, d1) -> (d0 + 3, d1 + 4) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index, index) -> (index, index)
|
|
|
|
%w = "fma"(%z#0, %z#1, %x#0) : (index, index, index) -> (index, index)
|
2018-08-04 04:22:26 +08:00
|
|
|
}
|
|
|
|
} // CHECK: }
|
|
|
|
return // CHECK: return
|
|
|
|
} // CHECK }
|
|
|
|
|
|
|
|
|
|
|
|
// Imperfect loop nest. Unrolling innermost here yields a perfect nest.
|
2018-08-07 02:54:39 +08:00
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_seq_imperfect(%arg0 : memref<128x128xf32>) {
|
2018-08-04 04:22:26 +08:00
|
|
|
mlfunc @loop_nest_seq_imperfect(%a : memref<128x128xf32>) {
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %c0 = constant 0 : index
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %c128 = constant 128 : index
|
|
|
|
%c128 = constant 128 : index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK: %0 = "vld"(%i0) : (index) -> i32
|
|
|
|
%ld = "vld"(%i) : (index) -> i32
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: %1 = affine_apply #map0(%c0)
|
|
|
|
// CHECK-NEXT: %2 = "vmulf"(%c0, %1) : (index, index) -> index
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %3 = "vaddf"(%2, %2) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %4 = affine_apply #map0(%c0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %5 = affine_apply #map0(%4)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %6 = "vmulf"(%4, %5) : (index, index) -> index
|
|
|
|
// CHECK-NEXT: %7 = "vaddf"(%6, %6) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %8 = affine_apply #map1(%c0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %9 = affine_apply #map0(%8)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %10 = "vmulf"(%8, %9) : (index, index) -> index
|
|
|
|
// CHECK-NEXT: %11 = "vaddf"(%10, %10) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %12 = affine_apply #map2(%c0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %13 = affine_apply #map0(%12)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: %14 = "vmulf"(%12, %13) : (index, index) -> index
|
|
|
|
// CHECK-NEXT: %15 = "vaddf"(%14, %14) : (index, index) -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 4 {
|
2018-08-02 13:36:12 +08:00
|
|
|
%x = "affine_apply" (%j) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
|
|
|
%y = "vmulf"(%j, %x) : (index, index) -> index
|
|
|
|
%z = "vaddf"(%y, %y) : (index, index) -> index
|
2018-08-02 13:36:12 +08:00
|
|
|
}
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK: %16 = "scale"(%c128, %i0) : (index, index) -> index
|
|
|
|
%addr = "scale"(%c128, %i) : (index, index) -> index
|
|
|
|
// CHECK: "vst"(%16, %i0) : (index, index) -> ()
|
|
|
|
"vst"(%addr, %i) : (index, index) -> ()
|
2018-08-04 04:22:26 +08:00
|
|
|
} // CHECK }
|
|
|
|
return // CHECK: return
|
|
|
|
}
|
|
|
|
|
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_seq_multiple() {
|
|
|
|
mlfunc @loop_nest_seq_multiple() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: c0 = constant 0 : index
|
|
|
|
// CHECK-NEXT: %c0_0 = constant 0 : index
|
|
|
|
// CHECK-NEXT: %0 = affine_apply #map0(%c0_0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: "mul"(%0, %0) : (index, index) -> ()
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %1 = affine_apply #map0(%c0_0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %2 = affine_apply #map0(%1)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: "mul"(%2, %2) : (index, index) -> ()
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %3 = affine_apply #map1(%c0_0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %4 = affine_apply #map0(%3)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: "mul"(%4, %4) : (index, index) -> ()
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %5 = affine_apply #map2(%c0_0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %6 = affine_apply #map0(%5)
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK-NEXT: "mul"(%6, %6) : (index, index) -> ()
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 4 {
|
2018-08-04 04:22:26 +08:00
|
|
|
%x = "affine_apply" (%j) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
|
|
|
"mul"(%x, %x) : (index, index) -> ()
|
2018-08-04 04:22:26 +08:00
|
|
|
}
|
2018-08-02 13:36:12 +08:00
|
|
|
|
2018-10-07 08:21:53 +08:00
|
|
|
// CHECK: %c99 = constant 99 : index
|
|
|
|
%k = "constant"(){value: 99} : () -> index
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %m = 0 to 100 step 2 {
|
|
|
|
// CHECK: %7 = affine_apply #map0(%c0)
|
|
|
|
// CHECK-NEXT: %8 = affine_apply #map6(%c0)[%c99]
|
|
|
|
// CHECK-NEXT: %9 = affine_apply #map0(%c0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %10 = affine_apply #map0(%9)
|
|
|
|
// CHECK-NEXT: %11 = affine_apply #map6(%9)[%c99]
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %12 = affine_apply #map1(%c0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %13 = affine_apply #map0(%12)
|
|
|
|
// CHECK-NEXT: %14 = affine_apply #map6(%12)[%c99]
|
2018-11-07 21:44:50 +08:00
|
|
|
// CHECK-NEXT: %15 = affine_apply #map2(%c0)
|
2018-09-08 05:47:21 +08:00
|
|
|
// CHECK-NEXT: %16 = affine_apply #map0(%15)
|
|
|
|
// CHECK-NEXT: %17 = affine_apply #map6(%15)[%c99]
|
2018-11-07 21:44:50 +08:00
|
|
|
for %n = 0 to 4 {
|
2018-08-02 13:36:12 +08:00
|
|
|
%y = "affine_apply" (%n) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
2018-08-02 13:36:12 +08:00
|
|
|
%z = "affine_apply" (%n, %k) { map: (d0) [s0] -> (d0 + s0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index, index) -> (index)
|
2018-08-02 13:36:12 +08:00
|
|
|
} // CHECK }
|
|
|
|
} // CHECK }
|
|
|
|
return // CHECK: return
|
|
|
|
} // CHECK }
|
2018-08-07 09:40:34 +08:00
|
|
|
|
|
|
|
// SHORT-LABEL: mlfunc @loop_nest_outer_unroll() {
|
|
|
|
mlfunc @loop_nest_outer_unroll() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// SHORT: for %i0 = 0 to 4 {
|
2018-08-16 00:09:54 +08:00
|
|
|
// SHORT-NEXT: %0 = affine_apply #map0(%i0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// SHORT-NEXT: %1 = "addi32"(%0, %0) : (index, index) -> index
|
2018-08-07 09:40:34 +08:00
|
|
|
// SHORT-NEXT: }
|
2018-11-07 21:44:50 +08:00
|
|
|
// SHORT-NEXT: for %i1 = 0 to 4 {
|
2018-08-16 00:09:54 +08:00
|
|
|
// SHORT-NEXT: %2 = affine_apply #map0(%i1)
|
2018-10-07 08:21:53 +08:00
|
|
|
// SHORT-NEXT: %3 = "addi32"(%2, %2) : (index, index) -> index
|
2018-08-07 09:40:34 +08:00
|
|
|
// SHORT-NEXT: }
|
2018-11-07 21:44:50 +08:00
|
|
|
for %i = 0 to 2 {
|
|
|
|
for %j = 0 to 4 {
|
2018-08-07 09:40:34 +08:00
|
|
|
%x = "affine_apply" (%j) { map: (d0) -> (d0 + 1) } :
|
2018-10-07 08:21:53 +08:00
|
|
|
(index) -> (index)
|
|
|
|
%y = "addi32"(%x, %x) : (index, index) -> index
|
2018-08-07 09:40:34 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return // SHORT: return
|
|
|
|
} // SHORT }
|
2018-08-17 04:51:44 +08:00
|
|
|
|
|
|
|
// We aren't doing any file check here. We just need this test case to
|
|
|
|
// successfully run. Both %i0 and i1 will get unrolled here with the min trip
|
|
|
|
// count threshold set to 2.
|
|
|
|
// SHORT-LABEL: mlfunc @loop_nest_seq_long() -> i32 {
|
|
|
|
mlfunc @loop_nest_seq_long() -> i32 {
|
|
|
|
%A = alloc() : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
%B = alloc() : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
%C = alloc() : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
|
|
|
|
%zero = constant 0 : i32
|
|
|
|
%one = constant 1 : i32
|
|
|
|
%two = constant 2 : i32
|
|
|
|
|
2018-10-07 08:21:53 +08:00
|
|
|
%zero_idx = constant 0 : index
|
2018-08-17 04:51:44 +08:00
|
|
|
|
|
|
|
for %n0 = 0 to 512 {
|
2018-11-07 21:44:50 +08:00
|
|
|
for %n1 = 0 to 8 {
|
2018-08-17 04:51:44 +08:00
|
|
|
store %one, %A[%n0, %n1] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
store %two, %B[%n0, %n1] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
store %zero, %C[%n0, %n1] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-11-07 21:44:50 +08:00
|
|
|
for %i0 = 0 to 2 {
|
|
|
|
for %i1 = 0 to 2 {
|
|
|
|
for %i2 = 0 to 8 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%b2 = "affine_apply" (%i1, %i2) {map: (d0, d1) -> (16*d0 + d1)} : (index, index) -> index
|
2018-08-17 04:51:44 +08:00
|
|
|
%x = load %B[%i0, %b2] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
"op1"(%x) : (i32) -> ()
|
|
|
|
}
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j1 = 0 to 8 {
|
|
|
|
for %j2 = 0 to 8 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%a2 = "affine_apply" (%i1, %j2) {map: (d0, d1) -> (16*d0 + d1)} : (index, index) -> index
|
2018-08-17 04:51:44 +08:00
|
|
|
%v203 = load %A[%j1, %a2] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
"op2"(%v203) : (i32) -> ()
|
|
|
|
}
|
2018-11-07 21:44:50 +08:00
|
|
|
for %k2 = 0 to 8 {
|
2018-08-17 04:51:44 +08:00
|
|
|
%s0 = "op3"() : () -> i32
|
2018-10-07 08:21:53 +08:00
|
|
|
%c2 = "affine_apply" (%i0, %k2) {map: (d0, d1) -> (16*d0 + d1)} : (index, index) -> index
|
2018-08-17 04:51:44 +08:00
|
|
|
%s1 = load %C[%j1, %c2] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
%s2 = "addi32"(%s0, %s1) : (i32, i32) -> i32
|
|
|
|
store %s2, %C[%j1, %c2] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
}
|
|
|
|
}
|
|
|
|
"op4"() : () -> ()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
%ret = load %C[%zero_idx, %zero_idx] : memref<512 x 512 x i32, (d0, d1) -> (d0, d1), 2>
|
|
|
|
return %ret : i32
|
|
|
|
}
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
|
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @unroll_unit_stride_no_cleanup() {
|
|
|
|
mlfunc @unroll_unit_stride_no_cleanup() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
|
|
|
// UNROLL-BY-4: for [[L1:%i[0-9]+]] = 0 to 8 step 4 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %0 = "addi32"([[L1]], [[L1]]) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %1 = "addi32"(%0, %0) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %2 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %3 = "addi32"(%2, %2) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %4 = "addi32"(%3, %3) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %5 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %6 = "addi32"(%5, %5) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %7 = "addi32"(%6, %6) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %8 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %9 = "addi32"(%8, %8) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %10 = "addi32"(%9, %9) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 8 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%x = "addi32"(%j, %j) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
%y = "addi32"(%x, %x) : (i32, i32) -> i32
|
|
|
|
}
|
|
|
|
// empty loop
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i2 = 0 to 8 {
|
|
|
|
for %k = 0 to 8 {
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @unroll_unit_stride_cleanup() {
|
|
|
|
mlfunc @unroll_unit_stride_cleanup() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
|
|
|
// UNROLL-BY-4: for [[L1:%i[0-9]+]] = 0 to 7 step 4 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %0 = "addi32"([[L1]], [[L1]]) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %1 = "addi32"(%0, %0) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %2 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %3 = "addi32"(%2, %2) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %4 = "addi32"(%3, %3) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %5 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %6 = "addi32"(%5, %5) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %7 = "addi32"(%6, %6) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %8 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %9 = "addi32"(%8, %8) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %10 = "addi32"(%9, %9) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4-NEXT: for [[L2:%i[0-9]+]] = 8 to 10 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %11 = "addi32"([[L2]], [[L2]]) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %12 = "addi32"(%11, %11) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 10 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%x = "addi32"(%j, %j) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
%y = "addi32"(%x, %x) : (i32, i32) -> i32
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @unroll_non_unit_stride_cleanup() {
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
mlfunc @unroll_non_unit_stride_cleanup() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4: for [[L1:%i[0-9]+]] = 2 to 37 step 20 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %0 = "addi32"([[L1]], [[L1]]) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %1 = "addi32"(%0, %0) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %2 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %3 = "addi32"(%2, %2) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %4 = "addi32"(%3, %3) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %5 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %6 = "addi32"(%5, %5) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %7 = "addi32"(%6, %6) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %8 = affine_apply #map{{[0-9]+}}([[L1]])
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %9 = "addi32"(%8, %8) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %10 = "addi32"(%9, %9) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
|
|
|
// UNROLL-BY-4-NEXT: for [[L2:%i[0-9]+]] = 42 to 48 step 5 {
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %11 = "addi32"([[L2]], [[L2]]) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %12 = "addi32"(%11, %11) : (i32, i32) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
|
|
|
for %j = 2 to 48 step 5 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%x = "addi32"(%j, %j) : (index, index) -> i32
|
Extend loop unrolling to unroll by a given factor; add builder for affine
apply op.
- add builder for AffineApplyOp (first one for an operation that has
non-zero operands)
- add support for loop unrolling by a given factor; uses the affine apply op
builder.
While on this, change 'step' of ForStmt to be 'unsigned' instead of
AffineConstantExpr *. Add setters for ForStmt lb, ub, step.
Sample Input:
// CHECK-LABEL: mlfunc @loop_nest_unroll_cleanup() {
mlfunc @loop_nest_unroll_cleanup() {
for %i = 1 to 100 {
for %j = 0 to 17 {
%x = "addi32"(%j, %j) : (affineint, affineint) -> i32
%y = "addi32"(%x, %x) : (i32, i32) -> i32
}
}
return
}
Output:
$ mlir-opt -loop-unroll -unroll-factor=4 /tmp/single2.mlir
#map0 = (d0) -> (d0 + 1)
#map1 = (d0) -> (d0 + 2)
#map2 = (d0) -> (d0 + 3)
mlfunc @loop_nest_unroll_cleanup() {
for %i0 = 1 to 100 {
for %i1 = 0 to 17 step 4 {
%0 = "addi32"(%i1, %i1) : (affineint, affineint) -> i32
%1 = "addi32"(%0, %0) : (i32, i32) -> i32
%2 = affine_apply #map0(%i1)
%3 = "addi32"(%2, %2) : (affineint, affineint) -> i32
%4 = affine_apply #map1(%i1)
%5 = "addi32"(%4, %4) : (affineint, affineint) -> i32
%6 = affine_apply #map2(%i1)
%7 = "addi32"(%6, %6) : (affineint, affineint) -> i32
}
for %i2 = 16 to 17 {
%8 = "addi32"(%i2, %i2) : (affineint, affineint) -> i32
%9 = "addi32"(%8, %8) : (i32, i32) -> i32
}
}
return
}
PiperOrigin-RevId: 209676220
2018-08-22 07:01:23 +08:00
|
|
|
%y = "addi32"(%x, %x) : (i32, i32) -> i32
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
2018-09-08 05:47:21 +08:00
|
|
|
|
|
|
|
// Both the unrolled loop and the cleanup loop are single iteration loops.
|
2018-10-07 08:21:53 +08:00
|
|
|
mlfunc @loop_nest_single_iteration_after_unroll(%N: index) {
|
|
|
|
// UNROLL-BY-4: %c0 = constant 0 : index
|
|
|
|
// UNROLL-BY-4: %c4 = constant 4 : index
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to %arg0 {
|
|
|
|
for %i = 0 to %N {
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4: %0 = "addi32"(%c0, %c0) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %1 = affine_apply #map0(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %2 = "addi32"(%1, %1) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %3 = affine_apply #map1(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %4 = "addi32"(%3, %3) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %5 = affine_apply #map2(%c0)
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %6 = "addi32"(%5, %5) : (index, index) -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %7 = "addi32"(%c4, %c4) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
// UNROLL-BY-4-NOT: for
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = 0 to 5 {
|
2018-10-07 08:21:53 +08:00
|
|
|
%x = "addi32"(%j, %j) : (index, index) -> i32
|
2018-09-08 05:47:21 +08:00
|
|
|
} // UNROLL-BY-4-NOT: }
|
|
|
|
} // UNROLL-BY-4: }
|
|
|
|
return
|
|
|
|
}
|
2018-09-13 01:21:23 +08:00
|
|
|
|
|
|
|
// Test cases with loop bound operands.
|
|
|
|
|
|
|
|
// No cleanup will be generated here.
|
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @loop_nest_operand1() {
|
|
|
|
mlfunc @loop_nest_operand1() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %i = 0 to 100 step 2 {
|
2018-09-13 01:21:23 +08:00
|
|
|
// UNROLL-BY-4: %0 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4: %1 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4: %2 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4: %3 = "foo"() : () -> i32
|
|
|
|
for %j = (d0) -> (0) (%i) to (d0) -> (d0 - d0 mod 4 - 1) (%i) {
|
|
|
|
%x = "foo"() : () -> i32
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// No cleanup will be generated here.
|
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @loop_nest_operand2() {
|
|
|
|
mlfunc @loop_nest_operand2() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %i = 0 to 100 step 2 {
|
2018-09-13 01:21:23 +08:00
|
|
|
// UNROLL-BY-4: %0 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4: %1 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4: %2 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4: %3 = "foo"() : () -> i32
|
|
|
|
for %j = (d0) -> (d0) (%i) to (d0) -> (5*d0 + 3) (%i) {
|
|
|
|
%x = "foo"() : () -> i32
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Difference between loop bounds is constant, but not a multiple of unroll
|
2018-09-19 01:22:03 +08:00
|
|
|
// factor. The cleanup loop happens to be a single iteration one and is promoted.
|
2018-09-13 01:21:23 +08:00
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @loop_nest_operand3() {
|
|
|
|
mlfunc @loop_nest_operand3() {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 step 2 {
|
|
|
|
for %i = 0 to 100 step 2 {
|
2018-09-26 08:15:54 +08:00
|
|
|
// UNROLL-BY-4: for %i1 = (d0) -> (d0)(%i0) to #map{{[0-9]+}}(%i0) step 4 {
|
2018-09-13 01:21:23 +08:00
|
|
|
// UNROLL-BY-4-NEXT: %0 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %1 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %2 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %3 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
|
|
|
// UNROLL-BY-4-NEXT: %4 = "foo"() : () -> i32
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = (d0) -> (d0) (%i) to (d0) -> (d0 + 9) (%i) {
|
2018-09-13 01:21:23 +08:00
|
|
|
%x = "foo"() : () -> i32
|
|
|
|
}
|
|
|
|
} // UNROLL-BY-4: }
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2018-10-07 08:21:53 +08:00
|
|
|
// UNROLL-BY-4-LABEL: mlfunc @loop_nest_operand4(%arg0 : index) {
|
|
|
|
mlfunc @loop_nest_operand4(%N : index) {
|
2018-11-07 21:44:50 +08:00
|
|
|
// UNROLL-BY-4: for %i0 = 0 to 100 {
|
|
|
|
for %i = 0 to 100 {
|
|
|
|
// UNROLL-BY-4: for %i1 = ()[s0] -> (0)()[%arg0] to #map{{[0-9]+}}()[%arg0] step 4 {
|
2018-09-19 01:22:03 +08:00
|
|
|
// UNROLL-BY-4: %0 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %1 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %2 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: %3 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4-NEXT: }
|
|
|
|
// A cleanup loop will be be generated here.
|
|
|
|
// UNROLL-BY-4-NEXT: for %i2 = #map{{[0-9]+}}()[%arg0] to %arg0 {
|
|
|
|
// UNROLL-BY-4-NEXT: %4 = "foo"() : () -> i32
|
|
|
|
// UNROLL-BY-4_NEXT: }
|
|
|
|
// Specify the lower bound so that both lb and ub operands match.
|
2018-11-07 21:44:50 +08:00
|
|
|
for %j = ()[s0] -> (0)()[%N] to %N {
|
2018-09-13 01:21:23 +08:00
|
|
|
%x = "foo"() : () -> i32
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
2018-09-28 02:54:55 +08:00
|
|
|
|
|
|
|
// CHECK-LABEL: mlfunc @loop_nest_unroll_full() {
|
|
|
|
mlfunc @loop_nest_unroll_full() {
|
|
|
|
// CHECK-NEXT: %0 = "foo"() : () -> i32
|
|
|
|
// CHECK-NEXT: %1 = "bar"() : () -> i32
|
|
|
|
// CHECK-NEXT: return
|
2018-11-07 21:44:50 +08:00
|
|
|
for %i = 0 to 1 {
|
2018-09-28 02:54:55 +08:00
|
|
|
%x = "foo"() : () -> i32
|
|
|
|
%y = "bar"() : () -> i32
|
|
|
|
}
|
|
|
|
return
|
|
|
|
} // CHECK }
|