[MLIR] Remove dead affine.applys while generating pointwise copies

This makes no impact on the test cases because affine-data-copy-generate
runs whole function canonicalization at its end; however, the latter
will be removed in a pending revision. It is thus useful to clean up
these affine.applys right here, and eventually, not even generate
these (when the right API to compose by construction is in place).

Differential Revision: https://reviews.llvm.org/D78055
This commit is contained in:
Uday Bondhugula 2020-04-14 01:18:37 +05:30
parent 2f60fbce6c
commit ac047d9fce
1 changed files with 8 additions and 1 deletions

View File

@ -1492,6 +1492,7 @@ generatePointWiseCopy(Location loc, Value memref, Value fastMemRef,
SmallVector<AffineExpr, 4> fastBufExprs; SmallVector<AffineExpr, 4> fastBufExprs;
SmallVector<Value, 4> fastBufMapOperands; SmallVector<Value, 4> fastBufMapOperands;
AffineForOp copyNestRoot; AffineForOp copyNestRoot;
SmallVector<AffineApplyOp, 4> mayBeDeadApplys;
for (unsigned d = 0; d < rank; ++d) { for (unsigned d = 0; d < rank; ++d) {
auto forOp = createCanonicalizedAffineForOp(b, loc, lbOperands, lbMaps[d], auto forOp = createCanonicalizedAffineForOp(b, loc, lbOperands, lbMaps[d],
ubOperands, ubMaps[d]); ubOperands, ubMaps[d]);
@ -1510,6 +1511,7 @@ generatePointWiseCopy(Location loc, Value memref, Value fastMemRef,
b.getAffineDimExpr(2 * d)); b.getAffineDimExpr(2 * d));
fastBufMapOperands.push_back(offset); fastBufMapOperands.push_back(offset);
fastBufMapOperands.push_back(forOp.getInductionVar()); fastBufMapOperands.push_back(forOp.getInductionVar());
mayBeDeadApplys.push_back(offset);
// Subscript for the slow memref being copied. // Subscript for the slow memref being copied.
memIndices.push_back(forOp.getInductionVar()); memIndices.push_back(forOp.getInductionVar());
@ -1520,6 +1522,11 @@ generatePointWiseCopy(Location loc, Value memref, Value fastMemRef,
fastBufMap = simplifyAffineMap(fastBufMap); fastBufMap = simplifyAffineMap(fastBufMap);
canonicalizeMapAndOperands(&fastBufMap, &fastBufMapOperands); canonicalizeMapAndOperands(&fastBufMap, &fastBufMapOperands);
// Drop any dead affine.applys.
for (auto applyOp : mayBeDeadApplys)
if (applyOp.use_empty())
applyOp.erase();
if (!isCopyOut) { if (!isCopyOut) {
// Copy in. // Copy in.
auto load = b.create<AffineLoadOp>(loc, memref, memIndices); auto load = b.create<AffineLoadOp>(loc, memref, memIndices);
@ -2191,7 +2198,7 @@ static AffineIfOp createSeparationCondition(MutableArrayRef<AffineForOp> loops,
// larger (and resp. smaller) than any other lower (or upper bound). // larger (and resp. smaller) than any other lower (or upper bound).
SmallVector<int64_t, 8> fullTileLb, fullTileUb; SmallVector<int64_t, 8> fullTileLb, fullTileUb;
for (auto loop : loops) { for (auto loop : loops) {
(void) loop; (void)loop;
// TODO: Non-unit stride is not an issue to generalize to. // TODO: Non-unit stride is not an issue to generalize to.
assert(loop.getStep() == 1 && "point loop step expected to be one"); assert(loop.getStep() == 1 && "point loop step expected to be one");
// Mark everything symbols for the purpose of finding a constant diff pair. // Mark everything symbols for the purpose of finding a constant diff pair.