2016-06-28 09:37:20 +08:00
|
|
|
//===--------- ScopInfo.cpp ----------------------------------------------===//
|
2011-04-29 14:27:02 +08:00
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// Create a polyhedral description for a static control flow region.
|
|
|
|
//
|
|
|
|
// The pass creates a polyhedral description of the Scops detected by the Scop
|
|
|
|
// detection derived from their LLVM-IR code.
|
|
|
|
//
|
2014-10-30 03:58:28 +08:00
|
|
|
// This representation is shared among several tools in the polyhedral
|
2011-04-29 14:27:02 +08:00
|
|
|
// community, which are e.g. Cloog, Pluto, Loopo, Graphite.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2015-12-21 20:38:56 +08:00
|
|
|
#include "polly/ScopInfo.h"
|
2011-04-29 14:27:02 +08:00
|
|
|
#include "polly/LinkAllPasses.h"
|
2014-06-18 01:31:36 +08:00
|
|
|
#include "polly/Options.h"
|
2016-06-28 09:37:28 +08:00
|
|
|
#include "polly/ScopBuilder.h"
|
2011-04-29 14:27:02 +08:00
|
|
|
#include "polly/Support/GICHelper.h"
|
2011-11-08 23:41:28 +08:00
|
|
|
#include "polly/Support/SCEVValidator.h"
|
2013-05-07 16:11:54 +08:00
|
|
|
#include "polly/Support/ScopHelper.h"
|
2015-11-22 19:06:51 +08:00
|
|
|
#include "llvm/ADT/DepthFirstIterator.h"
|
2015-04-05 21:11:54 +08:00
|
|
|
#include "llvm/ADT/MapVector.h"
|
2015-09-25 17:49:19 +08:00
|
|
|
#include "llvm/ADT/PostOrderIterator.h"
|
|
|
|
#include "llvm/ADT/STLExtras.h"
|
2015-05-09 17:13:42 +08:00
|
|
|
#include "llvm/ADT/SetVector.h"
|
2013-05-07 16:11:54 +08:00
|
|
|
#include "llvm/ADT/Statistic.h"
|
|
|
|
#include "llvm/ADT/StringExtras.h"
|
2014-09-18 19:17:17 +08:00
|
|
|
#include "llvm/Analysis/AliasAnalysis.h"
|
2017-03-17 21:56:53 +08:00
|
|
|
#include "llvm/Analysis/AssumptionCache.h"
|
2016-04-23 20:59:18 +08:00
|
|
|
#include "llvm/Analysis/Loads.h"
|
2015-05-09 17:13:42 +08:00
|
|
|
#include "llvm/Analysis/LoopInfo.h"
|
2015-09-25 17:49:19 +08:00
|
|
|
#include "llvm/Analysis/LoopIterator.h"
|
2011-04-29 14:27:02 +08:00
|
|
|
#include "llvm/Analysis/RegionIterator.h"
|
2013-05-07 16:11:54 +08:00
|
|
|
#include "llvm/Analysis/ScalarEvolutionExpressions.h"
|
2015-11-12 10:32:32 +08:00
|
|
|
#include "llvm/IR/DiagnosticInfo.h"
|
2011-04-29 14:27:02 +08:00
|
|
|
#include "llvm/Support/Debug.h"
|
2011-08-18 14:31:50 +08:00
|
|
|
#include "isl/aff.h"
|
2015-05-09 17:13:42 +08:00
|
|
|
#include "isl/constraint.h"
|
2011-10-06 08:03:35 +08:00
|
|
|
#include "isl/local_space.h"
|
2015-05-09 17:13:42 +08:00
|
|
|
#include "isl/map.h"
|
2011-12-07 15:42:51 +08:00
|
|
|
#include "isl/options.h"
|
2015-05-09 17:13:42 +08:00
|
|
|
#include "isl/printer.h"
|
2015-07-14 17:33:13 +08:00
|
|
|
#include "isl/schedule.h"
|
|
|
|
#include "isl/schedule_node.h"
|
2015-05-09 17:13:42 +08:00
|
|
|
#include "isl/set.h"
|
|
|
|
#include "isl/union_map.h"
|
2015-05-09 17:36:38 +08:00
|
|
|
#include "isl/union_set.h"
|
2013-06-21 14:41:31 +08:00
|
|
|
#include "isl/val.h"
|
2011-04-29 14:27:02 +08:00
|
|
|
#include <sstream>
|
|
|
|
#include <string>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
using namespace polly;
|
|
|
|
|
2014-04-22 11:30:19 +08:00
|
|
|
#define DEBUG_TYPE "polly-scops"
|
|
|
|
|
2016-11-18 22:37:08 +08:00
|
|
|
STATISTIC(AssumptionsAliasing, "Number of aliasing assumptions taken.");
|
|
|
|
STATISTIC(AssumptionsInbounds, "Number of inbounds assumptions taken.");
|
|
|
|
STATISTIC(AssumptionsWrapping, "Number of wrapping assumptions taken.");
|
|
|
|
STATISTIC(AssumptionsUnsigned, "Number of unsigned assumptions taken.");
|
|
|
|
STATISTIC(AssumptionsComplexity, "Number of too complex SCoPs.");
|
|
|
|
STATISTIC(AssumptionsUnprofitable, "Number of unprofitable SCoPs.");
|
|
|
|
STATISTIC(AssumptionsErrorBlock, "Number of error block assumptions taken.");
|
|
|
|
STATISTIC(AssumptionsInfiniteLoop, "Number of bounded loop assumptions taken.");
|
|
|
|
STATISTIC(AssumptionsInvariantLoad,
|
2016-11-18 05:41:08 +08:00
|
|
|
"Number of invariant loads assumptions taken.");
|
2016-11-18 22:37:08 +08:00
|
|
|
STATISTIC(AssumptionsDelinearization,
|
2016-11-18 05:41:08 +08:00
|
|
|
"Number of delinearization assumptions taken.");
|
|
|
|
|
2017-02-17 16:12:36 +08:00
|
|
|
STATISTIC(NumLoopsInScop, "Number of loops in scops");
|
|
|
|
STATISTIC(NumScopsDepthOne, "Number of scops with maximal loop depth 1");
|
|
|
|
STATISTIC(NumScopsDepthTwo, "Number of scops with maximal loop depth 2");
|
|
|
|
STATISTIC(NumScopsDepthThree, "Number of scops with maximal loop depth 3");
|
|
|
|
STATISTIC(NumScopsDepthFour, "Number of scops with maximal loop depth 4");
|
|
|
|
STATISTIC(NumScopsDepthFive, "Number of scops with maximal loop depth 5");
|
|
|
|
STATISTIC(NumScopsDepthLarger,
|
|
|
|
"Number of scops with maximal loop depth 6 and larger");
|
|
|
|
STATISTIC(MaxNumLoopsInScop, "Maximal number of loops in scops");
|
|
|
|
|
2015-12-20 21:31:48 +08:00
|
|
|
// The maximal number of basic sets we allow during domain construction to
|
|
|
|
// be created. More complex scops will result in very high compile time and
|
|
|
|
// are also unlikely to result in good code
|
2017-02-17 03:11:33 +08:00
|
|
|
static int const MaxDisjunctsInDomain = 20;
|
2015-12-20 21:31:48 +08:00
|
|
|
|
2017-02-17 03:11:25 +08:00
|
|
|
// The number of disjunct in the context after which we stop to add more
|
|
|
|
// disjuncts. This parameter is there to avoid exponential growth in the
|
|
|
|
// number of disjunct when adding non-convex sets to the context.
|
|
|
|
static int const MaxDisjunctsInContext = 4;
|
|
|
|
|
2017-05-19 11:45:00 +08:00
|
|
|
static cl::opt<int> OptComputeOut(
|
|
|
|
"polly-analysis-computeout",
|
|
|
|
cl::desc("Bound the dependence analysis by a maximal amount of "
|
|
|
|
"computational steps (0 means no bound)"),
|
|
|
|
cl::Hidden, cl::init(1000000), cl::ZeroOrMore, cl::cat(PollyCategory));
|
|
|
|
|
2016-04-13 00:09:44 +08:00
|
|
|
static cl::opt<bool> PollyRemarksMinimal(
|
|
|
|
"polly-remarks-minimal",
|
|
|
|
cl::desc("Do not emit remarks about assumptions that are known"),
|
|
|
|
cl::Hidden, cl::ZeroOrMore, cl::init(false), cl::cat(PollyCategory));
|
|
|
|
|
2014-08-18 08:40:13 +08:00
|
|
|
// Multiplicative reductions can be disabled separately as these kind of
|
2014-06-18 01:31:36 +08:00
|
|
|
// operations can overflow easily. Additive reductions and bit operations
|
|
|
|
// are in contrast pretty stable.
|
2014-07-09 18:50:10 +08:00
|
|
|
static cl::opt<bool> DisableMultiplicativeReductions(
|
|
|
|
"polly-disable-multiplicative-reductions",
|
|
|
|
cl::desc("Disable multiplicative reductions"), cl::Hidden, cl::ZeroOrMore,
|
|
|
|
cl::init(false), cl::cat(PollyCategory));
|
2014-06-18 01:31:36 +08:00
|
|
|
|
2014-09-27 19:02:39 +08:00
|
|
|
static cl::opt<unsigned> RunTimeChecksMaxParameters(
|
|
|
|
"polly-rtc-max-parameters",
|
|
|
|
cl::desc("The maximal number of parameters allowed in RTCs."), cl::Hidden,
|
|
|
|
cl::ZeroOrMore, cl::init(8), cl::cat(PollyCategory));
|
|
|
|
|
2015-03-28 23:11:14 +08:00
|
|
|
static cl::opt<unsigned> RunTimeChecksMaxArraysPerGroup(
|
|
|
|
"polly-rtc-max-arrays-per-group",
|
|
|
|
cl::desc("The maximal number of arrays to compare in each alias group."),
|
|
|
|
cl::Hidden, cl::ZeroOrMore, cl::init(20), cl::cat(PollyCategory));
|
2016-06-02 19:06:54 +08:00
|
|
|
|
2015-08-16 18:19:29 +08:00
|
|
|
static cl::opt<std::string> UserContextStr(
|
|
|
|
"polly-context", cl::value_desc("isl parameter set"),
|
|
|
|
cl::desc("Provide additional constraints on the context parameters"),
|
|
|
|
cl::init(""), cl::cat(PollyCategory));
|
2015-03-28 23:11:14 +08:00
|
|
|
|
2015-08-21 03:08:11 +08:00
|
|
|
static cl::opt<bool> DetectReductions("polly-detect-reductions",
|
|
|
|
cl::desc("Detect and exploit reductions"),
|
|
|
|
cl::Hidden, cl::ZeroOrMore,
|
|
|
|
cl::init(true), cl::cat(PollyCategory));
|
|
|
|
|
2016-04-29 19:43:20 +08:00
|
|
|
static cl::opt<bool>
|
|
|
|
IslOnErrorAbort("polly-on-isl-error-abort",
|
|
|
|
cl::desc("Abort if an isl error is encountered"),
|
|
|
|
cl::init(true), cl::cat(PollyCategory));
|
|
|
|
|
[ScopInfo] Simplify inbounds assumptions under domain constraints
Without this simplification for a loop nest:
void foo(long n1_a, long n1_b, long n1_c, long n1_d,
long p1_b, long p1_c, long p1_d,
float A_1[][p1_b][p1_c][p1_d]) {
for (long i = 0; i < n1_a; i++)
for (long j = 0; j < n1_b; j++)
for (long k = 0; k < n1_c; k++)
for (long l = 0; l < n1_d; l++)
A_1[i][j][k][l] += i + j + k + l;
}
the assumption:
n1_a <= 0 or (n1_a > 0 and n1_b <= 0) or
(n1_a > 0 and n1_b > 0 and n1_c <= 0) or
(n1_a > 0 and n1_b > 0 and n1_c > 0 and n1_d <= 0) or
(n1_a > 0 and n1_b > 0 and n1_c > 0 and n1_d > 0 and
p1_b >= n1_b and p1_c >= n1_c and p1_d >= n1_d)
is taken rather than the simpler assumption:
p9_b >= n9_b and p9_c >= n9_c and p9_d >= n9_d.
The former is less strict, as it allows arbitrary values of p1_* in case, the
loop is not executed at all. However, in practice these precise constraints
explode when combined across different accesses and loops. For now it seems
to make more sense to take less precise, but more scalable constraints by
default. In case we find a practical example where more precise constraints
are needed, we can think about allowing such precise constraints in specific
situations where they help.
This change speeds up the new test case from taking very long (waited at least
a minute, but it probably takes a lot more) to below a second.
llvm-svn: 296456
2017-02-28 17:45:54 +08:00
|
|
|
static cl::opt<bool> PollyPreciseInbounds(
|
|
|
|
"polly-precise-inbounds",
|
|
|
|
cl::desc("Take more precise inbounds assumptions (do not scale well)"),
|
|
|
|
cl::Hidden, cl::init(false), cl::cat(PollyCategory));
|
|
|
|
|
2017-03-17 20:26:58 +08:00
|
|
|
static cl::opt<bool>
|
|
|
|
PollyIgnoreInbounds("polly-ignore-inbounds",
|
|
|
|
cl::desc("Do not take inbounds assumptions at all"),
|
|
|
|
cl::Hidden, cl::init(false), cl::cat(PollyCategory));
|
|
|
|
|
2017-03-17 21:00:53 +08:00
|
|
|
static cl::opt<bool> PollyIgnoreParamBounds(
|
|
|
|
"polly-ignore-parameter-bounds",
|
|
|
|
cl::desc(
|
|
|
|
"Do not add parameter bounds and do no gist simplify sets accordingly"),
|
|
|
|
cl::Hidden, cl::init(false), cl::cat(PollyCategory));
|
|
|
|
|
[ScopInfo] Disable memory folding in case it results in multi-disjunct relations
Multi-disjunct access maps can easily result in inbound assumptions which
explode in case of many memory accesses and many parameters. This change reduces
compilation time of some larger kernel from over 15 minutes to less than 16
seconds.
Interesting is the test case test/ScopInfo/multidim_param_in_subscript.ll
which has a memory access
[n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, -1 + n - i1] }
which requires folding, but where only a single disjunct remains. We can still
model this test case even when only using limited memory folding.
For people only reading commit messages, here the comment that explains what
memory folding is:
To recover memory accesses with array size parameters in the subscript
expression we post-process the delinearization results.
We would normally recover from an access A[exp0(i) * N + exp1(i)] into an
array A[][N] the 2D access A[exp0(i)][exp1(i)]. However, another valid
delinearization is A[exp0(i) - 1][exp1(i) + N] which - depending on the
range of exp1(i) - may be preferrable. Specifically, for cases where we
know exp1(i) is negative, we want to choose the latter expression.
As we commonly do not have any information about the range of exp1(i),
we do not choose one of the two options, but instead create a piecewise
access function that adds the (-1, N) offsets as soon as exp1(i) becomes
negative. For a 2D array such an access function is created by applying
the piecewise map:
[i,j] -> [i, j] : j >= 0
[i,j] -> [i-1, j+N] : j < 0
After this patch we generate only the first case, except for situations where
we can proove the first case to be invalid and can consequently select the
second without introducing disjuncts.
llvm-svn: 296679
2017-03-02 05:11:27 +08:00
|
|
|
static cl::opt<bool> PollyPreciseFoldAccesses(
|
|
|
|
"polly-precise-fold-accesses",
|
2017-04-03 20:03:38 +08:00
|
|
|
cl::desc("Fold memory accesses to model more possible delinearizations "
|
|
|
|
"(does not scale well)"),
|
[ScopInfo] Disable memory folding in case it results in multi-disjunct relations
Multi-disjunct access maps can easily result in inbound assumptions which
explode in case of many memory accesses and many parameters. This change reduces
compilation time of some larger kernel from over 15 minutes to less than 16
seconds.
Interesting is the test case test/ScopInfo/multidim_param_in_subscript.ll
which has a memory access
[n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, -1 + n - i1] }
which requires folding, but where only a single disjunct remains. We can still
model this test case even when only using limited memory folding.
For people only reading commit messages, here the comment that explains what
memory folding is:
To recover memory accesses with array size parameters in the subscript
expression we post-process the delinearization results.
We would normally recover from an access A[exp0(i) * N + exp1(i)] into an
array A[][N] the 2D access A[exp0(i)][exp1(i)]. However, another valid
delinearization is A[exp0(i) - 1][exp1(i) + N] which - depending on the
range of exp1(i) - may be preferrable. Specifically, for cases where we
know exp1(i) is negative, we want to choose the latter expression.
As we commonly do not have any information about the range of exp1(i),
we do not choose one of the two options, but instead create a piecewise
access function that adds the (-1, N) offsets as soon as exp1(i) becomes
negative. For a 2D array such an access function is created by applying
the piecewise map:
[i,j] -> [i, j] : j >= 0
[i,j] -> [i-1, j+N] : j < 0
After this patch we generate only the first case, except for situations where
we can proove the first case to be invalid and can consequently select the
second without introducing disjuncts.
llvm-svn: 296679
2017-03-02 05:11:27 +08:00
|
|
|
cl::Hidden, cl::init(false), cl::cat(PollyCategory));
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
|
2017-05-06 22:03:58 +08:00
|
|
|
bool polly::UseInstructionNames;
|
|
|
|
static cl::opt<bool, true> XUseInstructionNames(
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
"polly-use-llvm-names",
|
2017-05-06 22:03:58 +08:00
|
|
|
cl::desc("Use LLVM-IR names when deriving statement names"),
|
|
|
|
cl::location(UseInstructionNames), cl::Hidden, cl::init(false),
|
|
|
|
cl::ZeroOrMore, cl::cat(PollyCategory));
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
|
2015-09-10 20:46:52 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2015-08-10 21:01:57 +08:00
|
|
|
// Create a sequence of two schedules. Either argument may be null and is
|
|
|
|
// interpreted as the empty schedule. Can also return null if both schedules are
|
|
|
|
// empty.
|
|
|
|
static __isl_give isl_schedule *
|
|
|
|
combineInSequence(__isl_take isl_schedule *Prev,
|
|
|
|
__isl_take isl_schedule *Succ) {
|
|
|
|
if (!Prev)
|
|
|
|
return Succ;
|
|
|
|
if (!Succ)
|
|
|
|
return Prev;
|
|
|
|
|
|
|
|
return isl_schedule_sequence(Prev, Succ);
|
|
|
|
}
|
|
|
|
|
2015-02-24 19:58:30 +08:00
|
|
|
static __isl_give isl_set *addRangeBoundsToSet(__isl_take isl_set *S,
|
|
|
|
const ConstantRange &Range,
|
|
|
|
int dim,
|
|
|
|
enum isl_dim_type type) {
|
|
|
|
isl_val *V;
|
2017-02-17 02:39:18 +08:00
|
|
|
isl_ctx *Ctx = isl_set_get_ctx(S);
|
2015-02-24 19:58:30 +08:00
|
|
|
|
2017-02-17 02:39:14 +08:00
|
|
|
// The upper and lower bound for a parameter value is derived either from
|
|
|
|
// the data type of the parameter or from the - possibly more restrictive -
|
|
|
|
// range metadata.
|
2017-02-17 02:39:18 +08:00
|
|
|
V = isl_valFromAPInt(Ctx, Range.getSignedMin(), true);
|
2017-02-17 02:39:14 +08:00
|
|
|
S = isl_set_lower_bound_val(S, type, dim, V);
|
2017-02-17 02:39:18 +08:00
|
|
|
V = isl_valFromAPInt(Ctx, Range.getSignedMax(), true);
|
2017-02-17 02:39:14 +08:00
|
|
|
S = isl_set_upper_bound_val(S, type, dim, V);
|
|
|
|
|
|
|
|
if (Range.isFullSet())
|
|
|
|
return S;
|
|
|
|
|
2017-02-17 03:11:25 +08:00
|
|
|
if (isl_set_n_basic_set(S) > MaxDisjunctsInContext)
|
|
|
|
return S;
|
|
|
|
|
2017-02-17 02:39:14 +08:00
|
|
|
// In case of signed wrapping, we can refine the set of valid values by
|
|
|
|
// excluding the part not covered by the wrapping range.
|
|
|
|
if (Range.isSignWrappedSet()) {
|
2017-02-17 02:39:18 +08:00
|
|
|
V = isl_valFromAPInt(Ctx, Range.getLower(), true);
|
2017-02-17 02:39:14 +08:00
|
|
|
isl_set *SLB = isl_set_lower_bound_val(isl_set_copy(S), type, dim, V);
|
|
|
|
|
2017-02-17 02:39:18 +08:00
|
|
|
V = isl_valFromAPInt(Ctx, Range.getUpper(), true);
|
2015-03-09 03:49:50 +08:00
|
|
|
V = isl_val_sub_ui(V, 1);
|
2017-02-17 02:39:14 +08:00
|
|
|
isl_set *SUB = isl_set_upper_bound_val(S, type, dim, V);
|
|
|
|
S = isl_set_union(SLB, SUB);
|
|
|
|
}
|
2015-02-24 19:58:30 +08:00
|
|
|
|
2017-02-17 02:39:14 +08:00
|
|
|
return S;
|
2015-02-24 19:58:30 +08:00
|
|
|
}
|
|
|
|
|
2015-08-21 02:04:22 +08:00
|
|
|
static const ScopArrayInfo *identifyBasePtrOriginSAI(Scop *S, Value *BasePtr) {
|
|
|
|
LoadInst *BasePtrLI = dyn_cast<LoadInst>(BasePtr);
|
|
|
|
if (!BasePtrLI)
|
|
|
|
return nullptr;
|
|
|
|
|
2016-05-23 20:40:48 +08:00
|
|
|
if (!S->contains(BasePtrLI))
|
2015-08-21 02:04:22 +08:00
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
ScalarEvolution &SE = *S->getSE();
|
|
|
|
|
|
|
|
auto *OriginBaseSCEV =
|
|
|
|
SE.getPointerBase(SE.getSCEV(BasePtrLI->getPointerOperand()));
|
|
|
|
if (!OriginBaseSCEV)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
auto *OriginBaseSCEVUnknown = dyn_cast<SCEVUnknown>(OriginBaseSCEV);
|
|
|
|
if (!OriginBaseSCEVUnknown)
|
|
|
|
return nullptr;
|
|
|
|
|
2015-11-11 01:31:31 +08:00
|
|
|
return S->getScopArrayInfo(OriginBaseSCEVUnknown->getValue(),
|
2017-01-15 04:25:44 +08:00
|
|
|
MemoryKind::Array);
|
2015-08-21 02:04:22 +08:00
|
|
|
}
|
|
|
|
|
2015-05-20 16:05:31 +08:00
|
|
|
ScopArrayInfo::ScopArrayInfo(Value *BasePtr, Type *ElementType, isl_ctx *Ctx,
|
2017-01-16 00:47:26 +08:00
|
|
|
ArrayRef<const SCEV *> Sizes, MemoryKind Kind,
|
2016-07-30 17:25:51 +08:00
|
|
|
const DataLayout &DL, Scop *S,
|
|
|
|
const char *BaseName)
|
2015-11-13 04:15:08 +08:00
|
|
|
: BasePtr(BasePtr), ElementType(ElementType), Kind(Kind), DL(DL), S(*S) {
|
2015-07-28 22:53:44 +08:00
|
|
|
std::string BasePtrName =
|
2017-01-15 04:25:44 +08:00
|
|
|
BaseName ? BaseName
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
: getIslCompatibleName("MemRef", BasePtr, S->getNextArrayIdx(),
|
|
|
|
Kind == MemoryKind::PHI ? "__phi" : "",
|
|
|
|
UseInstructionNames);
|
2014-10-05 19:32:18 +08:00
|
|
|
Id = isl_id_alloc(Ctx, BasePtrName.c_str(), this);
|
2015-08-21 02:04:22 +08:00
|
|
|
|
2016-02-15 06:31:39 +08:00
|
|
|
updateSizes(Sizes);
|
2016-07-30 17:25:51 +08:00
|
|
|
|
2017-01-15 04:25:44 +08:00
|
|
|
if (!BasePtr || Kind != MemoryKind::Array) {
|
2016-07-30 17:25:51 +08:00
|
|
|
BasePtrOriginSAI = nullptr;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2015-08-21 02:04:22 +08:00
|
|
|
BasePtrOriginSAI = identifyBasePtrOriginSAI(S, BasePtr);
|
|
|
|
if (BasePtrOriginSAI)
|
|
|
|
const_cast<ScopArrayInfo *>(BasePtrOriginSAI)->addDerivedSAI(this);
|
2014-10-05 19:32:18 +08:00
|
|
|
}
|
|
|
|
|
2015-09-26 16:55:54 +08:00
|
|
|
__isl_give isl_space *ScopArrayInfo::getSpace() const {
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *Space =
|
2015-09-26 16:55:54 +08:00
|
|
|
isl_space_set_alloc(isl_id_get_ctx(Id), 0, getNumberOfDimensions());
|
|
|
|
Space = isl_space_set_tuple_id(Space, isl_dim_set, isl_id_copy(Id));
|
|
|
|
return Space;
|
|
|
|
}
|
|
|
|
|
2016-09-18 03:22:18 +08:00
|
|
|
bool ScopArrayInfo::isReadOnly() {
|
|
|
|
isl_union_set *WriteSet = isl_union_map_range(S.getWrites());
|
|
|
|
isl_space *Space = getSpace();
|
|
|
|
WriteSet = isl_union_set_intersect(
|
|
|
|
WriteSet, isl_union_set_from_set(isl_set_universe(Space)));
|
|
|
|
|
|
|
|
bool IsReadOnly = isl_union_set_is_empty(WriteSet);
|
|
|
|
isl_union_set_free(WriteSet);
|
|
|
|
|
|
|
|
return IsReadOnly;
|
|
|
|
}
|
|
|
|
|
2017-05-10 18:59:58 +08:00
|
|
|
bool ScopArrayInfo::isCompatibleWith(const ScopArrayInfo *Array) const {
|
|
|
|
if (Array->getElementType() != getElementType())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (Array->getNumberOfDimensions() != getNumberOfDimensions())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
for (unsigned i = 0; i < getNumberOfDimensions(); i++)
|
|
|
|
if (Array->getDimensionSize(i) != getDimensionSize(i))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2016-02-15 06:31:39 +08:00
|
|
|
void ScopArrayInfo::updateElementType(Type *NewElementType) {
|
|
|
|
if (NewElementType == ElementType)
|
|
|
|
return;
|
|
|
|
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
auto OldElementSize = DL.getTypeAllocSizeInBits(ElementType);
|
|
|
|
auto NewElementSize = DL.getTypeAllocSizeInBits(NewElementType);
|
|
|
|
|
2016-02-25 22:08:48 +08:00
|
|
|
if (NewElementSize == OldElementSize || NewElementSize == 0)
|
2016-02-15 06:31:39 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
if (NewElementSize % OldElementSize == 0 && NewElementSize < OldElementSize) {
|
|
|
|
ElementType = NewElementType;
|
|
|
|
} else {
|
|
|
|
auto GCD = GreatestCommonDivisor64(NewElementSize, OldElementSize);
|
|
|
|
ElementType = IntegerType::get(ElementType->getContext(), GCD);
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
}
|
2016-02-15 06:31:39 +08:00
|
|
|
}
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
|
2016-12-02 16:10:56 +08:00
|
|
|
bool ScopArrayInfo::updateSizes(ArrayRef<const SCEV *> NewSizes,
|
|
|
|
bool CheckConsistency) {
|
2015-09-26 16:55:54 +08:00
|
|
|
int SharedDims = std::min(NewSizes.size(), DimensionSizes.size());
|
|
|
|
int ExtraDimsNew = NewSizes.size() - SharedDims;
|
|
|
|
int ExtraDimsOld = DimensionSizes.size() - SharedDims;
|
2016-09-13 01:08:31 +08:00
|
|
|
|
2016-12-02 16:10:56 +08:00
|
|
|
if (CheckConsistency) {
|
|
|
|
for (int i = 0; i < SharedDims; i++) {
|
|
|
|
auto *NewSize = NewSizes[i + ExtraDimsNew];
|
|
|
|
auto *KnownSize = DimensionSizes[i + ExtraDimsOld];
|
|
|
|
if (NewSize && KnownSize && NewSize != KnownSize)
|
|
|
|
return false;
|
|
|
|
}
|
2015-11-02 19:29:32 +08:00
|
|
|
|
2016-12-02 16:10:56 +08:00
|
|
|
if (DimensionSizes.size() >= NewSizes.size())
|
|
|
|
return true;
|
|
|
|
}
|
2015-09-26 16:55:54 +08:00
|
|
|
|
|
|
|
DimensionSizes.clear();
|
|
|
|
DimensionSizes.insert(DimensionSizes.begin(), NewSizes.begin(),
|
|
|
|
NewSizes.end());
|
|
|
|
for (isl_pw_aff *Size : DimensionSizesPw)
|
|
|
|
isl_pw_aff_free(Size);
|
|
|
|
DimensionSizesPw.clear();
|
|
|
|
for (const SCEV *Expr : DimensionSizes) {
|
2016-09-13 01:08:31 +08:00
|
|
|
if (!Expr) {
|
|
|
|
DimensionSizesPw.push_back(nullptr);
|
|
|
|
continue;
|
|
|
|
}
|
2016-04-23 22:31:17 +08:00
|
|
|
isl_pw_aff *Size = S.getPwAffOnly(Expr);
|
2015-09-26 16:55:54 +08:00
|
|
|
DimensionSizesPw.push_back(Size);
|
|
|
|
}
|
2015-11-02 19:29:32 +08:00
|
|
|
return true;
|
2015-09-26 16:55:54 +08:00
|
|
|
}
|
|
|
|
|
2015-08-12 23:27:16 +08:00
|
|
|
ScopArrayInfo::~ScopArrayInfo() {
|
|
|
|
isl_id_free(Id);
|
|
|
|
for (isl_pw_aff *Size : DimensionSizesPw)
|
|
|
|
isl_pw_aff_free(Size);
|
|
|
|
}
|
2014-10-05 19:32:18 +08:00
|
|
|
|
2015-05-20 16:05:31 +08:00
|
|
|
std::string ScopArrayInfo::getName() const { return isl_id_get_name(Id); }
|
|
|
|
|
|
|
|
int ScopArrayInfo::getElemSizeInBytes() const {
|
2015-11-13 04:15:08 +08:00
|
|
|
return DL.getTypeAllocSize(ElementType);
|
2015-05-20 16:05:31 +08:00
|
|
|
}
|
|
|
|
|
2016-04-10 05:55:23 +08:00
|
|
|
__isl_give isl_id *ScopArrayInfo::getBasePtrId() const {
|
|
|
|
return isl_id_copy(Id);
|
|
|
|
}
|
2014-10-05 19:32:18 +08:00
|
|
|
|
|
|
|
void ScopArrayInfo::dump() const { print(errs()); }
|
|
|
|
|
2015-08-12 23:27:16 +08:00
|
|
|
void ScopArrayInfo::print(raw_ostream &OS, bool SizeAsPwAff) const {
|
2015-11-10 22:02:54 +08:00
|
|
|
OS.indent(8) << *getElementType() << " " << getName();
|
2016-09-13 01:08:31 +08:00
|
|
|
unsigned u = 0;
|
|
|
|
if (getNumberOfDimensions() > 0 && !getDimensionSize(0)) {
|
2015-11-10 22:02:54 +08:00
|
|
|
OS << "[*]";
|
2016-09-13 01:08:31 +08:00
|
|
|
u++;
|
|
|
|
}
|
|
|
|
for (; u < getNumberOfDimensions(); u++) {
|
2015-08-12 23:27:16 +08:00
|
|
|
OS << "[";
|
|
|
|
|
2015-11-10 22:24:21 +08:00
|
|
|
if (SizeAsPwAff) {
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *Size = getDimensionSizePw(u);
|
2015-11-10 22:24:21 +08:00
|
|
|
OS << " " << Size << " ";
|
|
|
|
isl_pw_aff_free(Size);
|
|
|
|
} else {
|
|
|
|
OS << *getDimensionSize(u);
|
|
|
|
}
|
2015-08-12 23:27:16 +08:00
|
|
|
|
|
|
|
OS << "]";
|
|
|
|
}
|
|
|
|
|
2015-11-10 22:02:54 +08:00
|
|
|
OS << ";";
|
|
|
|
|
2015-08-21 02:04:22 +08:00
|
|
|
if (BasePtrOriginSAI)
|
|
|
|
OS << " [BasePtrOrigin: " << BasePtrOriginSAI->getName() << "]";
|
|
|
|
|
2015-05-20 16:05:31 +08:00
|
|
|
OS << " // Element size " << getElemSizeInBytes() << "\n";
|
2014-10-05 19:32:18 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
const ScopArrayInfo *
|
|
|
|
ScopArrayInfo::getFromAccessFunction(__isl_keep isl_pw_multi_aff *PMA) {
|
|
|
|
isl_id *Id = isl_pw_multi_aff_get_tuple_id(PMA, isl_dim_out);
|
|
|
|
assert(Id && "Output dimension didn't have an ID");
|
|
|
|
return getFromId(Id);
|
|
|
|
}
|
|
|
|
|
2016-09-01 17:03:27 +08:00
|
|
|
const ScopArrayInfo *ScopArrayInfo::getFromId(__isl_take isl_id *Id) {
|
2014-10-05 19:32:18 +08:00
|
|
|
void *User = isl_id_get_user(Id);
|
|
|
|
const ScopArrayInfo *SAI = static_cast<ScopArrayInfo *>(User);
|
|
|
|
isl_id_free(Id);
|
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
|
2016-04-11 22:34:08 +08:00
|
|
|
void MemoryAccess::wrapConstantDimensions() {
|
|
|
|
auto *SAI = getScopArrayInfo();
|
|
|
|
auto *ArraySpace = SAI->getSpace();
|
|
|
|
auto *Ctx = isl_space_get_ctx(ArraySpace);
|
|
|
|
unsigned DimsArray = SAI->getNumberOfDimensions();
|
|
|
|
|
|
|
|
auto *DivModAff = isl_multi_aff_identity(isl_space_map_from_domain_and_range(
|
|
|
|
isl_space_copy(ArraySpace), isl_space_copy(ArraySpace)));
|
|
|
|
auto *LArraySpace = isl_local_space_from_space(ArraySpace);
|
|
|
|
|
|
|
|
// Begin with last dimension, to iteratively carry into higher dimensions.
|
|
|
|
for (int i = DimsArray - 1; i > 0; i--) {
|
|
|
|
auto *DimSize = SAI->getDimensionSize(i);
|
|
|
|
auto *DimSizeCst = dyn_cast<SCEVConstant>(DimSize);
|
|
|
|
|
|
|
|
// This transformation is not applicable to dimensions with dynamic size.
|
|
|
|
if (!DimSizeCst)
|
|
|
|
continue;
|
|
|
|
|
2017-02-17 12:48:52 +08:00
|
|
|
// This transformation is not applicable to dimensions of size zero.
|
|
|
|
if (DimSize->isZero())
|
|
|
|
continue;
|
|
|
|
|
2016-04-11 22:34:08 +08:00
|
|
|
auto *DimSizeVal = isl_valFromAPInt(Ctx, DimSizeCst->getAPInt(), false);
|
|
|
|
auto *Var = isl_aff_var_on_domain(isl_local_space_copy(LArraySpace),
|
|
|
|
isl_dim_set, i);
|
|
|
|
auto *PrevVar = isl_aff_var_on_domain(isl_local_space_copy(LArraySpace),
|
|
|
|
isl_dim_set, i - 1);
|
|
|
|
|
|
|
|
// Compute: index % size
|
|
|
|
// Modulo must apply in the divide of the previous iteration, if any.
|
|
|
|
auto *Modulo = isl_aff_copy(Var);
|
|
|
|
Modulo = isl_aff_mod_val(Modulo, isl_val_copy(DimSizeVal));
|
|
|
|
Modulo = isl_aff_pullback_multi_aff(Modulo, isl_multi_aff_copy(DivModAff));
|
|
|
|
|
|
|
|
// Compute: floor(index / size)
|
|
|
|
auto *Divide = Var;
|
|
|
|
Divide = isl_aff_div(
|
|
|
|
Divide,
|
|
|
|
isl_aff_val_on_domain(isl_local_space_copy(LArraySpace), DimSizeVal));
|
|
|
|
Divide = isl_aff_floor(Divide);
|
|
|
|
Divide = isl_aff_add(Divide, PrevVar);
|
|
|
|
Divide = isl_aff_pullback_multi_aff(Divide, isl_multi_aff_copy(DivModAff));
|
|
|
|
|
|
|
|
// Apply Modulo and Divide.
|
|
|
|
DivModAff = isl_multi_aff_set_aff(DivModAff, i, Modulo);
|
|
|
|
DivModAff = isl_multi_aff_set_aff(DivModAff, i - 1, Divide);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Apply all modulo/divides on the accesses.
|
|
|
|
AccessRelation =
|
|
|
|
isl_map_apply_range(AccessRelation, isl_map_from_multi_aff(DivModAff));
|
|
|
|
AccessRelation = isl_map_detect_equalities(AccessRelation);
|
|
|
|
isl_local_space_free(LArraySpace);
|
|
|
|
}
|
|
|
|
|
2015-09-26 16:55:54 +08:00
|
|
|
void MemoryAccess::updateDimensionality() {
|
2016-02-19 00:50:12 +08:00
|
|
|
auto *SAI = getScopArrayInfo();
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *ArraySpace = SAI->getSpace();
|
|
|
|
auto *AccessSpace = isl_space_range(isl_map_get_space(AccessRelation));
|
2016-02-19 00:50:12 +08:00
|
|
|
auto *Ctx = isl_space_get_ctx(AccessSpace);
|
2015-09-26 16:55:54 +08:00
|
|
|
|
|
|
|
auto DimsArray = isl_space_dim(ArraySpace, isl_dim_set);
|
|
|
|
auto DimsAccess = isl_space_dim(AccessSpace, isl_dim_set);
|
|
|
|
auto DimsMissing = DimsArray - DimsAccess;
|
|
|
|
|
2016-02-25 06:08:24 +08:00
|
|
|
auto *BB = getStatement()->getEntryBlock();
|
2016-02-22 03:13:19 +08:00
|
|
|
auto &DL = BB->getModule()->getDataLayout();
|
2016-02-19 00:50:12 +08:00
|
|
|
unsigned ArrayElemSize = SAI->getElemSizeInBytes();
|
2016-02-22 03:13:19 +08:00
|
|
|
unsigned ElemBytes = DL.getTypeAllocSize(getElementType());
|
2016-02-19 00:50:12 +08:00
|
|
|
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *Map = isl_map_from_domain_and_range(
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
isl_set_universe(AccessSpace),
|
|
|
|
isl_set_universe(isl_space_copy(ArraySpace)));
|
2015-09-26 16:55:54 +08:00
|
|
|
|
|
|
|
for (unsigned i = 0; i < DimsMissing; i++)
|
|
|
|
Map = isl_map_fix_si(Map, isl_dim_out, i, 0);
|
|
|
|
|
|
|
|
for (unsigned i = DimsMissing; i < DimsArray; i++)
|
|
|
|
Map = isl_map_equate(Map, isl_dim_in, i - DimsMissing, isl_dim_out, i);
|
|
|
|
|
|
|
|
AccessRelation = isl_map_apply_range(AccessRelation, Map);
|
2016-01-08 22:01:59 +08:00
|
|
|
|
2016-02-19 00:50:12 +08:00
|
|
|
// For the non delinearized arrays, divide the access function of the last
|
|
|
|
// subscript by the size of the elements in the array.
|
|
|
|
//
|
|
|
|
// A stride one array access in C expressed as A[i] is expressed in
|
|
|
|
// LLVM-IR as something like A[i * elementsize]. This hides the fact that
|
|
|
|
// two subsequent values of 'i' index two values that are stored next to
|
|
|
|
// each other in memory. By this division we make this characteristic
|
|
|
|
// obvious again. If the base pointer was accessed with offsets not divisible
|
2016-08-03 13:28:09 +08:00
|
|
|
// by the accesses element size, we will have chosen a smaller ArrayElemSize
|
2016-02-19 00:50:12 +08:00
|
|
|
// that divides the offsets of all accesses to this base pointer.
|
|
|
|
if (DimsAccess == 1) {
|
|
|
|
isl_val *V = isl_val_int_from_si(Ctx, ArrayElemSize);
|
|
|
|
AccessRelation = isl_map_floordiv_val(AccessRelation, V);
|
|
|
|
}
|
|
|
|
|
2016-04-11 22:34:08 +08:00
|
|
|
// We currently do this only if we added at least one dimension, which means
|
|
|
|
// some dimension's indices have not been specified, an indicator that some
|
|
|
|
// index values have been added together.
|
|
|
|
// TODO: Investigate general usefulness; Effect on unit tests is to make index
|
|
|
|
// expressions more complicated.
|
|
|
|
if (DimsMissing)
|
|
|
|
wrapConstantDimensions();
|
|
|
|
|
2016-02-19 00:50:12 +08:00
|
|
|
if (!isAffine())
|
|
|
|
computeBoundsOnAccessRelation(ArrayElemSize);
|
|
|
|
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
// Introduce multi-element accesses in case the type loaded by this memory
|
|
|
|
// access is larger than the canonical element type of the array.
|
|
|
|
//
|
|
|
|
// An access ((float *)A)[i] to an array char *A is modeled as
|
|
|
|
// {[i] -> A[o] : 4 i <= o <= 4 i + 3
|
|
|
|
if (ElemBytes > ArrayElemSize) {
|
|
|
|
assert(ElemBytes % ArrayElemSize == 0 &&
|
|
|
|
"Loaded element size should be multiple of canonical element size");
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *Map = isl_map_from_domain_and_range(
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
isl_set_universe(isl_space_copy(ArraySpace)),
|
|
|
|
isl_set_universe(isl_space_copy(ArraySpace)));
|
|
|
|
for (unsigned i = 0; i < DimsArray - 1; i++)
|
|
|
|
Map = isl_map_equate(Map, isl_dim_in, i, isl_dim_out, i);
|
|
|
|
|
|
|
|
isl_constraint *C;
|
|
|
|
isl_local_space *LS;
|
|
|
|
|
|
|
|
LS = isl_local_space_from_space(isl_map_get_space(Map));
|
|
|
|
int Num = ElemBytes / getScopArrayInfo()->getElemSizeInBytes();
|
|
|
|
|
|
|
|
C = isl_constraint_alloc_inequality(isl_local_space_copy(LS));
|
|
|
|
C = isl_constraint_set_constant_val(C, isl_val_int_from_si(Ctx, Num - 1));
|
2016-02-19 00:50:12 +08:00
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_in, DimsArray - 1, 1);
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_out, DimsArray - 1, -1);
|
|
|
|
Map = isl_map_add_constraint(Map, C);
|
|
|
|
|
|
|
|
C = isl_constraint_alloc_inequality(LS);
|
2016-02-19 00:50:12 +08:00
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_in, DimsArray - 1, -1);
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_out, DimsArray - 1, 1);
|
|
|
|
C = isl_constraint_set_constant_val(C, isl_val_int_from_si(Ctx, 0));
|
|
|
|
Map = isl_map_add_constraint(Map, C);
|
|
|
|
AccessRelation = isl_map_apply_range(AccessRelation, Map);
|
|
|
|
}
|
|
|
|
|
|
|
|
isl_space_free(ArraySpace);
|
2015-09-26 16:55:54 +08:00
|
|
|
}
|
|
|
|
|
2014-08-01 16:13:25 +08:00
|
|
|
const std::string
|
|
|
|
MemoryAccess::getReductionOperatorStr(MemoryAccess::ReductionType RT) {
|
|
|
|
switch (RT) {
|
|
|
|
case MemoryAccess::RT_NONE:
|
|
|
|
llvm_unreachable("Requested a reduction operator string for a memory "
|
|
|
|
"access which isn't a reduction");
|
|
|
|
case MemoryAccess::RT_ADD:
|
|
|
|
return "+";
|
|
|
|
case MemoryAccess::RT_MUL:
|
|
|
|
return "*";
|
|
|
|
case MemoryAccess::RT_BOR:
|
|
|
|
return "|";
|
|
|
|
case MemoryAccess::RT_BXOR:
|
|
|
|
return "^";
|
|
|
|
case MemoryAccess::RT_BAND:
|
|
|
|
return "&";
|
|
|
|
}
|
|
|
|
llvm_unreachable("Unknown reduction type");
|
|
|
|
return "";
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Return the reduction type for a given binary operator.
|
2014-07-02 04:52:51 +08:00
|
|
|
static MemoryAccess::ReductionType getReductionType(const BinaryOperator *BinOp,
|
|
|
|
const Instruction *Load) {
|
|
|
|
if (!BinOp)
|
|
|
|
return MemoryAccess::RT_NONE;
|
|
|
|
switch (BinOp->getOpcode()) {
|
|
|
|
case Instruction::FAdd:
|
|
|
|
if (!BinOp->hasUnsafeAlgebra())
|
|
|
|
return MemoryAccess::RT_NONE;
|
|
|
|
// Fall through
|
|
|
|
case Instruction::Add:
|
|
|
|
return MemoryAccess::RT_ADD;
|
|
|
|
case Instruction::Or:
|
|
|
|
return MemoryAccess::RT_BOR;
|
|
|
|
case Instruction::Xor:
|
|
|
|
return MemoryAccess::RT_BXOR;
|
|
|
|
case Instruction::And:
|
|
|
|
return MemoryAccess::RT_BAND;
|
|
|
|
case Instruction::FMul:
|
|
|
|
if (!BinOp->hasUnsafeAlgebra())
|
|
|
|
return MemoryAccess::RT_NONE;
|
|
|
|
// Fall through
|
|
|
|
case Instruction::Mul:
|
|
|
|
if (DisableMultiplicativeReductions)
|
|
|
|
return MemoryAccess::RT_NONE;
|
|
|
|
return MemoryAccess::RT_MUL;
|
|
|
|
default:
|
|
|
|
return MemoryAccess::RT_NONE;
|
|
|
|
}
|
|
|
|
}
|
2015-09-18 01:28:15 +08:00
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
MemoryAccess::~MemoryAccess() {
|
2015-05-15 17:58:32 +08:00
|
|
|
isl_id_free(Id);
|
2016-04-23 22:32:34 +08:00
|
|
|
isl_set_free(InvalidDomain);
|
2011-08-18 14:31:46 +08:00
|
|
|
isl_map_free(AccessRelation);
|
2015-09-05 15:46:40 +08:00
|
|
|
isl_map_free(NewAccessRelation);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 03:53:31 +08:00
|
|
|
const ScopArrayInfo *MemoryAccess::getOriginalScopArrayInfo() const {
|
2014-10-05 19:32:18 +08:00
|
|
|
isl_id *ArrayId = getArrayId();
|
|
|
|
void *User = isl_id_get_user(ArrayId);
|
|
|
|
const ScopArrayInfo *SAI = static_cast<ScopArrayInfo *>(User);
|
|
|
|
isl_id_free(ArrayId);
|
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
|
2016-09-02 03:53:31 +08:00
|
|
|
const ScopArrayInfo *MemoryAccess::getLatestScopArrayInfo() const {
|
|
|
|
isl_id *ArrayId = getLatestArrayId();
|
|
|
|
void *User = isl_id_get_user(ArrayId);
|
|
|
|
const ScopArrayInfo *SAI = static_cast<ScopArrayInfo *>(User);
|
|
|
|
isl_id_free(ArrayId);
|
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
|
|
|
|
__isl_give isl_id *MemoryAccess::getOriginalArrayId() const {
|
2014-07-29 16:37:55 +08:00
|
|
|
return isl_map_get_tuple_id(AccessRelation, isl_dim_out);
|
|
|
|
}
|
|
|
|
|
2016-09-02 03:53:31 +08:00
|
|
|
__isl_give isl_id *MemoryAccess::getLatestArrayId() const {
|
|
|
|
if (!hasNewAccessRelation())
|
|
|
|
return getOriginalArrayId();
|
|
|
|
return isl_map_get_tuple_id(NewAccessRelation, isl_dim_out);
|
|
|
|
}
|
|
|
|
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
__isl_give isl_map *MemoryAccess::getAddressFunction() const {
|
|
|
|
return isl_map_lexmin(getAccessRelation());
|
|
|
|
}
|
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_pw_multi_aff *MemoryAccess::applyScheduleToAccessRelation(
|
|
|
|
__isl_take isl_union_map *USchedule) const {
|
2014-10-13 20:58:03 +08:00
|
|
|
isl_map *Schedule, *ScheduledAccRel;
|
|
|
|
isl_union_set *UDomain;
|
|
|
|
|
|
|
|
UDomain = isl_union_set_from_set(getStatement()->getDomain());
|
|
|
|
USchedule = isl_union_map_intersect_domain(USchedule, UDomain);
|
|
|
|
Schedule = isl_map_from_union_map(USchedule);
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
ScheduledAccRel = isl_map_apply_domain(getAddressFunction(), Schedule);
|
2014-10-13 20:58:03 +08:00
|
|
|
return isl_pw_multi_aff_from_map(ScheduledAccRel);
|
|
|
|
}
|
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_map *MemoryAccess::getOriginalAccessRelation() const {
|
2011-10-06 08:04:11 +08:00
|
|
|
return isl_map_copy(AccessRelation);
|
|
|
|
}
|
|
|
|
|
2014-10-13 20:58:03 +08:00
|
|
|
std::string MemoryAccess::getOriginalAccessRelationStr() const {
|
2011-10-06 08:04:11 +08:00
|
|
|
return stringFromIslObj(AccessRelation);
|
|
|
|
}
|
|
|
|
|
2014-10-13 20:58:03 +08:00
|
|
|
__isl_give isl_space *MemoryAccess::getOriginalAccessRelationSpace() const {
|
2014-07-03 01:47:48 +08:00
|
|
|
return isl_map_get_space(AccessRelation);
|
|
|
|
}
|
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_map *MemoryAccess::getNewAccessRelation() const {
|
2015-09-05 15:46:40 +08:00
|
|
|
return isl_map_copy(NewAccessRelation);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2015-09-05 15:46:47 +08:00
|
|
|
std::string MemoryAccess::getNewAccessRelationStr() const {
|
|
|
|
return stringFromIslObj(NewAccessRelation);
|
|
|
|
}
|
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_basic_map *
|
|
|
|
MemoryAccess::createBasicAccessMap(ScopStmt *Statement) {
|
2012-05-29 17:29:44 +08:00
|
|
|
isl_space *Space = isl_space_set_alloc(Statement->getIslCtx(), 0, 1);
|
2012-09-11 21:50:21 +08:00
|
|
|
Space = isl_space_align_params(Space, Statement->getDomainSpace());
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2012-05-29 17:29:44 +08:00
|
|
|
return isl_basic_map_from_domain_and_range(
|
2013-02-05 20:09:06 +08:00
|
|
|
isl_basic_set_universe(Statement->getDomainSpace()),
|
|
|
|
isl_basic_set_universe(Space));
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2014-07-03 01:47:48 +08:00
|
|
|
// Formalize no out-of-bound access assumption
|
|
|
|
//
|
|
|
|
// When delinearizing array accesses we optimistically assume that the
|
|
|
|
// delinearized accesses do not access out of bound locations (the subscript
|
|
|
|
// expression of each array evaluates for each statement instance that is
|
|
|
|
// executed to a value that is larger than zero and strictly smaller than the
|
|
|
|
// size of the corresponding dimension). The only exception is the outermost
|
2014-08-04 05:07:30 +08:00
|
|
|
// dimension for which we do not need to assume any upper bound. At this point
|
|
|
|
// we formalize this assumption to ensure that at code generation time the
|
|
|
|
// relevant run-time checks can be generated.
|
2014-07-03 01:47:48 +08:00
|
|
|
//
|
|
|
|
// To find the set of constraints necessary to avoid out of bound accesses, we
|
|
|
|
// first build the set of data locations that are not within array bounds. We
|
|
|
|
// then apply the reverse access relation to obtain the set of iterations that
|
|
|
|
// may contain invalid accesses and reduce this set of iterations to the ones
|
|
|
|
// that are actually executed by intersecting them with the domain of the
|
|
|
|
// statement. If we now project out all loop dimensions, we obtain a set of
|
|
|
|
// parameters that may cause statement instances to be executed that may
|
|
|
|
// possibly yield out of bound memory accesses. The complement of these
|
|
|
|
// constraints is the set of constraints that needs to be assumed to ensure such
|
|
|
|
// statement instances are never executed.
|
2015-09-19 03:59:43 +08:00
|
|
|
void MemoryAccess::assumeNoOutOfBound() {
|
2017-03-17 20:26:58 +08:00
|
|
|
if (PollyIgnoreInbounds)
|
|
|
|
return;
|
2016-02-07 21:57:32 +08:00
|
|
|
auto *SAI = getScopArrayInfo();
|
2014-10-13 20:58:03 +08:00
|
|
|
isl_space *Space = isl_space_range(getOriginalAccessRelationSpace());
|
2014-07-03 01:47:48 +08:00
|
|
|
isl_set *Outside = isl_set_empty(isl_space_copy(Space));
|
2016-01-08 22:01:59 +08:00
|
|
|
for (int i = 1, Size = isl_space_dim(Space, isl_dim_set); i < Size; ++i) {
|
2014-07-03 01:47:48 +08:00
|
|
|
isl_local_space *LS = isl_local_space_from_space(isl_space_copy(Space));
|
|
|
|
isl_pw_aff *Var =
|
|
|
|
isl_pw_aff_var_on_domain(isl_local_space_copy(LS), isl_dim_set, i);
|
|
|
|
isl_pw_aff *Zero = isl_pw_aff_zero_on_domain(LS);
|
|
|
|
|
|
|
|
isl_set *DimOutside;
|
|
|
|
|
2014-08-04 05:07:30 +08:00
|
|
|
DimOutside = isl_pw_aff_lt_set(isl_pw_aff_copy(Var), Zero);
|
2016-02-07 21:57:32 +08:00
|
|
|
isl_pw_aff *SizeE = SAI->getDimensionSizePw(i);
|
2014-08-04 05:07:30 +08:00
|
|
|
SizeE = isl_pw_aff_add_dims(SizeE, isl_dim_in,
|
|
|
|
isl_space_dim(Space, isl_dim_set));
|
|
|
|
SizeE = isl_pw_aff_set_tuple_id(SizeE, isl_dim_in,
|
|
|
|
isl_space_get_tuple_id(Space, isl_dim_set));
|
|
|
|
|
|
|
|
DimOutside = isl_set_union(DimOutside, isl_pw_aff_le_set(SizeE, Var));
|
2014-07-03 01:47:48 +08:00
|
|
|
|
|
|
|
Outside = isl_set_union(Outside, DimOutside);
|
|
|
|
}
|
|
|
|
|
|
|
|
Outside = isl_set_apply(Outside, isl_map_reverse(getAccessRelation()));
|
|
|
|
Outside = isl_set_intersect(Outside, Statement->getDomain());
|
|
|
|
Outside = isl_set_params(Outside);
|
2015-06-26 20:09:28 +08:00
|
|
|
|
|
|
|
// Remove divs to avoid the construction of overly complicated assumptions.
|
|
|
|
// Doing so increases the set of parameter combinations that are assumed to
|
|
|
|
// not appear. This is always save, but may make the resulting run-time check
|
|
|
|
// bail out more often than strictly necessary.
|
|
|
|
Outside = isl_set_remove_divs(Outside);
|
2014-07-03 01:47:48 +08:00
|
|
|
Outside = isl_set_complement(Outside);
|
2016-04-11 21:24:29 +08:00
|
|
|
const auto &Loc = getAccessInstruction()
|
|
|
|
? getAccessInstruction()->getDebugLoc()
|
|
|
|
: DebugLoc();
|
[ScopInfo] Simplify inbounds assumptions under domain constraints
Without this simplification for a loop nest:
void foo(long n1_a, long n1_b, long n1_c, long n1_d,
long p1_b, long p1_c, long p1_d,
float A_1[][p1_b][p1_c][p1_d]) {
for (long i = 0; i < n1_a; i++)
for (long j = 0; j < n1_b; j++)
for (long k = 0; k < n1_c; k++)
for (long l = 0; l < n1_d; l++)
A_1[i][j][k][l] += i + j + k + l;
}
the assumption:
n1_a <= 0 or (n1_a > 0 and n1_b <= 0) or
(n1_a > 0 and n1_b > 0 and n1_c <= 0) or
(n1_a > 0 and n1_b > 0 and n1_c > 0 and n1_d <= 0) or
(n1_a > 0 and n1_b > 0 and n1_c > 0 and n1_d > 0 and
p1_b >= n1_b and p1_c >= n1_c and p1_d >= n1_d)
is taken rather than the simpler assumption:
p9_b >= n9_b and p9_c >= n9_c and p9_d >= n9_d.
The former is less strict, as it allows arbitrary values of p1_* in case, the
loop is not executed at all. However, in practice these precise constraints
explode when combined across different accesses and loops. For now it seems
to make more sense to take less precise, but more scalable constraints by
default. In case we find a practical example where more precise constraints
are needed, we can think about allowing such precise constraints in specific
situations where they help.
This change speeds up the new test case from taking very long (waited at least
a minute, but it probably takes a lot more) to below a second.
llvm-svn: 296456
2017-02-28 17:45:54 +08:00
|
|
|
if (!PollyPreciseInbounds)
|
|
|
|
Outside = isl_set_gist(Outside, isl_set_params(Statement->getDomain()));
|
2016-04-12 21:27:35 +08:00
|
|
|
Statement->getParent()->recordAssumption(INBOUNDS, Outside, Loc,
|
|
|
|
AS_ASSUMPTION);
|
2014-07-03 01:47:48 +08:00
|
|
|
isl_space_free(Space);
|
|
|
|
}
|
|
|
|
|
2016-02-22 03:13:19 +08:00
|
|
|
void MemoryAccess::buildMemIntrinsicAccessRelation() {
|
2016-11-18 06:11:56 +08:00
|
|
|
assert(isMemoryIntrinsic());
|
2016-09-13 01:08:31 +08:00
|
|
|
assert(Subscripts.size() == 2 && Sizes.size() == 1);
|
2016-02-22 03:13:19 +08:00
|
|
|
|
2016-04-12 21:26:45 +08:00
|
|
|
auto *SubscriptPWA = getPwAff(Subscripts[0]);
|
2016-02-22 03:13:19 +08:00
|
|
|
auto *SubscriptMap = isl_map_from_pw_aff(SubscriptPWA);
|
2016-02-25 22:08:48 +08:00
|
|
|
|
|
|
|
isl_map *LengthMap;
|
|
|
|
if (Subscripts[1] == nullptr) {
|
|
|
|
LengthMap = isl_map_universe(isl_map_get_space(SubscriptMap));
|
|
|
|
} else {
|
2016-04-12 21:26:45 +08:00
|
|
|
auto *LengthPWA = getPwAff(Subscripts[1]);
|
2016-02-25 22:08:48 +08:00
|
|
|
LengthMap = isl_map_from_pw_aff(LengthPWA);
|
|
|
|
auto *RangeSpace = isl_space_range(isl_map_get_space(LengthMap));
|
|
|
|
LengthMap = isl_map_apply_range(LengthMap, isl_map_lex_gt(RangeSpace));
|
|
|
|
}
|
|
|
|
LengthMap = isl_map_lower_bound_si(LengthMap, isl_dim_out, 0, 0);
|
|
|
|
LengthMap = isl_map_align_params(LengthMap, isl_map_get_space(SubscriptMap));
|
2016-02-22 03:13:19 +08:00
|
|
|
SubscriptMap =
|
|
|
|
isl_map_align_params(SubscriptMap, isl_map_get_space(LengthMap));
|
|
|
|
LengthMap = isl_map_sum(LengthMap, SubscriptMap);
|
|
|
|
AccessRelation = isl_map_set_tuple_id(LengthMap, isl_dim_in,
|
|
|
|
getStatement()->getDomainId());
|
|
|
|
}
|
|
|
|
|
2015-02-24 19:58:30 +08:00
|
|
|
void MemoryAccess::computeBoundsOnAccessRelation(unsigned ElementSize) {
|
|
|
|
ScalarEvolution *SE = Statement->getParent()->getSE();
|
|
|
|
|
2016-02-22 03:13:19 +08:00
|
|
|
auto MAI = MemAccInst(getAccessInstruction());
|
2016-02-27 09:49:58 +08:00
|
|
|
if (isa<MemIntrinsic>(MAI))
|
2016-02-22 03:13:19 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
Value *Ptr = MAI.getPointerOperand();
|
2015-02-24 19:58:30 +08:00
|
|
|
if (!Ptr || !SE->isSCEVable(Ptr->getType()))
|
|
|
|
return;
|
|
|
|
|
|
|
|
auto *PtrSCEV = SE->getSCEV(Ptr);
|
|
|
|
if (isa<SCEVCouldNotCompute>(PtrSCEV))
|
|
|
|
return;
|
|
|
|
|
|
|
|
auto *BasePtrSCEV = SE->getPointerBase(PtrSCEV);
|
|
|
|
if (BasePtrSCEV && !isa<SCEVCouldNotCompute>(BasePtrSCEV))
|
|
|
|
PtrSCEV = SE->getMinusSCEV(PtrSCEV, BasePtrSCEV);
|
|
|
|
|
|
|
|
const ConstantRange &Range = SE->getSignedRange(PtrSCEV);
|
|
|
|
if (Range.isFullSet())
|
|
|
|
return;
|
|
|
|
|
2017-05-19 05:55:36 +08:00
|
|
|
if (Range.isWrappedSet() || Range.isSignWrappedSet())
|
2017-02-12 16:11:12 +08:00
|
|
|
return;
|
|
|
|
|
2015-03-09 03:49:50 +08:00
|
|
|
bool isWrapping = Range.isSignWrappedSet();
|
2017-02-12 16:11:12 +08:00
|
|
|
|
2015-02-24 19:58:30 +08:00
|
|
|
unsigned BW = Range.getBitWidth();
|
2016-02-07 21:59:03 +08:00
|
|
|
const auto One = APInt(BW, 1);
|
2015-03-09 03:49:50 +08:00
|
|
|
const auto LB = isWrapping ? Range.getLower() : Range.getSignedMin();
|
2016-02-07 21:59:03 +08:00
|
|
|
const auto UB = isWrapping ? (Range.getUpper() - One) : Range.getSignedMax();
|
2015-03-09 03:49:50 +08:00
|
|
|
|
|
|
|
auto Min = LB.sdiv(APInt(BW, ElementSize));
|
2016-02-07 21:59:03 +08:00
|
|
|
auto Max = UB.sdiv(APInt(BW, ElementSize)) + One;
|
2015-02-24 19:58:30 +08:00
|
|
|
|
2017-02-12 16:11:12 +08:00
|
|
|
assert(Min.sle(Max) && "Minimum expected to be less or equal than max");
|
|
|
|
|
2015-02-24 19:58:30 +08:00
|
|
|
isl_set *AccessRange = isl_map_range(isl_map_copy(AccessRelation));
|
|
|
|
AccessRange =
|
|
|
|
addRangeBoundsToSet(AccessRange, ConstantRange(Min, Max), 0, isl_dim_set);
|
|
|
|
AccessRelation = isl_map_intersect_range(AccessRelation, AccessRange);
|
|
|
|
}
|
|
|
|
|
2016-12-02 13:21:22 +08:00
|
|
|
void MemoryAccess::foldAccessRelation() {
|
|
|
|
if (Sizes.size() < 2 || isa<SCEVConstant>(Sizes[1]))
|
|
|
|
return;
|
|
|
|
|
2015-09-19 03:59:43 +08:00
|
|
|
int Size = Subscripts.size();
|
2015-03-31 01:22:28 +08:00
|
|
|
|
[ScopInfo] Disable memory folding in case it results in multi-disjunct relations
Multi-disjunct access maps can easily result in inbound assumptions which
explode in case of many memory accesses and many parameters. This change reduces
compilation time of some larger kernel from over 15 minutes to less than 16
seconds.
Interesting is the test case test/ScopInfo/multidim_param_in_subscript.ll
which has a memory access
[n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, -1 + n - i1] }
which requires folding, but where only a single disjunct remains. We can still
model this test case even when only using limited memory folding.
For people only reading commit messages, here the comment that explains what
memory folding is:
To recover memory accesses with array size parameters in the subscript
expression we post-process the delinearization results.
We would normally recover from an access A[exp0(i) * N + exp1(i)] into an
array A[][N] the 2D access A[exp0(i)][exp1(i)]. However, another valid
delinearization is A[exp0(i) - 1][exp1(i) + N] which - depending on the
range of exp1(i) - may be preferrable. Specifically, for cases where we
know exp1(i) is negative, we want to choose the latter expression.
As we commonly do not have any information about the range of exp1(i),
we do not choose one of the two options, but instead create a piecewise
access function that adds the (-1, N) offsets as soon as exp1(i) becomes
negative. For a 2D array such an access function is created by applying
the piecewise map:
[i,j] -> [i, j] : j >= 0
[i,j] -> [i-1, j+N] : j < 0
After this patch we generate only the first case, except for situations where
we can proove the first case to be invalid and can consequently select the
second without introducing disjuncts.
llvm-svn: 296679
2017-03-02 05:11:27 +08:00
|
|
|
isl_map *OldAccessRelation = isl_map_copy(AccessRelation);
|
|
|
|
|
2015-03-31 01:22:28 +08:00
|
|
|
for (int i = Size - 2; i >= 0; --i) {
|
|
|
|
isl_space *Space;
|
|
|
|
isl_map *MapOne, *MapTwo;
|
2016-09-13 01:08:31 +08:00
|
|
|
isl_pw_aff *DimSize = getPwAff(Sizes[i + 1]);
|
2015-03-31 01:22:28 +08:00
|
|
|
|
|
|
|
isl_space *SpaceSize = isl_pw_aff_get_space(DimSize);
|
|
|
|
isl_pw_aff_free(DimSize);
|
|
|
|
isl_id *ParamId = isl_space_get_dim_id(SpaceSize, isl_dim_param, 0);
|
|
|
|
|
|
|
|
Space = isl_map_get_space(AccessRelation);
|
|
|
|
Space = isl_space_map_from_set(isl_space_range(Space));
|
|
|
|
Space = isl_space_align_params(Space, SpaceSize);
|
|
|
|
|
|
|
|
int ParamLocation = isl_space_find_dim_by_id(Space, isl_dim_param, ParamId);
|
|
|
|
isl_id_free(ParamId);
|
|
|
|
|
|
|
|
MapOne = isl_map_universe(isl_space_copy(Space));
|
|
|
|
for (int j = 0; j < Size; ++j)
|
|
|
|
MapOne = isl_map_equate(MapOne, isl_dim_in, j, isl_dim_out, j);
|
|
|
|
MapOne = isl_map_lower_bound_si(MapOne, isl_dim_in, i + 1, 0);
|
|
|
|
|
|
|
|
MapTwo = isl_map_universe(isl_space_copy(Space));
|
|
|
|
for (int j = 0; j < Size; ++j)
|
|
|
|
if (j < i || j > i + 1)
|
|
|
|
MapTwo = isl_map_equate(MapTwo, isl_dim_in, j, isl_dim_out, j);
|
|
|
|
|
|
|
|
isl_local_space *LS = isl_local_space_from_space(Space);
|
|
|
|
isl_constraint *C;
|
|
|
|
C = isl_equality_alloc(isl_local_space_copy(LS));
|
|
|
|
C = isl_constraint_set_constant_si(C, -1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_in, i, 1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_out, i, -1);
|
|
|
|
MapTwo = isl_map_add_constraint(MapTwo, C);
|
|
|
|
C = isl_equality_alloc(LS);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_in, i + 1, 1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_out, i + 1, -1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_param, ParamLocation, 1);
|
|
|
|
MapTwo = isl_map_add_constraint(MapTwo, C);
|
|
|
|
MapTwo = isl_map_upper_bound_si(MapTwo, isl_dim_in, i + 1, -1);
|
|
|
|
|
|
|
|
MapOne = isl_map_union(MapOne, MapTwo);
|
|
|
|
AccessRelation = isl_map_apply_range(AccessRelation, MapOne);
|
|
|
|
}
|
2016-12-02 13:21:22 +08:00
|
|
|
|
|
|
|
isl_id *BaseAddrId = getScopArrayInfo()->getBasePtrId();
|
|
|
|
auto Space = Statement->getDomainSpace();
|
|
|
|
AccessRelation = isl_map_set_tuple_id(
|
|
|
|
AccessRelation, isl_dim_in, isl_space_get_tuple_id(Space, isl_dim_set));
|
|
|
|
AccessRelation =
|
|
|
|
isl_map_set_tuple_id(AccessRelation, isl_dim_out, BaseAddrId);
|
|
|
|
AccessRelation = isl_map_gist_domain(AccessRelation, Statement->getDomain());
|
[ScopInfo] Disable memory folding in case it results in multi-disjunct relations
Multi-disjunct access maps can easily result in inbound assumptions which
explode in case of many memory accesses and many parameters. This change reduces
compilation time of some larger kernel from over 15 minutes to less than 16
seconds.
Interesting is the test case test/ScopInfo/multidim_param_in_subscript.ll
which has a memory access
[n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, -1 + n - i1] }
which requires folding, but where only a single disjunct remains. We can still
model this test case even when only using limited memory folding.
For people only reading commit messages, here the comment that explains what
memory folding is:
To recover memory accesses with array size parameters in the subscript
expression we post-process the delinearization results.
We would normally recover from an access A[exp0(i) * N + exp1(i)] into an
array A[][N] the 2D access A[exp0(i)][exp1(i)]. However, another valid
delinearization is A[exp0(i) - 1][exp1(i) + N] which - depending on the
range of exp1(i) - may be preferrable. Specifically, for cases where we
know exp1(i) is negative, we want to choose the latter expression.
As we commonly do not have any information about the range of exp1(i),
we do not choose one of the two options, but instead create a piecewise
access function that adds the (-1, N) offsets as soon as exp1(i) becomes
negative. For a 2D array such an access function is created by applying
the piecewise map:
[i,j] -> [i, j] : j >= 0
[i,j] -> [i-1, j+N] : j < 0
After this patch we generate only the first case, except for situations where
we can proove the first case to be invalid and can consequently select the
second without introducing disjuncts.
llvm-svn: 296679
2017-03-02 05:11:27 +08:00
|
|
|
|
|
|
|
// Access dimension folding might in certain cases increase the number of
|
|
|
|
// disjuncts in the memory access, which can possibly complicate the generated
|
|
|
|
// run-time checks and can lead to costly compilation.
|
|
|
|
if (!PollyPreciseFoldAccesses && isl_map_n_basic_map(AccessRelation) >
|
|
|
|
isl_map_n_basic_map(OldAccessRelation)) {
|
|
|
|
isl_map_free(AccessRelation);
|
|
|
|
AccessRelation = OldAccessRelation;
|
|
|
|
} else {
|
|
|
|
isl_map_free(OldAccessRelation);
|
|
|
|
}
|
|
|
|
|
2016-12-02 13:21:22 +08:00
|
|
|
isl_space_free(Space);
|
2015-03-31 01:22:28 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Check if @p Expr is divisible by @p Size.
|
2015-11-13 04:15:32 +08:00
|
|
|
static bool isDivisible(const SCEV *Expr, unsigned Size, ScalarEvolution &SE) {
|
2016-02-25 22:08:48 +08:00
|
|
|
assert(Size != 0);
|
2016-02-19 00:50:12 +08:00
|
|
|
if (Size == 1)
|
|
|
|
return true;
|
2015-11-13 04:15:32 +08:00
|
|
|
|
|
|
|
// Only one factor needs to be divisible.
|
|
|
|
if (auto *MulExpr = dyn_cast<SCEVMulExpr>(Expr)) {
|
|
|
|
for (auto *FactorExpr : MulExpr->operands())
|
|
|
|
if (isDivisible(FactorExpr, Size, SE))
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
// For other n-ary expressions (Add, AddRec, Max,...) all operands need
|
|
|
|
// to be divisble.
|
|
|
|
if (auto *NAryExpr = dyn_cast<SCEVNAryExpr>(Expr)) {
|
|
|
|
for (auto *OpExpr : NAryExpr->operands())
|
|
|
|
if (!isDivisible(OpExpr, Size, SE))
|
|
|
|
return false;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
auto *SizeSCEV = SE.getConstant(Expr->getType(), Size);
|
|
|
|
auto *UDivSCEV = SE.getUDivExpr(Expr, SizeSCEV);
|
|
|
|
auto *MulSCEV = SE.getMulExpr(UDivSCEV, SizeSCEV);
|
|
|
|
return MulSCEV == Expr;
|
|
|
|
}
|
|
|
|
|
2015-09-19 03:59:43 +08:00
|
|
|
void MemoryAccess::buildAccessRelation(const ScopArrayInfo *SAI) {
|
|
|
|
assert(!AccessRelation && "AccessReltation already built");
|
2014-10-05 19:32:18 +08:00
|
|
|
|
2016-04-23 22:32:34 +08:00
|
|
|
// Initialize the invalid domain which describes all iterations for which the
|
|
|
|
// access relation is not modeled correctly.
|
2016-04-25 21:36:23 +08:00
|
|
|
auto *StmtInvalidDomain = getStatement()->getInvalidDomain();
|
|
|
|
InvalidDomain = isl_set_empty(isl_set_get_space(StmtInvalidDomain));
|
|
|
|
isl_set_free(StmtInvalidDomain);
|
2016-04-23 22:32:34 +08:00
|
|
|
|
2015-09-19 03:59:43 +08:00
|
|
|
isl_ctx *Ctx = isl_id_get_ctx(Id);
|
2014-10-05 19:32:18 +08:00
|
|
|
isl_id *BaseAddrId = SAI->getBasePtrId();
|
2011-11-10 06:34:34 +08:00
|
|
|
|
2016-11-02 04:53:11 +08:00
|
|
|
if (getAccessInstruction() && isa<MemIntrinsic>(getAccessInstruction())) {
|
|
|
|
buildMemIntrinsicAccessRelation();
|
|
|
|
AccessRelation =
|
|
|
|
isl_map_set_tuple_id(AccessRelation, isl_dim_out, BaseAddrId);
|
|
|
|
return;
|
|
|
|
}
|
2016-02-22 03:13:19 +08:00
|
|
|
|
2016-11-02 04:53:11 +08:00
|
|
|
if (!isAffine()) {
|
2013-06-23 13:21:18 +08:00
|
|
|
// We overapproximate non-affine accesses with a possible access to the
|
|
|
|
// whole array. For read accesses it does not make a difference, if an
|
|
|
|
// access must or may happen. However, for write accesses it is important to
|
|
|
|
// differentiate between writes that must happen and writes that may happen.
|
2016-02-22 03:13:19 +08:00
|
|
|
if (!AccessRelation)
|
|
|
|
AccessRelation = isl_map_from_basic_map(createBasicAccessMap(Statement));
|
|
|
|
|
2014-07-29 16:37:55 +08:00
|
|
|
AccessRelation =
|
|
|
|
isl_map_set_tuple_id(AccessRelation, isl_dim_out, BaseAddrId);
|
2011-12-20 18:43:14 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-07-29 16:37:55 +08:00
|
|
|
isl_space *Space = isl_space_alloc(Ctx, 0, Statement->getNumIterators(), 0);
|
2014-04-10 16:38:02 +08:00
|
|
|
AccessRelation = isl_map_universe(Space);
|
2014-04-09 05:20:44 +08:00
|
|
|
|
2015-09-19 03:59:43 +08:00
|
|
|
for (int i = 0, Size = Subscripts.size(); i < Size; ++i) {
|
2016-04-12 21:26:45 +08:00
|
|
|
isl_pw_aff *Affine = getPwAff(Subscripts[i]);
|
2014-04-09 05:20:44 +08:00
|
|
|
isl_map *SubscriptMap = isl_map_from_pw_aff(Affine);
|
2014-04-10 16:38:02 +08:00
|
|
|
AccessRelation = isl_map_flat_range_product(AccessRelation, SubscriptMap);
|
2014-04-09 05:20:44 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2014-04-10 16:38:02 +08:00
|
|
|
Space = Statement->getDomainSpace();
|
2013-02-05 20:09:06 +08:00
|
|
|
AccessRelation = isl_map_set_tuple_id(
|
|
|
|
AccessRelation, isl_dim_in, isl_space_get_tuple_id(Space, isl_dim_set));
|
2014-07-29 16:37:55 +08:00
|
|
|
AccessRelation =
|
|
|
|
isl_map_set_tuple_id(AccessRelation, isl_dim_out, BaseAddrId);
|
|
|
|
|
2015-03-30 08:07:50 +08:00
|
|
|
AccessRelation = isl_map_gist_domain(AccessRelation, Statement->getDomain());
|
2014-07-29 16:37:55 +08:00
|
|
|
isl_space_free(Space);
|
2011-11-08 23:41:08 +08:00
|
|
|
}
|
2011-08-18 15:51:37 +08:00
|
|
|
|
2015-10-02 21:53:07 +08:00
|
|
|
MemoryAccess::MemoryAccess(ScopStmt *Stmt, Instruction *AccessInst,
|
2016-02-22 03:13:19 +08:00
|
|
|
AccessType AccType, Value *BaseAddress,
|
|
|
|
Type *ElementType, bool Affine,
|
2015-09-19 03:59:43 +08:00
|
|
|
ArrayRef<const SCEV *> Subscripts,
|
|
|
|
ArrayRef<const SCEV *> Sizes, Value *AccessValue,
|
2017-05-03 16:02:32 +08:00
|
|
|
MemoryKind Kind)
|
2016-02-22 03:13:19 +08:00
|
|
|
: Kind(Kind), AccType(AccType), RedType(RT_NONE), Statement(Stmt),
|
2017-05-03 15:57:35 +08:00
|
|
|
InvalidDomain(nullptr), BaseAddr(BaseAddress), ElementType(ElementType),
|
|
|
|
Sizes(Sizes.begin(), Sizes.end()), AccessInstruction(AccessInst),
|
|
|
|
AccessValue(AccessValue), IsAffine(Affine),
|
2015-09-19 03:59:43 +08:00
|
|
|
Subscripts(Subscripts.begin(), Subscripts.end()), AccessRelation(nullptr),
|
2017-05-10 21:11:20 +08:00
|
|
|
NewAccessRelation(nullptr), FAD(nullptr) {
|
2016-02-20 11:40:15 +08:00
|
|
|
static const std::string TypeStrings[] = {"", "_Read", "_Write", "_MayWrite"};
|
2017-05-03 15:57:35 +08:00
|
|
|
const std::string Access = TypeStrings[AccType] + utostr(Stmt->size());
|
2015-11-06 04:15:37 +08:00
|
|
|
|
2017-05-03 15:57:35 +08:00
|
|
|
std::string IdName = Stmt->getBaseName() + Access;
|
2015-11-06 04:15:37 +08:00
|
|
|
Id = isl_id_alloc(Stmt->getParent()->getIslCtx(), IdName.c_str(), this);
|
|
|
|
}
|
2015-09-19 03:59:43 +08:00
|
|
|
|
2016-09-14 14:26:09 +08:00
|
|
|
MemoryAccess::MemoryAccess(ScopStmt *Stmt, AccessType AccType,
|
|
|
|
__isl_take isl_map *AccRel)
|
2017-01-15 04:25:44 +08:00
|
|
|
: Kind(MemoryKind::Array), AccType(AccType), RedType(RT_NONE),
|
|
|
|
Statement(Stmt), InvalidDomain(nullptr), AccessInstruction(nullptr),
|
2017-05-10 21:11:20 +08:00
|
|
|
IsAffine(true), AccessRelation(nullptr), NewAccessRelation(AccRel),
|
|
|
|
FAD(nullptr) {
|
2016-09-14 14:26:09 +08:00
|
|
|
auto *ArrayInfoId = isl_map_get_tuple_id(NewAccessRelation, isl_dim_out);
|
|
|
|
auto *SAI = ScopArrayInfo::getFromId(ArrayInfoId);
|
|
|
|
Sizes.push_back(nullptr);
|
|
|
|
for (unsigned i = 1; i < SAI->getNumberOfDimensions(); i++)
|
|
|
|
Sizes.push_back(SAI->getDimensionSize(i));
|
|
|
|
ElementType = SAI->getElementType();
|
|
|
|
BaseAddr = SAI->getBasePtr();
|
|
|
|
static const std::string TypeStrings[] = {"", "_Read", "_Write", "_MayWrite"};
|
2017-05-03 15:57:35 +08:00
|
|
|
const std::string Access = TypeStrings[AccType] + utostr(Stmt->size());
|
2016-09-14 14:26:09 +08:00
|
|
|
|
2017-05-03 15:57:35 +08:00
|
|
|
std::string IdName = Stmt->getBaseName() + Access;
|
2016-09-14 14:26:09 +08:00
|
|
|
Id = isl_id_alloc(Stmt->getParent()->getIslCtx(), IdName.c_str(), this);
|
|
|
|
}
|
|
|
|
|
2011-11-08 23:41:08 +08:00
|
|
|
void MemoryAccess::realignParams() {
|
2016-05-10 20:18:22 +08:00
|
|
|
auto *Ctx = Statement->getParent()->getContext();
|
|
|
|
InvalidDomain = isl_set_gist_params(InvalidDomain, isl_set_copy(Ctx));
|
|
|
|
AccessRelation = isl_map_gist_params(AccessRelation, Ctx);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2014-08-01 16:13:25 +08:00
|
|
|
const std::string MemoryAccess::getReductionOperatorStr() const {
|
|
|
|
return MemoryAccess::getReductionOperatorStr(getReductionType());
|
|
|
|
}
|
|
|
|
|
2015-05-15 17:58:32 +08:00
|
|
|
__isl_give isl_id *MemoryAccess::getId() const { return isl_id_copy(Id); }
|
|
|
|
|
2014-07-02 04:52:51 +08:00
|
|
|
raw_ostream &polly::operator<<(raw_ostream &OS,
|
|
|
|
MemoryAccess::ReductionType RT) {
|
2014-08-01 16:13:25 +08:00
|
|
|
if (RT == MemoryAccess::RT_NONE)
|
2014-07-02 04:52:51 +08:00
|
|
|
OS << "NONE";
|
2014-08-01 16:13:25 +08:00
|
|
|
else
|
|
|
|
OS << MemoryAccess::getReductionOperatorStr(RT);
|
2014-07-02 04:52:51 +08:00
|
|
|
return OS;
|
|
|
|
}
|
|
|
|
|
2017-05-15 16:41:30 +08:00
|
|
|
void MemoryAccess::setFortranArrayDescriptor(Value *FAD) { this->FAD = FAD; }
|
2017-05-10 21:11:20 +08:00
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
void MemoryAccess::print(raw_ostream &OS) const {
|
2014-10-08 18:11:33 +08:00
|
|
|
switch (AccType) {
|
2013-07-14 04:41:24 +08:00
|
|
|
case READ:
|
2014-06-27 02:47:03 +08:00
|
|
|
OS.indent(12) << "ReadAccess :=\t";
|
2013-06-23 13:21:18 +08:00
|
|
|
break;
|
2013-07-14 04:41:24 +08:00
|
|
|
case MUST_WRITE:
|
2014-06-27 02:47:03 +08:00
|
|
|
OS.indent(12) << "MustWriteAccess :=\t";
|
2013-06-23 13:21:18 +08:00
|
|
|
break;
|
2013-07-14 04:41:24 +08:00
|
|
|
case MAY_WRITE:
|
2014-06-27 02:47:03 +08:00
|
|
|
OS.indent(12) << "MayWriteAccess :=\t";
|
2013-06-23 13:21:18 +08:00
|
|
|
break;
|
|
|
|
}
|
2017-05-10 21:11:20 +08:00
|
|
|
|
2015-02-07 04:13:15 +08:00
|
|
|
OS << "[Reduction Type: " << getReductionType() << "] ";
|
2017-05-10 21:11:20 +08:00
|
|
|
|
|
|
|
if (FAD) {
|
|
|
|
OS << "[Fortran array descriptor: " << FAD->getName();
|
|
|
|
OS << "] ";
|
|
|
|
};
|
|
|
|
|
ScopInfo: Harmonize the different array kinds
Over time different vocabulary has been introduced to describe the different
memory objects in Polly, resulting in different - often inconsistent - naming
schemes in different parts of Polly. We now standartize this to the following
scheme:
KindArray, KindValue, KindPHI, KindExitPHI
| ------- isScalar -----------|
In most cases this naming scheme has already been used previously (this
minimizes changes and ensures we remain consistent with previous publications).
The main change is that we remove KindScalar to clearify the difference between
a scalar as a memory object of kind Value, PHI or ExitPHI and a value (former
KindScalar) which is a memory object modeling a llvm::Value.
We also move all documentation to the Kind* enum in the ScopArrayInfo class,
remove the second enum in the MemoryAccess class and update documentation to be
formulated from the perspective of the memory object, rather than the memory
access. The terms "Implicit"/"Explicit", formerly used to describe memory
accesses, have been dropped. From the perspective of memory accesses they
described the different memory kinds well - especially from the perspective of
code generation - but just from the perspective of a memory object it seems more
straightforward to talk about scalars and arrays, rather than explicit and
implicit arrays. The last comment is clearly subjective, though. A less
subjective reason to go for these terms is the historic use both in mailing list
discussions and publications.
llvm-svn: 255467
2015-12-14 03:59:01 +08:00
|
|
|
OS << "[Scalar: " << isScalarKind() << "]\n";
|
2015-12-14 03:35:26 +08:00
|
|
|
OS.indent(16) << getOriginalAccessRelationStr() << ";\n";
|
2015-09-05 15:46:47 +08:00
|
|
|
if (hasNewAccessRelation())
|
|
|
|
OS.indent(11) << "new: " << getNewAccessRelationStr() << ";\n";
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2013-01-15 06:40:23 +08:00
|
|
|
void MemoryAccess::dump() const { print(errs()); }
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2016-04-12 21:26:45 +08:00
|
|
|
__isl_give isl_pw_aff *MemoryAccess::getPwAff(const SCEV *E) {
|
|
|
|
auto *Stmt = getStatement();
|
2016-04-23 22:32:34 +08:00
|
|
|
PWACtx PWAC = Stmt->getParent()->getPwAff(E, Stmt->getEntryBlock());
|
2016-07-11 20:01:26 +08:00
|
|
|
isl_set *StmtDom = isl_set_reset_tuple_id(getStatement()->getDomain());
|
|
|
|
isl_set *NewInvalidDom = isl_set_intersect(StmtDom, PWAC.second);
|
|
|
|
InvalidDomain = isl_set_union(InvalidDomain, NewInvalidDom);
|
2016-04-23 22:32:34 +08:00
|
|
|
return PWAC.first;
|
2016-04-12 21:26:45 +08:00
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
// Create a map in the size of the provided set domain, that maps from the
|
|
|
|
// one element of the provided set domain to another element of the provided
|
|
|
|
// set domain.
|
|
|
|
// The mapping is limited to all points that are equal in all but the last
|
|
|
|
// dimension and for which the last dimension of the input is strict smaller
|
|
|
|
// than the last dimension of the output.
|
|
|
|
//
|
|
|
|
// getEqualAndLarger(set[i0, i1, ..., iX]):
|
|
|
|
//
|
|
|
|
// set[i0, i1, ..., iX] -> set[o0, o1, ..., oX]
|
|
|
|
// : i0 = o0, i1 = o1, ..., i(X-1) = o(X-1), iX < oX
|
|
|
|
//
|
2016-09-08 19:18:56 +08:00
|
|
|
static isl_map *getEqualAndLarger(__isl_take isl_space *setDomain) {
|
2012-02-01 22:23:36 +08:00
|
|
|
isl_space *Space = isl_space_map_from_set(setDomain);
|
2015-05-22 03:02:44 +08:00
|
|
|
isl_map *Map = isl_map_universe(Space);
|
2013-10-05 01:14:53 +08:00
|
|
|
unsigned lastDimension = isl_map_dim(Map, isl_dim_in) - 1;
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
// Set all but the last dimension to be equal for the input and output
|
|
|
|
//
|
|
|
|
// input[i0, i1, ..., iX] -> output[o0, o1, ..., oX]
|
|
|
|
// : i0 = o0, i1 = o1, ..., i(X-1) = o(X-1)
|
2013-10-05 01:14:53 +08:00
|
|
|
for (unsigned i = 0; i < lastDimension; ++i)
|
2012-02-01 22:23:36 +08:00
|
|
|
Map = isl_map_equate(Map, isl_dim_in, i, isl_dim_out, i);
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
// Set the last dimension of the input to be strict smaller than the
|
|
|
|
// last dimension of the output.
|
|
|
|
//
|
|
|
|
// input[?,?,?,...,iX] -> output[?,?,?,...,oX] : iX < oX
|
2015-05-22 03:02:44 +08:00
|
|
|
Map = isl_map_order_lt(Map, isl_dim_in, lastDimension, isl_dim_out,
|
|
|
|
lastDimension);
|
2012-02-01 22:23:36 +08:00
|
|
|
return Map;
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_set *
|
|
|
|
MemoryAccess::getStride(__isl_take const isl_map *Schedule) const {
|
2013-02-05 20:09:06 +08:00
|
|
|
isl_map *S = const_cast<isl_map *>(Schedule);
|
2014-10-13 20:58:03 +08:00
|
|
|
isl_map *AccessRelation = getAccessRelation();
|
2012-12-18 15:46:06 +08:00
|
|
|
isl_space *Space = isl_space_range(isl_map_get_space(S));
|
|
|
|
isl_map *NextScatt = getEqualAndLarger(Space);
|
|
|
|
|
|
|
|
S = isl_map_reverse(S);
|
|
|
|
NextScatt = isl_map_lexmin(NextScatt);
|
|
|
|
|
|
|
|
NextScatt = isl_map_apply_range(NextScatt, isl_map_copy(S));
|
|
|
|
NextScatt = isl_map_apply_range(NextScatt, isl_map_copy(AccessRelation));
|
|
|
|
NextScatt = isl_map_apply_domain(NextScatt, S);
|
|
|
|
NextScatt = isl_map_apply_domain(NextScatt, AccessRelation);
|
|
|
|
|
|
|
|
isl_set *Deltas = isl_map_deltas(NextScatt);
|
|
|
|
return Deltas;
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2012-12-18 15:46:06 +08:00
|
|
|
bool MemoryAccess::isStrideX(__isl_take const isl_map *Schedule,
|
2012-01-25 00:42:16 +08:00
|
|
|
int StrideWidth) const {
|
|
|
|
isl_set *Stride, *StrideX;
|
|
|
|
bool IsStrideX;
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2012-12-18 15:46:06 +08:00
|
|
|
Stride = getStride(Schedule);
|
2012-01-25 00:42:16 +08:00
|
|
|
StrideX = isl_set_universe(isl_set_get_space(Stride));
|
2015-08-25 06:20:46 +08:00
|
|
|
for (unsigned i = 0; i < isl_set_dim(StrideX, isl_dim_set) - 1; i++)
|
|
|
|
StrideX = isl_set_fix_si(StrideX, isl_dim_set, i, 0);
|
|
|
|
StrideX = isl_set_fix_si(StrideX, isl_dim_set,
|
|
|
|
isl_set_dim(StrideX, isl_dim_set) - 1, StrideWidth);
|
2015-08-19 00:12:05 +08:00
|
|
|
IsStrideX = isl_set_is_subset(Stride, StrideX);
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2012-01-25 00:42:16 +08:00
|
|
|
isl_set_free(StrideX);
|
2012-01-18 04:34:27 +08:00
|
|
|
isl_set_free(Stride);
|
2011-08-20 19:11:25 +08:00
|
|
|
|
2012-01-25 00:42:16 +08:00
|
|
|
return IsStrideX;
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2016-09-01 17:03:27 +08:00
|
|
|
bool MemoryAccess::isStrideZero(__isl_take const isl_map *Schedule) const {
|
2012-12-18 15:46:06 +08:00
|
|
|
return isStrideX(Schedule, 0);
|
2012-01-25 00:42:16 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2016-09-01 17:03:27 +08:00
|
|
|
bool MemoryAccess::isStrideOne(__isl_take const isl_map *Schedule) const {
|
2012-12-18 15:46:06 +08:00
|
|
|
return isStrideX(Schedule, 1);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2016-12-02 16:10:56 +08:00
|
|
|
void MemoryAccess::setAccessRelation(__isl_take isl_map *NewAccess) {
|
|
|
|
isl_map_free(AccessRelation);
|
|
|
|
AccessRelation = NewAccess;
|
|
|
|
}
|
|
|
|
|
2016-09-01 17:03:27 +08:00
|
|
|
void MemoryAccess::setNewAccessRelation(__isl_take isl_map *NewAccess) {
|
2016-09-02 03:16:58 +08:00
|
|
|
assert(NewAccess);
|
|
|
|
|
|
|
|
#ifndef NDEBUG
|
|
|
|
// Check domain space compatibility.
|
|
|
|
auto *NewSpace = isl_map_get_space(NewAccess);
|
|
|
|
auto *NewDomainSpace = isl_space_domain(isl_space_copy(NewSpace));
|
|
|
|
auto *OriginalDomainSpace = getStatement()->getDomainSpace();
|
|
|
|
assert(isl_space_has_equal_tuples(OriginalDomainSpace, NewDomainSpace));
|
|
|
|
isl_space_free(NewDomainSpace);
|
|
|
|
isl_space_free(OriginalDomainSpace);
|
|
|
|
|
|
|
|
// Check whether there is an access for every statement instance.
|
|
|
|
auto *StmtDomain = getStatement()->getDomain();
|
|
|
|
StmtDomain = isl_set_intersect_params(
|
|
|
|
StmtDomain, getStatement()->getParent()->getContext());
|
|
|
|
auto *NewDomain = isl_map_domain(isl_map_copy(NewAccess));
|
|
|
|
assert(isl_set_is_subset(StmtDomain, NewDomain) &&
|
|
|
|
"Partial accesses not supported");
|
|
|
|
isl_set_free(NewDomain);
|
|
|
|
isl_set_free(StmtDomain);
|
|
|
|
|
|
|
|
auto *NewAccessSpace = isl_space_range(NewSpace);
|
|
|
|
assert(isl_space_has_tuple_id(NewAccessSpace, isl_dim_set) &&
|
|
|
|
"Must specify the array that is accessed");
|
|
|
|
auto *NewArrayId = isl_space_get_tuple_id(NewAccessSpace, isl_dim_set);
|
|
|
|
auto *SAI = static_cast<ScopArrayInfo *>(isl_id_get_user(NewArrayId));
|
|
|
|
assert(SAI && "Must set a ScopArrayInfo");
|
Relax assert when setting access functions with invariant base pointers
Summary:
Instead of forbidding such access functions completely, we verify that their
base pointer has been hoisted and only assert in case the base pointer was
not hoisted.
I was trying for a little while to get a test case that ensures the assert is
correctly fired in case of invariant load hoisting being disabled, but I could
not find a good way to do so, as llvm-lit immediately aborts if a command
yields a non-zero return value. As we do not generally test our asserts,
not having a test case here seems OK.
This resolves http://llvm.org/PR31494
Suggested-by: Michael Kruse <llvm@meinersbur.de>
Reviewers: efriedma, jdoerfert, Meinersbur, gareevroman, sebpop, zinob, huihuiz, pollydev
Reviewed By: Meinersbur
Differential Revision: https://reviews.llvm.org/D28798
llvm-svn: 292213
2017-01-17 20:00:42 +08:00
|
|
|
|
|
|
|
if (SAI->isArrayKind() && SAI->getBasePtrOriginSAI()) {
|
|
|
|
InvariantEquivClassTy *EqClass =
|
|
|
|
getStatement()->getParent()->lookupInvariantEquivClass(
|
|
|
|
SAI->getBasePtr());
|
|
|
|
assert(EqClass &&
|
|
|
|
"Access functions to indirect arrays must have an invariant and "
|
|
|
|
"hoisted base pointer");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check whether access dimensions correspond to number of dimensions of the
|
|
|
|
// accesses array.
|
2016-09-02 03:16:58 +08:00
|
|
|
auto Dims = SAI->getNumberOfDimensions();
|
|
|
|
assert(isl_space_dim(NewAccessSpace, isl_dim_set) == Dims &&
|
|
|
|
"Access dims must match array dims");
|
|
|
|
isl_space_free(NewAccessSpace);
|
|
|
|
isl_id_free(NewArrayId);
|
|
|
|
#endif
|
|
|
|
|
2015-09-05 15:46:40 +08:00
|
|
|
isl_map_free(NewAccessRelation);
|
|
|
|
NewAccessRelation = NewAccess;
|
2011-07-13 01:14:03 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
2011-10-06 08:04:05 +08:00
|
|
|
|
2016-04-10 05:55:23 +08:00
|
|
|
__isl_give isl_map *ScopStmt::getSchedule() const {
|
2015-07-14 17:33:13 +08:00
|
|
|
isl_set *Domain = getDomain();
|
|
|
|
if (isl_set_is_empty(Domain)) {
|
|
|
|
isl_set_free(Domain);
|
|
|
|
return isl_map_from_aff(
|
|
|
|
isl_aff_zero_on_domain(isl_local_space_from_space(getDomainSpace())));
|
|
|
|
}
|
|
|
|
auto *Schedule = getParent()->getSchedule();
|
2016-09-14 14:26:09 +08:00
|
|
|
if (!Schedule) {
|
|
|
|
isl_set_free(Domain);
|
|
|
|
return nullptr;
|
|
|
|
}
|
2015-07-14 17:33:13 +08:00
|
|
|
Schedule = isl_union_map_intersect_domain(
|
|
|
|
Schedule, isl_union_set_from_set(isl_set_copy(Domain)));
|
|
|
|
if (isl_union_map_is_empty(Schedule)) {
|
|
|
|
isl_set_free(Domain);
|
|
|
|
isl_union_map_free(Schedule);
|
|
|
|
return isl_map_from_aff(
|
|
|
|
isl_aff_zero_on_domain(isl_local_space_from_space(getDomainSpace())));
|
|
|
|
}
|
|
|
|
auto *M = isl_map_from_union_map(Schedule);
|
|
|
|
M = isl_map_coalesce(M);
|
|
|
|
M = isl_map_gist_domain(M, Domain);
|
|
|
|
M = isl_map_coalesce(M);
|
|
|
|
return M;
|
|
|
|
}
|
2011-10-06 08:04:05 +08:00
|
|
|
|
2016-04-29 18:44:41 +08:00
|
|
|
__isl_give isl_pw_aff *ScopStmt::getPwAff(const SCEV *E, bool NonNegative) {
|
|
|
|
PWACtx PWAC = getParent()->getPwAff(E, getEntryBlock(), NonNegative);
|
2016-04-23 22:31:17 +08:00
|
|
|
InvalidDomain = isl_set_union(InvalidDomain, PWAC.second);
|
|
|
|
return PWAC.first;
|
2015-08-12 18:19:50 +08:00
|
|
|
}
|
|
|
|
|
2014-02-21 05:43:54 +08:00
|
|
|
void ScopStmt::restrictDomain(__isl_take isl_set *NewDomain) {
|
|
|
|
assert(isl_set_is_subset(NewDomain, Domain) &&
|
|
|
|
"New domain is not a subset of old domain!");
|
|
|
|
isl_set_free(Domain);
|
|
|
|
Domain = NewDomain;
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2015-10-02 21:53:07 +08:00
|
|
|
void ScopStmt::buildAccessRelations() {
|
2016-02-07 21:57:32 +08:00
|
|
|
Scop &S = *getParent();
|
2015-10-02 21:53:07 +08:00
|
|
|
for (MemoryAccess *Access : MemAccs) {
|
2016-02-22 03:13:19 +08:00
|
|
|
Type *ElementType = Access->getElementType();
|
2014-10-05 19:32:18 +08:00
|
|
|
|
2017-01-15 04:25:44 +08:00
|
|
|
MemoryKind Ty;
|
ScopInfo: Harmonize the different array kinds
Over time different vocabulary has been introduced to describe the different
memory objects in Polly, resulting in different - often inconsistent - naming
schemes in different parts of Polly. We now standartize this to the following
scheme:
KindArray, KindValue, KindPHI, KindExitPHI
| ------- isScalar -----------|
In most cases this naming scheme has already been used previously (this
minimizes changes and ensures we remain consistent with previous publications).
The main change is that we remove KindScalar to clearify the difference between
a scalar as a memory object of kind Value, PHI or ExitPHI and a value (former
KindScalar) which is a memory object modeling a llvm::Value.
We also move all documentation to the Kind* enum in the ScopArrayInfo class,
remove the second enum in the MemoryAccess class and update documentation to be
formulated from the perspective of the memory object, rather than the memory
access. The terms "Implicit"/"Explicit", formerly used to describe memory
accesses, have been dropped. From the perspective of memory accesses they
described the different memory kinds well - especially from the perspective of
code generation - but just from the perspective of a memory object it seems more
straightforward to talk about scalars and arrays, rather than explicit and
implicit arrays. The last comment is clearly subjective, though. A less
subjective reason to go for these terms is the historic use both in mailing list
discussions and publications.
llvm-svn: 255467
2015-12-14 03:59:01 +08:00
|
|
|
if (Access->isPHIKind())
|
2017-01-15 04:25:44 +08:00
|
|
|
Ty = MemoryKind::PHI;
|
ScopInfo: Harmonize the different array kinds
Over time different vocabulary has been introduced to describe the different
memory objects in Polly, resulting in different - often inconsistent - naming
schemes in different parts of Polly. We now standartize this to the following
scheme:
KindArray, KindValue, KindPHI, KindExitPHI
| ------- isScalar -----------|
In most cases this naming scheme has already been used previously (this
minimizes changes and ensures we remain consistent with previous publications).
The main change is that we remove KindScalar to clearify the difference between
a scalar as a memory object of kind Value, PHI or ExitPHI and a value (former
KindScalar) which is a memory object modeling a llvm::Value.
We also move all documentation to the Kind* enum in the ScopArrayInfo class,
remove the second enum in the MemoryAccess class and update documentation to be
formulated from the perspective of the memory object, rather than the memory
access. The terms "Implicit"/"Explicit", formerly used to describe memory
accesses, have been dropped. From the perspective of memory accesses they
described the different memory kinds well - especially from the perspective of
code generation - but just from the perspective of a memory object it seems more
straightforward to talk about scalars and arrays, rather than explicit and
implicit arrays. The last comment is clearly subjective, though. A less
subjective reason to go for these terms is the historic use both in mailing list
discussions and publications.
llvm-svn: 255467
2015-12-14 03:59:01 +08:00
|
|
|
else if (Access->isExitPHIKind())
|
2017-01-15 04:25:44 +08:00
|
|
|
Ty = MemoryKind::ExitPHI;
|
ScopInfo: Harmonize the different array kinds
Over time different vocabulary has been introduced to describe the different
memory objects in Polly, resulting in different - often inconsistent - naming
schemes in different parts of Polly. We now standartize this to the following
scheme:
KindArray, KindValue, KindPHI, KindExitPHI
| ------- isScalar -----------|
In most cases this naming scheme has already been used previously (this
minimizes changes and ensures we remain consistent with previous publications).
The main change is that we remove KindScalar to clearify the difference between
a scalar as a memory object of kind Value, PHI or ExitPHI and a value (former
KindScalar) which is a memory object modeling a llvm::Value.
We also move all documentation to the Kind* enum in the ScopArrayInfo class,
remove the second enum in the MemoryAccess class and update documentation to be
formulated from the perspective of the memory object, rather than the memory
access. The terms "Implicit"/"Explicit", formerly used to describe memory
accesses, have been dropped. From the perspective of memory accesses they
described the different memory kinds well - especially from the perspective of
code generation - but just from the perspective of a memory object it seems more
straightforward to talk about scalars and arrays, rather than explicit and
implicit arrays. The last comment is clearly subjective, though. A less
subjective reason to go for these terms is the historic use both in mailing list
discussions and publications.
llvm-svn: 255467
2015-12-14 03:59:01 +08:00
|
|
|
else if (Access->isValueKind())
|
2017-01-15 04:25:44 +08:00
|
|
|
Ty = MemoryKind::Value;
|
2015-11-11 01:31:31 +08:00
|
|
|
else
|
2017-01-15 04:25:44 +08:00
|
|
|
Ty = MemoryKind::Array;
|
2015-11-11 01:31:31 +08:00
|
|
|
|
2017-02-10 18:09:46 +08:00
|
|
|
auto *SAI = S.getOrCreateScopArrayInfo(Access->getOriginalBaseAddr(),
|
|
|
|
ElementType, Access->Sizes, Ty);
|
2015-10-02 21:53:07 +08:00
|
|
|
Access->buildAccessRelation(SAI);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-05-12 06:56:46 +08:00
|
|
|
MemoryAccess *ScopStmt::lookupPHIReadOf(PHINode *PHI) const {
|
|
|
|
for (auto *MA : *this) {
|
|
|
|
if (!MA->isRead())
|
|
|
|
continue;
|
|
|
|
if (!MA->isLatestAnyPHIKind())
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (MA->getAccessInstruction() == PHI)
|
|
|
|
return MA;
|
|
|
|
}
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2015-10-02 21:53:07 +08:00
|
|
|
void ScopStmt::addAccess(MemoryAccess *Access) {
|
|
|
|
Instruction *AccessInst = Access->getAccessInstruction();
|
|
|
|
|
2015-12-23 07:25:11 +08:00
|
|
|
if (Access->isArrayKind()) {
|
|
|
|
MemoryAccessList &MAL = InstructionToAccess[AccessInst];
|
|
|
|
MAL.emplace_front(Access);
|
2016-01-26 21:33:10 +08:00
|
|
|
} else if (Access->isValueKind() && Access->isWrite()) {
|
|
|
|
Instruction *AccessVal = cast<Instruction>(Access->getAccessValue());
|
2016-02-25 06:08:19 +08:00
|
|
|
assert(Parent.getStmtFor(AccessVal) == this);
|
2016-01-26 21:33:10 +08:00
|
|
|
assert(!ValueWrites.lookup(AccessVal));
|
|
|
|
|
|
|
|
ValueWrites[AccessVal] = Access;
|
2016-01-26 21:33:15 +08:00
|
|
|
} else if (Access->isValueKind() && Access->isRead()) {
|
|
|
|
Value *AccessVal = Access->getAccessValue();
|
|
|
|
assert(!ValueReads.lookup(AccessVal));
|
|
|
|
|
|
|
|
ValueReads[AccessVal] = Access;
|
2016-01-26 21:33:27 +08:00
|
|
|
} else if (Access->isAnyPHIKind() && Access->isWrite()) {
|
2017-02-10 18:09:44 +08:00
|
|
|
PHINode *PHI = cast<PHINode>(Access->getAccessValue());
|
2016-01-26 21:33:27 +08:00
|
|
|
assert(!PHIWrites.lookup(PHI));
|
|
|
|
|
|
|
|
PHIWrites[PHI] = Access;
|
2015-12-23 07:25:11 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
MemAccs.push_back(Access);
|
2015-10-02 21:53:07 +08:00
|
|
|
}
|
|
|
|
|
2011-11-08 23:41:08 +08:00
|
|
|
void ScopStmt::realignParams() {
|
2014-06-14 02:01:45 +08:00
|
|
|
for (MemoryAccess *MA : *this)
|
|
|
|
MA->realignParams();
|
2011-11-08 23:41:08 +08:00
|
|
|
|
2016-05-10 20:18:22 +08:00
|
|
|
auto *Ctx = Parent.getContext();
|
|
|
|
InvalidDomain = isl_set_gist_params(InvalidDomain, isl_set_copy(Ctx));
|
|
|
|
Domain = isl_set_gist_params(Domain, Ctx);
|
2011-11-08 23:41:08 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Add @p BSet to the set @p User if @p BSet is bounded.
|
2015-09-10 21:00:06 +08:00
|
|
|
static isl_stat collectBoundedParts(__isl_take isl_basic_set *BSet,
|
|
|
|
void *User) {
|
|
|
|
isl_set **BoundedParts = static_cast<isl_set **>(User);
|
|
|
|
if (isl_basic_set_is_bounded(BSet))
|
|
|
|
*BoundedParts = isl_set_union(*BoundedParts, isl_set_from_basic_set(BSet));
|
|
|
|
else
|
|
|
|
isl_basic_set_free(BSet);
|
|
|
|
return isl_stat_ok;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Return the bounded parts of @p S.
|
2015-09-10 21:00:06 +08:00
|
|
|
static __isl_give isl_set *collectBoundedParts(__isl_take isl_set *S) {
|
|
|
|
isl_set *BoundedParts = isl_set_empty(isl_set_get_space(S));
|
|
|
|
isl_set_foreach_basic_set(S, collectBoundedParts, &BoundedParts);
|
|
|
|
isl_set_free(S);
|
|
|
|
return BoundedParts;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Compute the (un)bounded parts of @p S wrt. to dimension @p Dim.
|
2015-09-10 21:00:06 +08:00
|
|
|
///
|
|
|
|
/// @returns A separation of @p S into first an unbounded then a bounded subset,
|
|
|
|
/// both with regards to the dimension @p Dim.
|
|
|
|
static std::pair<__isl_give isl_set *, __isl_give isl_set *>
|
|
|
|
partitionSetParts(__isl_take isl_set *S, unsigned Dim) {
|
|
|
|
|
|
|
|
for (unsigned u = 0, e = isl_set_n_dim(S); u < e; u++)
|
2015-09-21 00:15:32 +08:00
|
|
|
S = isl_set_lower_bound_si(S, isl_dim_set, u, 0);
|
2015-09-10 21:00:06 +08:00
|
|
|
|
|
|
|
unsigned NumDimsS = isl_set_n_dim(S);
|
2015-09-21 00:15:32 +08:00
|
|
|
isl_set *OnlyDimS = isl_set_copy(S);
|
2015-09-10 21:00:06 +08:00
|
|
|
|
|
|
|
// Remove dimensions that are greater than Dim as they are not interesting.
|
|
|
|
assert(NumDimsS >= Dim + 1);
|
|
|
|
OnlyDimS =
|
|
|
|
isl_set_project_out(OnlyDimS, isl_dim_set, Dim + 1, NumDimsS - Dim - 1);
|
|
|
|
|
|
|
|
// Create artificial parametric upper bounds for dimensions smaller than Dim
|
|
|
|
// as we are not interested in them.
|
|
|
|
OnlyDimS = isl_set_insert_dims(OnlyDimS, isl_dim_param, 0, Dim);
|
|
|
|
for (unsigned u = 0; u < Dim; u++) {
|
|
|
|
isl_constraint *C = isl_inequality_alloc(
|
|
|
|
isl_local_space_from_space(isl_set_get_space(OnlyDimS)));
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_param, u, 1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_set, u, -1);
|
|
|
|
OnlyDimS = isl_set_add_constraint(OnlyDimS, C);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Collect all bounded parts of OnlyDimS.
|
|
|
|
isl_set *BoundedParts = collectBoundedParts(OnlyDimS);
|
|
|
|
|
|
|
|
// Create the dimensions greater than Dim again.
|
|
|
|
BoundedParts = isl_set_insert_dims(BoundedParts, isl_dim_set, Dim + 1,
|
|
|
|
NumDimsS - Dim - 1);
|
|
|
|
|
|
|
|
// Remove the artificial upper bound parameters again.
|
|
|
|
BoundedParts = isl_set_remove_dims(BoundedParts, isl_dim_param, 0, Dim);
|
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
isl_set *UnboundedParts = isl_set_subtract(S, isl_set_copy(BoundedParts));
|
2015-09-10 21:00:06 +08:00
|
|
|
return std::make_pair(UnboundedParts, BoundedParts);
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Set the dimension Ids from @p From in @p To.
|
2015-09-28 17:33:22 +08:00
|
|
|
static __isl_give isl_set *setDimensionIds(__isl_keep isl_set *From,
|
|
|
|
__isl_take isl_set *To) {
|
|
|
|
for (unsigned u = 0, e = isl_set_n_dim(From); u < e; u++) {
|
|
|
|
isl_id *DimId = isl_set_get_dim_id(From, isl_dim_set, u);
|
|
|
|
To = isl_set_set_dim_id(To, isl_dim_set, u, DimId);
|
|
|
|
}
|
|
|
|
return To;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Create the conditions under which @p L @p Pred @p R is true.
|
2015-08-31 05:13:53 +08:00
|
|
|
static __isl_give isl_set *buildConditionSet(ICmpInst::Predicate Pred,
|
2015-09-28 17:33:22 +08:00
|
|
|
__isl_take isl_pw_aff *L,
|
|
|
|
__isl_take isl_pw_aff *R) {
|
2015-08-31 05:13:53 +08:00
|
|
|
switch (Pred) {
|
|
|
|
case ICmpInst::ICMP_EQ:
|
|
|
|
return isl_pw_aff_eq_set(L, R);
|
|
|
|
case ICmpInst::ICMP_NE:
|
|
|
|
return isl_pw_aff_ne_set(L, R);
|
|
|
|
case ICmpInst::ICMP_SLT:
|
|
|
|
return isl_pw_aff_lt_set(L, R);
|
|
|
|
case ICmpInst::ICMP_SLE:
|
|
|
|
return isl_pw_aff_le_set(L, R);
|
|
|
|
case ICmpInst::ICMP_SGT:
|
|
|
|
return isl_pw_aff_gt_set(L, R);
|
|
|
|
case ICmpInst::ICMP_SGE:
|
|
|
|
return isl_pw_aff_ge_set(L, R);
|
|
|
|
case ICmpInst::ICMP_ULT:
|
|
|
|
return isl_pw_aff_lt_set(L, R);
|
|
|
|
case ICmpInst::ICMP_UGT:
|
|
|
|
return isl_pw_aff_gt_set(L, R);
|
|
|
|
case ICmpInst::ICMP_ULE:
|
|
|
|
return isl_pw_aff_le_set(L, R);
|
|
|
|
case ICmpInst::ICMP_UGE:
|
|
|
|
return isl_pw_aff_ge_set(L, R);
|
|
|
|
default:
|
|
|
|
llvm_unreachable("Non integer predicate not supported");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Create the conditions under which @p L @p Pred @p R is true.
|
2015-09-28 17:33:22 +08:00
|
|
|
///
|
|
|
|
/// Helper function that will make sure the dimensions of the result have the
|
|
|
|
/// same isl_id's as the @p Domain.
|
|
|
|
static __isl_give isl_set *buildConditionSet(ICmpInst::Predicate Pred,
|
|
|
|
__isl_take isl_pw_aff *L,
|
|
|
|
__isl_take isl_pw_aff *R,
|
|
|
|
__isl_keep isl_set *Domain) {
|
|
|
|
isl_set *ConsequenceCondSet = buildConditionSet(Pred, L, R);
|
|
|
|
return setDimensionIds(Domain, ConsequenceCondSet);
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Build the conditions sets for the switch @p SI in the @p Domain.
|
2015-08-31 05:13:53 +08:00
|
|
|
///
|
|
|
|
/// This will fill @p ConditionSets with the conditions under which control
|
2015-09-28 17:33:22 +08:00
|
|
|
/// will be moved from @p SI to its successors. Hence, @p ConditionSets will
|
|
|
|
/// have as many elements as @p SI has successors.
|
2016-05-10 21:06:42 +08:00
|
|
|
static bool
|
2016-04-19 22:53:13 +08:00
|
|
|
buildConditionSets(ScopStmt &Stmt, SwitchInst *SI, Loop *L,
|
|
|
|
__isl_keep isl_set *Domain,
|
2015-08-31 05:13:53 +08:00
|
|
|
SmallVectorImpl<__isl_give isl_set *> &ConditionSets) {
|
|
|
|
|
2015-09-28 17:33:22 +08:00
|
|
|
Value *Condition = getConditionFromTerminator(SI);
|
|
|
|
assert(Condition && "No condition for switch");
|
|
|
|
|
2016-04-19 22:53:13 +08:00
|
|
|
Scop &S = *Stmt.getParent();
|
2015-09-28 17:33:22 +08:00
|
|
|
ScalarEvolution &SE = *S.getSE();
|
|
|
|
isl_pw_aff *LHS, *RHS;
|
2016-04-19 22:53:13 +08:00
|
|
|
LHS = Stmt.getPwAff(SE.getSCEVAtScope(Condition, L));
|
2015-09-28 17:33:22 +08:00
|
|
|
|
|
|
|
unsigned NumSuccessors = SI->getNumSuccessors();
|
|
|
|
ConditionSets.resize(NumSuccessors);
|
|
|
|
for (auto &Case : SI->cases()) {
|
|
|
|
unsigned Idx = Case.getSuccessorIndex();
|
|
|
|
ConstantInt *CaseValue = Case.getCaseValue();
|
|
|
|
|
2016-04-19 22:53:13 +08:00
|
|
|
RHS = Stmt.getPwAff(SE.getSCEV(CaseValue));
|
2015-09-28 17:33:22 +08:00
|
|
|
isl_set *CaseConditionSet =
|
|
|
|
buildConditionSet(ICmpInst::ICMP_EQ, isl_pw_aff_copy(LHS), RHS, Domain);
|
|
|
|
ConditionSets[Idx] = isl_set_coalesce(
|
|
|
|
isl_set_intersect(CaseConditionSet, isl_set_copy(Domain)));
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(ConditionSets[0] == nullptr && "Default condition set was set");
|
|
|
|
isl_set *ConditionSetUnion = isl_set_copy(ConditionSets[1]);
|
|
|
|
for (unsigned u = 2; u < NumSuccessors; u++)
|
|
|
|
ConditionSetUnion =
|
|
|
|
isl_set_union(ConditionSetUnion, isl_set_copy(ConditionSets[u]));
|
|
|
|
ConditionSets[0] = setDimensionIds(
|
|
|
|
Domain, isl_set_subtract(isl_set_copy(Domain), ConditionSetUnion));
|
|
|
|
|
|
|
|
isl_pw_aff_free(LHS);
|
2016-05-10 21:06:42 +08:00
|
|
|
|
|
|
|
return true;
|
2015-09-28 17:33:22 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Build the conditions sets for the branch condition @p Condition in
|
|
|
|
/// the @p Domain.
|
2015-09-28 17:33:22 +08:00
|
|
|
///
|
|
|
|
/// This will fill @p ConditionSets with the conditions under which control
|
|
|
|
/// will be moved from @p TI to its successors. Hence, @p ConditionSets will
|
2015-11-12 11:25:01 +08:00
|
|
|
/// have as many elements as @p TI has successors. If @p TI is nullptr the
|
|
|
|
/// context under which @p Condition is true/false will be returned as the
|
|
|
|
/// new elements of @p ConditionSets.
|
2016-05-10 21:06:42 +08:00
|
|
|
static bool
|
2016-04-19 22:53:13 +08:00
|
|
|
buildConditionSets(ScopStmt &Stmt, Value *Condition, TerminatorInst *TI,
|
|
|
|
Loop *L, __isl_keep isl_set *Domain,
|
2015-09-28 17:33:22 +08:00
|
|
|
SmallVectorImpl<__isl_give isl_set *> &ConditionSets) {
|
|
|
|
|
2016-04-19 22:53:13 +08:00
|
|
|
Scop &S = *Stmt.getParent();
|
2015-08-31 05:13:53 +08:00
|
|
|
isl_set *ConsequenceCondSet = nullptr;
|
|
|
|
if (auto *CCond = dyn_cast<ConstantInt>(Condition)) {
|
|
|
|
if (CCond->isZero())
|
|
|
|
ConsequenceCondSet = isl_set_empty(isl_set_get_space(Domain));
|
|
|
|
else
|
|
|
|
ConsequenceCondSet = isl_set_universe(isl_set_get_space(Domain));
|
2015-10-11 21:21:03 +08:00
|
|
|
} else if (BinaryOperator *BinOp = dyn_cast<BinaryOperator>(Condition)) {
|
|
|
|
auto Opcode = BinOp->getOpcode();
|
|
|
|
assert(Opcode == Instruction::And || Opcode == Instruction::Or);
|
|
|
|
|
2016-05-10 22:01:21 +08:00
|
|
|
bool Valid = buildConditionSets(Stmt, BinOp->getOperand(0), TI, L, Domain,
|
|
|
|
ConditionSets) &&
|
|
|
|
buildConditionSets(Stmt, BinOp->getOperand(1), TI, L, Domain,
|
|
|
|
ConditionSets);
|
|
|
|
if (!Valid) {
|
|
|
|
while (!ConditionSets.empty())
|
|
|
|
isl_set_free(ConditionSets.pop_back_val());
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2016-05-10 22:01:21 +08:00
|
|
|
}
|
2015-10-11 21:21:03 +08:00
|
|
|
|
|
|
|
isl_set_free(ConditionSets.pop_back_val());
|
|
|
|
isl_set *ConsCondPart0 = ConditionSets.pop_back_val();
|
|
|
|
isl_set_free(ConditionSets.pop_back_val());
|
|
|
|
isl_set *ConsCondPart1 = ConditionSets.pop_back_val();
|
|
|
|
|
|
|
|
if (Opcode == Instruction::And)
|
|
|
|
ConsequenceCondSet = isl_set_intersect(ConsCondPart0, ConsCondPart1);
|
|
|
|
else
|
|
|
|
ConsequenceCondSet = isl_set_union(ConsCondPart0, ConsCondPart1);
|
2015-08-31 05:13:53 +08:00
|
|
|
} else {
|
|
|
|
auto *ICond = dyn_cast<ICmpInst>(Condition);
|
|
|
|
assert(ICond &&
|
|
|
|
"Condition of exiting branch was neither constant nor ICmp!");
|
|
|
|
|
|
|
|
ScalarEvolution &SE = *S.getSE();
|
|
|
|
isl_pw_aff *LHS, *RHS;
|
2016-04-29 18:44:41 +08:00
|
|
|
// For unsigned comparisons we assumed the signed bit of neither operand
|
|
|
|
// to be set. The comparison is equal to a signed comparison under this
|
|
|
|
// assumption.
|
|
|
|
bool NonNeg = ICond->isUnsigned();
|
|
|
|
LHS = Stmt.getPwAff(SE.getSCEVAtScope(ICond->getOperand(0), L), NonNeg);
|
|
|
|
RHS = Stmt.getPwAff(SE.getSCEVAtScope(ICond->getOperand(1), L), NonNeg);
|
2015-09-28 17:33:22 +08:00
|
|
|
ConsequenceCondSet =
|
|
|
|
buildConditionSet(ICond->getPredicate(), LHS, RHS, Domain);
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
|
2015-11-12 11:25:01 +08:00
|
|
|
// If no terminator was given we are only looking for parameter constraints
|
|
|
|
// under which @p Condition is true/false.
|
|
|
|
if (!TI)
|
|
|
|
ConsequenceCondSet = isl_set_params(ConsequenceCondSet);
|
2015-08-31 05:13:53 +08:00
|
|
|
assert(ConsequenceCondSet);
|
2016-04-04 15:59:41 +08:00
|
|
|
ConsequenceCondSet = isl_set_coalesce(
|
|
|
|
isl_set_intersect(ConsequenceCondSet, isl_set_copy(Domain)));
|
|
|
|
|
2016-04-26 17:20:41 +08:00
|
|
|
isl_set *AlternativeCondSet = nullptr;
|
2016-05-02 20:25:36 +08:00
|
|
|
bool TooComplex =
|
2017-02-17 03:11:33 +08:00
|
|
|
isl_set_n_basic_set(ConsequenceCondSet) >= MaxDisjunctsInDomain;
|
2016-04-26 17:20:41 +08:00
|
|
|
|
2016-05-02 20:25:36 +08:00
|
|
|
if (!TooComplex) {
|
2016-04-04 15:59:41 +08:00
|
|
|
AlternativeCondSet = isl_set_subtract(isl_set_copy(Domain),
|
|
|
|
isl_set_copy(ConsequenceCondSet));
|
2016-05-02 20:25:36 +08:00
|
|
|
TooComplex =
|
2017-02-17 03:11:33 +08:00
|
|
|
isl_set_n_basic_set(AlternativeCondSet) >= MaxDisjunctsInDomain;
|
2016-04-26 17:20:41 +08:00
|
|
|
}
|
|
|
|
|
2016-05-02 20:25:36 +08:00
|
|
|
if (TooComplex) {
|
2016-04-04 15:59:41 +08:00
|
|
|
S.invalidate(COMPLEXITY, TI ? TI->getDebugLoc() : DebugLoc());
|
2016-04-26 17:20:41 +08:00
|
|
|
isl_set_free(AlternativeCondSet);
|
|
|
|
isl_set_free(ConsequenceCondSet);
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2016-04-04 15:59:41 +08:00
|
|
|
}
|
2015-08-31 05:13:53 +08:00
|
|
|
|
2016-04-04 15:59:41 +08:00
|
|
|
ConditionSets.push_back(ConsequenceCondSet);
|
|
|
|
ConditionSets.push_back(isl_set_coalesce(AlternativeCondSet));
|
2016-05-10 21:06:42 +08:00
|
|
|
|
|
|
|
return true;
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Build the conditions sets for the terminator @p TI in the @p Domain.
|
2015-10-11 21:21:03 +08:00
|
|
|
///
|
|
|
|
/// This will fill @p ConditionSets with the conditions under which control
|
|
|
|
/// will be moved from @p TI to its successors. Hence, @p ConditionSets will
|
|
|
|
/// have as many elements as @p TI has successors.
|
2016-05-10 21:06:42 +08:00
|
|
|
static bool
|
2016-04-19 22:53:13 +08:00
|
|
|
buildConditionSets(ScopStmt &Stmt, TerminatorInst *TI, Loop *L,
|
2015-10-11 21:21:03 +08:00
|
|
|
__isl_keep isl_set *Domain,
|
|
|
|
SmallVectorImpl<__isl_give isl_set *> &ConditionSets) {
|
|
|
|
|
|
|
|
if (SwitchInst *SI = dyn_cast<SwitchInst>(TI))
|
2016-04-19 22:53:13 +08:00
|
|
|
return buildConditionSets(Stmt, SI, L, Domain, ConditionSets);
|
2015-10-11 21:21:03 +08:00
|
|
|
|
|
|
|
assert(isa<BranchInst>(TI) && "Terminator was neither branch nor switch.");
|
|
|
|
|
|
|
|
if (TI->getNumSuccessors() == 1) {
|
|
|
|
ConditionSets.push_back(isl_set_copy(Domain));
|
2016-05-10 21:06:42 +08:00
|
|
|
return true;
|
2015-10-11 21:21:03 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
Value *Condition = getConditionFromTerminator(TI);
|
|
|
|
assert(Condition && "No condition for Terminator");
|
|
|
|
|
2016-04-19 22:53:13 +08:00
|
|
|
return buildConditionSets(Stmt, Condition, TI, L, Domain, ConditionSets);
|
2015-10-11 21:21:03 +08:00
|
|
|
}
|
|
|
|
|
2015-09-10 21:12:02 +08:00
|
|
|
void ScopStmt::buildDomain() {
|
2016-02-25 06:08:08 +08:00
|
|
|
isl_id *Id = isl_id_alloc(getIslCtx(), getBaseName(), this);
|
2012-05-29 17:29:44 +08:00
|
|
|
|
2015-09-10 21:00:06 +08:00
|
|
|
Domain = getParent()->getDomainConditions(this);
|
2012-05-29 17:29:44 +08:00
|
|
|
Domain = isl_set_set_tuple_id(Domain, Id);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2015-09-10 23:27:46 +08:00
|
|
|
void ScopStmt::collectSurroundingLoops() {
|
|
|
|
for (unsigned u = 0, e = isl_set_n_dim(Domain); u < e; u++) {
|
|
|
|
isl_id *DimId = isl_set_get_dim_id(Domain, isl_dim_set, u);
|
|
|
|
NestLoops.push_back(static_cast<Loop *>(isl_id_get_user(DimId)));
|
|
|
|
isl_id_free(DimId);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
ScopStmt::ScopStmt(Scop &parent, Region &R, Loop *SurroundingLoop)
|
2016-04-23 21:02:23 +08:00
|
|
|
: Parent(parent), InvalidDomain(nullptr), Domain(nullptr), BB(nullptr),
|
2017-03-16 06:16:43 +08:00
|
|
|
R(&R), Build(nullptr), SurroundingLoop(SurroundingLoop) {
|
2015-02-24 20:00:50 +08:00
|
|
|
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
BaseName = getIslCompatibleName(
|
|
|
|
"Stmt", R.getNameStr(), parent.getNextStmtIdx(), "", UseInstructionNames);
|
2015-02-24 20:00:50 +08:00
|
|
|
}
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
ScopStmt::ScopStmt(Scop &parent, BasicBlock &bb, Loop *SurroundingLoop)
|
2016-04-23 21:02:23 +08:00
|
|
|
: Parent(parent), InvalidDomain(nullptr), Domain(nullptr), BB(&bb),
|
2017-03-16 06:16:43 +08:00
|
|
|
R(nullptr), Build(nullptr), SurroundingLoop(SurroundingLoop) {
|
2011-04-29 14:27:02 +08:00
|
|
|
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
BaseName = getIslCompatibleName("Stmt", &bb, parent.getNextStmtIdx(), "",
|
|
|
|
UseInstructionNames);
|
2015-10-02 21:53:07 +08:00
|
|
|
}
|
|
|
|
|
2016-09-14 14:26:09 +08:00
|
|
|
ScopStmt::ScopStmt(Scop &parent, __isl_take isl_map *SourceRel,
|
|
|
|
__isl_take isl_map *TargetRel, __isl_take isl_set *NewDomain)
|
|
|
|
: Parent(parent), InvalidDomain(nullptr), Domain(NewDomain), BB(nullptr),
|
|
|
|
R(nullptr), Build(nullptr) {
|
|
|
|
BaseName = getIslCompatibleName("CopyStmt_", "",
|
|
|
|
std::to_string(parent.getCopyStmtsNum()));
|
|
|
|
auto *Id = isl_id_alloc(getIslCtx(), getBaseName(), this);
|
|
|
|
Domain = isl_set_set_tuple_id(Domain, isl_id_copy(Id));
|
|
|
|
TargetRel = isl_map_set_tuple_id(TargetRel, isl_dim_in, Id);
|
|
|
|
auto *Access =
|
|
|
|
new MemoryAccess(this, MemoryAccess::AccessType::MUST_WRITE, TargetRel);
|
|
|
|
parent.addAccessFunction(Access);
|
|
|
|
addAccess(Access);
|
|
|
|
SourceRel = isl_map_set_tuple_id(SourceRel, isl_dim_in, isl_id_copy(Id));
|
|
|
|
Access = new MemoryAccess(this, MemoryAccess::AccessType::READ, SourceRel);
|
|
|
|
parent.addAccessFunction(Access);
|
|
|
|
addAccess(Access);
|
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
void ScopStmt::init(LoopInfo &LI) {
|
2015-10-02 21:53:07 +08:00
|
|
|
assert(!Domain && "init must be called only once");
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2015-09-10 21:12:02 +08:00
|
|
|
buildDomain();
|
2015-09-10 23:27:46 +08:00
|
|
|
collectSurroundingLoops();
|
2015-10-02 21:53:07 +08:00
|
|
|
buildAccessRelations();
|
|
|
|
|
2015-08-21 03:08:11 +08:00
|
|
|
if (DetectReductions)
|
|
|
|
checkForReductions();
|
2014-06-28 04:31:28 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Collect loads which might form a reduction chain with @p StoreMA.
|
2014-06-28 04:31:28 +08:00
|
|
|
///
|
2015-02-25 00:00:29 +08:00
|
|
|
/// Check if the stored value for @p StoreMA is a binary operator with one or
|
|
|
|
/// two loads as operands. If the binary operand is commutative & associative,
|
2014-06-28 04:31:28 +08:00
|
|
|
/// used only once (by @p StoreMA) and its load operands are also used only
|
|
|
|
/// once, we have found a possible reduction chain. It starts at an operand
|
|
|
|
/// load and includes the binary operator and @p StoreMA.
|
|
|
|
///
|
2015-02-25 00:00:29 +08:00
|
|
|
/// Note: We allow only one use to ensure the load and binary operator cannot
|
2014-06-28 04:31:28 +08:00
|
|
|
/// escape this block or into any other store except @p StoreMA.
|
|
|
|
void ScopStmt::collectCandiateReductionLoads(
|
|
|
|
MemoryAccess *StoreMA, SmallVectorImpl<MemoryAccess *> &Loads) {
|
|
|
|
auto *Store = dyn_cast<StoreInst>(StoreMA->getAccessInstruction());
|
|
|
|
if (!Store)
|
2014-06-18 01:31:36 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
// Skip if there is not one binary operator between the load and the store
|
|
|
|
auto *BinOp = dyn_cast<BinaryOperator>(Store->getValueOperand());
|
2014-06-28 04:31:28 +08:00
|
|
|
if (!BinOp)
|
2014-06-18 01:31:36 +08:00
|
|
|
return;
|
|
|
|
|
2014-06-28 04:31:28 +08:00
|
|
|
// Skip if the binary operators has multiple uses
|
|
|
|
if (BinOp->getNumUses() != 1)
|
2014-06-18 01:31:36 +08:00
|
|
|
return;
|
|
|
|
|
2015-02-25 00:00:29 +08:00
|
|
|
// Skip if the opcode of the binary operator is not commutative/associative
|
2014-06-28 04:31:28 +08:00
|
|
|
if (!BinOp->isCommutative() || !BinOp->isAssociative())
|
2014-06-18 01:31:36 +08:00
|
|
|
return;
|
|
|
|
|
2014-07-01 08:32:29 +08:00
|
|
|
// Skip if the binary operator is outside the current SCoP
|
|
|
|
if (BinOp->getParent() != Store->getParent())
|
|
|
|
return;
|
|
|
|
|
2014-06-18 01:31:36 +08:00
|
|
|
// Skip if it is a multiplicative reduction and we disabled them
|
|
|
|
if (DisableMultiplicativeReductions &&
|
|
|
|
(BinOp->getOpcode() == Instruction::Mul ||
|
|
|
|
BinOp->getOpcode() == Instruction::FMul))
|
|
|
|
return;
|
|
|
|
|
2014-06-28 04:31:28 +08:00
|
|
|
// Check the binary operator operands for a candidate load
|
|
|
|
auto *PossibleLoad0 = dyn_cast<LoadInst>(BinOp->getOperand(0));
|
|
|
|
auto *PossibleLoad1 = dyn_cast<LoadInst>(BinOp->getOperand(1));
|
|
|
|
if (!PossibleLoad0 && !PossibleLoad1)
|
|
|
|
return;
|
|
|
|
|
|
|
|
// A load is only a candidate if it cannot escape (thus has only this use)
|
|
|
|
if (PossibleLoad0 && PossibleLoad0->getNumUses() == 1)
|
2014-07-01 08:32:29 +08:00
|
|
|
if (PossibleLoad0->getParent() == Store->getParent())
|
2015-12-16 07:50:04 +08:00
|
|
|
Loads.push_back(&getArrayAccessFor(PossibleLoad0));
|
2014-06-28 04:31:28 +08:00
|
|
|
if (PossibleLoad1 && PossibleLoad1->getNumUses() == 1)
|
2014-07-01 08:32:29 +08:00
|
|
|
if (PossibleLoad1->getParent() == Store->getParent())
|
2015-12-16 07:50:04 +08:00
|
|
|
Loads.push_back(&getArrayAccessFor(PossibleLoad1));
|
2014-06-28 04:31:28 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Check for reductions in this ScopStmt.
|
2014-06-28 04:31:28 +08:00
|
|
|
///
|
2015-02-25 00:00:29 +08:00
|
|
|
/// Iterate over all store memory accesses and check for valid binary reduction
|
|
|
|
/// like chains. For all candidates we check if they have the same base address
|
|
|
|
/// and there are no other accesses which overlap with them. The base address
|
|
|
|
/// check rules out impossible reductions candidates early. The overlap check,
|
|
|
|
/// together with the "only one user" check in collectCandiateReductionLoads,
|
2014-06-28 04:31:28 +08:00
|
|
|
/// guarantees that none of the intermediate results will escape during
|
|
|
|
/// execution of the loop nest. We basically check here that no other memory
|
|
|
|
/// access can access the same memory as the potential reduction.
|
|
|
|
void ScopStmt::checkForReductions() {
|
|
|
|
SmallVector<MemoryAccess *, 2> Loads;
|
|
|
|
SmallVector<std::pair<MemoryAccess *, MemoryAccess *>, 4> Candidates;
|
|
|
|
|
2015-02-25 00:00:29 +08:00
|
|
|
// First collect candidate load-store reduction chains by iterating over all
|
2014-06-28 04:31:28 +08:00
|
|
|
// stores and collecting possible reduction loads.
|
|
|
|
for (MemoryAccess *StoreMA : MemAccs) {
|
|
|
|
if (StoreMA->isRead())
|
|
|
|
continue;
|
|
|
|
|
|
|
|
Loads.clear();
|
|
|
|
collectCandiateReductionLoads(StoreMA, Loads);
|
|
|
|
for (MemoryAccess *LoadMA : Loads)
|
|
|
|
Candidates.push_back(std::make_pair(LoadMA, StoreMA));
|
|
|
|
}
|
|
|
|
|
|
|
|
// Then check each possible candidate pair.
|
|
|
|
for (const auto &CandidatePair : Candidates) {
|
|
|
|
bool Valid = true;
|
|
|
|
isl_map *LoadAccs = CandidatePair.first->getAccessRelation();
|
|
|
|
isl_map *StoreAccs = CandidatePair.second->getAccessRelation();
|
|
|
|
|
|
|
|
// Skip those with obviously unequal base addresses.
|
|
|
|
if (!isl_map_has_equal_space(LoadAccs, StoreAccs)) {
|
|
|
|
isl_map_free(LoadAccs);
|
|
|
|
isl_map_free(StoreAccs);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// And check if the remaining for overlap with other memory accesses.
|
|
|
|
isl_map *AllAccsRel = isl_map_union(LoadAccs, StoreAccs);
|
|
|
|
AllAccsRel = isl_map_intersect_domain(AllAccsRel, getDomain());
|
|
|
|
isl_set *AllAccs = isl_map_range(AllAccsRel);
|
|
|
|
|
|
|
|
for (MemoryAccess *MA : MemAccs) {
|
|
|
|
if (MA == CandidatePair.first || MA == CandidatePair.second)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
isl_map *AccRel =
|
|
|
|
isl_map_intersect_domain(MA->getAccessRelation(), getDomain());
|
|
|
|
isl_set *Accs = isl_map_range(AccRel);
|
|
|
|
|
2016-09-08 22:08:07 +08:00
|
|
|
if (isl_set_has_equal_space(AllAccs, Accs)) {
|
2014-06-28 04:31:28 +08:00
|
|
|
isl_set *OverlapAccs = isl_set_intersect(Accs, isl_set_copy(AllAccs));
|
|
|
|
Valid = Valid && isl_set_is_empty(OverlapAccs);
|
|
|
|
isl_set_free(OverlapAccs);
|
2016-09-08 22:08:07 +08:00
|
|
|
} else {
|
|
|
|
isl_set_free(Accs);
|
2014-06-28 04:31:28 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
isl_set_free(AllAccs);
|
|
|
|
if (!Valid)
|
|
|
|
continue;
|
|
|
|
|
2014-07-02 04:52:51 +08:00
|
|
|
const LoadInst *Load =
|
|
|
|
dyn_cast<const LoadInst>(CandidatePair.first->getAccessInstruction());
|
|
|
|
MemoryAccess::ReductionType RT =
|
|
|
|
getReductionType(dyn_cast<BinaryOperator>(Load->user_back()), Load);
|
|
|
|
|
2014-06-28 04:31:28 +08:00
|
|
|
// If no overlapping access was found we mark the load and store as
|
|
|
|
// reduction like.
|
2014-07-02 04:52:51 +08:00
|
|
|
CandidatePair.first->markAsReductionLike(RT);
|
|
|
|
CandidatePair.second->markAsReductionLike(RT);
|
2014-06-28 04:31:28 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2013-01-15 06:40:23 +08:00
|
|
|
std::string ScopStmt::getDomainStr() const { return stringFromIslObj(Domain); }
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2015-04-21 19:37:25 +08:00
|
|
|
std::string ScopStmt::getScheduleStr() const {
|
2015-07-14 17:33:13 +08:00
|
|
|
auto *S = getSchedule();
|
2016-09-14 14:26:09 +08:00
|
|
|
if (!S)
|
|
|
|
return "";
|
2015-07-14 17:33:13 +08:00
|
|
|
auto Str = stringFromIslObj(S);
|
|
|
|
isl_map_free(S);
|
|
|
|
return Str;
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
void ScopStmt::setInvalidDomain(__isl_take isl_set *ID) {
|
|
|
|
isl_set_free(InvalidDomain);
|
|
|
|
InvalidDomain = ID;
|
2016-04-12 17:57:34 +08:00
|
|
|
}
|
|
|
|
|
2016-02-25 06:08:24 +08:00
|
|
|
BasicBlock *ScopStmt::getEntryBlock() const {
|
|
|
|
if (isBlockStmt())
|
|
|
|
return getBasicBlock();
|
|
|
|
return getRegion()->getEntry();
|
|
|
|
}
|
|
|
|
|
2015-02-20 06:16:12 +08:00
|
|
|
unsigned ScopStmt::getNumIterators() const { return NestLoops.size(); }
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
const char *ScopStmt::getBaseName() const { return BaseName.c_str(); }
|
|
|
|
|
2016-05-10 22:00:57 +08:00
|
|
|
Loop *ScopStmt::getLoopForDimension(unsigned Dimension) const {
|
2013-02-16 05:26:44 +08:00
|
|
|
return NestLoops[Dimension];
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2013-01-15 06:40:23 +08:00
|
|
|
isl_ctx *ScopStmt::getIslCtx() const { return Parent.getIslCtx(); }
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_set *ScopStmt::getDomain() const { return isl_set_copy(Domain); }
|
2011-05-07 03:52:19 +08:00
|
|
|
|
2015-03-30 20:22:39 +08:00
|
|
|
__isl_give isl_space *ScopStmt::getDomainSpace() const {
|
2012-01-18 04:34:23 +08:00
|
|
|
return isl_set_get_space(Domain);
|
|
|
|
}
|
|
|
|
|
2015-03-30 19:52:59 +08:00
|
|
|
__isl_give isl_id *ScopStmt::getDomainId() const {
|
|
|
|
return isl_set_get_tuple_id(Domain);
|
|
|
|
}
|
2012-08-30 19:49:38 +08:00
|
|
|
|
2016-04-12 17:57:34 +08:00
|
|
|
ScopStmt::~ScopStmt() {
|
|
|
|
isl_set_free(Domain);
|
2016-04-23 21:02:23 +08:00
|
|
|
isl_set_free(InvalidDomain);
|
2016-04-12 17:57:34 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
void ScopStmt::print(raw_ostream &OS) const {
|
|
|
|
OS << "\t" << getBaseName() << "\n";
|
|
|
|
OS.indent(12) << "Domain :=\n";
|
|
|
|
|
|
|
|
if (Domain) {
|
|
|
|
OS.indent(16) << getDomainStr() << ";\n";
|
|
|
|
} else
|
|
|
|
OS.indent(16) << "n/a\n";
|
|
|
|
|
2015-04-21 19:37:25 +08:00
|
|
|
OS.indent(12) << "Schedule :=\n";
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
if (Domain) {
|
2015-04-21 19:37:25 +08:00
|
|
|
OS.indent(16) << getScheduleStr() << ";\n";
|
2011-04-29 14:27:02 +08:00
|
|
|
} else
|
|
|
|
OS.indent(16) << "n/a\n";
|
|
|
|
|
2014-06-28 16:59:45 +08:00
|
|
|
for (MemoryAccess *Access : MemAccs)
|
|
|
|
Access->print(OS);
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void ScopStmt::dump() const { print(dbgs()); }
|
|
|
|
|
2017-05-12 06:56:12 +08:00
|
|
|
void ScopStmt::removeAccessData(MemoryAccess *MA) {
|
|
|
|
if (MA->isRead() && MA->isOriginalValueKind()) {
|
|
|
|
bool Found = ValueReads.erase(MA->getAccessValue());
|
|
|
|
(void)Found;
|
|
|
|
assert(Found && "Expected access data not found");
|
|
|
|
}
|
|
|
|
if (MA->isWrite() && MA->isOriginalValueKind()) {
|
|
|
|
bool Found = ValueWrites.erase(cast<Instruction>(MA->getAccessValue()));
|
|
|
|
(void)Found;
|
|
|
|
assert(Found && "Expected access data not found");
|
|
|
|
}
|
|
|
|
if (MA->isWrite() && MA->isOriginalAnyPHIKind()) {
|
|
|
|
bool Found = PHIWrites.erase(cast<PHINode>(MA->getAccessInstruction()));
|
|
|
|
(void)Found;
|
|
|
|
assert(Found && "Expected access data not found");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-05-23 22:45:58 +08:00
|
|
|
void ScopStmt::removeMemoryAccess(MemoryAccess *MA) {
|
2017-01-15 04:25:44 +08:00
|
|
|
// Remove the memory accesses from this statement together with all scalar
|
|
|
|
// accesses that were caused by it. MemoryKind::Value READs have no access
|
|
|
|
// instruction, hence would not be removed by this function. However, it is
|
|
|
|
// only used for invariant LoadInst accesses, its arguments are always affine,
|
|
|
|
// hence synthesizable, and therefore there are no MemoryKind::Value READ
|
|
|
|
// accesses to be removed.
|
2016-05-23 22:45:58 +08:00
|
|
|
auto Predicate = [&](MemoryAccess *Acc) {
|
|
|
|
return Acc->getAccessInstruction() == MA->getAccessInstruction();
|
|
|
|
};
|
2017-05-12 06:56:12 +08:00
|
|
|
for (auto *MA : MemAccs) {
|
|
|
|
if (Predicate(MA))
|
|
|
|
removeAccessData(MA);
|
|
|
|
}
|
2016-05-23 22:45:58 +08:00
|
|
|
MemAccs.erase(std::remove_if(MemAccs.begin(), MemAccs.end(), Predicate),
|
|
|
|
MemAccs.end());
|
|
|
|
InstructionToAccess.erase(MA->getAccessInstruction());
|
2015-09-30 07:47:21 +08:00
|
|
|
}
|
|
|
|
|
2017-03-11 00:05:24 +08:00
|
|
|
void ScopStmt::removeSingleMemoryAccess(MemoryAccess *MA) {
|
|
|
|
auto MAIt = std::find(MemAccs.begin(), MemAccs.end(), MA);
|
|
|
|
assert(MAIt != MemAccs.end());
|
|
|
|
MemAccs.erase(MAIt);
|
|
|
|
|
2017-05-12 06:56:12 +08:00
|
|
|
removeAccessData(MA);
|
|
|
|
|
2017-03-11 00:05:24 +08:00
|
|
|
auto It = InstructionToAccess.find(MA->getAccessInstruction());
|
|
|
|
if (It != InstructionToAccess.end()) {
|
|
|
|
It->second.remove(MA);
|
|
|
|
if (It->second.empty())
|
|
|
|
InstructionToAccess.erase(MA->getAccessInstruction());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
/// Scop class implement
|
2011-11-08 23:41:28 +08:00
|
|
|
|
2011-11-17 20:56:10 +08:00
|
|
|
void Scop::setContext(__isl_take isl_set *NewContext) {
|
2011-11-15 19:38:44 +08:00
|
|
|
NewContext = isl_set_align_params(NewContext, isl_set_get_space(Context));
|
|
|
|
isl_set_free(Context);
|
|
|
|
Context = NewContext;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Remap parameter values but keep AddRecs valid wrt. invariant loads.
|
2015-11-04 00:47:58 +08:00
|
|
|
struct SCEVSensitiveParameterRewriter
|
2016-11-27 01:58:40 +08:00
|
|
|
: public SCEVRewriteVisitor<SCEVSensitiveParameterRewriter> {
|
2015-11-04 00:47:58 +08:00
|
|
|
ValueToValueMap &VMap;
|
|
|
|
|
|
|
|
public:
|
|
|
|
SCEVSensitiveParameterRewriter(ValueToValueMap &VMap, ScalarEvolution &SE)
|
2016-11-27 01:58:40 +08:00
|
|
|
: SCEVRewriteVisitor(SE), VMap(VMap) {}
|
2015-11-04 00:47:58 +08:00
|
|
|
|
|
|
|
static const SCEV *rewrite(const SCEV *E, ScalarEvolution &SE,
|
|
|
|
ValueToValueMap &VMap) {
|
|
|
|
SCEVSensitiveParameterRewriter SSPR(VMap, SE);
|
|
|
|
return SSPR.visit(E);
|
|
|
|
}
|
|
|
|
|
|
|
|
const SCEV *visitAddRecExpr(const SCEVAddRecExpr *E) {
|
|
|
|
auto *Start = visit(E->getStart());
|
|
|
|
auto *AddRec = SE.getAddRecExpr(SE.getConstant(E->getType(), 0),
|
|
|
|
visit(E->getStepRecurrence(SE)),
|
|
|
|
E->getLoop(), SCEV::FlagAnyWrap);
|
|
|
|
return SE.getAddExpr(Start, AddRec);
|
|
|
|
}
|
|
|
|
|
|
|
|
const SCEV *visitUnknown(const SCEVUnknown *E) {
|
|
|
|
if (auto *NewValue = VMap.lookup(E->getValue()))
|
|
|
|
return SE.getUnknown(NewValue);
|
|
|
|
return E;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2015-10-18 20:39:19 +08:00
|
|
|
const SCEV *Scop::getRepresentingInvariantLoadSCEV(const SCEV *S) {
|
2015-11-04 00:47:58 +08:00
|
|
|
return SCEVSensitiveParameterRewriter::rewrite(S, *SE, InvEquivClassVMap);
|
2015-10-10 01:12:26 +08:00
|
|
|
}
|
|
|
|
|
2016-04-26 00:15:13 +08:00
|
|
|
void Scop::createParameterId(const SCEV *Parameter) {
|
|
|
|
assert(Parameters.count(Parameter));
|
|
|
|
assert(!ParameterIds.count(Parameter));
|
2011-11-07 20:58:59 +08:00
|
|
|
|
2016-04-26 00:15:13 +08:00
|
|
|
std::string ParameterName = "p_" + std::to_string(getNumParams() - 1);
|
2015-11-17 19:54:51 +08:00
|
|
|
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
if (UseInstructionNames) {
|
|
|
|
if (const SCEVUnknown *ValueParameter = dyn_cast<SCEVUnknown>(Parameter)) {
|
|
|
|
Value *Val = ValueParameter->getValue();
|
|
|
|
|
|
|
|
// If this parameter references a specific Value and this value has a name
|
|
|
|
// we use this name as it is likely to be unique and more useful than just
|
|
|
|
// a number.
|
|
|
|
if (Val->hasName())
|
|
|
|
ParameterName = Val->getName();
|
|
|
|
else if (LoadInst *LI = dyn_cast<LoadInst>(Val)) {
|
|
|
|
auto *LoadOrigin = LI->getPointerOperand()->stripInBoundsOffsets();
|
|
|
|
if (LoadOrigin->hasName()) {
|
|
|
|
ParameterName += "_loaded_from_";
|
|
|
|
ParameterName +=
|
|
|
|
LI->getPointerOperand()->stripInBoundsOffsets()->getName();
|
|
|
|
}
|
2015-11-17 19:54:51 +08:00
|
|
|
}
|
|
|
|
}
|
2011-11-15 19:38:55 +08:00
|
|
|
|
[ScopInfo] Do not use LLVM names to identify statements, arrays, and parameters
LLVM-IR names are commonly available in debug builds, but often not in release
builds. Hence, using LLVM-IR names to identify statements or memory reference
results makes the behavior of Polly depend on the compile mode. This is
undesirable. Hence, we now just number the statements instead of using LLVM-IR
names to identify them (this issue has previously been brought up by Zino
Benaissa).
However, as LLVM-IR names help in making test cases more readable, we add an
option '-polly-use-llvm-names' to still use LLVM-IR names. This flag is by
default set in the polly tests to make test cases more readable.
This change reduces the time in ScopInfo from 32 seconds to 2 seconds for the
following test case provided by Eli Friedman <efriedma@codeaurora.org> (already
used in one of the previous commits):
struct X { int x; };
void a();
#define SIG (int x, X **y, X **z)
typedef void (*fn)SIG;
#define FN { for (int i = 0; i < x; ++i) { (*y)[i].x += (*z)[i].x; } a(); }
#define FN5 FN FN FN FN FN
#define FN25 FN5 FN5 FN5 FN5
#define FN125 FN25 FN25 FN25 FN25 FN25
#define FN250 FN125 FN125
#define FN1250 FN250 FN250 FN250 FN250 FN250
void x SIG { FN1250 }
For a larger benchmark I have on-hand (10000 loops), this reduces the time for
running -polly-scops from 5 minutes to 4 minutes, a reduction by 20%.
The reason for this large speedup is that our previous use of printAsOperand
had a quadratic cost, as for each printed and unnamed operand the full function
was scanned to find the instruction number that identifies the operand.
We do not need to adjust the way memory reference ids are constructured, as
they do not use LLVM values.
Reviewed by: efriedma
Tags: #polly
Differential Revision: https://reviews.llvm.org/D32789
llvm-svn: 302072
2017-05-04 04:08:52 +08:00
|
|
|
ParameterName = getIslCompatibleName("", ParameterName, "");
|
|
|
|
}
|
2016-07-01 21:40:28 +08:00
|
|
|
|
2016-04-26 00:15:13 +08:00
|
|
|
auto *Id = isl_id_alloc(getIslCtx(), ParameterName.c_str(),
|
|
|
|
const_cast<void *>((const void *)Parameter));
|
|
|
|
ParameterIds[Parameter] = Id;
|
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::addParams(const ParameterSetTy &NewParameters) {
|
|
|
|
for (const SCEV *Parameter : NewParameters) {
|
|
|
|
// Normalize the SCEV to get the representing element for an invariant load.
|
|
|
|
Parameter = extractConstantFactor(Parameter, *SE).second;
|
|
|
|
Parameter = getRepresentingInvariantLoadSCEV(Parameter);
|
|
|
|
|
|
|
|
if (Parameters.insert(Parameter))
|
|
|
|
createParameterId(Parameter);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
__isl_give isl_id *Scop::getIdForParam(const SCEV *Parameter) {
|
|
|
|
// Normalize the SCEV to get the representing element for an invariant load.
|
|
|
|
Parameter = getRepresentingInvariantLoadSCEV(Parameter);
|
|
|
|
return isl_id_copy(ParameterIds.lookup(Parameter));
|
2011-11-07 20:58:59 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2016-09-01 17:03:27 +08:00
|
|
|
__isl_give isl_set *
|
|
|
|
Scop::addNonEmptyDomainConstraints(__isl_take isl_set *C) const {
|
2015-08-21 02:06:30 +08:00
|
|
|
isl_set *DomainContext = isl_union_set_params(getDomains());
|
|
|
|
return isl_set_intersect_params(C, DomainContext);
|
|
|
|
}
|
|
|
|
|
2016-05-23 20:43:44 +08:00
|
|
|
bool Scop::isDominatedBy(const DominatorTree &DT, BasicBlock *BB) const {
|
|
|
|
return DT.dominates(BB, getEntry());
|
|
|
|
}
|
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
void Scop::addUserAssumptions(AssumptionCache &AC, DominatorTree &DT,
|
|
|
|
LoopInfo &LI) {
|
2016-05-23 20:38:05 +08:00
|
|
|
auto &F = getFunction();
|
2017-03-17 21:56:53 +08:00
|
|
|
for (auto &Assumption : AC.assumptions()) {
|
|
|
|
auto *CI = dyn_cast_or_null<CallInst>(Assumption);
|
|
|
|
if (!CI || CI->getNumArgOperands() != 1)
|
|
|
|
continue;
|
2016-05-10 22:00:57 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
bool InScop = contains(CI);
|
|
|
|
if (!InScop && !isDominatedBy(DT, CI->getParent()))
|
2015-11-12 11:25:01 +08:00
|
|
|
continue;
|
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
auto *L = LI.getLoopFor(CI->getParent());
|
|
|
|
auto *Val = CI->getArgOperand(0);
|
|
|
|
ParameterSetTy DetectedParams;
|
|
|
|
if (!isAffineConstraint(Val, &R, L, *SE, DetectedParams)) {
|
|
|
|
emitOptimizationRemarkAnalysis(F.getContext(), DEBUG_TYPE, F,
|
|
|
|
CI->getDebugLoc(),
|
|
|
|
"Non-affine user assumption ignored.");
|
|
|
|
continue;
|
|
|
|
}
|
2015-11-12 11:25:01 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
// Collect all newly introduced parameters.
|
|
|
|
ParameterSetTy NewParams;
|
|
|
|
for (auto *Param : DetectedParams) {
|
|
|
|
Param = extractConstantFactor(Param, *SE).second;
|
|
|
|
Param = getRepresentingInvariantLoadSCEV(Param);
|
|
|
|
if (Parameters.count(Param))
|
2016-04-26 02:51:27 +08:00
|
|
|
continue;
|
2017-03-17 21:56:53 +08:00
|
|
|
NewParams.insert(Param);
|
|
|
|
}
|
2016-05-10 21:06:42 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
SmallVector<isl_set *, 2> ConditionSets;
|
|
|
|
auto *TI = InScop ? CI->getParent()->getTerminator() : nullptr;
|
|
|
|
auto &Stmt = InScop ? *getStmtFor(CI->getParent()) : *Stmts.begin();
|
|
|
|
auto *Dom = InScop ? getDomainConditions(&Stmt) : isl_set_copy(Context);
|
|
|
|
bool Valid = buildConditionSets(Stmt, Val, TI, L, Dom, ConditionSets);
|
|
|
|
isl_set_free(Dom);
|
2015-11-12 11:25:01 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
if (!Valid)
|
|
|
|
continue;
|
2016-04-26 02:51:27 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
isl_set *AssumptionCtx = nullptr;
|
|
|
|
if (InScop) {
|
|
|
|
AssumptionCtx = isl_set_complement(isl_set_params(ConditionSets[1]));
|
|
|
|
isl_set_free(ConditionSets[0]);
|
|
|
|
} else {
|
|
|
|
AssumptionCtx = isl_set_complement(ConditionSets[1]);
|
|
|
|
AssumptionCtx = isl_set_intersect(AssumptionCtx, ConditionSets[0]);
|
|
|
|
}
|
2016-04-26 02:51:27 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
// Project out newly introduced parameters as they are not otherwise useful.
|
|
|
|
if (!NewParams.empty()) {
|
|
|
|
for (unsigned u = 0; u < isl_set_n_param(AssumptionCtx); u++) {
|
|
|
|
auto *Id = isl_set_get_dim_id(AssumptionCtx, isl_dim_param, u);
|
|
|
|
auto *Param = static_cast<const SCEV *>(isl_id_get_user(Id));
|
|
|
|
isl_id_free(Id);
|
2016-04-26 02:51:27 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
if (!NewParams.count(Param))
|
|
|
|
continue;
|
2016-12-15 17:25:14 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
AssumptionCtx =
|
|
|
|
isl_set_project_out(AssumptionCtx, isl_dim_param, u--, 1);
|
2016-04-26 02:51:27 +08:00
|
|
|
}
|
2016-12-15 17:25:14 +08:00
|
|
|
}
|
2017-03-17 21:56:53 +08:00
|
|
|
|
|
|
|
emitOptimizationRemarkAnalysis(
|
|
|
|
F.getContext(), DEBUG_TYPE, F, CI->getDebugLoc(),
|
|
|
|
"Use user assumption: " + stringFromIslObj(AssumptionCtx));
|
|
|
|
Context = isl_set_intersect(Context, AssumptionCtx);
|
2015-11-12 11:25:01 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-08-16 18:19:29 +08:00
|
|
|
void Scop::addUserContext() {
|
|
|
|
if (UserContextStr.empty())
|
|
|
|
return;
|
|
|
|
|
2016-02-17 23:49:21 +08:00
|
|
|
isl_set *UserContext =
|
|
|
|
isl_set_read_from_str(getIslCtx(), UserContextStr.c_str());
|
2015-08-16 18:19:29 +08:00
|
|
|
isl_space *Space = getParamSpace();
|
|
|
|
if (isl_space_dim(Space, isl_dim_param) !=
|
|
|
|
isl_set_dim(UserContext, isl_dim_param)) {
|
|
|
|
auto SpaceStr = isl_space_to_str(Space);
|
|
|
|
errs() << "Error: the context provided in -polly-context has not the same "
|
|
|
|
<< "number of dimensions than the computed context. Due to this "
|
|
|
|
<< "mismatch, the -polly-context option is ignored. Please provide "
|
|
|
|
<< "the context in the parameter space: " << SpaceStr << ".\n";
|
|
|
|
free(SpaceStr);
|
|
|
|
isl_set_free(UserContext);
|
|
|
|
isl_space_free(Space);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (unsigned i = 0; i < isl_space_dim(Space, isl_dim_param); i++) {
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *NameContext = isl_set_get_dim_name(Context, isl_dim_param, i);
|
|
|
|
auto *NameUserContext = isl_set_get_dim_name(UserContext, isl_dim_param, i);
|
2015-08-16 18:19:29 +08:00
|
|
|
|
|
|
|
if (strcmp(NameContext, NameUserContext) != 0) {
|
|
|
|
auto SpaceStr = isl_space_to_str(Space);
|
|
|
|
errs() << "Error: the name of dimension " << i
|
|
|
|
<< " provided in -polly-context "
|
|
|
|
<< "is '" << NameUserContext << "', but the name in the computed "
|
|
|
|
<< "context is '" << NameContext
|
|
|
|
<< "'. Due to this name mismatch, "
|
|
|
|
<< "the -polly-context option is ignored. Please provide "
|
|
|
|
<< "the context in the parameter space: " << SpaceStr << ".\n";
|
|
|
|
free(SpaceStr);
|
|
|
|
isl_set_free(UserContext);
|
|
|
|
isl_space_free(Space);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
UserContext =
|
|
|
|
isl_set_set_dim_id(UserContext, isl_dim_param, i,
|
|
|
|
isl_space_get_dim_id(Space, isl_dim_param, i));
|
|
|
|
}
|
|
|
|
|
|
|
|
Context = isl_set_intersect(Context, UserContext);
|
|
|
|
isl_space_free(Space);
|
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
void Scop::buildInvariantEquivalenceClasses() {
|
2016-02-08 01:30:13 +08:00
|
|
|
DenseMap<std::pair<const SCEV *, Type *>, LoadInst *> EquivClasses;
|
2015-10-18 20:39:19 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
const InvariantLoadsSetTy &RIL = getRequiredInvariantLoads();
|
2015-10-10 01:12:26 +08:00
|
|
|
for (LoadInst *LInst : RIL) {
|
|
|
|
const SCEV *PointerSCEV = SE->getSCEV(LInst->getPointerOperand());
|
|
|
|
|
2016-02-08 01:30:13 +08:00
|
|
|
Type *Ty = LInst->getType();
|
|
|
|
LoadInst *&ClassRep = EquivClasses[std::make_pair(PointerSCEV, Ty)];
|
2015-11-11 12:30:07 +08:00
|
|
|
if (ClassRep) {
|
2015-10-18 20:39:19 +08:00
|
|
|
InvEquivClassVMap[LInst] = ClassRep;
|
2015-11-11 12:30:07 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
ClassRep = LInst;
|
2016-07-11 20:15:10 +08:00
|
|
|
InvariantEquivClasses.emplace_back(
|
|
|
|
InvariantEquivClassTy{PointerSCEV, MemoryAccessList(), nullptr, Ty});
|
2015-10-10 01:12:26 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-11-08 23:41:13 +08:00
|
|
|
void Scop::buildContext() {
|
2016-02-17 23:49:21 +08:00
|
|
|
isl_space *Space = isl_space_params_alloc(getIslCtx(), 0);
|
2013-10-30 05:05:49 +08:00
|
|
|
Context = isl_set_universe(isl_space_copy(Space));
|
2016-03-01 21:06:28 +08:00
|
|
|
InvalidContext = isl_set_empty(isl_space_copy(Space));
|
2013-10-30 05:05:49 +08:00
|
|
|
AssumedContext = isl_set_universe(Space);
|
2011-10-06 08:03:48 +08:00
|
|
|
}
|
|
|
|
|
2012-05-22 18:47:27 +08:00
|
|
|
void Scop::addParameterBounds() {
|
2016-04-26 00:15:13 +08:00
|
|
|
unsigned PDim = 0;
|
|
|
|
for (auto *Parameter : Parameters) {
|
|
|
|
ConstantRange SRange = SE->getSignedRange(Parameter);
|
|
|
|
Context = addRangeBoundsToSet(Context, SRange, PDim++, isl_dim_param);
|
2012-05-22 18:47:27 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-11-08 23:41:08 +08:00
|
|
|
void Scop::realignParams() {
|
2017-03-17 21:00:53 +08:00
|
|
|
if (PollyIgnoreParamBounds)
|
|
|
|
return;
|
|
|
|
|
2011-11-08 23:41:13 +08:00
|
|
|
// Add all parameters into a common model.
|
2016-02-17 23:49:21 +08:00
|
|
|
isl_space *Space = isl_space_params_alloc(getIslCtx(), ParameterIds.size());
|
2011-11-08 23:41:13 +08:00
|
|
|
|
2016-04-26 00:15:13 +08:00
|
|
|
unsigned PDim = 0;
|
|
|
|
for (const auto *Parameter : Parameters) {
|
2011-11-08 23:41:13 +08:00
|
|
|
isl_id *id = getIdForParam(Parameter);
|
2016-04-26 00:15:13 +08:00
|
|
|
Space = isl_space_set_dim_id(Space, isl_dim_param, PDim++, id);
|
2011-11-08 23:41:13 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Align the parameters of all data structures to the model.
|
|
|
|
Context = isl_set_align_params(Context, Space);
|
|
|
|
|
2016-05-10 20:18:22 +08:00
|
|
|
// As all parameters are known add bounds to them.
|
|
|
|
addParameterBounds();
|
|
|
|
|
2015-05-27 13:16:57 +08:00
|
|
|
for (ScopStmt &Stmt : *this)
|
|
|
|
Stmt.realignParams();
|
2016-06-02 23:07:41 +08:00
|
|
|
|
|
|
|
// Simplify the schedule according to the context too.
|
|
|
|
Schedule = isl_schedule_gist_domain_params(Schedule, getContext());
|
2011-11-08 23:41:08 +08:00
|
|
|
}
|
|
|
|
|
2015-09-16 06:52:53 +08:00
|
|
|
static __isl_give isl_set *
|
|
|
|
simplifyAssumptionContext(__isl_take isl_set *AssumptionContext,
|
|
|
|
const Scop &S) {
|
2017-01-07 01:30:34 +08:00
|
|
|
// If we have modeled all blocks in the SCoP that have side effects we can
|
|
|
|
// simplify the context with the constraints that are needed for anything to
|
|
|
|
// be executed at all. However, if we have error blocks in the SCoP we already
|
|
|
|
// assumed some parameter combinations cannot occur and removed them from the
|
2015-11-09 04:16:39 +08:00
|
|
|
// domains, thus we cannot use the remaining domain to simplify the
|
|
|
|
// assumptions.
|
|
|
|
if (!S.hasErrorBlock()) {
|
|
|
|
isl_set *DomainParameters = isl_union_set_params(S.getDomains());
|
|
|
|
AssumptionContext =
|
|
|
|
isl_set_gist_params(AssumptionContext, DomainParameters);
|
|
|
|
}
|
|
|
|
|
2015-09-16 06:52:53 +08:00
|
|
|
AssumptionContext = isl_set_gist_params(AssumptionContext, S.getContext());
|
|
|
|
return AssumptionContext;
|
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::simplifyContexts() {
|
2014-07-03 01:47:48 +08:00
|
|
|
// The parameter constraints of the iteration domains give us a set of
|
|
|
|
// constraints that need to hold for all cases where at least a single
|
|
|
|
// statement iteration is executed in the whole scop. We now simplify the
|
|
|
|
// assumed context under the assumption that such constraints hold and at
|
|
|
|
// least a single statement iteration is executed. For cases where no
|
|
|
|
// statement instances are executed, the assumptions we have taken about
|
|
|
|
// the executed code do not matter and can be changed.
|
|
|
|
//
|
|
|
|
// WARNING: This only holds if the assumptions we have taken do not reduce
|
|
|
|
// the set of statement instances that are executed. Otherwise we
|
|
|
|
// may run into a case where the iteration domains suggest that
|
2015-02-25 00:00:29 +08:00
|
|
|
// for a certain set of parameter constraints no code is executed,
|
2014-07-03 01:47:48 +08:00
|
|
|
// but in the original program some computation would have been
|
2015-02-25 00:00:29 +08:00
|
|
|
// performed. In such a case, modifying the run-time conditions and
|
|
|
|
// possibly influencing the run-time check may cause certain scops
|
2014-07-03 01:47:48 +08:00
|
|
|
// to not be executed.
|
|
|
|
//
|
|
|
|
// Example:
|
|
|
|
//
|
|
|
|
// When delinearizing the following code:
|
|
|
|
//
|
|
|
|
// for (long i = 0; i < 100; i++)
|
|
|
|
// for (long j = 0; j < m; j++)
|
|
|
|
// A[i+p][j] = 1.0;
|
|
|
|
//
|
|
|
|
// we assume that the condition m <= 0 or (m >= 1 and p >= 0) holds as
|
2015-02-25 00:00:29 +08:00
|
|
|
// otherwise we would access out of bound data. Now, knowing that code is
|
2014-07-03 01:47:48 +08:00
|
|
|
// only executed for the case m >= 0, it is sufficient to assume p >= 0.
|
2015-09-16 06:52:53 +08:00
|
|
|
AssumedContext = simplifyAssumptionContext(AssumedContext, *this);
|
2016-03-01 21:06:28 +08:00
|
|
|
InvalidContext = isl_set_align_params(InvalidContext, getParamSpace());
|
2014-07-03 01:47:48 +08:00
|
|
|
}
|
|
|
|
|
2017-05-19 11:45:00 +08:00
|
|
|
struct MinMaxData {
|
|
|
|
Scop::MinMaxVectorTy &MinMaxAccesses;
|
|
|
|
Scop &S;
|
|
|
|
};
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Add the minimal/maximal access in @p Set to @p User.
|
2015-05-28 21:32:11 +08:00
|
|
|
static isl_stat buildMinMaxAccess(__isl_take isl_set *Set, void *User) {
|
2017-05-19 11:45:00 +08:00
|
|
|
auto Data = (struct MinMaxData *)User;
|
|
|
|
Scop::MinMaxVectorTy *MinMaxAccesses = &Data->MinMaxAccesses;
|
2014-09-18 19:17:17 +08:00
|
|
|
isl_pw_multi_aff *MinPMA, *MaxPMA;
|
|
|
|
isl_pw_aff *LastDimAff;
|
|
|
|
isl_aff *OneAff;
|
|
|
|
unsigned Pos;
|
2017-05-19 11:45:00 +08:00
|
|
|
isl_ctx *Ctx = isl_set_get_ctx(Set);
|
2014-09-18 19:17:17 +08:00
|
|
|
|
2016-04-22 19:38:19 +08:00
|
|
|
Set = isl_set_remove_divs(Set);
|
|
|
|
|
2017-02-17 03:11:33 +08:00
|
|
|
if (isl_set_n_basic_set(Set) >= MaxDisjunctsInDomain) {
|
2016-04-22 19:38:19 +08:00
|
|
|
isl_set_free(Set);
|
|
|
|
return isl_stat_error;
|
|
|
|
}
|
|
|
|
|
2014-09-27 19:02:39 +08:00
|
|
|
// Restrict the number of parameters involved in the access as the lexmin/
|
|
|
|
// lexmax computation will take too long if this number is high.
|
|
|
|
//
|
|
|
|
// Experiments with a simple test case using an i7 4800MQ:
|
|
|
|
//
|
|
|
|
// #Parameters involved | Time (in sec)
|
|
|
|
// 6 | 0.01
|
|
|
|
// 7 | 0.04
|
|
|
|
// 8 | 0.12
|
|
|
|
// 9 | 0.40
|
|
|
|
// 10 | 1.54
|
|
|
|
// 11 | 6.78
|
|
|
|
// 12 | 30.38
|
|
|
|
//
|
|
|
|
if (isl_set_n_param(Set) > RunTimeChecksMaxParameters) {
|
|
|
|
unsigned InvolvedParams = 0;
|
|
|
|
for (unsigned u = 0, e = isl_set_n_param(Set); u < e; u++)
|
|
|
|
if (isl_set_involves_dims(Set, isl_dim_param, u, 1))
|
|
|
|
InvolvedParams++;
|
|
|
|
|
|
|
|
if (InvolvedParams > RunTimeChecksMaxParameters) {
|
|
|
|
isl_set_free(Set);
|
2015-05-28 21:32:11 +08:00
|
|
|
return isl_stat_error;
|
2014-09-27 19:02:39 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-05-19 11:45:00 +08:00
|
|
|
{
|
|
|
|
IslMaxOperationsGuard MaxOpGuard(isl_set_get_ctx(Set), OptComputeOut);
|
|
|
|
MinPMA = isl_set_lexmin_pw_multi_aff(isl_set_copy(Set));
|
|
|
|
MaxPMA = isl_set_lexmax_pw_multi_aff(isl_set_copy(Set));
|
|
|
|
}
|
|
|
|
|
|
|
|
if (isl_ctx_last_error(Ctx) == isl_error_quota) {
|
|
|
|
MinPMA = isl_pw_multi_aff_free(MinPMA);
|
|
|
|
MaxPMA = isl_pw_multi_aff_free(MaxPMA);
|
|
|
|
Set = isl_set_free(Set);
|
|
|
|
Data->S.invalidate(COMPLEXITY, DebugLoc());
|
|
|
|
return isl_stat_error;
|
|
|
|
}
|
2014-09-18 19:17:17 +08:00
|
|
|
|
2014-10-07 22:37:59 +08:00
|
|
|
MinPMA = isl_pw_multi_aff_coalesce(MinPMA);
|
|
|
|
MaxPMA = isl_pw_multi_aff_coalesce(MaxPMA);
|
|
|
|
|
2014-09-18 19:17:17 +08:00
|
|
|
// Adjust the last dimension of the maximal access by one as we want to
|
|
|
|
// enclose the accessed memory region by MinPMA and MaxPMA. The pointer
|
|
|
|
// we test during code generation might now point after the end of the
|
|
|
|
// allocated array but we will never dereference it anyway.
|
|
|
|
assert(isl_pw_multi_aff_dim(MaxPMA, isl_dim_out) &&
|
|
|
|
"Assumed at least one output dimension");
|
|
|
|
Pos = isl_pw_multi_aff_dim(MaxPMA, isl_dim_out) - 1;
|
|
|
|
LastDimAff = isl_pw_multi_aff_get_pw_aff(MaxPMA, Pos);
|
|
|
|
OneAff = isl_aff_zero_on_domain(
|
|
|
|
isl_local_space_from_space(isl_pw_aff_get_domain_space(LastDimAff)));
|
|
|
|
OneAff = isl_aff_add_constant_si(OneAff, 1);
|
|
|
|
LastDimAff = isl_pw_aff_add(LastDimAff, isl_pw_aff_from_aff(OneAff));
|
|
|
|
MaxPMA = isl_pw_multi_aff_set_pw_aff(MaxPMA, Pos, LastDimAff);
|
|
|
|
|
|
|
|
MinMaxAccesses->push_back(std::make_pair(MinPMA, MaxPMA));
|
|
|
|
|
|
|
|
isl_set_free(Set);
|
2015-05-28 21:32:11 +08:00
|
|
|
return isl_stat_ok;
|
2014-09-18 19:17:17 +08:00
|
|
|
}
|
|
|
|
|
2014-10-01 20:42:37 +08:00
|
|
|
static __isl_give isl_set *getAccessDomain(MemoryAccess *MA) {
|
|
|
|
isl_set *Domain = MA->getStatement()->getDomain();
|
|
|
|
Domain = isl_set_project_out(Domain, isl_dim_set, 0, isl_set_n_dim(Domain));
|
|
|
|
return isl_set_reset_tuple_id(Domain);
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Wrapper function to calculate minimal/maximal accesses to each array.
|
2017-01-16 23:49:04 +08:00
|
|
|
static bool calculateMinMaxAccess(Scop::AliasGroupTy AliasGroup, Scop &S,
|
2015-07-26 21:14:38 +08:00
|
|
|
Scop::MinMaxVectorTy &MinMaxAccesses) {
|
2015-07-24 01:04:54 +08:00
|
|
|
|
2017-05-19 11:45:00 +08:00
|
|
|
struct MinMaxData Data = {MinMaxAccesses, S};
|
|
|
|
Data.MinMaxAccesses.reserve(AliasGroup.size());
|
2017-01-16 23:49:04 +08:00
|
|
|
|
|
|
|
isl_union_set *Domains = S.getDomains();
|
|
|
|
isl_union_map *Accesses = isl_union_map_empty(S.getParamSpace());
|
|
|
|
|
|
|
|
for (MemoryAccess *MA : AliasGroup)
|
|
|
|
Accesses = isl_union_map_add_map(Accesses, MA->getAccessRelation());
|
|
|
|
|
2015-07-24 01:04:54 +08:00
|
|
|
Accesses = isl_union_map_intersect_domain(Accesses, Domains);
|
|
|
|
isl_union_set *Locations = isl_union_map_range(Accesses);
|
|
|
|
Locations = isl_union_set_coalesce(Locations);
|
|
|
|
Locations = isl_union_set_detect_equalities(Locations);
|
2017-05-19 11:45:00 +08:00
|
|
|
bool Valid =
|
|
|
|
(0 == isl_union_set_foreach_set(Locations, buildMinMaxAccess, &Data));
|
2015-07-24 01:04:54 +08:00
|
|
|
isl_union_set_free(Locations);
|
|
|
|
return Valid;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Helper to treat non-affine regions and basic blocks the same.
|
2015-08-31 05:13:53 +08:00
|
|
|
///
|
|
|
|
///{
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Return the block that is the representing block for @p RN.
|
2015-08-31 05:13:53 +08:00
|
|
|
static inline BasicBlock *getRegionNodeBasicBlock(RegionNode *RN) {
|
|
|
|
return RN->isSubRegion() ? RN->getNodeAs<Region>()->getEntry()
|
|
|
|
: RN->getNodeAs<BasicBlock>();
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Return the @p idx'th block that is executed after @p RN.
|
2015-09-28 17:33:22 +08:00
|
|
|
static inline BasicBlock *
|
|
|
|
getRegionNodeSuccessor(RegionNode *RN, TerminatorInst *TI, unsigned idx) {
|
2015-08-31 05:13:53 +08:00
|
|
|
if (RN->isSubRegion()) {
|
|
|
|
assert(idx == 0);
|
|
|
|
return RN->getNodeAs<Region>()->getExit();
|
|
|
|
}
|
2015-09-28 17:33:22 +08:00
|
|
|
return TI->getSuccessor(idx);
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Return the smallest loop surrounding @p RN.
|
2015-08-31 05:13:53 +08:00
|
|
|
static inline Loop *getRegionNodeLoop(RegionNode *RN, LoopInfo &LI) {
|
2017-03-08 00:17:55 +08:00
|
|
|
if (!RN->isSubRegion()) {
|
|
|
|
BasicBlock *BB = RN->getNodeAs<BasicBlock>();
|
|
|
|
Loop *L = LI.getLoopFor(BB);
|
|
|
|
|
|
|
|
// Unreachable statements are not considered to belong to a LLVM loop, as
|
|
|
|
// they are not part of an actual loop in the control flow graph.
|
|
|
|
// Nevertheless, we handle certain unreachable statements that are common
|
|
|
|
// when modeling run-time bounds checks as being part of the loop to be
|
|
|
|
// able to model them and to later eliminate the run-time bounds checks.
|
|
|
|
//
|
|
|
|
// Specifically, for basic blocks that terminate in an unreachable and
|
|
|
|
// where the immeditate predecessor is part of a loop, we assume these
|
|
|
|
// basic blocks belong to the loop the predecessor belongs to. This
|
|
|
|
// allows us to model the following code.
|
|
|
|
//
|
|
|
|
// for (i = 0; i < N; i++) {
|
|
|
|
// if (i > 1024)
|
|
|
|
// abort(); <- this abort might be translated to an
|
|
|
|
// unreachable
|
|
|
|
//
|
|
|
|
// A[i] = ...
|
|
|
|
// }
|
|
|
|
if (!L && isa<UnreachableInst>(BB->getTerminator()) && BB->getPrevNode())
|
|
|
|
L = LI.getLoopFor(BB->getPrevNode());
|
|
|
|
return L;
|
|
|
|
}
|
2015-08-31 05:13:53 +08:00
|
|
|
|
|
|
|
Region *NonAffineSubRegion = RN->getNodeAs<Region>();
|
|
|
|
Loop *L = LI.getLoopFor(NonAffineSubRegion->getEntry());
|
|
|
|
while (L && NonAffineSubRegion->contains(L))
|
|
|
|
L = L->getParentLoop();
|
|
|
|
return L;
|
|
|
|
}
|
|
|
|
|
2017-03-08 00:17:55 +08:00
|
|
|
/// Get the number of blocks in @p L.
|
|
|
|
///
|
|
|
|
/// The number of blocks in a loop are the number of basic blocks actually
|
|
|
|
/// belonging to the loop, as well as all single basic blocks that the loop
|
|
|
|
/// exits to and which terminate in an unreachable instruction. We do not
|
|
|
|
/// allow such basic blocks in the exit of a scop, hence they belong to the
|
|
|
|
/// scop and represent run-time conditions which we want to model and
|
|
|
|
/// subsequently speculate away.
|
|
|
|
///
|
|
|
|
/// @see getRegionNodeLoop for additional details.
|
|
|
|
long getNumBlocksInLoop(Loop *L) {
|
|
|
|
long NumBlocks = L->getNumBlocks();
|
|
|
|
SmallVector<llvm::BasicBlock *, 4> ExitBlocks;
|
|
|
|
L->getExitBlocks(ExitBlocks);
|
|
|
|
|
|
|
|
for (auto ExitBlock : ExitBlocks) {
|
|
|
|
if (isa<UnreachableInst>(ExitBlock->getTerminator()))
|
|
|
|
NumBlocks++;
|
|
|
|
}
|
|
|
|
return NumBlocks;
|
|
|
|
}
|
|
|
|
|
2015-09-10 23:27:46 +08:00
|
|
|
static inline unsigned getNumBlocksInRegionNode(RegionNode *RN) {
|
|
|
|
if (!RN->isSubRegion())
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
Region *R = RN->getNodeAs<Region>();
|
2016-02-01 09:55:08 +08:00
|
|
|
return std::distance(R->block_begin(), R->block_end());
|
2015-09-10 23:27:46 +08:00
|
|
|
}
|
|
|
|
|
2015-10-08 04:32:43 +08:00
|
|
|
static bool containsErrorBlock(RegionNode *RN, const Region &R, LoopInfo &LI,
|
|
|
|
const DominatorTree &DT) {
|
2015-10-02 07:48:18 +08:00
|
|
|
if (!RN->isSubRegion())
|
2015-10-08 04:32:43 +08:00
|
|
|
return isErrorBlock(*RN->getNodeAs<BasicBlock>(), R, LI, DT);
|
2015-10-02 07:48:18 +08:00
|
|
|
for (BasicBlock *BB : RN->getNodeAs<Region>()->blocks())
|
2015-10-08 04:32:43 +08:00
|
|
|
if (isErrorBlock(*BB, R, LI, DT))
|
2015-10-02 07:48:18 +08:00
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2015-08-31 05:13:53 +08:00
|
|
|
///}
|
|
|
|
|
2015-09-10 23:27:46 +08:00
|
|
|
static inline __isl_give isl_set *addDomainDimId(__isl_take isl_set *Domain,
|
|
|
|
unsigned Dim, Loop *L) {
|
2016-03-29 15:50:52 +08:00
|
|
|
Domain = isl_set_lower_bound_si(Domain, isl_dim_set, Dim, -1);
|
2015-09-10 23:27:46 +08:00
|
|
|
isl_id *DimId =
|
|
|
|
isl_id_alloc(isl_set_get_ctx(Domain), nullptr, static_cast<void *>(L));
|
|
|
|
return isl_set_set_dim_id(Domain, isl_dim_set, Dim, DimId);
|
|
|
|
}
|
|
|
|
|
2016-04-19 22:48:22 +08:00
|
|
|
__isl_give isl_set *Scop::getDomainConditions(const ScopStmt *Stmt) const {
|
2016-02-25 06:08:24 +08:00
|
|
|
return getDomainConditions(Stmt->getEntryBlock());
|
2015-09-16 06:49:04 +08:00
|
|
|
}
|
|
|
|
|
2016-04-19 22:48:22 +08:00
|
|
|
__isl_give isl_set *Scop::getDomainConditions(BasicBlock *BB) const {
|
2016-04-08 18:32:26 +08:00
|
|
|
auto DIt = DomainMap.find(BB);
|
|
|
|
if (DIt != DomainMap.end())
|
|
|
|
return isl_set_copy(DIt->getSecond());
|
|
|
|
|
|
|
|
auto &RI = *R.getRegionInfo();
|
|
|
|
auto *BBR = RI.getRegionFor(BB);
|
|
|
|
while (BBR->getEntry() == BB)
|
|
|
|
BBR = BBR->getParent();
|
|
|
|
return getDomainConditions(BBR->getEntry());
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
bool Scop::buildDomains(Region *R, DominatorTree &DT, LoopInfo &LI) {
|
2015-08-31 05:13:53 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
bool IsOnlyNonAffineRegion = isNonAffineSubRegion(R);
|
2015-08-31 21:56:32 +08:00
|
|
|
auto *EntryBB = R->getEntry();
|
2016-01-26 19:01:41 +08:00
|
|
|
auto *L = IsOnlyNonAffineRegion ? nullptr : LI.getLoopFor(EntryBB);
|
|
|
|
int LD = getRelativeLoopDepth(L);
|
2015-08-31 21:56:32 +08:00
|
|
|
auto *S = isl_set_universe(isl_space_set_alloc(getIslCtx(), 0, LD + 1));
|
2015-09-10 23:27:46 +08:00
|
|
|
|
|
|
|
while (LD-- >= 0) {
|
|
|
|
S = addDomainDimId(S, LD + 1, L);
|
|
|
|
L = L->getParentLoop();
|
|
|
|
}
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
// Initialize the invalid domain.
|
|
|
|
auto *EntryStmt = getStmtFor(EntryBB);
|
|
|
|
EntryStmt->setInvalidDomain(isl_set_empty(isl_set_get_space(S)));
|
|
|
|
|
2015-08-31 21:56:32 +08:00
|
|
|
DomainMap[EntryBB] = S;
|
2015-08-31 05:13:53 +08:00
|
|
|
|
2016-01-26 19:01:41 +08:00
|
|
|
if (IsOnlyNonAffineRegion)
|
2016-05-10 20:19:47 +08:00
|
|
|
return !containsErrorBlock(R->getNode(), *R, LI, DT);
|
2016-03-30 04:02:05 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!buildDomainsWithBranchConstraints(R, DT, LI))
|
2016-03-30 04:02:05 +08:00
|
|
|
return false;
|
2015-09-14 19:15:07 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!propagateDomainConstraints(R, DT, LI))
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2015-11-22 19:06:51 +08:00
|
|
|
|
|
|
|
// Error blocks and blocks dominated by them have been assumed to never be
|
|
|
|
// executed. Representing them in the Scop does not add any value. In fact,
|
|
|
|
// it is likely to cause issues during construction of the ScopStmts. The
|
2016-04-08 18:30:09 +08:00
|
|
|
// contents of error blocks have not been verified to be expressible and
|
2015-11-22 19:06:51 +08:00
|
|
|
// will cause problems when building up a ScopStmt for them.
|
|
|
|
// Furthermore, basic blocks dominated by error blocks may reference
|
|
|
|
// instructions in the error block which, if the error block is not modeled,
|
2016-04-08 18:30:09 +08:00
|
|
|
// can themselves not be constructed properly. To this end we will replace
|
|
|
|
// the domains of error blocks and those only reachable via error blocks
|
|
|
|
// with an empty set. Additionally, we will record for each block under which
|
2016-04-12 17:57:34 +08:00
|
|
|
// parameter combination it would be reached via an error block in its
|
2016-04-23 21:02:23 +08:00
|
|
|
// InvalidDomain. This information is needed during load hoisting.
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!propagateInvalidStmtDomains(R, DT, LI))
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2016-04-08 18:30:09 +08:00
|
|
|
|
2016-03-30 04:02:05 +08:00
|
|
|
return true;
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Adjust the dimensions of @p Dom that was constructed for @p OldL
|
2016-04-04 15:50:40 +08:00
|
|
|
/// to be compatible to domains constructed for loop @p NewL.
|
|
|
|
///
|
|
|
|
/// This function assumes @p NewL and @p OldL are equal or there is a CFG
|
|
|
|
/// edge from @p OldL to @p NewL.
|
|
|
|
static __isl_give isl_set *adjustDomainDimensions(Scop &S,
|
|
|
|
__isl_take isl_set *Dom,
|
|
|
|
Loop *OldL, Loop *NewL) {
|
|
|
|
|
|
|
|
// If the loops are the same there is nothing to do.
|
|
|
|
if (NewL == OldL)
|
|
|
|
return Dom;
|
|
|
|
|
|
|
|
int OldDepth = S.getRelativeLoopDepth(OldL);
|
|
|
|
int NewDepth = S.getRelativeLoopDepth(NewL);
|
|
|
|
// If both loops are non-affine loops there is nothing to do.
|
|
|
|
if (OldDepth == -1 && NewDepth == -1)
|
|
|
|
return Dom;
|
|
|
|
|
|
|
|
// Distinguish three cases:
|
|
|
|
// 1) The depth is the same but the loops are not.
|
|
|
|
// => One loop was left one was entered.
|
|
|
|
// 2) The depth increased from OldL to NewL.
|
|
|
|
// => One loop was entered, none was left.
|
|
|
|
// 3) The depth decreased from OldL to NewL.
|
|
|
|
// => Loops were left were difference of the depths defines how many.
|
|
|
|
if (OldDepth == NewDepth) {
|
|
|
|
assert(OldL->getParentLoop() == NewL->getParentLoop());
|
|
|
|
Dom = isl_set_project_out(Dom, isl_dim_set, NewDepth, 1);
|
|
|
|
Dom = isl_set_add_dims(Dom, isl_dim_set, 1);
|
|
|
|
Dom = addDomainDimId(Dom, NewDepth, NewL);
|
|
|
|
} else if (OldDepth < NewDepth) {
|
|
|
|
assert(OldDepth + 1 == NewDepth);
|
|
|
|
auto &R = S.getRegion();
|
|
|
|
(void)R;
|
|
|
|
assert(NewL->getParentLoop() == OldL ||
|
|
|
|
((!OldL || !R.contains(OldL)) && R.contains(NewL)));
|
|
|
|
Dom = isl_set_add_dims(Dom, isl_dim_set, 1);
|
|
|
|
Dom = addDomainDimId(Dom, NewDepth, NewL);
|
|
|
|
} else {
|
|
|
|
assert(OldDepth > NewDepth);
|
|
|
|
int Diff = OldDepth - NewDepth;
|
|
|
|
int NumDim = isl_set_n_dim(Dom);
|
|
|
|
assert(NumDim >= Diff);
|
|
|
|
Dom = isl_set_project_out(Dom, isl_dim_set, NumDim - Diff, Diff);
|
|
|
|
}
|
|
|
|
|
|
|
|
return Dom;
|
|
|
|
}
|
2016-04-04 15:57:39 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
bool Scop::propagateInvalidStmtDomains(Region *R, DominatorTree &DT,
|
|
|
|
LoopInfo &LI) {
|
2016-04-08 18:30:09 +08:00
|
|
|
ReversePostOrderTraversal<Region *> RTraversal(R);
|
|
|
|
for (auto *RN : RTraversal) {
|
|
|
|
|
|
|
|
// Recurse for affine subregions but go on for basic blocks and non-affine
|
|
|
|
// subregions.
|
|
|
|
if (RN->isSubRegion()) {
|
|
|
|
Region *SubRegion = RN->getNodeAs<Region>();
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!isNonAffineSubRegion(SubRegion)) {
|
|
|
|
propagateInvalidStmtDomains(SubRegion, DT, LI);
|
2016-04-08 18:30:09 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ContainsErrorBlock = containsErrorBlock(RN, getRegion(), LI, DT);
|
|
|
|
BasicBlock *BB = getRegionNodeBasicBlock(RN);
|
2016-04-12 17:57:34 +08:00
|
|
|
ScopStmt *Stmt = getStmtFor(BB);
|
2016-04-08 18:30:09 +08:00
|
|
|
isl_set *&Domain = DomainMap[BB];
|
|
|
|
assert(Domain && "Cannot propagate a nullptr");
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
auto *InvalidDomain = Stmt->getInvalidDomain();
|
2016-04-12 17:57:34 +08:00
|
|
|
bool IsInvalidBlock =
|
2016-04-23 21:02:23 +08:00
|
|
|
ContainsErrorBlock || isl_set_is_subset(Domain, InvalidDomain);
|
2016-04-08 18:30:09 +08:00
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
if (!IsInvalidBlock) {
|
|
|
|
InvalidDomain = isl_set_intersect(InvalidDomain, isl_set_copy(Domain));
|
2016-04-08 18:30:09 +08:00
|
|
|
} else {
|
2016-04-23 21:02:23 +08:00
|
|
|
isl_set_free(InvalidDomain);
|
|
|
|
InvalidDomain = Domain;
|
2016-05-10 20:42:26 +08:00
|
|
|
isl_set *DomPar = isl_set_params(isl_set_copy(Domain));
|
|
|
|
recordAssumption(ERRORBLOCK, DomPar, BB->getTerminator()->getDebugLoc(),
|
|
|
|
AS_RESTRICTION);
|
|
|
|
Domain = nullptr;
|
2016-04-08 18:30:09 +08:00
|
|
|
}
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
if (isl_set_is_empty(InvalidDomain)) {
|
2016-04-23 22:31:17 +08:00
|
|
|
Stmt->setInvalidDomain(InvalidDomain);
|
2016-04-08 18:30:09 +08:00
|
|
|
continue;
|
2016-04-12 17:57:34 +08:00
|
|
|
}
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
auto *BBLoop = getRegionNodeLoop(RN, LI);
|
2016-04-08 18:30:09 +08:00
|
|
|
auto *TI = BB->getTerminator();
|
|
|
|
unsigned NumSuccs = RN->isSubRegion() ? 1 : TI->getNumSuccessors();
|
|
|
|
for (unsigned u = 0; u < NumSuccs; u++) {
|
|
|
|
auto *SuccBB = getRegionNodeSuccessor(RN, TI, u);
|
2016-04-12 17:57:34 +08:00
|
|
|
auto *SuccStmt = getStmtFor(SuccBB);
|
|
|
|
|
|
|
|
// Skip successors outside the SCoP.
|
|
|
|
if (!SuccStmt)
|
|
|
|
continue;
|
|
|
|
|
2016-04-25 21:34:50 +08:00
|
|
|
// Skip backedges.
|
|
|
|
if (DT.dominates(SuccBB, BB))
|
|
|
|
continue;
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
auto *SuccBBLoop = SuccStmt->getSurroundingLoop();
|
2016-04-23 21:02:23 +08:00
|
|
|
auto *AdjustedInvalidDomain = adjustDomainDimensions(
|
|
|
|
*this, isl_set_copy(InvalidDomain), BBLoop, SuccBBLoop);
|
|
|
|
auto *SuccInvalidDomain = SuccStmt->getInvalidDomain();
|
|
|
|
SuccInvalidDomain =
|
|
|
|
isl_set_union(SuccInvalidDomain, AdjustedInvalidDomain);
|
|
|
|
SuccInvalidDomain = isl_set_coalesce(SuccInvalidDomain);
|
|
|
|
unsigned NumConjucts = isl_set_n_basic_set(SuccInvalidDomain);
|
|
|
|
SuccStmt->setInvalidDomain(SuccInvalidDomain);
|
2016-04-08 18:30:09 +08:00
|
|
|
|
2016-05-02 20:25:18 +08:00
|
|
|
// Check if the maximal number of domain disjunctions was reached.
|
2016-04-08 18:30:09 +08:00
|
|
|
// In case this happens we will bail.
|
2017-02-17 03:11:33 +08:00
|
|
|
if (NumConjucts < MaxDisjunctsInDomain)
|
2016-04-08 18:30:09 +08:00
|
|
|
continue;
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
isl_set_free(InvalidDomain);
|
2016-04-08 18:30:09 +08:00
|
|
|
invalidate(COMPLEXITY, TI->getDebugLoc());
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2016-04-08 18:30:09 +08:00
|
|
|
}
|
2016-04-23 21:02:23 +08:00
|
|
|
|
|
|
|
Stmt->setInvalidDomain(InvalidDomain);
|
2016-04-08 18:30:09 +08:00
|
|
|
}
|
2016-05-10 21:06:42 +08:00
|
|
|
|
|
|
|
return true;
|
2016-04-08 18:30:09 +08:00
|
|
|
}
|
|
|
|
|
2016-04-04 15:57:39 +08:00
|
|
|
void Scop::propagateDomainConstraintsToRegionExit(
|
|
|
|
BasicBlock *BB, Loop *BBLoop,
|
2016-05-19 20:34:57 +08:00
|
|
|
SmallPtrSetImpl<BasicBlock *> &FinishedExitBlocks, LoopInfo &LI) {
|
2016-04-04 15:57:39 +08:00
|
|
|
|
|
|
|
// Check if the block @p BB is the entry of a region. If so we propagate it's
|
|
|
|
// domain to the exit block of the region. Otherwise we are done.
|
|
|
|
auto *RI = R.getRegionInfo();
|
|
|
|
auto *BBReg = RI ? RI->getRegionFor(BB) : nullptr;
|
|
|
|
auto *ExitBB = BBReg ? BBReg->getExit() : nullptr;
|
2016-05-23 20:40:48 +08:00
|
|
|
if (!BBReg || BBReg->getEntry() != BB || !contains(ExitBB))
|
2016-04-04 15:57:39 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
// Do not propagate the domain if there is a loop backedge inside the region
|
2017-01-07 01:30:34 +08:00
|
|
|
// that would prevent the exit block from being executed.
|
2016-04-04 15:57:39 +08:00
|
|
|
auto *L = BBLoop;
|
2016-05-23 20:40:48 +08:00
|
|
|
while (L && contains(L)) {
|
2016-04-04 15:57:39 +08:00
|
|
|
SmallVector<BasicBlock *, 4> LatchBBs;
|
|
|
|
BBLoop->getLoopLatches(LatchBBs);
|
|
|
|
for (auto *LatchBB : LatchBBs)
|
|
|
|
if (BB != LatchBB && BBReg->contains(LatchBB))
|
|
|
|
return;
|
|
|
|
L = L->getParentLoop();
|
|
|
|
}
|
|
|
|
|
|
|
|
auto *Domain = DomainMap[BB];
|
|
|
|
assert(Domain && "Cannot propagate a nullptr");
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
auto *ExitStmt = getStmtFor(ExitBB);
|
|
|
|
auto *ExitBBLoop = ExitStmt->getSurroundingLoop();
|
2016-04-04 15:57:39 +08:00
|
|
|
|
|
|
|
// Since the dimensions of @p BB and @p ExitBB might be different we have to
|
|
|
|
// adjust the domain before we can propagate it.
|
|
|
|
auto *AdjustedDomain =
|
|
|
|
adjustDomainDimensions(*this, isl_set_copy(Domain), BBLoop, ExitBBLoop);
|
|
|
|
auto *&ExitDomain = DomainMap[ExitBB];
|
|
|
|
|
|
|
|
// If the exit domain is not yet created we set it otherwise we "add" the
|
|
|
|
// current domain.
|
|
|
|
ExitDomain =
|
|
|
|
ExitDomain ? isl_set_union(AdjustedDomain, ExitDomain) : AdjustedDomain;
|
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
// Initialize the invalid domain.
|
|
|
|
ExitStmt->setInvalidDomain(isl_set_empty(isl_set_get_space(ExitDomain)));
|
|
|
|
|
2016-04-04 15:57:39 +08:00
|
|
|
FinishedExitBlocks.insert(ExitBB);
|
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
bool Scop::buildDomainsWithBranchConstraints(Region *R, DominatorTree &DT,
|
|
|
|
LoopInfo &LI) {
|
2015-08-31 05:13:53 +08:00
|
|
|
// To create the domain for each block in R we iterate over all blocks and
|
|
|
|
// subregions in R and propagate the conditions under which the current region
|
|
|
|
// element is executed. To this end we iterate in reverse post order over R as
|
|
|
|
// it ensures that we first visit all predecessors of a region node (either a
|
|
|
|
// basic block or a subregion) before we visit the region node itself.
|
|
|
|
// Initially, only the domain for the SCoP region entry block is set and from
|
|
|
|
// there we propagate the current domain to all successors, however we add the
|
|
|
|
// condition that the successor is actually executed next.
|
|
|
|
// As we are only interested in non-loop carried constraints here we can
|
|
|
|
// simply skip loop back edges.
|
|
|
|
|
2016-04-04 15:57:39 +08:00
|
|
|
SmallPtrSet<BasicBlock *, 8> FinishedExitBlocks;
|
2015-08-31 05:13:53 +08:00
|
|
|
ReversePostOrderTraversal<Region *> RTraversal(R);
|
|
|
|
for (auto *RN : RTraversal) {
|
|
|
|
|
|
|
|
// Recurse for affine subregions but go on for basic blocks and non-affine
|
|
|
|
// subregions.
|
|
|
|
if (RN->isSubRegion()) {
|
|
|
|
Region *SubRegion = RN->getNodeAs<Region>();
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!isNonAffineSubRegion(SubRegion)) {
|
|
|
|
if (!buildDomainsWithBranchConstraints(SubRegion, DT, LI))
|
2016-03-30 04:02:05 +08:00
|
|
|
return false;
|
2015-08-31 05:13:53 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-11-11 16:42:20 +08:00
|
|
|
if (containsErrorBlock(RN, getRegion(), LI, DT))
|
2015-11-09 04:16:39 +08:00
|
|
|
HasErrorBlock = true;
|
2015-10-02 07:48:18 +08:00
|
|
|
|
2015-08-31 05:13:53 +08:00
|
|
|
BasicBlock *BB = getRegionNodeBasicBlock(RN);
|
2015-09-11 01:51:27 +08:00
|
|
|
TerminatorInst *TI = BB->getTerminator();
|
|
|
|
|
2015-11-11 16:42:20 +08:00
|
|
|
if (isa<UnreachableInst>(TI))
|
|
|
|
continue;
|
|
|
|
|
2015-10-02 07:48:18 +08:00
|
|
|
isl_set *Domain = DomainMap.lookup(BB);
|
2016-02-27 14:59:30 +08:00
|
|
|
if (!Domain)
|
2015-09-11 01:51:27 +08:00
|
|
|
continue;
|
2016-05-19 20:33:14 +08:00
|
|
|
MaxLoopDepth = std::max(MaxLoopDepth, isl_set_n_dim(Domain));
|
2015-08-31 05:13:53 +08:00
|
|
|
|
2016-04-04 15:57:39 +08:00
|
|
|
auto *BBLoop = getRegionNodeLoop(RN, LI);
|
|
|
|
// Propagate the domain from BB directly to blocks that have a superset
|
|
|
|
// domain, at the moment only region exit nodes of regions that start in BB.
|
2016-05-19 20:34:57 +08:00
|
|
|
propagateDomainConstraintsToRegionExit(BB, BBLoop, FinishedExitBlocks, LI);
|
2016-04-04 15:57:39 +08:00
|
|
|
|
|
|
|
// If all successors of BB have been set a domain through the propagation
|
|
|
|
// above we do not need to build condition sets but can just skip this
|
|
|
|
// block. However, it is important to note that this is a local property
|
|
|
|
// with regards to the region @p R. To this end FinishedExitBlocks is a
|
|
|
|
// local variable.
|
|
|
|
auto IsFinishedRegionExit = [&FinishedExitBlocks](BasicBlock *SuccBB) {
|
|
|
|
return FinishedExitBlocks.count(SuccBB);
|
|
|
|
};
|
|
|
|
if (std::all_of(succ_begin(BB), succ_end(BB), IsFinishedRegionExit))
|
|
|
|
continue;
|
2015-08-31 05:13:53 +08:00
|
|
|
|
|
|
|
// Build the condition sets for the successor nodes of the current region
|
|
|
|
// node. If it is a non-affine subregion we will always execute the single
|
|
|
|
// exit node, hence the single entry node domain is the condition set. For
|
|
|
|
// basic blocks we use the helper function buildConditionSets.
|
2015-09-28 17:33:22 +08:00
|
|
|
SmallVector<isl_set *, 8> ConditionSets;
|
2015-08-31 05:13:53 +08:00
|
|
|
if (RN->isSubRegion())
|
|
|
|
ConditionSets.push_back(isl_set_copy(Domain));
|
2016-05-10 21:06:42 +08:00
|
|
|
else if (!buildConditionSets(*getStmtFor(BB), TI, BBLoop, Domain,
|
|
|
|
ConditionSets))
|
|
|
|
return false;
|
2015-08-31 05:13:53 +08:00
|
|
|
|
|
|
|
// Now iterate over the successors and set their initial domain based on
|
|
|
|
// their condition set. We skip back edges here and have to be careful when
|
|
|
|
// we leave a loop not to keep constraints over a dimension that doesn't
|
|
|
|
// exist anymore.
|
2015-09-28 17:33:22 +08:00
|
|
|
assert(RN->isSubRegion() || TI->getNumSuccessors() == ConditionSets.size());
|
2015-08-31 05:13:53 +08:00
|
|
|
for (unsigned u = 0, e = ConditionSets.size(); u < e; u++) {
|
|
|
|
isl_set *CondSet = ConditionSets[u];
|
2015-09-28 17:33:22 +08:00
|
|
|
BasicBlock *SuccBB = getRegionNodeSuccessor(RN, TI, u);
|
2015-08-31 05:13:53 +08:00
|
|
|
|
2016-04-19 22:49:05 +08:00
|
|
|
auto *SuccStmt = getStmtFor(SuccBB);
|
|
|
|
// Skip blocks outside the region.
|
|
|
|
if (!SuccStmt) {
|
|
|
|
isl_set_free(CondSet);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-04-04 15:57:39 +08:00
|
|
|
// If we propagate the domain of some block to "SuccBB" we do not have to
|
|
|
|
// adjust the domain.
|
|
|
|
if (FinishedExitBlocks.count(SuccBB)) {
|
|
|
|
isl_set_free(CondSet);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2015-08-31 05:13:53 +08:00
|
|
|
// Skip back edges.
|
|
|
|
if (DT.dominates(SuccBB, BB)) {
|
|
|
|
isl_set_free(CondSet);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
auto *SuccBBLoop = SuccStmt->getSurroundingLoop();
|
2016-04-04 15:50:40 +08:00
|
|
|
CondSet = adjustDomainDimensions(*this, CondSet, BBLoop, SuccBBLoop);
|
2015-08-31 05:13:53 +08:00
|
|
|
|
|
|
|
// Set the domain for the successor or merge it with an existing domain in
|
|
|
|
// case there are multiple paths (without loop back edges) to the
|
|
|
|
// successor block.
|
|
|
|
isl_set *&SuccDomain = DomainMap[SuccBB];
|
2016-03-23 06:05:32 +08:00
|
|
|
|
2016-04-23 21:02:23 +08:00
|
|
|
if (SuccDomain) {
|
2016-03-30 04:02:05 +08:00
|
|
|
SuccDomain = isl_set_coalesce(isl_set_union(SuccDomain, CondSet));
|
2016-04-23 21:02:23 +08:00
|
|
|
} else {
|
|
|
|
// Initialize the invalid domain.
|
|
|
|
SuccStmt->setInvalidDomain(isl_set_empty(isl_set_get_space(CondSet)));
|
|
|
|
SuccDomain = CondSet;
|
|
|
|
}
|
2016-03-30 04:02:05 +08:00
|
|
|
|
2016-05-02 20:25:18 +08:00
|
|
|
// Check if the maximal number of domain disjunctions was reached.
|
2016-03-30 04:02:05 +08:00
|
|
|
// In case this happens we will clean up and bail.
|
2017-02-17 03:11:33 +08:00
|
|
|
if (isl_set_n_basic_set(SuccDomain) < MaxDisjunctsInDomain)
|
2016-03-30 04:02:05 +08:00
|
|
|
continue;
|
|
|
|
|
|
|
|
invalidate(COMPLEXITY, DebugLoc());
|
|
|
|
while (++u < ConditionSets.size())
|
|
|
|
isl_set_free(ConditionSets[u]);
|
|
|
|
return false;
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
}
|
2016-03-30 04:02:05 +08:00
|
|
|
|
|
|
|
return true;
|
2015-08-31 05:13:53 +08:00
|
|
|
}
|
|
|
|
|
2016-09-01 17:03:27 +08:00
|
|
|
__isl_give isl_set *
|
|
|
|
Scop::getPredecessorDomainConstraints(BasicBlock *BB,
|
|
|
|
__isl_keep isl_set *Domain,
|
|
|
|
DominatorTree &DT, LoopInfo &LI) {
|
2016-04-04 15:57:39 +08:00
|
|
|
// If @p BB is the ScopEntry we are done
|
|
|
|
if (R.getEntry() == BB)
|
|
|
|
return isl_set_universe(isl_set_get_space(Domain));
|
|
|
|
|
|
|
|
// The region info of this function.
|
|
|
|
auto &RI = *R.getRegionInfo();
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
auto *BBLoop = getStmtFor(BB)->getSurroundingLoop();
|
2016-04-04 15:57:39 +08:00
|
|
|
|
|
|
|
// A domain to collect all predecessor domains, thus all conditions under
|
|
|
|
// which the block is executed. To this end we start with the empty domain.
|
|
|
|
isl_set *PredDom = isl_set_empty(isl_set_get_space(Domain));
|
|
|
|
|
|
|
|
// Set of regions of which the entry block domain has been propagated to BB.
|
|
|
|
// all predecessors inside any of the regions can be skipped.
|
|
|
|
SmallSet<Region *, 8> PropagatedRegions;
|
|
|
|
|
|
|
|
for (auto *PredBB : predecessors(BB)) {
|
|
|
|
// Skip backedges.
|
|
|
|
if (DT.dominates(BB, PredBB))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
// If the predecessor is in a region we used for propagation we can skip it.
|
|
|
|
auto PredBBInRegion = [PredBB](Region *PR) { return PR->contains(PredBB); };
|
|
|
|
if (std::any_of(PropagatedRegions.begin(), PropagatedRegions.end(),
|
|
|
|
PredBBInRegion)) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check if there is a valid region we can use for propagation, thus look
|
|
|
|
// for a region that contains the predecessor and has @p BB as exit block.
|
|
|
|
auto *PredR = RI.getRegionFor(PredBB);
|
|
|
|
while (PredR->getExit() != BB && !PredR->contains(BB))
|
|
|
|
PredR->getParent();
|
|
|
|
|
|
|
|
// If a valid region for propagation was found use the entry of that region
|
|
|
|
// for propagation, otherwise the PredBB directly.
|
|
|
|
if (PredR->getExit() == BB) {
|
|
|
|
PredBB = PredR->getEntry();
|
|
|
|
PropagatedRegions.insert(PredR);
|
|
|
|
}
|
|
|
|
|
2016-04-08 18:32:26 +08:00
|
|
|
auto *PredBBDom = getDomainConditions(PredBB);
|
2017-03-16 06:16:43 +08:00
|
|
|
auto *PredBBLoop = getStmtFor(PredBB)->getSurroundingLoop();
|
2016-04-04 15:57:39 +08:00
|
|
|
PredBBDom = adjustDomainDimensions(*this, PredBBDom, PredBBLoop, BBLoop);
|
|
|
|
|
|
|
|
PredDom = isl_set_union(PredDom, PredBBDom);
|
|
|
|
}
|
|
|
|
|
|
|
|
return PredDom;
|
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
bool Scop::propagateDomainConstraints(Region *R, DominatorTree &DT,
|
|
|
|
LoopInfo &LI) {
|
2015-09-10 21:00:06 +08:00
|
|
|
// Iterate over the region R and propagate the domain constrains from the
|
|
|
|
// predecessors to the current node. In contrast to the
|
|
|
|
// buildDomainsWithBranchConstraints function, this one will pull the domain
|
|
|
|
// information from the predecessors instead of pushing it to the successors.
|
|
|
|
// Additionally, we assume the domains to be already present in the domain
|
|
|
|
// map here. However, we iterate again in reverse post order so we know all
|
|
|
|
// predecessors have been visited before a block or non-affine subregion is
|
|
|
|
// visited.
|
|
|
|
|
|
|
|
ReversePostOrderTraversal<Region *> RTraversal(R);
|
|
|
|
for (auto *RN : RTraversal) {
|
|
|
|
|
|
|
|
// Recurse for affine subregions but go on for basic blocks and non-affine
|
|
|
|
// subregions.
|
|
|
|
if (RN->isSubRegion()) {
|
|
|
|
Region *SubRegion = RN->getNodeAs<Region>();
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!isNonAffineSubRegion(SubRegion)) {
|
|
|
|
if (!propagateDomainConstraints(SubRegion, DT, LI))
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2015-09-10 21:00:06 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
BasicBlock *BB = getRegionNodeBasicBlock(RN);
|
2015-10-02 07:48:18 +08:00
|
|
|
isl_set *&Domain = DomainMap[BB];
|
2016-04-06 00:18:53 +08:00
|
|
|
assert(Domain);
|
2015-10-02 07:48:18 +08:00
|
|
|
|
2015-09-10 21:00:06 +08:00
|
|
|
// Under the union of all predecessor conditions we can reach this block.
|
2016-05-19 20:34:57 +08:00
|
|
|
auto *PredDom = getPredecessorDomainConstraints(BB, Domain, DT, LI);
|
2015-09-16 06:11:49 +08:00
|
|
|
Domain = isl_set_coalesce(isl_set_intersect(Domain, PredDom));
|
2016-04-04 15:57:39 +08:00
|
|
|
Domain = isl_set_align_params(Domain, getParamSpace());
|
2015-09-11 01:51:27 +08:00
|
|
|
|
2016-04-04 15:57:39 +08:00
|
|
|
Loop *BBLoop = getRegionNodeLoop(RN, LI);
|
2016-05-23 20:40:48 +08:00
|
|
|
if (BBLoop && BBLoop->getHeader() == BB && contains(BBLoop))
|
2016-05-10 21:06:42 +08:00
|
|
|
if (!addLoopBoundsToHeaderDomain(BBLoop, LI))
|
|
|
|
return false;
|
2015-09-10 21:00:06 +08:00
|
|
|
}
|
2016-05-10 21:06:42 +08:00
|
|
|
|
|
|
|
return true;
|
2015-09-10 21:00:06 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Create a map to map from a given iteration to a subsequent iteration.
|
|
|
|
///
|
|
|
|
/// This map maps from SetSpace -> SetSpace where the dimensions @p Dim
|
|
|
|
/// is incremented by one and all other dimensions are equal, e.g.,
|
2015-09-10 21:00:06 +08:00
|
|
|
/// [i0, i1, i2, i3] -> [i0, i1, i2 + 1, i3]
|
2016-09-02 14:33:33 +08:00
|
|
|
///
|
|
|
|
/// if @p Dim is 2 and @p SetSpace has 4 dimensions.
|
2015-09-10 21:00:06 +08:00
|
|
|
static __isl_give isl_map *
|
|
|
|
createNextIterationMap(__isl_take isl_space *SetSpace, unsigned Dim) {
|
|
|
|
auto *MapSpace = isl_space_map_from_set(SetSpace);
|
|
|
|
auto *NextIterationMap = isl_map_universe(isl_space_copy(MapSpace));
|
2017-03-17 05:33:20 +08:00
|
|
|
for (unsigned u = 0; u < isl_map_dim(NextIterationMap, isl_dim_in); u++)
|
2015-09-10 21:00:06 +08:00
|
|
|
if (u != Dim)
|
|
|
|
NextIterationMap =
|
|
|
|
isl_map_equate(NextIterationMap, isl_dim_in, u, isl_dim_out, u);
|
|
|
|
auto *C = isl_constraint_alloc_equality(isl_local_space_from_space(MapSpace));
|
|
|
|
C = isl_constraint_set_constant_si(C, 1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_in, Dim, 1);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_out, Dim, -1);
|
|
|
|
NextIterationMap = isl_map_add_constraint(NextIterationMap, C);
|
|
|
|
return NextIterationMap;
|
|
|
|
}
|
|
|
|
|
2016-05-10 21:06:42 +08:00
|
|
|
bool Scop::addLoopBoundsToHeaderDomain(Loop *L, LoopInfo &LI) {
|
2015-09-21 00:15:32 +08:00
|
|
|
int LoopDepth = getRelativeLoopDepth(L);
|
|
|
|
assert(LoopDepth >= 0 && "Loop in region should have at least depth one");
|
2015-09-10 21:00:06 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
BasicBlock *HeaderBB = L->getHeader();
|
|
|
|
assert(DomainMap.count(HeaderBB));
|
|
|
|
isl_set *&HeaderBBDom = DomainMap[HeaderBB];
|
2015-09-10 21:00:06 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
isl_map *NextIterationMap =
|
|
|
|
createNextIterationMap(isl_set_get_space(HeaderBBDom), LoopDepth);
|
2015-09-10 21:00:06 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
isl_set *UnionBackedgeCondition =
|
|
|
|
isl_set_empty(isl_set_get_space(HeaderBBDom));
|
2015-09-10 21:00:06 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
SmallVector<llvm::BasicBlock *, 4> LatchBlocks;
|
|
|
|
L->getLoopLatches(LatchBlocks);
|
2015-09-10 21:00:06 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
for (BasicBlock *LatchBB : LatchBlocks) {
|
2015-10-02 07:48:18 +08:00
|
|
|
|
|
|
|
// If the latch is only reachable via error statements we skip it.
|
|
|
|
isl_set *LatchBBDom = DomainMap.lookup(LatchBB);
|
|
|
|
if (!LatchBBDom)
|
|
|
|
continue;
|
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
isl_set *BackedgeCondition = nullptr;
|
|
|
|
|
2015-09-28 17:33:22 +08:00
|
|
|
TerminatorInst *TI = LatchBB->getTerminator();
|
|
|
|
BranchInst *BI = dyn_cast<BranchInst>(TI);
|
2016-11-10 13:20:29 +08:00
|
|
|
assert(BI && "Only branch instructions allowed in loop latches");
|
|
|
|
|
|
|
|
if (BI->isUnconditional())
|
2015-09-21 00:15:32 +08:00
|
|
|
BackedgeCondition = isl_set_copy(LatchBBDom);
|
|
|
|
else {
|
2015-09-28 17:33:22 +08:00
|
|
|
SmallVector<isl_set *, 8> ConditionSets;
|
2015-09-21 00:15:32 +08:00
|
|
|
int idx = BI->getSuccessor(0) != HeaderBB;
|
2016-05-10 21:06:42 +08:00
|
|
|
if (!buildConditionSets(*getStmtFor(LatchBB), TI, L, LatchBBDom,
|
2016-11-03 23:19:41 +08:00
|
|
|
ConditionSets)) {
|
|
|
|
isl_map_free(NextIterationMap);
|
|
|
|
isl_set_free(UnionBackedgeCondition);
|
2016-05-10 21:06:42 +08:00
|
|
|
return false;
|
2016-11-03 23:19:41 +08:00
|
|
|
}
|
2015-09-20 23:00:20 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
// Free the non back edge condition set as we do not need it.
|
|
|
|
isl_set_free(ConditionSets[1 - idx]);
|
|
|
|
|
|
|
|
BackedgeCondition = ConditionSets[idx];
|
2015-09-20 23:00:20 +08:00
|
|
|
}
|
2015-09-10 21:00:06 +08:00
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
int LatchLoopDepth = getRelativeLoopDepth(LI.getLoopFor(LatchBB));
|
|
|
|
assert(LatchLoopDepth >= LoopDepth);
|
|
|
|
BackedgeCondition =
|
|
|
|
isl_set_project_out(BackedgeCondition, isl_dim_set, LoopDepth + 1,
|
|
|
|
LatchLoopDepth - LoopDepth);
|
|
|
|
UnionBackedgeCondition =
|
|
|
|
isl_set_union(UnionBackedgeCondition, BackedgeCondition);
|
2015-09-10 21:00:06 +08:00
|
|
|
}
|
2015-09-21 00:15:32 +08:00
|
|
|
|
|
|
|
isl_map *ForwardMap = isl_map_lex_le(isl_set_get_space(HeaderBBDom));
|
|
|
|
for (int i = 0; i < LoopDepth; i++)
|
|
|
|
ForwardMap = isl_map_equate(ForwardMap, isl_dim_in, i, isl_dim_out, i);
|
|
|
|
|
|
|
|
isl_set *UnionBackedgeConditionComplement =
|
|
|
|
isl_set_complement(UnionBackedgeCondition);
|
|
|
|
UnionBackedgeConditionComplement = isl_set_lower_bound_si(
|
|
|
|
UnionBackedgeConditionComplement, isl_dim_set, LoopDepth, 0);
|
|
|
|
UnionBackedgeConditionComplement =
|
|
|
|
isl_set_apply(UnionBackedgeConditionComplement, ForwardMap);
|
|
|
|
HeaderBBDom = isl_set_subtract(HeaderBBDom, UnionBackedgeConditionComplement);
|
|
|
|
HeaderBBDom = isl_set_apply(HeaderBBDom, NextIterationMap);
|
|
|
|
|
|
|
|
auto Parts = partitionSetParts(HeaderBBDom, LoopDepth);
|
|
|
|
HeaderBBDom = Parts.second;
|
|
|
|
|
2015-09-21 00:59:23 +08:00
|
|
|
// Check if there is a <nsw> tagged AddRec for this loop and if so do not add
|
|
|
|
// the bounded assumptions to the context as they are already implied by the
|
|
|
|
// <nsw> tag.
|
|
|
|
if (Affinator.hasNSWAddRecForLoop(L)) {
|
|
|
|
isl_set_free(Parts.first);
|
2016-05-10 21:06:42 +08:00
|
|
|
return true;
|
2015-09-21 00:59:23 +08:00
|
|
|
}
|
|
|
|
|
2015-09-21 00:15:32 +08:00
|
|
|
isl_set *UnboundedCtx = isl_set_params(Parts.first);
|
2016-04-12 21:27:35 +08:00
|
|
|
recordAssumption(INFINITELOOP, UnboundedCtx,
|
|
|
|
HeaderBB->getTerminator()->getDebugLoc(), AS_RESTRICTION);
|
2016-05-10 21:06:42 +08:00
|
|
|
return true;
|
2015-09-10 21:00:06 +08:00
|
|
|
}
|
|
|
|
|
2016-05-23 17:26:46 +08:00
|
|
|
MemoryAccess *Scop::lookupBasePtrAccess(MemoryAccess *MA) {
|
2017-02-09 18:11:58 +08:00
|
|
|
Value *PointerBase = MA->getOriginalBaseAddr();
|
2016-05-23 17:26:46 +08:00
|
|
|
|
2017-02-09 17:34:46 +08:00
|
|
|
auto *PointerBaseInst = dyn_cast<Instruction>(PointerBase);
|
2016-05-23 17:26:46 +08:00
|
|
|
if (!PointerBaseInst)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
auto *BasePtrStmt = getStmtFor(PointerBaseInst);
|
|
|
|
if (!BasePtrStmt)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
return BasePtrStmt->getArrayAccessOrNULLFor(PointerBaseInst);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool Scop::hasNonHoistableBasePtrInScop(MemoryAccess *MA,
|
|
|
|
__isl_keep isl_union_map *Writes) {
|
2016-05-23 18:40:54 +08:00
|
|
|
if (auto *BasePtrMA = lookupBasePtrAccess(MA)) {
|
|
|
|
auto *NHCtx = getNonHoistableCtx(BasePtrMA, Writes);
|
|
|
|
bool Hoistable = NHCtx != nullptr;
|
|
|
|
isl_set_free(NHCtx);
|
|
|
|
return !Hoistable;
|
|
|
|
}
|
2016-05-23 17:26:46 +08:00
|
|
|
|
2017-02-09 18:11:58 +08:00
|
|
|
Value *BaseAddr = MA->getOriginalBaseAddr();
|
2017-02-09 17:34:46 +08:00
|
|
|
if (auto *BasePtrInst = dyn_cast<Instruction>(BaseAddr))
|
2016-05-23 17:26:46 +08:00
|
|
|
if (!isa<LoadInst>(BasePtrInst))
|
2016-05-23 20:40:48 +08:00
|
|
|
return contains(BasePtrInst);
|
2016-05-23 17:26:46 +08:00
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-06-02 19:06:54 +08:00
|
|
|
bool Scop::buildAliasChecks(AliasAnalysis &AA) {
|
2015-08-21 02:30:08 +08:00
|
|
|
if (!PollyUseRuntimeAliasChecks)
|
2016-06-02 19:06:54 +08:00
|
|
|
return true;
|
2015-08-21 02:30:08 +08:00
|
|
|
|
2016-11-18 05:41:08 +08:00
|
|
|
if (buildAliasGroups(AA)) {
|
|
|
|
// Aliasing assumptions do not go through addAssumption but we still want to
|
|
|
|
// collect statistics so we do it here explicitly.
|
|
|
|
if (MinMaxAliasGroups.size())
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsAliasing++;
|
2016-06-02 19:06:54 +08:00
|
|
|
return true;
|
2016-11-18 05:41:08 +08:00
|
|
|
}
|
2015-08-21 02:30:08 +08:00
|
|
|
|
|
|
|
// If a problem occurs while building the alias groups we need to delete
|
|
|
|
// this SCoP and pretend it wasn't valid in the first place. To this end
|
|
|
|
// we make the assumed context infeasible.
|
2015-12-12 17:52:26 +08:00
|
|
|
invalidate(ALIASING, DebugLoc());
|
2015-08-21 02:30:08 +08:00
|
|
|
|
|
|
|
DEBUG(dbgs() << "\n\nNOTE: Run time checks for " << getNameStr()
|
|
|
|
<< " could not be created as the number of parameters involved "
|
|
|
|
"is too high. The SCoP will be "
|
|
|
|
"dismissed.\nUse:\n\t--polly-rtc-max-parameters=X\nto adjust "
|
|
|
|
"the maximal number of parameters but be advised that the "
|
|
|
|
"compile time might increase exponentially.\n\n");
|
2016-06-02 19:06:54 +08:00
|
|
|
return false;
|
2015-08-21 02:30:08 +08:00
|
|
|
}
|
|
|
|
|
2017-02-10 07:12:22 +08:00
|
|
|
std::tuple<Scop::AliasGroupVectorTy, DenseSet<const ScopArrayInfo *>>
|
2017-01-16 22:07:57 +08:00
|
|
|
Scop::buildAliasGroupsForAccesses(AliasAnalysis &AA) {
|
2014-09-18 19:17:17 +08:00
|
|
|
AliasSetTracker AST(AA);
|
|
|
|
|
|
|
|
DenseMap<Value *, MemoryAccess *> PtrToAcc;
|
2017-02-10 07:12:22 +08:00
|
|
|
DenseSet<const ScopArrayInfo *> HasWriteAccess;
|
2015-05-27 13:16:57 +08:00
|
|
|
for (ScopStmt &Stmt : *this) {
|
2014-10-07 01:43:00 +08:00
|
|
|
|
2015-05-27 13:16:57 +08:00
|
|
|
isl_set *StmtDomain = Stmt.getDomain();
|
2014-10-07 01:43:00 +08:00
|
|
|
bool StmtDomainEmpty = isl_set_is_empty(StmtDomain);
|
|
|
|
isl_set_free(StmtDomain);
|
2017-01-16 22:07:57 +08:00
|
|
|
|
|
|
|
// Statements with an empty domain will never be executed.
|
2014-10-07 01:43:00 +08:00
|
|
|
if (StmtDomainEmpty)
|
|
|
|
continue;
|
|
|
|
|
2015-05-27 13:16:57 +08:00
|
|
|
for (MemoryAccess *MA : Stmt) {
|
ScopInfo: Harmonize the different array kinds
Over time different vocabulary has been introduced to describe the different
memory objects in Polly, resulting in different - often inconsistent - naming
schemes in different parts of Polly. We now standartize this to the following
scheme:
KindArray, KindValue, KindPHI, KindExitPHI
| ------- isScalar -----------|
In most cases this naming scheme has already been used previously (this
minimizes changes and ensures we remain consistent with previous publications).
The main change is that we remove KindScalar to clearify the difference between
a scalar as a memory object of kind Value, PHI or ExitPHI and a value (former
KindScalar) which is a memory object modeling a llvm::Value.
We also move all documentation to the Kind* enum in the ScopArrayInfo class,
remove the second enum in the MemoryAccess class and update documentation to be
formulated from the perspective of the memory object, rather than the memory
access. The terms "Implicit"/"Explicit", formerly used to describe memory
accesses, have been dropped. From the perspective of memory accesses they
described the different memory kinds well - especially from the perspective of
code generation - but just from the perspective of a memory object it seems more
straightforward to talk about scalars and arrays, rather than explicit and
implicit arrays. The last comment is clearly subjective, though. A less
subjective reason to go for these terms is the historic use both in mailing list
discussions and publications.
llvm-svn: 255467
2015-12-14 03:59:01 +08:00
|
|
|
if (MA->isScalarKind())
|
2014-09-18 19:17:17 +08:00
|
|
|
continue;
|
2014-10-01 20:40:46 +08:00
|
|
|
if (!MA->isRead())
|
2017-02-10 07:12:22 +08:00
|
|
|
HasWriteAccess.insert(MA->getScopArrayInfo());
|
2016-01-28 01:09:17 +08:00
|
|
|
MemAccInst Acc(MA->getAccessInstruction());
|
2016-02-27 09:49:58 +08:00
|
|
|
if (MA->isRead() && isa<MemTransferInst>(Acc))
|
2016-10-25 21:37:43 +08:00
|
|
|
PtrToAcc[cast<MemTransferInst>(Acc)->getRawSource()] = MA;
|
2016-02-22 03:13:19 +08:00
|
|
|
else
|
|
|
|
PtrToAcc[Acc.getPointerOperand()] = MA;
|
2014-09-18 19:17:17 +08:00
|
|
|
AST.add(Acc);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-01-16 22:07:57 +08:00
|
|
|
AliasGroupVectorTy AliasGroups;
|
2014-09-18 19:17:17 +08:00
|
|
|
for (AliasSet &AS : AST) {
|
2014-10-08 10:23:48 +08:00
|
|
|
if (AS.isMustAlias() || AS.isForwardingAliasSet())
|
2014-09-18 19:17:17 +08:00
|
|
|
continue;
|
|
|
|
AliasGroupTy AG;
|
2016-02-22 00:37:25 +08:00
|
|
|
for (auto &PR : AS)
|
2014-09-18 19:17:17 +08:00
|
|
|
AG.push_back(PtrToAcc[PR.getValue()]);
|
2016-02-22 03:13:19 +08:00
|
|
|
if (AG.size() < 2)
|
|
|
|
continue;
|
2014-09-18 19:17:17 +08:00
|
|
|
AliasGroups.push_back(std::move(AG));
|
|
|
|
}
|
|
|
|
|
2017-01-16 22:07:57 +08:00
|
|
|
return std::make_tuple(AliasGroups, HasWriteAccess);
|
|
|
|
}
|
|
|
|
|
2017-01-16 22:08:00 +08:00
|
|
|
void Scop::splitAliasGroupsByDomain(AliasGroupVectorTy &AliasGroups) {
|
2014-10-01 20:42:37 +08:00
|
|
|
for (unsigned u = 0; u < AliasGroups.size(); u++) {
|
|
|
|
AliasGroupTy NewAG;
|
|
|
|
AliasGroupTy &AG = AliasGroups[u];
|
|
|
|
AliasGroupTy::iterator AGI = AG.begin();
|
|
|
|
isl_set *AGDomain = getAccessDomain(*AGI);
|
|
|
|
while (AGI != AG.end()) {
|
|
|
|
MemoryAccess *MA = *AGI;
|
|
|
|
isl_set *MADomain = getAccessDomain(MA);
|
|
|
|
if (isl_set_is_disjoint(AGDomain, MADomain)) {
|
|
|
|
NewAG.push_back(MA);
|
|
|
|
AGI = AG.erase(AGI);
|
|
|
|
isl_set_free(MADomain);
|
|
|
|
} else {
|
|
|
|
AGDomain = isl_set_union(AGDomain, MADomain);
|
|
|
|
AGI++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (NewAG.size() > 1)
|
|
|
|
AliasGroups.push_back(std::move(NewAG));
|
|
|
|
isl_set_free(AGDomain);
|
|
|
|
}
|
2017-01-16 22:08:00 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bool Scop::buildAliasGroups(AliasAnalysis &AA) {
|
|
|
|
// To create sound alias checks we perform the following steps:
|
|
|
|
// o) We partition each group into read only and non read only accesses.
|
|
|
|
// o) For each group with more than one base pointer we then compute minimal
|
|
|
|
// and maximal accesses to each array of a group in read only and non
|
|
|
|
// read only partitions separately.
|
|
|
|
AliasGroupVectorTy AliasGroups;
|
2017-02-10 07:12:22 +08:00
|
|
|
DenseSet<const ScopArrayInfo *> HasWriteAccess;
|
2017-01-16 22:08:00 +08:00
|
|
|
|
|
|
|
std::tie(AliasGroups, HasWriteAccess) = buildAliasGroupsForAccesses(AA);
|
|
|
|
|
|
|
|
splitAliasGroupsByDomain(AliasGroups);
|
2014-10-01 20:42:37 +08:00
|
|
|
|
2014-10-01 20:40:46 +08:00
|
|
|
for (AliasGroupTy &AG : AliasGroups) {
|
2017-01-16 23:49:07 +08:00
|
|
|
bool Valid = buildAliasGroup(AG, HasWriteAccess);
|
|
|
|
if (!Valid)
|
|
|
|
return false;
|
|
|
|
}
|
2014-10-01 20:40:46 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
return true;
|
|
|
|
}
|
2014-10-01 20:42:37 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
bool Scop::buildAliasGroup(Scop::AliasGroupTy &AliasGroup,
|
2017-02-10 07:12:22 +08:00
|
|
|
DenseSet<const ScopArrayInfo *> HasWriteAccess) {
|
2017-01-16 23:49:07 +08:00
|
|
|
AliasGroupTy ReadOnlyAccesses;
|
|
|
|
AliasGroupTy ReadWriteAccesses;
|
2017-02-10 07:12:22 +08:00
|
|
|
SmallPtrSet<const ScopArrayInfo *, 4> ReadWriteArrays;
|
2017-02-19 04:51:29 +08:00
|
|
|
SmallPtrSet<const ScopArrayInfo *, 4> ReadOnlyArrays;
|
2014-10-01 20:40:46 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
auto &F = getFunction();
|
2014-10-01 20:40:46 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
if (AliasGroup.size() < 2)
|
|
|
|
return true;
|
2014-10-01 20:40:46 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
for (MemoryAccess *Access : AliasGroup) {
|
|
|
|
emitOptimizationRemarkAnalysis(
|
|
|
|
F.getContext(), DEBUG_TYPE, F,
|
|
|
|
Access->getAccessInstruction()->getDebugLoc(),
|
|
|
|
"Possibly aliasing pointer, use restrict keyword.");
|
|
|
|
|
2017-02-10 07:12:22 +08:00
|
|
|
const ScopArrayInfo *Array = Access->getScopArrayInfo();
|
|
|
|
if (HasWriteAccess.count(Array)) {
|
|
|
|
ReadWriteArrays.insert(Array);
|
2017-01-16 23:49:07 +08:00
|
|
|
ReadWriteAccesses.push_back(Access);
|
|
|
|
} else {
|
2017-02-19 04:51:29 +08:00
|
|
|
ReadOnlyArrays.insert(Array);
|
2017-01-16 23:49:07 +08:00
|
|
|
ReadOnlyAccesses.push_back(Access);
|
2016-05-23 17:26:46 +08:00
|
|
|
}
|
2017-01-16 23:49:07 +08:00
|
|
|
}
|
2016-02-25 22:06:11 +08:00
|
|
|
|
2017-01-16 23:49:09 +08:00
|
|
|
// If there are no read-only pointers, and less than two read-write pointers,
|
|
|
|
// no alias check is needed.
|
2017-02-10 07:12:22 +08:00
|
|
|
if (ReadOnlyAccesses.empty() && ReadWriteArrays.size() <= 1)
|
2017-01-16 23:49:07 +08:00
|
|
|
return true;
|
2015-07-24 01:04:54 +08:00
|
|
|
|
2017-01-16 23:49:09 +08:00
|
|
|
// If there is no read-write pointer, no alias check is needed.
|
2017-02-10 07:12:22 +08:00
|
|
|
if (ReadWriteArrays.empty())
|
2017-01-16 23:49:07 +08:00
|
|
|
return true;
|
2014-09-18 19:17:17 +08:00
|
|
|
|
2017-01-16 23:49:09 +08:00
|
|
|
// For non-affine accesses, no alias check can be generated as we cannot
|
|
|
|
// compute a sufficiently tight lower and upper bound: bail out.
|
2017-01-16 23:49:07 +08:00
|
|
|
for (MemoryAccess *MA : AliasGroup) {
|
|
|
|
if (!MA->isAffine()) {
|
|
|
|
invalidate(ALIASING, MA->getAccessInstruction()->getDebugLoc());
|
2017-01-16 23:49:04 +08:00
|
|
|
return false;
|
2017-01-16 23:49:07 +08:00
|
|
|
}
|
2017-01-16 23:49:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Ensure that for all memory accesses for which we generate alias checks,
|
|
|
|
// their base pointers are available.
|
|
|
|
for (MemoryAccess *MA : AliasGroup) {
|
2017-01-16 23:49:07 +08:00
|
|
|
if (MemoryAccess *BasePtrMA = lookupBasePtrAccess(MA))
|
|
|
|
addRequiredInvariantLoad(
|
|
|
|
cast<LoadInst>(BasePtrMA->getAccessInstruction()));
|
|
|
|
}
|
2015-07-24 01:04:54 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
MinMaxAliasGroups.emplace_back();
|
|
|
|
MinMaxVectorPairTy &pair = MinMaxAliasGroups.back();
|
|
|
|
MinMaxVectorTy &MinMaxAccessesReadWrite = pair.first;
|
|
|
|
MinMaxVectorTy &MinMaxAccessesReadOnly = pair.second;
|
2015-07-24 01:04:54 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
bool Valid;
|
2014-09-27 19:02:39 +08:00
|
|
|
|
2017-01-16 23:49:07 +08:00
|
|
|
Valid =
|
|
|
|
calculateMinMaxAccess(ReadWriteAccesses, *this, MinMaxAccessesReadWrite);
|
|
|
|
|
|
|
|
if (!Valid)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
// Bail out if the number of values we need to compare is too large.
|
|
|
|
// This is important as the number of comparisons grows quadratically with
|
|
|
|
// the number of values we need to compare.
|
2017-02-19 04:51:29 +08:00
|
|
|
if (MinMaxAccessesReadWrite.size() + ReadOnlyArrays.size() >
|
2017-01-16 23:49:07 +08:00
|
|
|
RunTimeChecksMaxArraysPerGroup)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
Valid =
|
|
|
|
calculateMinMaxAccess(ReadOnlyAccesses, *this, MinMaxAccessesReadOnly);
|
|
|
|
|
|
|
|
if (!Valid)
|
|
|
|
return false;
|
2014-09-27 19:02:39 +08:00
|
|
|
|
2015-03-28 22:50:32 +08:00
|
|
|
return true;
|
2014-09-18 19:17:17 +08:00
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Get the smallest loop that contains @p S but is not in @p S.
|
2016-05-23 20:42:38 +08:00
|
|
|
static Loop *getLoopSurroundingScop(Scop &S, LoopInfo &LI) {
|
2015-11-22 00:56:13 +08:00
|
|
|
// Start with the smallest loop containing the entry and expand that
|
|
|
|
// loop until it contains all blocks in the region. If there is a loop
|
|
|
|
// containing all blocks in the region check if it is itself contained
|
|
|
|
// and if so take the parent loop as it will be the smallest containing
|
|
|
|
// the region but not contained by it.
|
2016-05-23 20:42:38 +08:00
|
|
|
Loop *L = LI.getLoopFor(S.getEntry());
|
2015-11-22 00:56:13 +08:00
|
|
|
while (L) {
|
|
|
|
bool AllContained = true;
|
2016-05-23 20:42:38 +08:00
|
|
|
for (auto *BB : S.blocks())
|
2015-11-22 00:56:13 +08:00
|
|
|
AllContained &= L->contains(BB);
|
|
|
|
if (AllContained)
|
|
|
|
break;
|
|
|
|
L = L->getParentLoop();
|
|
|
|
}
|
|
|
|
|
2016-05-23 20:42:38 +08:00
|
|
|
return L ? (S.contains(L) ? L->getParentLoop() : L) : nullptr;
|
2015-09-10 23:27:46 +08:00
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
Scop::Scop(Region &R, ScalarEvolution &ScalarEvolution, LoopInfo &LI,
|
2016-05-23 17:07:08 +08:00
|
|
|
ScopDetection::DetectionContext &DC)
|
2017-05-15 21:43:01 +08:00
|
|
|
: SE(&ScalarEvolution), R(R), name(R.getNameStr()), IsOptimized(false),
|
2016-02-13 23:12:54 +08:00
|
|
|
HasSingleExitEdge(R.getExitingBlock()), HasErrorBlock(false),
|
2016-09-14 14:26:09 +08:00
|
|
|
MaxLoopDepth(0), CopyStmtsNum(0), DC(DC),
|
|
|
|
IslCtx(isl_ctx_alloc(), isl_ctx_free), Context(nullptr),
|
|
|
|
Affinator(this, LI), AssumedContext(nullptr), InvalidContext(nullptr),
|
|
|
|
Schedule(nullptr) {
|
2016-04-29 19:43:20 +08:00
|
|
|
if (IslOnErrorAbort)
|
|
|
|
isl_options_set_on_error(getIslCtx(), ISL_ON_ERROR_ABORT);
|
Support accesses with differently sized types to the same array
This allows code such as:
void multiple_types(char *Short, char *Float, char *Double) {
for (long i = 0; i < 100; i++) {
Short[i] = *(short *)&Short[2 * i];
Float[i] = *(float *)&Float[4 * i];
Double[i] = *(double *)&Double[8 * i];
}
}
To model such code we use as canonical element type of the modeled array the
smallest element type of all original array accesses, if type allocation sizes
are multiples of each other. Otherwise, we use a newly created iN type, where N
is the gcd of the allocation size of the types used in the accesses to this
array. Accesses with types larger as the canonical element type are modeled as
multiple accesses with the smaller type.
For example the second load access is modeled as:
{ Stmt_bb2[i0] -> MemRef_Float[o0] : 4i0 <= o0 <= 3 + 4i0 }
To support code-generating these memory accesses, we introduce a new method
getAccessAddressFunction that assigns each statement instance a single memory
location, the address we load from/store to. Currently we obtain this address by
taking the lexmin of the access function. We may consider keeping track of the
memory location more explicitly in the future.
We currently do _not_ handle multi-dimensional arrays and also keep the
restriction of not supporting accesses where the offset expression is not a
multiple of the access element type size. This patch adds tests that ensure
we correctly invalidate a scop in case these accesses are found. Both types of
accesses can be handled using the very same model, but are left to be added in
the future.
We also move the initialization of the scop-context into the constructor to
ensure it is already available when invalidating the scop.
Finally, we add this as a new item to the 2.9 release notes
Reviewers: jdoerfert, Meinersbur
Differential Revision: http://reviews.llvm.org/D16878
llvm-svn: 259784
2016-02-04 21:18:42 +08:00
|
|
|
buildContext();
|
|
|
|
}
|
2015-02-24 20:00:50 +08:00
|
|
|
|
2016-12-02 16:10:56 +08:00
|
|
|
void Scop::foldSizeConstantsToRight() {
|
|
|
|
isl_union_set *Accessed = isl_union_map_range(getAccesses());
|
|
|
|
|
|
|
|
for (auto Array : arrays()) {
|
|
|
|
if (Array->getNumberOfDimensions() <= 1)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
isl_space *Space = Array->getSpace();
|
|
|
|
|
|
|
|
Space = isl_space_align_params(Space, isl_union_set_get_space(Accessed));
|
|
|
|
|
|
|
|
if (!isl_union_set_contains(Accessed, Space)) {
|
|
|
|
isl_space_free(Space);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
isl_set *Elements = isl_union_set_extract_set(Accessed, Space);
|
|
|
|
|
|
|
|
isl_map *Transform =
|
|
|
|
isl_map_universe(isl_space_map_from_set(Array->getSpace()));
|
|
|
|
|
|
|
|
std::vector<int> Int;
|
|
|
|
|
|
|
|
int Dims = isl_set_dim(Elements, isl_dim_set);
|
|
|
|
for (int i = 0; i < Dims; i++) {
|
|
|
|
isl_set *DimOnly =
|
|
|
|
isl_set_project_out(isl_set_copy(Elements), isl_dim_set, 0, i);
|
|
|
|
DimOnly = isl_set_project_out(DimOnly, isl_dim_set, 1, Dims - i - 1);
|
|
|
|
DimOnly = isl_set_lower_bound_si(DimOnly, isl_dim_set, 0, 0);
|
|
|
|
|
|
|
|
isl_basic_set *DimHull = isl_set_affine_hull(DimOnly);
|
|
|
|
|
|
|
|
if (i == Dims - 1) {
|
|
|
|
Int.push_back(1);
|
|
|
|
Transform = isl_map_equate(Transform, isl_dim_in, i, isl_dim_out, i);
|
|
|
|
isl_basic_set_free(DimHull);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (isl_basic_set_dim(DimHull, isl_dim_div) == 1) {
|
|
|
|
isl_aff *Diff = isl_basic_set_get_div(DimHull, 0);
|
|
|
|
isl_val *Val = isl_aff_get_denominator_val(Diff);
|
|
|
|
isl_aff_free(Diff);
|
|
|
|
|
|
|
|
int ValInt = 1;
|
|
|
|
|
|
|
|
if (isl_val_is_int(Val))
|
|
|
|
ValInt = isl_val_get_num_si(Val);
|
|
|
|
isl_val_free(Val);
|
|
|
|
|
|
|
|
Int.push_back(ValInt);
|
|
|
|
|
|
|
|
isl_constraint *C = isl_constraint_alloc_equality(
|
|
|
|
isl_local_space_from_space(isl_map_get_space(Transform)));
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_out, i, ValInt);
|
|
|
|
C = isl_constraint_set_coefficient_si(C, isl_dim_in, i, -1);
|
|
|
|
Transform = isl_map_add_constraint(Transform, C);
|
|
|
|
isl_basic_set_free(DimHull);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
isl_basic_set *ZeroSet = isl_basic_set_copy(DimHull);
|
|
|
|
ZeroSet = isl_basic_set_fix_si(ZeroSet, isl_dim_set, 0, 0);
|
|
|
|
|
|
|
|
int ValInt = 1;
|
|
|
|
if (isl_basic_set_is_equal(ZeroSet, DimHull)) {
|
|
|
|
ValInt = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
Int.push_back(ValInt);
|
|
|
|
Transform = isl_map_equate(Transform, isl_dim_in, i, isl_dim_out, i);
|
|
|
|
isl_basic_set_free(DimHull);
|
|
|
|
isl_basic_set_free(ZeroSet);
|
|
|
|
}
|
|
|
|
|
|
|
|
isl_set *MappedElements = isl_map_domain(isl_map_copy(Transform));
|
|
|
|
|
|
|
|
if (!isl_set_is_subset(Elements, MappedElements)) {
|
|
|
|
isl_set_free(Elements);
|
|
|
|
isl_set_free(MappedElements);
|
|
|
|
isl_map_free(Transform);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
isl_set_free(MappedElements);
|
|
|
|
|
|
|
|
bool CanFold = true;
|
|
|
|
|
|
|
|
if (Int[0] <= 1)
|
|
|
|
CanFold = false;
|
|
|
|
|
|
|
|
unsigned NumDims = Array->getNumberOfDimensions();
|
|
|
|
for (unsigned i = 1; i < NumDims - 1; i++)
|
|
|
|
if (Int[0] != Int[i] && Int[i])
|
|
|
|
CanFold = false;
|
|
|
|
|
|
|
|
if (!CanFold) {
|
|
|
|
isl_set_free(Elements);
|
|
|
|
isl_map_free(Transform);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (auto &Access : AccessFunctions)
|
|
|
|
if (Access->getScopArrayInfo() == Array)
|
|
|
|
Access->setAccessRelation(isl_map_apply_range(
|
|
|
|
Access->getAccessRelation(), isl_map_copy(Transform)));
|
|
|
|
|
|
|
|
isl_map_free(Transform);
|
|
|
|
|
|
|
|
std::vector<const SCEV *> Sizes;
|
|
|
|
for (unsigned i = 0; i < NumDims; i++) {
|
|
|
|
auto Size = Array->getDimensionSize(i);
|
|
|
|
|
|
|
|
if (i == NumDims - 1)
|
|
|
|
Size = SE->getMulExpr(Size, SE->getConstant(Size->getType(), Int[0]));
|
|
|
|
Sizes.push_back(Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
Array->updateSizes(Sizes, false /* CheckConsistency */);
|
|
|
|
|
|
|
|
isl_set_free(Elements);
|
|
|
|
}
|
|
|
|
isl_union_set_free(Accessed);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-12-02 13:21:22 +08:00
|
|
|
void Scop::finalizeAccesses() {
|
|
|
|
updateAccessDimensionality();
|
2016-12-02 16:10:56 +08:00
|
|
|
foldSizeConstantsToRight();
|
2016-12-02 13:21:22 +08:00
|
|
|
foldAccessRelations();
|
|
|
|
assumeNoOutOfBounds();
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
Scop::~Scop() {
|
|
|
|
isl_set_free(Context);
|
2013-10-30 05:05:49 +08:00
|
|
|
isl_set_free(AssumedContext);
|
2016-03-01 21:06:28 +08:00
|
|
|
isl_set_free(InvalidContext);
|
2015-07-14 17:33:13 +08:00
|
|
|
isl_schedule_free(Schedule);
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2016-04-26 00:15:13 +08:00
|
|
|
for (auto &It : ParameterIds)
|
|
|
|
isl_id_free(It.second);
|
|
|
|
|
2015-08-31 05:13:53 +08:00
|
|
|
for (auto It : DomainMap)
|
|
|
|
isl_set_free(It.second);
|
|
|
|
|
2016-04-12 21:27:35 +08:00
|
|
|
for (auto &AS : RecordedAssumptions)
|
|
|
|
isl_set_free(AS.Set);
|
|
|
|
|
2014-09-18 19:17:17 +08:00
|
|
|
// Free the alias groups
|
2015-07-24 01:04:54 +08:00
|
|
|
for (MinMaxVectorPairTy &MinMaxAccessPair : MinMaxAliasGroups) {
|
2015-07-26 21:14:38 +08:00
|
|
|
for (MinMaxAccessTy &MMA : MinMaxAccessPair.first) {
|
2014-09-18 19:17:17 +08:00
|
|
|
isl_pw_multi_aff_free(MMA.first);
|
|
|
|
isl_pw_multi_aff_free(MMA.second);
|
|
|
|
}
|
2015-07-26 21:14:38 +08:00
|
|
|
for (MinMaxAccessTy &MMA : MinMaxAccessPair.second) {
|
2015-07-24 01:04:54 +08:00
|
|
|
isl_pw_multi_aff_free(MMA.first);
|
|
|
|
isl_pw_multi_aff_free(MMA.second);
|
|
|
|
}
|
2014-09-18 19:17:17 +08:00
|
|
|
}
|
2015-09-30 07:47:21 +08:00
|
|
|
|
2015-10-10 01:12:26 +08:00
|
|
|
for (const auto &IAClass : InvariantEquivClasses)
|
2016-07-11 20:15:10 +08:00
|
|
|
isl_set_free(IAClass.ExecutionContext);
|
2016-02-17 23:49:21 +08:00
|
|
|
|
|
|
|
// Explicitly release all Scop objects and the underlying isl objects before
|
2017-01-07 01:30:34 +08:00
|
|
|
// we release the isl context.
|
2016-02-17 23:49:21 +08:00
|
|
|
Stmts.clear();
|
2016-07-30 17:25:51 +08:00
|
|
|
ScopArrayInfoSet.clear();
|
2016-02-17 23:49:21 +08:00
|
|
|
ScopArrayInfoMap.clear();
|
2016-07-30 17:25:51 +08:00
|
|
|
ScopArrayNameMap.clear();
|
2016-08-21 19:09:19 +08:00
|
|
|
AccessFunctions.clear();
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2015-09-26 16:55:54 +08:00
|
|
|
void Scop::updateAccessDimensionality() {
|
2016-02-19 00:50:12 +08:00
|
|
|
// Check all array accesses for each base pointer and find a (virtual) element
|
|
|
|
// size for the base pointer that divides all access functions.
|
2017-02-10 07:24:54 +08:00
|
|
|
for (ScopStmt &Stmt : *this)
|
|
|
|
for (MemoryAccess *Access : Stmt) {
|
2016-02-19 00:50:12 +08:00
|
|
|
if (!Access->isArrayKind())
|
|
|
|
continue;
|
2017-02-10 07:24:54 +08:00
|
|
|
ScopArrayInfo *Array =
|
2017-02-10 07:24:57 +08:00
|
|
|
const_cast<ScopArrayInfo *>(Access->getScopArrayInfo());
|
|
|
|
|
2017-02-10 07:24:54 +08:00
|
|
|
if (Array->getNumberOfDimensions() != 1)
|
2016-02-19 00:50:12 +08:00
|
|
|
continue;
|
2017-02-10 07:24:54 +08:00
|
|
|
unsigned DivisibleSize = Array->getElemSizeInBytes();
|
|
|
|
const SCEV *Subscript = Access->getSubscript(0);
|
2016-02-19 00:50:12 +08:00
|
|
|
while (!isDivisible(Subscript, DivisibleSize, *SE))
|
|
|
|
DivisibleSize /= 2;
|
|
|
|
auto *Ty = IntegerType::get(SE->getContext(), DivisibleSize * 8);
|
2017-02-10 07:24:54 +08:00
|
|
|
Array->updateElementType(Ty);
|
2016-02-19 00:50:12 +08:00
|
|
|
}
|
|
|
|
|
2015-09-26 16:55:54 +08:00
|
|
|
for (auto &Stmt : *this)
|
|
|
|
for (auto &Access : Stmt)
|
|
|
|
Access->updateDimensionality();
|
|
|
|
}
|
|
|
|
|
2016-12-02 13:21:22 +08:00
|
|
|
void Scop::foldAccessRelations() {
|
|
|
|
for (auto &Stmt : *this)
|
|
|
|
for (auto &Access : Stmt)
|
|
|
|
Access->foldAccessRelation();
|
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::assumeNoOutOfBounds() {
|
|
|
|
for (auto &Stmt : *this)
|
|
|
|
for (auto &Access : Stmt)
|
|
|
|
Access->assumeNoOutOfBound();
|
|
|
|
}
|
|
|
|
|
2016-07-23 01:31:17 +08:00
|
|
|
void Scop::simplifySCoP(bool AfterHoisting) {
|
2015-09-30 07:47:21 +08:00
|
|
|
for (auto StmtIt = Stmts.begin(), StmtEnd = Stmts.end(); StmtIt != StmtEnd;) {
|
|
|
|
ScopStmt &Stmt = *StmtIt;
|
2015-10-02 21:53:07 +08:00
|
|
|
|
2016-05-10 20:19:47 +08:00
|
|
|
bool RemoveStmt = Stmt.isEmpty();
|
2015-11-04 00:54:49 +08:00
|
|
|
if (!RemoveStmt)
|
2016-05-10 20:42:26 +08:00
|
|
|
RemoveStmt = !DomainMap[Stmt.getEntryBlock()];
|
2015-11-04 00:54:49 +08:00
|
|
|
|
|
|
|
// Remove read only statements only after invariant loop hoisting.
|
2016-05-10 20:19:47 +08:00
|
|
|
if (!RemoveStmt && AfterHoisting) {
|
2015-11-04 00:54:49 +08:00
|
|
|
bool OnlyRead = true;
|
|
|
|
for (MemoryAccess *MA : Stmt) {
|
|
|
|
if (MA->isRead())
|
|
|
|
continue;
|
|
|
|
|
|
|
|
OnlyRead = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
RemoveStmt = OnlyRead;
|
|
|
|
}
|
2015-10-04 23:00:05 +08:00
|
|
|
|
2016-05-10 20:19:47 +08:00
|
|
|
if (!RemoveStmt) {
|
|
|
|
StmtIt++;
|
2015-09-30 07:47:21 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-05-10 20:19:47 +08:00
|
|
|
// Remove the statement because it is unnecessary.
|
|
|
|
if (Stmt.isRegionStmt())
|
|
|
|
for (BasicBlock *BB : Stmt.getRegion()->blocks())
|
|
|
|
StmtMap.erase(BB);
|
|
|
|
else
|
|
|
|
StmtMap.erase(Stmt.getBasicBlock());
|
|
|
|
|
|
|
|
StmtIt = Stmts.erase(StmtIt);
|
2015-09-30 07:47:21 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-27 20:49:11 +08:00
|
|
|
InvariantEquivClassTy *Scop::lookupInvariantEquivClass(Value *Val) {
|
2015-10-18 20:39:19 +08:00
|
|
|
LoadInst *LInst = dyn_cast<LoadInst>(Val);
|
|
|
|
if (!LInst)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
if (Value *Rep = InvEquivClassVMap.lookup(LInst))
|
|
|
|
LInst = cast<LoadInst>(Rep);
|
|
|
|
|
2016-02-08 01:30:13 +08:00
|
|
|
Type *Ty = LInst->getType();
|
2015-10-18 20:39:19 +08:00
|
|
|
const SCEV *PointerSCEV = SE->getSCEV(LInst->getPointerOperand());
|
2016-03-24 21:22:16 +08:00
|
|
|
for (auto &IAClass : InvariantEquivClasses) {
|
2016-07-11 20:27:04 +08:00
|
|
|
if (PointerSCEV != IAClass.IdentifyingPointer || Ty != IAClass.AccessType)
|
2016-03-24 21:22:16 +08:00
|
|
|
continue;
|
|
|
|
|
2016-07-11 20:15:10 +08:00
|
|
|
auto &MAs = IAClass.InvariantAccesses;
|
2016-03-24 21:22:16 +08:00
|
|
|
for (auto *MA : MAs)
|
|
|
|
if (MA->getAccessInstruction() == Val)
|
|
|
|
return &IAClass;
|
|
|
|
}
|
2015-10-18 20:39:19 +08:00
|
|
|
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
/// Check if @p MA can always be hoisted without execution context.
|
2016-04-23 22:32:34 +08:00
|
|
|
static bool canAlwaysBeHoisted(MemoryAccess *MA, bool StmtInvalidCtxIsEmpty,
|
2016-05-23 18:40:54 +08:00
|
|
|
bool MAInvalidCtxIsEmpty,
|
|
|
|
bool NonHoistableCtxIsEmpty) {
|
2016-04-23 20:59:18 +08:00
|
|
|
LoadInst *LInst = cast<LoadInst>(MA->getAccessInstruction());
|
|
|
|
const DataLayout &DL = LInst->getParent()->getModule()->getDataLayout();
|
|
|
|
// TODO: We can provide more information for better but more expensive
|
|
|
|
// results.
|
|
|
|
if (!isDereferenceableAndAlignedPointer(LInst->getPointerOperand(),
|
|
|
|
LInst->getAlignment(), DL))
|
|
|
|
return false;
|
|
|
|
|
2016-05-23 18:40:54 +08:00
|
|
|
// If the location might be overwritten we do not hoist it unconditionally.
|
|
|
|
//
|
|
|
|
// TODO: This is probably to conservative.
|
|
|
|
if (!NonHoistableCtxIsEmpty)
|
|
|
|
return false;
|
|
|
|
|
2016-04-23 20:59:18 +08:00
|
|
|
// If a dereferencable load is in a statement that is modeled precisely we can
|
|
|
|
// hoist it.
|
2016-04-23 22:32:34 +08:00
|
|
|
if (StmtInvalidCtxIsEmpty && MAInvalidCtxIsEmpty)
|
2016-04-23 20:59:18 +08:00
|
|
|
return true;
|
|
|
|
|
|
|
|
// Even if the statement is not modeled precisely we can hoist the load if it
|
2017-01-07 01:30:34 +08:00
|
|
|
// does not involve any parameters that might have been specialized by the
|
2016-04-23 20:59:18 +08:00
|
|
|
// statement domain.
|
|
|
|
for (unsigned u = 0, e = MA->getNumSubscripts(); u < e; u++)
|
|
|
|
if (!isa<SCEVConstant>(MA->getSubscript(u)))
|
|
|
|
return false;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2016-05-23 18:40:54 +08:00
|
|
|
void Scop::addInvariantLoads(ScopStmt &Stmt, InvariantAccessesTy &InvMAs) {
|
2015-10-18 20:39:19 +08:00
|
|
|
|
2016-04-22 19:38:44 +08:00
|
|
|
if (InvMAs.empty())
|
|
|
|
return;
|
|
|
|
|
2016-04-22 19:41:14 +08:00
|
|
|
auto *StmtInvalidCtx = Stmt.getInvalidContext();
|
2016-04-23 20:59:18 +08:00
|
|
|
bool StmtInvalidCtxIsEmpty = isl_set_is_empty(StmtInvalidCtx);
|
2016-04-22 19:41:14 +08:00
|
|
|
|
2016-04-08 18:30:09 +08:00
|
|
|
// Get the context under which the statement is executed but remove the error
|
|
|
|
// context under which this statement is reached.
|
2015-10-18 20:39:19 +08:00
|
|
|
isl_set *DomainCtx = isl_set_params(Stmt.getDomain());
|
2016-04-22 19:41:14 +08:00
|
|
|
DomainCtx = isl_set_subtract(DomainCtx, StmtInvalidCtx);
|
2015-10-18 20:39:19 +08:00
|
|
|
|
2017-02-17 03:11:33 +08:00
|
|
|
if (isl_set_n_basic_set(DomainCtx) >= MaxDisjunctsInDomain) {
|
2016-05-23 18:40:54 +08:00
|
|
|
auto *AccInst = InvMAs.front().MA->getAccessInstruction();
|
2016-04-22 19:41:14 +08:00
|
|
|
invalidate(COMPLEXITY, AccInst->getDebugLoc());
|
|
|
|
isl_set_free(DomainCtx);
|
2016-05-23 18:40:54 +08:00
|
|
|
for (auto &InvMA : InvMAs)
|
|
|
|
isl_set_free(InvMA.NonHoistableCtx);
|
2016-04-22 19:41:14 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2015-10-18 20:39:19 +08:00
|
|
|
// Project out all parameters that relate to loads in the statement. Otherwise
|
|
|
|
// we could have cyclic dependences on the constraints under which the
|
|
|
|
// hoisted loads are executed and we could not determine an order in which to
|
|
|
|
// pre-load them. This happens because not only lower bounds are part of the
|
|
|
|
// domain but also upper bounds.
|
2016-05-23 18:40:54 +08:00
|
|
|
for (auto &InvMA : InvMAs) {
|
|
|
|
auto *MA = InvMA.MA;
|
2015-10-18 20:39:19 +08:00
|
|
|
Instruction *AccInst = MA->getAccessInstruction();
|
|
|
|
if (SE->isSCEVable(AccInst->getType())) {
|
2015-11-08 03:45:27 +08:00
|
|
|
SetVector<Value *> Values;
|
|
|
|
for (const SCEV *Parameter : Parameters) {
|
|
|
|
Values.clear();
|
2016-04-08 18:25:58 +08:00
|
|
|
findValues(Parameter, *SE, Values);
|
2015-11-08 03:45:27 +08:00
|
|
|
if (!Values.count(AccInst))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (isl_id *ParamId = getIdForParam(Parameter)) {
|
|
|
|
int Dim = isl_set_find_dim_by_id(DomainCtx, isl_dim_param, ParamId);
|
2017-03-17 17:02:53 +08:00
|
|
|
if (Dim >= 0)
|
|
|
|
DomainCtx = isl_set_eliminate(DomainCtx, isl_dim_param, Dim, 1);
|
2015-11-08 03:45:27 +08:00
|
|
|
isl_id_free(ParamId);
|
|
|
|
}
|
2015-10-18 20:39:19 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-05-23 18:40:54 +08:00
|
|
|
for (auto &InvMA : InvMAs) {
|
|
|
|
auto *MA = InvMA.MA;
|
|
|
|
auto *NHCtx = InvMA.NonHoistableCtx;
|
|
|
|
|
2015-10-18 20:39:19 +08:00
|
|
|
// Check for another invariant access that accesses the same location as
|
|
|
|
// MA and if found consolidate them. Otherwise create a new equivalence
|
|
|
|
// class at the end of InvariantEquivClasses.
|
|
|
|
LoadInst *LInst = cast<LoadInst>(MA->getAccessInstruction());
|
2016-02-08 01:30:13 +08:00
|
|
|
Type *Ty = LInst->getType();
|
2015-10-18 20:39:19 +08:00
|
|
|
const SCEV *PointerSCEV = SE->getSCEV(LInst->getPointerOperand());
|
|
|
|
|
2016-04-23 22:32:34 +08:00
|
|
|
auto *MAInvalidCtx = MA->getInvalidContext();
|
2016-05-23 18:40:54 +08:00
|
|
|
bool NonHoistableCtxIsEmpty = isl_set_is_empty(NHCtx);
|
2016-04-23 22:32:34 +08:00
|
|
|
bool MAInvalidCtxIsEmpty = isl_set_is_empty(MAInvalidCtx);
|
|
|
|
|
2016-04-23 20:59:18 +08:00
|
|
|
isl_set *MACtx;
|
|
|
|
// Check if we know that this pointer can be speculatively accessed.
|
2016-05-23 18:40:54 +08:00
|
|
|
if (canAlwaysBeHoisted(MA, StmtInvalidCtxIsEmpty, MAInvalidCtxIsEmpty,
|
|
|
|
NonHoistableCtxIsEmpty)) {
|
2016-04-23 20:59:18 +08:00
|
|
|
MACtx = isl_set_universe(isl_set_get_space(DomainCtx));
|
2016-04-23 22:32:34 +08:00
|
|
|
isl_set_free(MAInvalidCtx);
|
2016-05-23 18:40:54 +08:00
|
|
|
isl_set_free(NHCtx);
|
2016-04-23 20:59:18 +08:00
|
|
|
} else {
|
|
|
|
MACtx = isl_set_copy(DomainCtx);
|
2016-05-23 18:40:54 +08:00
|
|
|
MACtx = isl_set_subtract(MACtx, isl_set_union(MAInvalidCtx, NHCtx));
|
2016-04-23 20:59:18 +08:00
|
|
|
MACtx = isl_set_gist_params(MACtx, getContext());
|
|
|
|
}
|
|
|
|
|
2015-10-18 20:39:19 +08:00
|
|
|
bool Consolidated = false;
|
|
|
|
for (auto &IAClass : InvariantEquivClasses) {
|
2016-07-11 20:27:04 +08:00
|
|
|
if (PointerSCEV != IAClass.IdentifyingPointer || Ty != IAClass.AccessType)
|
2015-10-18 20:39:19 +08:00
|
|
|
continue;
|
|
|
|
|
2016-03-03 20:26:58 +08:00
|
|
|
// If the pointer and the type is equal check if the access function wrt.
|
|
|
|
// to the domain is equal too. It can happen that the domain fixes
|
|
|
|
// parameter values and these can be different for distinct part of the
|
2016-03-03 20:30:19 +08:00
|
|
|
// SCoP. If this happens we cannot consolidate the loads but need to
|
2016-03-03 20:26:58 +08:00
|
|
|
// create a new invariant load equivalence class.
|
2016-07-11 20:15:10 +08:00
|
|
|
auto &MAs = IAClass.InvariantAccesses;
|
2016-03-03 20:26:58 +08:00
|
|
|
if (!MAs.empty()) {
|
|
|
|
auto *LastMA = MAs.front();
|
|
|
|
|
|
|
|
auto *AR = isl_map_range(MA->getAccessRelation());
|
|
|
|
auto *LastAR = isl_map_range(LastMA->getAccessRelation());
|
|
|
|
bool SameAR = isl_set_is_equal(AR, LastAR);
|
|
|
|
isl_set_free(AR);
|
|
|
|
isl_set_free(LastAR);
|
|
|
|
|
|
|
|
if (!SameAR)
|
|
|
|
continue;
|
|
|
|
}
|
2015-10-18 20:39:19 +08:00
|
|
|
|
|
|
|
// Add MA to the list of accesses that are in this class.
|
|
|
|
MAs.push_front(MA);
|
|
|
|
|
2016-03-03 20:26:58 +08:00
|
|
|
Consolidated = true;
|
|
|
|
|
2015-10-18 20:39:19 +08:00
|
|
|
// Unify the execution context of the class and this statement.
|
2016-07-11 20:15:10 +08:00
|
|
|
isl_set *&IAClassDomainCtx = IAClass.ExecutionContext;
|
2015-11-11 12:30:07 +08:00
|
|
|
if (IAClassDomainCtx)
|
2016-04-23 20:59:18 +08:00
|
|
|
IAClassDomainCtx =
|
|
|
|
isl_set_coalesce(isl_set_union(IAClassDomainCtx, MACtx));
|
2015-11-11 12:30:07 +08:00
|
|
|
else
|
2016-04-23 20:59:18 +08:00
|
|
|
IAClassDomainCtx = MACtx;
|
2015-10-18 20:39:19 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Consolidated)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
// If we did not consolidate MA, thus did not find an equivalence class
|
|
|
|
// for it, we create a new one.
|
2016-07-11 20:15:10 +08:00
|
|
|
InvariantEquivClasses.emplace_back(
|
|
|
|
InvariantEquivClassTy{PointerSCEV, MemoryAccessList{MA}, MACtx, Ty});
|
2015-10-18 20:39:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
isl_set_free(DomainCtx);
|
|
|
|
}
|
|
|
|
|
2016-05-23 18:40:54 +08:00
|
|
|
__isl_give isl_set *Scop::getNonHoistableCtx(MemoryAccess *Access,
|
|
|
|
__isl_keep isl_union_map *Writes) {
|
2015-12-14 05:00:40 +08:00
|
|
|
// TODO: Loads that are not loop carried, hence are in a statement with
|
|
|
|
// zero iterators, are by construction invariant, though we
|
|
|
|
// currently "hoist" them anyway. This is necessary because we allow
|
|
|
|
// them to be treated as parameters (e.g., in conditions) and our code
|
|
|
|
// generation would otherwise use the old value.
|
|
|
|
|
|
|
|
auto &Stmt = *Access->getStatement();
|
2016-02-25 06:08:24 +08:00
|
|
|
BasicBlock *BB = Stmt.getEntryBlock();
|
2015-12-14 05:00:40 +08:00
|
|
|
|
2016-11-18 06:11:56 +08:00
|
|
|
if (Access->isScalarKind() || Access->isWrite() || !Access->isAffine() ||
|
|
|
|
Access->isMemoryIntrinsic())
|
2016-05-23 18:40:54 +08:00
|
|
|
return nullptr;
|
2015-09-30 07:47:21 +08:00
|
|
|
|
2015-12-14 05:00:40 +08:00
|
|
|
// Skip accesses that have an invariant base pointer which is defined but
|
|
|
|
// not loaded inside the SCoP. This can happened e.g., if a readnone call
|
|
|
|
// returns a pointer that is used as a base address. However, as we want
|
|
|
|
// to hoist indirect pointers, we allow the base pointer to be defined in
|
|
|
|
// the region if it is also a memory access. Each ScopArrayInfo object
|
|
|
|
// that has a base pointer origin has a base pointer that is loaded and
|
|
|
|
// that it is invariant, thus it will be hoisted too. However, if there is
|
|
|
|
// no base pointer origin we check that the base pointer is defined
|
|
|
|
// outside the region.
|
2016-05-23 18:40:54 +08:00
|
|
|
auto *LI = cast<LoadInst>(Access->getAccessInstruction());
|
2016-05-23 17:26:46 +08:00
|
|
|
if (hasNonHoistableBasePtrInScop(Access, Writes))
|
2016-05-23 18:40:54 +08:00
|
|
|
return nullptr;
|
2015-09-30 07:47:21 +08:00
|
|
|
|
2015-12-14 05:00:40 +08:00
|
|
|
isl_map *AccessRelation = Access->getAccessRelation();
|
2016-03-24 21:19:16 +08:00
|
|
|
assert(!isl_map_is_empty(AccessRelation));
|
2015-10-19 03:49:25 +08:00
|
|
|
|
2015-12-14 05:00:40 +08:00
|
|
|
if (isl_map_involves_dims(AccessRelation, isl_dim_in, 0,
|
|
|
|
Stmt.getNumIterators())) {
|
|
|
|
isl_map_free(AccessRelation);
|
2016-05-23 18:40:54 +08:00
|
|
|
return nullptr;
|
2015-12-14 05:00:40 +08:00
|
|
|
}
|
2015-10-02 22:51:00 +08:00
|
|
|
|
2015-12-14 05:00:40 +08:00
|
|
|
AccessRelation = isl_map_intersect_domain(AccessRelation, Stmt.getDomain());
|
2017-04-28 04:08:16 +08:00
|
|
|
isl_set *SafeToLoad;
|
|
|
|
|
|
|
|
auto &DL = getFunction().getParent()->getDataLayout();
|
|
|
|
if (isSafeToLoadUnconditionally(LI->getPointerOperand(), LI->getAlignment(),
|
|
|
|
DL)) {
|
|
|
|
SafeToLoad =
|
|
|
|
isl_set_universe(isl_space_range(isl_map_get_space(AccessRelation)));
|
|
|
|
isl_map_free(AccessRelation);
|
|
|
|
} else if (BB != LI->getParent()) {
|
|
|
|
// Skip accesses in non-affine subregions as they might not be executed
|
|
|
|
// under the same condition as the entry of the non-affine subregion.
|
|
|
|
isl_map_free(AccessRelation);
|
|
|
|
return nullptr;
|
|
|
|
} else {
|
|
|
|
SafeToLoad = isl_map_range(AccessRelation);
|
|
|
|
}
|
2015-10-19 03:50:18 +08:00
|
|
|
|
2015-12-14 05:00:40 +08:00
|
|
|
isl_union_map *Written = isl_union_map_intersect_range(
|
2017-04-28 04:08:16 +08:00
|
|
|
isl_union_map_copy(Writes), isl_union_set_from_set(SafeToLoad));
|
2016-05-23 18:40:54 +08:00
|
|
|
auto *WrittenCtx = isl_union_map_params(Written);
|
|
|
|
bool IsWritten = !isl_set_is_empty(WrittenCtx);
|
|
|
|
|
|
|
|
if (!IsWritten)
|
|
|
|
return WrittenCtx;
|
|
|
|
|
|
|
|
WrittenCtx = isl_set_remove_divs(WrittenCtx);
|
2017-02-17 03:11:33 +08:00
|
|
|
bool TooComplex = isl_set_n_basic_set(WrittenCtx) >= MaxDisjunctsInDomain;
|
2016-05-23 18:40:54 +08:00
|
|
|
if (TooComplex || !isRequiredInvariantLoad(LI)) {
|
|
|
|
isl_set_free(WrittenCtx);
|
|
|
|
return nullptr;
|
|
|
|
}
|
2015-10-19 03:50:18 +08:00
|
|
|
|
2016-05-23 18:40:54 +08:00
|
|
|
addAssumption(INVARIANTLOAD, isl_set_copy(WrittenCtx), LI->getDebugLoc(),
|
|
|
|
AS_RESTRICTION);
|
|
|
|
return WrittenCtx;
|
2015-12-14 05:00:40 +08:00
|
|
|
}
|
2015-09-30 07:47:21 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
void Scop::verifyInvariantLoads() {
|
|
|
|
auto &RIL = getRequiredInvariantLoads();
|
2015-12-14 05:00:40 +08:00
|
|
|
for (LoadInst *LI : RIL) {
|
2016-05-23 20:40:48 +08:00
|
|
|
assert(LI && contains(LI));
|
2016-02-25 06:08:19 +08:00
|
|
|
ScopStmt *Stmt = getStmtFor(LI);
|
2015-12-21 15:10:39 +08:00
|
|
|
if (Stmt && Stmt->getArrayAccessOrNULLFor(LI)) {
|
2015-12-14 05:00:40 +08:00
|
|
|
invalidate(INVARIANTLOAD, LI->getDebugLoc());
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2015-09-30 07:47:21 +08:00
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
void Scop::hoistInvariantLoads() {
|
2016-02-29 15:29:42 +08:00
|
|
|
if (!PollyInvariantLoadHoisting)
|
|
|
|
return;
|
2015-09-30 07:47:21 +08:00
|
|
|
|
2016-02-29 15:29:42 +08:00
|
|
|
isl_union_map *Writes = getWrites();
|
|
|
|
for (ScopStmt &Stmt : *this) {
|
2016-05-23 18:40:54 +08:00
|
|
|
InvariantAccessesTy InvariantAccesses;
|
2016-02-29 15:29:42 +08:00
|
|
|
|
|
|
|
for (MemoryAccess *Access : Stmt)
|
2016-05-23 18:40:54 +08:00
|
|
|
if (auto *NHCtx = getNonHoistableCtx(Access, Writes))
|
|
|
|
InvariantAccesses.push_back({Access, NHCtx});
|
2016-02-29 15:29:42 +08:00
|
|
|
|
|
|
|
// Transfer the memory access from the statement to the SCoP.
|
2016-05-23 22:45:58 +08:00
|
|
|
for (auto InvMA : InvariantAccesses)
|
|
|
|
Stmt.removeMemoryAccess(InvMA.MA);
|
2016-02-29 15:29:42 +08:00
|
|
|
addInvariantLoads(Stmt, InvariantAccesses);
|
|
|
|
}
|
|
|
|
isl_union_map_free(Writes);
|
2015-09-30 07:47:21 +08:00
|
|
|
}
|
|
|
|
|
2017-05-10 18:59:58 +08:00
|
|
|
/// Find the canonical scop array info object for a set of invariant load
|
|
|
|
/// hoisted loads. The canonical array is the one that corresponds to the
|
|
|
|
/// first load in the list of accesses which is used as base pointer of a
|
|
|
|
/// scop array.
|
|
|
|
static const ScopArrayInfo *findCanonicalArray(Scop *S,
|
|
|
|
MemoryAccessList &Accesses) {
|
|
|
|
for (MemoryAccess *Access : Accesses) {
|
|
|
|
const ScopArrayInfo *CanonicalArray = S->getScopArrayInfoOrNull(
|
|
|
|
Access->getAccessInstruction(), MemoryKind::Array);
|
|
|
|
if (CanonicalArray)
|
|
|
|
return CanonicalArray;
|
|
|
|
}
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Check if @p Array severs as base array in an invariant load.
|
|
|
|
static bool isUsedForIndirectHoistedLoad(Scop *S, const ScopArrayInfo *Array) {
|
|
|
|
for (InvariantEquivClassTy &EqClass2 : S->getInvariantAccesses())
|
|
|
|
for (MemoryAccess *Access2 : EqClass2.InvariantAccesses)
|
|
|
|
if (Access2->getScopArrayInfo() == Array)
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Replace the base pointer arrays in all memory accesses referencing @p Old,
|
|
|
|
/// with a reference to @p New.
|
|
|
|
static void replaceBasePtrArrays(Scop *S, const ScopArrayInfo *Old,
|
|
|
|
const ScopArrayInfo *New) {
|
|
|
|
for (ScopStmt &Stmt : *S)
|
|
|
|
for (MemoryAccess *Access : Stmt) {
|
|
|
|
if (Access->getLatestScopArrayInfo() != Old)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
isl_id *Id = New->getBasePtrId();
|
|
|
|
isl_map *Map = Access->getAccessRelation();
|
|
|
|
Map = isl_map_set_tuple_id(Map, isl_dim_out, Id);
|
|
|
|
Access->setAccessRelation(Map);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::canonicalizeDynamicBasePtrs() {
|
|
|
|
for (InvariantEquivClassTy &EqClass : InvariantEquivClasses) {
|
|
|
|
MemoryAccessList &BasePtrAccesses = EqClass.InvariantAccesses;
|
|
|
|
|
|
|
|
const ScopArrayInfo *CanonicalBasePtrSAI =
|
|
|
|
findCanonicalArray(this, BasePtrAccesses);
|
|
|
|
|
|
|
|
if (!CanonicalBasePtrSAI)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
for (MemoryAccess *BasePtrAccess : BasePtrAccesses) {
|
|
|
|
const ScopArrayInfo *BasePtrSAI = getScopArrayInfoOrNull(
|
|
|
|
BasePtrAccess->getAccessInstruction(), MemoryKind::Array);
|
|
|
|
if (!BasePtrSAI || BasePtrSAI == CanonicalBasePtrSAI ||
|
|
|
|
!BasePtrSAI->isCompatibleWith(CanonicalBasePtrSAI))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
// we currently do not canonicalize arrays where some accesses are
|
|
|
|
// hoisted as invariant loads. If we would, we need to update the access
|
|
|
|
// function of the invariant loads as well. However, as this is not a
|
|
|
|
// very common situation, we leave this for now to avoid further
|
|
|
|
// complexity increases.
|
|
|
|
if (isUsedForIndirectHoistedLoad(this, BasePtrSAI))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
replaceBasePtrArrays(this, BasePtrSAI, CanonicalBasePtrSAI);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-01-15 04:25:44 +08:00
|
|
|
const ScopArrayInfo *
|
|
|
|
Scop::getOrCreateScopArrayInfo(Value *BasePtr, Type *ElementType,
|
|
|
|
ArrayRef<const SCEV *> Sizes, MemoryKind Kind,
|
|
|
|
const char *BaseName) {
|
2016-07-30 17:25:51 +08:00
|
|
|
assert((BasePtr || BaseName) &&
|
|
|
|
"BasePtr and BaseName can not be nullptr at the same time.");
|
|
|
|
assert(!(BasePtr && BaseName) && "BaseName is redundant.");
|
|
|
|
auto &SAI = BasePtr ? ScopArrayInfoMap[std::make_pair(BasePtr, Kind)]
|
|
|
|
: ScopArrayNameMap[BaseName];
|
2015-09-26 16:55:54 +08:00
|
|
|
if (!SAI) {
|
2016-05-23 20:38:05 +08:00
|
|
|
auto &DL = getFunction().getParent()->getDataLayout();
|
2016-02-02 21:22:54 +08:00
|
|
|
SAI.reset(new ScopArrayInfo(BasePtr, ElementType, getIslCtx(), Sizes, Kind,
|
2016-07-30 17:25:51 +08:00
|
|
|
DL, this, BaseName));
|
|
|
|
ScopArrayInfoSet.insert(SAI.get());
|
2015-09-26 16:55:54 +08:00
|
|
|
} else {
|
2016-02-15 06:31:39 +08:00
|
|
|
SAI->updateElementType(ElementType);
|
2015-11-02 19:29:32 +08:00
|
|
|
// In case of mismatching array sizes, we bail out by setting the run-time
|
|
|
|
// context to false.
|
2016-02-15 06:31:39 +08:00
|
|
|
if (!SAI->updateSizes(Sizes))
|
2015-12-12 17:52:26 +08:00
|
|
|
invalidate(DELINEARIZATION, DebugLoc());
|
2015-09-26 16:55:54 +08:00
|
|
|
}
|
2015-05-23 13:58:27 +08:00
|
|
|
return SAI.get();
|
2014-10-05 19:32:18 +08:00
|
|
|
}
|
|
|
|
|
2016-07-30 17:25:51 +08:00
|
|
|
const ScopArrayInfo *
|
|
|
|
Scop::createScopArrayInfo(Type *ElementType, const std::string &BaseName,
|
|
|
|
const std::vector<unsigned> &Sizes) {
|
|
|
|
auto *DimSizeType = Type::getInt64Ty(getSE()->getContext());
|
|
|
|
std::vector<const SCEV *> SCEVSizes;
|
|
|
|
|
|
|
|
for (auto size : Sizes)
|
2016-09-13 01:08:31 +08:00
|
|
|
if (size)
|
|
|
|
SCEVSizes.push_back(getSE()->getConstant(DimSizeType, size, false));
|
|
|
|
else
|
|
|
|
SCEVSizes.push_back(nullptr);
|
2016-07-30 17:25:51 +08:00
|
|
|
|
2017-01-15 04:25:44 +08:00
|
|
|
auto *SAI = getOrCreateScopArrayInfo(nullptr, ElementType, SCEVSizes,
|
|
|
|
MemoryKind::Array, BaseName.c_str());
|
2016-07-30 17:25:51 +08:00
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
|
2017-05-10 18:59:58 +08:00
|
|
|
const ScopArrayInfo *Scop::getScopArrayInfoOrNull(Value *BasePtr,
|
|
|
|
MemoryKind Kind) {
|
2015-11-11 01:31:31 +08:00
|
|
|
auto *SAI = ScopArrayInfoMap[std::make_pair(BasePtr, Kind)].get();
|
2017-05-10 18:59:58 +08:00
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
|
|
|
|
const ScopArrayInfo *Scop::getScopArrayInfo(Value *BasePtr, MemoryKind Kind) {
|
|
|
|
auto *SAI = getScopArrayInfoOrNull(BasePtr, Kind);
|
2014-10-05 19:32:18 +08:00
|
|
|
assert(SAI && "No ScopArrayInfo available for this base pointer");
|
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
|
2013-01-15 06:40:23 +08:00
|
|
|
std::string Scop::getContextStr() const { return stringFromIslObj(Context); }
|
2016-02-22 00:37:58 +08:00
|
|
|
|
2014-07-03 01:47:48 +08:00
|
|
|
std::string Scop::getAssumedContextStr() const {
|
2016-03-01 21:06:28 +08:00
|
|
|
assert(AssumedContext && "Assumed context not yet built");
|
2014-07-03 01:47:48 +08:00
|
|
|
return stringFromIslObj(AssumedContext);
|
|
|
|
}
|
2016-02-22 00:37:58 +08:00
|
|
|
|
2016-03-01 21:06:28 +08:00
|
|
|
std::string Scop::getInvalidContextStr() const {
|
|
|
|
return stringFromIslObj(InvalidContext);
|
2015-09-16 06:52:53 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
std::string Scop::getNameStr() const {
|
|
|
|
std::string ExitName, EntryName;
|
|
|
|
raw_string_ostream ExitStr(ExitName);
|
|
|
|
raw_string_ostream EntryStr(EntryName);
|
|
|
|
|
2014-01-09 18:42:15 +08:00
|
|
|
R.getEntry()->printAsOperand(EntryStr, false);
|
2011-04-29 14:27:02 +08:00
|
|
|
EntryStr.str();
|
|
|
|
|
|
|
|
if (R.getExit()) {
|
2014-01-09 18:42:15 +08:00
|
|
|
R.getExit()->printAsOperand(ExitStr, false);
|
2011-04-29 14:27:02 +08:00
|
|
|
ExitStr.str();
|
|
|
|
} else
|
|
|
|
ExitName = "FunctionExit";
|
|
|
|
|
|
|
|
return EntryName + "---" + ExitName;
|
|
|
|
}
|
|
|
|
|
2013-01-15 06:40:23 +08:00
|
|
|
__isl_give isl_set *Scop::getContext() const { return isl_set_copy(Context); }
|
2011-10-06 08:03:42 +08:00
|
|
|
__isl_give isl_space *Scop::getParamSpace() const {
|
2015-05-27 05:37:31 +08:00
|
|
|
return isl_set_get_space(Context);
|
2011-10-06 08:03:42 +08:00
|
|
|
}
|
|
|
|
|
2013-10-30 05:05:49 +08:00
|
|
|
__isl_give isl_set *Scop::getAssumedContext() const {
|
2016-03-01 21:06:28 +08:00
|
|
|
assert(AssumedContext && "Assumed context not yet built");
|
2013-10-30 05:05:49 +08:00
|
|
|
return isl_set_copy(AssumedContext);
|
|
|
|
}
|
|
|
|
|
2017-03-17 21:09:52 +08:00
|
|
|
bool Scop::isProfitable(bool ScalarsAreUnprofitable) const {
|
2016-05-11 00:38:09 +08:00
|
|
|
if (PollyProcessUnprofitable)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
if (isEmpty())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
unsigned OptimizableStmtsOrLoops = 0;
|
|
|
|
for (auto &Stmt : *this) {
|
|
|
|
if (Stmt.getNumIterators() == 0)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
bool ContainsArrayAccs = false;
|
|
|
|
bool ContainsScalarAccs = false;
|
|
|
|
for (auto *MA : Stmt) {
|
|
|
|
if (MA->isRead())
|
|
|
|
continue;
|
2017-03-17 21:09:52 +08:00
|
|
|
ContainsArrayAccs |= MA->isLatestArrayKind();
|
|
|
|
ContainsScalarAccs |= MA->isLatestScalarKind();
|
2016-05-11 00:38:09 +08:00
|
|
|
}
|
|
|
|
|
2017-03-17 21:09:52 +08:00
|
|
|
if (!ScalarsAreUnprofitable || (ContainsArrayAccs && !ContainsScalarAccs))
|
2016-05-11 00:38:09 +08:00
|
|
|
OptimizableStmtsOrLoops += Stmt.getNumIterators();
|
|
|
|
}
|
|
|
|
|
|
|
|
return OptimizableStmtsOrLoops > 1;
|
|
|
|
}
|
|
|
|
|
2015-08-21 02:06:30 +08:00
|
|
|
bool Scop::hasFeasibleRuntimeContext() const {
|
2016-03-01 21:06:28 +08:00
|
|
|
auto *PositiveContext = getAssumedContext();
|
2016-04-23 21:00:27 +08:00
|
|
|
auto *NegativeContext = getInvalidContext();
|
2016-03-01 21:06:28 +08:00
|
|
|
PositiveContext = addNonEmptyDomainConstraints(PositiveContext);
|
2016-04-23 21:00:27 +08:00
|
|
|
bool IsFeasible = !(isl_set_is_empty(PositiveContext) ||
|
|
|
|
isl_set_is_subset(PositiveContext, NegativeContext));
|
2016-03-01 21:06:28 +08:00
|
|
|
isl_set_free(PositiveContext);
|
2016-04-23 21:00:27 +08:00
|
|
|
if (!IsFeasible) {
|
|
|
|
isl_set_free(NegativeContext);
|
2016-03-01 21:06:28 +08:00
|
|
|
return false;
|
2016-04-23 21:00:27 +08:00
|
|
|
}
|
2016-03-01 21:06:28 +08:00
|
|
|
|
|
|
|
auto *DomainContext = isl_union_set_params(getDomains());
|
|
|
|
IsFeasible = !isl_set_is_subset(DomainContext, NegativeContext);
|
2016-04-13 01:54:29 +08:00
|
|
|
IsFeasible &= !isl_set_is_subset(Context, NegativeContext);
|
2016-03-01 21:06:28 +08:00
|
|
|
isl_set_free(NegativeContext);
|
|
|
|
isl_set_free(DomainContext);
|
|
|
|
|
2015-08-20 13:58:56 +08:00
|
|
|
return IsFeasible;
|
|
|
|
}
|
|
|
|
|
2015-11-12 10:33:38 +08:00
|
|
|
static std::string toString(AssumptionKind Kind) {
|
|
|
|
switch (Kind) {
|
|
|
|
case ALIASING:
|
|
|
|
return "No-aliasing";
|
|
|
|
case INBOUNDS:
|
|
|
|
return "Inbounds";
|
|
|
|
case WRAPPING:
|
|
|
|
return "No-overflows";
|
Model zext-extend instructions
A zero-extended value can be interpreted as a piecewise defined signed
value. If the value was non-negative it stays the same, otherwise it
is the sum of the original value and 2^n where n is the bit-width of
the original (or operand) type. Examples:
zext i8 127 to i32 -> { [127] }
zext i8 -1 to i32 -> { [256 + (-1)] } = { [255] }
zext i8 %v to i32 -> [v] -> { [v] | v >= 0; [256 + v] | v < 0 }
However, LLVM/Scalar Evolution uses zero-extend (potentially lead by a
truncate) to represent some forms of modulo computation. The left-hand side
of the condition in the code below would result in the SCEV
"zext i1 <false, +, true>for.body" which is just another description
of the C expression "i & 1 != 0" or, equivalently, "i % 2 != 0".
for (i = 0; i < N; i++)
if (i & 1 != 0 /* == i % 2 */)
/* do something */
If we do not make the modulo explicit but only use the mechanism described
above we will get the very restrictive assumption "N < 3", because for all
values of N >= 3 the SCEVAddRecExpr operand of the zero-extend would wrap.
Alternatively, we can make the modulo in the operand explicit in the
resulting piecewise function and thereby avoid the assumption on N. For the
example this would result in the following piecewise affine function:
{ [i0] -> [(1)] : 2*floor((-1 + i0)/2) = -1 + i0;
[i0] -> [(0)] : 2*floor((i0)/2) = i0 }
To this end we can first determine if the (immediate) operand of the
zero-extend can wrap and, in case it might, we will use explicit modulo
semantic to compute the result instead of emitting non-wrapping assumptions.
Note that operands with large bit-widths are less likely to be negative
because it would result in a very large access offset or loop bound after the
zero-extend. To this end one can optimistically assume the operand to be
positive and avoid the piecewise definition if the bit-width is bigger than
some threshold (here MaxZextSmallBitWidth).
We choose to go with a hybrid solution of all modeling techniques described
above. For small bit-widths (up to MaxZextSmallBitWidth) we will model the
wrapping explicitly and use a piecewise defined function. However, if the
bit-width is bigger than MaxZextSmallBitWidth we will employ overflow
assumptions and assume the "former negative" piece will not exist.
llvm-svn: 267408
2016-04-25 22:01:36 +08:00
|
|
|
case UNSIGNED:
|
|
|
|
return "Signed-unsigned";
|
2016-03-27 00:17:00 +08:00
|
|
|
case COMPLEXITY:
|
|
|
|
return "Low complexity";
|
2016-05-11 00:38:09 +08:00
|
|
|
case PROFITABLE:
|
|
|
|
return "Profitable";
|
2015-11-12 10:33:38 +08:00
|
|
|
case ERRORBLOCK:
|
|
|
|
return "No-error";
|
|
|
|
case INFINITELOOP:
|
|
|
|
return "Finite loop";
|
|
|
|
case INVARIANTLOAD:
|
|
|
|
return "Invariant load";
|
|
|
|
case DELINEARIZATION:
|
|
|
|
return "Delinearization";
|
|
|
|
}
|
|
|
|
llvm_unreachable("Unknown AssumptionKind!");
|
|
|
|
}
|
|
|
|
|
2016-06-06 20:16:10 +08:00
|
|
|
bool Scop::isEffectiveAssumption(__isl_keep isl_set *Set, AssumptionSign Sign) {
|
|
|
|
if (Sign == AS_ASSUMPTION) {
|
|
|
|
if (isl_set_is_subset(Context, Set))
|
|
|
|
return false;
|
2015-11-12 10:33:38 +08:00
|
|
|
|
2016-06-06 20:16:10 +08:00
|
|
|
if (isl_set_is_subset(AssumedContext, Set))
|
|
|
|
return false;
|
|
|
|
} else {
|
|
|
|
if (isl_set_is_disjoint(Set, Context))
|
|
|
|
return false;
|
2016-03-01 21:06:28 +08:00
|
|
|
|
2016-06-06 20:16:10 +08:00
|
|
|
if (isl_set_is_subset(Set, InvalidContext))
|
|
|
|
return false;
|
2016-03-01 21:06:28 +08:00
|
|
|
}
|
2016-06-06 20:16:10 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool Scop::trackAssumption(AssumptionKind Kind, __isl_keep isl_set *Set,
|
|
|
|
DebugLoc Loc, AssumptionSign Sign) {
|
|
|
|
if (PollyRemarksMinimal && !isEffectiveAssumption(Set, Sign))
|
|
|
|
return false;
|
2015-11-12 10:33:38 +08:00
|
|
|
|
2016-11-18 06:08:40 +08:00
|
|
|
// Do never emit trivial assumptions as they only clutter the output.
|
|
|
|
if (!PollyRemarksMinimal) {
|
|
|
|
isl_set *Univ = nullptr;
|
|
|
|
if (Sign == AS_ASSUMPTION)
|
|
|
|
Univ = isl_set_universe(isl_set_get_space(Set));
|
|
|
|
|
|
|
|
bool IsTrivial = (Sign == AS_RESTRICTION && isl_set_is_empty(Set)) ||
|
|
|
|
(Sign == AS_ASSUMPTION && isl_set_is_equal(Univ, Set));
|
|
|
|
isl_set_free(Univ);
|
|
|
|
|
|
|
|
if (IsTrivial)
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-11-18 05:41:08 +08:00
|
|
|
switch (Kind) {
|
|
|
|
case ALIASING:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsAliasing++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case INBOUNDS:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsInbounds++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case WRAPPING:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsWrapping++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case UNSIGNED:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsUnsigned++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case COMPLEXITY:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsComplexity++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case PROFITABLE:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsUnprofitable++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case ERRORBLOCK:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsErrorBlock++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case INFINITELOOP:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsInfiniteLoop++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case INVARIANTLOAD:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsInvariantLoad++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
case DELINEARIZATION:
|
2016-11-18 22:37:08 +08:00
|
|
|
AssumptionsDelinearization++;
|
2016-11-18 05:41:08 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2016-05-23 20:38:05 +08:00
|
|
|
auto &F = getFunction();
|
2016-03-01 21:06:28 +08:00
|
|
|
auto Suffix = Sign == AS_ASSUMPTION ? " assumption:\t" : " restriction:\t";
|
|
|
|
std::string Msg = toString(Kind) + Suffix + stringFromIslObj(Set);
|
2015-11-12 10:33:38 +08:00
|
|
|
emitOptimizationRemarkAnalysis(F.getContext(), DEBUG_TYPE, F, Loc, Msg);
|
2016-03-01 21:06:28 +08:00
|
|
|
return true;
|
2015-11-12 10:33:38 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::addAssumption(AssumptionKind Kind, __isl_take isl_set *Set,
|
2016-03-01 21:06:28 +08:00
|
|
|
DebugLoc Loc, AssumptionSign Sign) {
|
2016-04-12 21:27:35 +08:00
|
|
|
// Simplify the assumptions/restrictions first.
|
|
|
|
Set = isl_set_gist_params(Set, getContext());
|
|
|
|
|
2016-03-01 21:06:28 +08:00
|
|
|
if (!trackAssumption(Kind, Set, Loc, Sign)) {
|
|
|
|
isl_set_free(Set);
|
|
|
|
return;
|
2015-11-12 00:22:36 +08:00
|
|
|
}
|
|
|
|
|
2016-03-01 21:06:28 +08:00
|
|
|
if (Sign == AS_ASSUMPTION) {
|
|
|
|
AssumedContext = isl_set_intersect(AssumedContext, Set);
|
|
|
|
AssumedContext = isl_set_coalesce(AssumedContext);
|
|
|
|
} else {
|
|
|
|
InvalidContext = isl_set_union(InvalidContext, Set);
|
|
|
|
InvalidContext = isl_set_coalesce(InvalidContext);
|
|
|
|
}
|
2014-07-03 01:47:48 +08:00
|
|
|
}
|
|
|
|
|
2016-04-12 21:27:35 +08:00
|
|
|
void Scop::recordAssumption(AssumptionKind Kind, __isl_take isl_set *Set,
|
2016-04-12 21:28:39 +08:00
|
|
|
DebugLoc Loc, AssumptionSign Sign, BasicBlock *BB) {
|
2016-11-10 19:44:10 +08:00
|
|
|
assert((isl_set_is_params(Set) || BB) &&
|
|
|
|
"Assumptions without a basic block must be parameter sets");
|
2016-04-12 21:28:39 +08:00
|
|
|
RecordedAssumptions.push_back({Kind, Sign, Set, Loc, BB});
|
2016-04-12 21:27:35 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::addRecordedAssumptions() {
|
|
|
|
while (!RecordedAssumptions.empty()) {
|
|
|
|
const Assumption &AS = RecordedAssumptions.pop_back_val();
|
2016-04-12 21:28:39 +08:00
|
|
|
|
2016-04-28 22:32:58 +08:00
|
|
|
if (!AS.BB) {
|
|
|
|
addAssumption(AS.Kind, AS.Set, AS.Loc, AS.Sign);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-05-10 20:42:26 +08:00
|
|
|
// If the domain was deleted the assumptions are void.
|
|
|
|
isl_set *Dom = getDomainConditions(AS.BB);
|
|
|
|
if (!Dom) {
|
|
|
|
isl_set_free(AS.Set);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-04-12 21:28:39 +08:00
|
|
|
// If a basic block was given use its domain to simplify the assumption.
|
2016-04-28 22:32:58 +08:00
|
|
|
// In case of restrictions we know they only have to hold on the domain,
|
|
|
|
// thus we can intersect them with the domain of the block. However, for
|
|
|
|
// assumptions the domain has to imply them, thus:
|
|
|
|
// _ _____
|
|
|
|
// Dom => S <==> A v B <==> A - B
|
|
|
|
//
|
2017-01-07 01:30:34 +08:00
|
|
|
// To avoid the complement we will register A - B as a restriction not an
|
2016-04-28 22:32:58 +08:00
|
|
|
// assumption.
|
|
|
|
isl_set *S = AS.Set;
|
|
|
|
if (AS.Sign == AS_RESTRICTION)
|
|
|
|
S = isl_set_params(isl_set_intersect(S, Dom));
|
|
|
|
else /* (AS.Sign == AS_ASSUMPTION) */
|
|
|
|
S = isl_set_params(isl_set_subtract(Dom, S));
|
2016-04-12 21:28:39 +08:00
|
|
|
|
2016-04-28 22:32:58 +08:00
|
|
|
addAssumption(AS.Kind, S, AS.Loc, AS_RESTRICTION);
|
2016-04-12 21:27:35 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-12-12 17:52:26 +08:00
|
|
|
void Scop::invalidate(AssumptionKind Kind, DebugLoc Loc) {
|
2016-03-01 21:06:28 +08:00
|
|
|
addAssumption(Kind, isl_set_empty(getParamSpace()), Loc, AS_ASSUMPTION);
|
2015-12-12 17:52:26 +08:00
|
|
|
}
|
|
|
|
|
2016-03-01 21:06:28 +08:00
|
|
|
__isl_give isl_set *Scop::getInvalidContext() const {
|
|
|
|
return isl_set_copy(InvalidContext);
|
2015-09-16 06:52:53 +08:00
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
void Scop::printContext(raw_ostream &OS) const {
|
|
|
|
OS << "Context:\n";
|
2016-03-01 21:06:28 +08:00
|
|
|
OS.indent(4) << Context << "\n";
|
2011-11-08 23:41:28 +08:00
|
|
|
|
2014-07-03 01:47:48 +08:00
|
|
|
OS.indent(4) << "Assumed Context:\n";
|
2016-03-01 21:06:28 +08:00
|
|
|
OS.indent(4) << AssumedContext << "\n";
|
2015-09-16 06:52:53 +08:00
|
|
|
|
2016-03-01 21:06:28 +08:00
|
|
|
OS.indent(4) << "Invalid Context:\n";
|
|
|
|
OS.indent(4) << InvalidContext << "\n";
|
2015-09-16 06:52:53 +08:00
|
|
|
|
2016-04-26 00:15:13 +08:00
|
|
|
unsigned Dim = 0;
|
|
|
|
for (const SCEV *Parameter : Parameters)
|
|
|
|
OS.indent(4) << "p" << Dim++ << ": " << *Parameter << "\n";
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2014-09-18 19:17:17 +08:00
|
|
|
void Scop::printAliasAssumptions(raw_ostream &OS) const {
|
2015-07-25 20:31:03 +08:00
|
|
|
int noOfGroups = 0;
|
|
|
|
for (const MinMaxVectorPairTy &Pair : MinMaxAliasGroups) {
|
2015-07-26 21:14:38 +08:00
|
|
|
if (Pair.second.size() == 0)
|
2015-07-24 01:04:54 +08:00
|
|
|
noOfGroups += 1;
|
|
|
|
else
|
2015-07-26 21:14:38 +08:00
|
|
|
noOfGroups += Pair.second.size();
|
2015-07-24 01:04:54 +08:00
|
|
|
}
|
|
|
|
|
2015-07-25 20:31:03 +08:00
|
|
|
OS.indent(4) << "Alias Groups (" << noOfGroups << "):\n";
|
2014-09-18 19:17:17 +08:00
|
|
|
if (MinMaxAliasGroups.empty()) {
|
|
|
|
OS.indent(8) << "n/a\n";
|
|
|
|
return;
|
|
|
|
}
|
2015-07-24 01:04:54 +08:00
|
|
|
|
2015-07-25 20:31:03 +08:00
|
|
|
for (const MinMaxVectorPairTy &Pair : MinMaxAliasGroups) {
|
2015-07-24 01:04:54 +08:00
|
|
|
|
|
|
|
// If the group has no read only accesses print the write accesses.
|
2015-07-26 21:14:38 +08:00
|
|
|
if (Pair.second.empty()) {
|
2015-07-24 01:04:54 +08:00
|
|
|
OS.indent(8) << "[[";
|
2015-07-26 21:14:38 +08:00
|
|
|
for (const MinMaxAccessTy &MMANonReadOnly : Pair.first) {
|
2015-07-25 20:31:03 +08:00
|
|
|
OS << " <" << MMANonReadOnly.first << ", " << MMANonReadOnly.second
|
|
|
|
<< ">";
|
2015-07-24 01:04:54 +08:00
|
|
|
}
|
|
|
|
OS << " ]]\n";
|
|
|
|
}
|
|
|
|
|
2015-07-26 21:14:38 +08:00
|
|
|
for (const MinMaxAccessTy &MMAReadOnly : Pair.second) {
|
2015-07-24 01:04:54 +08:00
|
|
|
OS.indent(8) << "[[";
|
2015-07-25 20:31:03 +08:00
|
|
|
OS << " <" << MMAReadOnly.first << ", " << MMAReadOnly.second << ">";
|
2015-07-26 21:14:38 +08:00
|
|
|
for (const MinMaxAccessTy &MMANonReadOnly : Pair.first) {
|
2015-07-25 20:31:03 +08:00
|
|
|
OS << " <" << MMANonReadOnly.first << ", " << MMANonReadOnly.second
|
|
|
|
<< ">";
|
2015-07-24 01:04:54 +08:00
|
|
|
}
|
|
|
|
OS << " ]]\n";
|
|
|
|
}
|
2014-09-18 19:17:17 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
void Scop::printStatements(raw_ostream &OS) const {
|
|
|
|
OS << "Statements {\n";
|
|
|
|
|
2015-05-27 13:16:57 +08:00
|
|
|
for (const ScopStmt &Stmt : *this)
|
|
|
|
OS.indent(4) << Stmt;
|
2011-04-29 14:27:02 +08:00
|
|
|
|
|
|
|
OS.indent(4) << "}\n";
|
|
|
|
}
|
|
|
|
|
2015-05-20 16:05:31 +08:00
|
|
|
void Scop::printArrayInfo(raw_ostream &OS) const {
|
|
|
|
OS << "Arrays {\n";
|
|
|
|
|
2015-05-23 13:58:27 +08:00
|
|
|
for (auto &Array : arrays())
|
2016-07-30 17:25:51 +08:00
|
|
|
Array->print(OS);
|
2015-05-20 16:05:31 +08:00
|
|
|
|
|
|
|
OS.indent(4) << "}\n";
|
2015-08-12 23:27:16 +08:00
|
|
|
|
|
|
|
OS.indent(4) << "Arrays (Bounds as pw_affs) {\n";
|
|
|
|
|
|
|
|
for (auto &Array : arrays())
|
2016-07-30 17:25:51 +08:00
|
|
|
Array->print(OS, /* SizeAsPwAff */ true);
|
2015-08-12 23:27:16 +08:00
|
|
|
|
|
|
|
OS.indent(4) << "}\n";
|
2015-05-20 16:05:31 +08:00
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
void Scop::print(raw_ostream &OS) const {
|
2016-05-23 20:38:05 +08:00
|
|
|
OS.indent(4) << "Function: " << getFunction().getName() << "\n";
|
2014-03-19 02:05:38 +08:00
|
|
|
OS.indent(4) << "Region: " << getNameStr() << "\n";
|
2015-01-14 02:31:55 +08:00
|
|
|
OS.indent(4) << "Max Loop Depth: " << getMaxLoopDepth() << "\n";
|
2015-09-30 07:47:21 +08:00
|
|
|
OS.indent(4) << "Invariant Accesses: {\n";
|
2015-10-10 01:12:26 +08:00
|
|
|
for (const auto &IAClass : InvariantEquivClasses) {
|
2016-07-11 20:15:10 +08:00
|
|
|
const auto &MAs = IAClass.InvariantAccesses;
|
2015-10-18 20:39:19 +08:00
|
|
|
if (MAs.empty()) {
|
2016-07-11 20:15:10 +08:00
|
|
|
OS.indent(12) << "Class Pointer: " << *IAClass.IdentifyingPointer << "\n";
|
2015-10-10 01:12:26 +08:00
|
|
|
} else {
|
2015-10-18 20:39:19 +08:00
|
|
|
MAs.front()->print(OS);
|
2016-07-11 20:15:10 +08:00
|
|
|
OS.indent(12) << "Execution Context: " << IAClass.ExecutionContext
|
|
|
|
<< "\n";
|
2015-10-10 01:12:26 +08:00
|
|
|
}
|
2015-09-30 07:47:21 +08:00
|
|
|
}
|
|
|
|
OS.indent(4) << "}\n";
|
2011-04-29 14:27:02 +08:00
|
|
|
printContext(OS.indent(4));
|
2015-05-20 16:05:31 +08:00
|
|
|
printArrayInfo(OS.indent(4));
|
2014-09-18 19:17:17 +08:00
|
|
|
printAliasAssumptions(OS);
|
2011-04-29 14:27:02 +08:00
|
|
|
printStatements(OS.indent(4));
|
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::dump() const { print(dbgs()); }
|
|
|
|
|
2016-02-17 23:49:21 +08:00
|
|
|
isl_ctx *Scop::getIslCtx() const { return IslCtx.get(); }
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2016-04-29 18:44:41 +08:00
|
|
|
__isl_give PWACtx Scop::getPwAff(const SCEV *E, BasicBlock *BB,
|
|
|
|
bool NonNegative) {
|
2016-03-27 00:17:00 +08:00
|
|
|
// First try to use the SCEVAffinator to generate a piecewise defined
|
|
|
|
// affine function from @p E in the context of @p BB. If that tasks becomes to
|
|
|
|
// complex the affinator might return a nullptr. In such a case we invalidate
|
|
|
|
// the SCoP and return a dummy value. This way we do not need to add error
|
2017-01-07 01:30:34 +08:00
|
|
|
// handling code to all users of this function.
|
2016-04-23 22:31:17 +08:00
|
|
|
auto PWAC = Affinator.getPwAff(E, BB);
|
2016-04-29 18:44:41 +08:00
|
|
|
if (PWAC.first) {
|
2016-05-10 19:45:46 +08:00
|
|
|
// TODO: We could use a heuristic and either use:
|
|
|
|
// SCEVAffinator::takeNonNegativeAssumption
|
|
|
|
// or
|
|
|
|
// SCEVAffinator::interpretAsUnsigned
|
|
|
|
// to deal with unsigned or "NonNegative" SCEVs.
|
2016-04-29 18:44:41 +08:00
|
|
|
if (NonNegative)
|
|
|
|
Affinator.takeNonNegativeAssumption(PWAC);
|
2016-04-23 22:31:17 +08:00
|
|
|
return PWAC;
|
2016-04-29 18:44:41 +08:00
|
|
|
}
|
2016-03-27 00:17:00 +08:00
|
|
|
|
|
|
|
auto DL = BB ? BB->getTerminator()->getDebugLoc() : DebugLoc();
|
|
|
|
invalidate(COMPLEXITY, DL);
|
|
|
|
return Affinator.getPwAff(SE->getZero(E->getType()), BB);
|
2015-08-12 18:19:50 +08:00
|
|
|
}
|
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
__isl_give isl_union_set *Scop::getDomains() const {
|
2017-03-17 17:02:50 +08:00
|
|
|
isl_space *EmptySpace = isl_space_params_alloc(getIslCtx(), 0);
|
|
|
|
isl_union_set *Domain = isl_union_set_empty(EmptySpace);
|
2012-02-14 22:02:40 +08:00
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
for (const ScopStmt &Stmt : *this)
|
2015-05-27 13:16:57 +08:00
|
|
|
Domain = isl_union_set_add_set(Domain, Stmt.getDomain());
|
2012-02-14 22:02:40 +08:00
|
|
|
|
|
|
|
return Domain;
|
|
|
|
}
|
|
|
|
|
2016-04-23 22:31:17 +08:00
|
|
|
__isl_give isl_pw_aff *Scop::getPwAffOnly(const SCEV *E, BasicBlock *BB) {
|
|
|
|
PWACtx PWAC = getPwAff(E, BB);
|
|
|
|
isl_set_free(PWAC.second);
|
|
|
|
return PWAC.first;
|
|
|
|
}
|
|
|
|
|
2015-11-12 22:07:09 +08:00
|
|
|
__isl_give isl_union_map *
|
|
|
|
Scop::getAccessesOfType(std::function<bool(MemoryAccess &)> Predicate) {
|
|
|
|
isl_union_map *Accesses = isl_union_map_empty(getParamSpace());
|
2014-07-11 15:12:10 +08:00
|
|
|
|
2015-05-27 13:16:57 +08:00
|
|
|
for (ScopStmt &Stmt : *this) {
|
|
|
|
for (MemoryAccess *MA : Stmt) {
|
2015-11-12 22:07:09 +08:00
|
|
|
if (!Predicate(*MA))
|
2014-07-11 15:12:10 +08:00
|
|
|
continue;
|
|
|
|
|
2015-05-27 13:16:57 +08:00
|
|
|
isl_set *Domain = Stmt.getDomain();
|
2014-07-11 15:12:10 +08:00
|
|
|
isl_map *AccessDomain = MA->getAccessRelation();
|
|
|
|
AccessDomain = isl_map_intersect_domain(AccessDomain, Domain);
|
2015-11-12 22:07:09 +08:00
|
|
|
Accesses = isl_union_map_add_map(Accesses, AccessDomain);
|
2014-07-11 15:12:10 +08:00
|
|
|
}
|
|
|
|
}
|
2015-11-12 22:07:09 +08:00
|
|
|
return isl_union_map_coalesce(Accesses);
|
2014-07-11 15:12:10 +08:00
|
|
|
}
|
|
|
|
|
2015-11-12 22:07:09 +08:00
|
|
|
__isl_give isl_union_map *Scop::getMustWrites() {
|
|
|
|
return getAccessesOfType([](MemoryAccess &MA) { return MA.isMustWrite(); });
|
|
|
|
}
|
2014-07-11 15:12:10 +08:00
|
|
|
|
2015-11-12 22:07:09 +08:00
|
|
|
__isl_give isl_union_map *Scop::getMayWrites() {
|
|
|
|
return getAccessesOfType([](MemoryAccess &MA) { return MA.isMayWrite(); });
|
2014-07-11 15:12:10 +08:00
|
|
|
}
|
|
|
|
|
2014-02-21 05:43:54 +08:00
|
|
|
__isl_give isl_union_map *Scop::getWrites() {
|
2015-11-12 22:07:09 +08:00
|
|
|
return getAccessesOfType([](MemoryAccess &MA) { return MA.isWrite(); });
|
2014-02-21 05:43:54 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
__isl_give isl_union_map *Scop::getReads() {
|
2015-11-12 22:07:09 +08:00
|
|
|
return getAccessesOfType([](MemoryAccess &MA) { return MA.isRead(); });
|
2014-02-21 05:43:54 +08:00
|
|
|
}
|
|
|
|
|
2015-11-12 22:07:13 +08:00
|
|
|
__isl_give isl_union_map *Scop::getAccesses() {
|
|
|
|
return getAccessesOfType([](MemoryAccess &MA) { return true; });
|
|
|
|
}
|
|
|
|
|
2016-09-14 14:26:09 +08:00
|
|
|
// Check whether @p Node is an extension node.
|
|
|
|
//
|
|
|
|
// @return true if @p Node is an extension node.
|
|
|
|
isl_bool isNotExtNode(__isl_keep isl_schedule_node *Node, void *User) {
|
|
|
|
if (isl_schedule_node_get_type(Node) == isl_schedule_node_extension)
|
|
|
|
return isl_bool_error;
|
|
|
|
else
|
|
|
|
return isl_bool_true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool Scop::containsExtensionNode(__isl_keep isl_schedule *Schedule) {
|
|
|
|
return isl_schedule_foreach_schedule_node_top_down(Schedule, isNotExtNode,
|
|
|
|
nullptr) == isl_stat_error;
|
|
|
|
}
|
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
__isl_give isl_union_map *Scop::getSchedule() const {
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *Tree = getScheduleTree();
|
2016-09-14 14:26:09 +08:00
|
|
|
if (containsExtensionNode(Tree)) {
|
|
|
|
isl_schedule_free(Tree);
|
|
|
|
return nullptr;
|
|
|
|
}
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *S = isl_schedule_get_map(Tree);
|
2015-07-14 17:33:13 +08:00
|
|
|
isl_schedule_free(Tree);
|
|
|
|
return S;
|
|
|
|
}
|
2014-02-21 05:43:54 +08:00
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
__isl_give isl_schedule *Scop::getScheduleTree() const {
|
|
|
|
return isl_schedule_intersect_domain(isl_schedule_copy(Schedule),
|
|
|
|
getDomains());
|
|
|
|
}
|
2014-06-28 16:59:38 +08:00
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
void Scop::setSchedule(__isl_take isl_union_map *NewSchedule) {
|
|
|
|
auto *S = isl_schedule_from_domain(getDomains());
|
|
|
|
S = isl_schedule_insert_partial_schedule(
|
|
|
|
S, isl_multi_union_pw_aff_from_union_map(NewSchedule));
|
|
|
|
isl_schedule_free(Schedule);
|
|
|
|
Schedule = S;
|
|
|
|
}
|
|
|
|
|
|
|
|
void Scop::setScheduleTree(__isl_take isl_schedule *NewSchedule) {
|
|
|
|
isl_schedule_free(Schedule);
|
|
|
|
Schedule = NewSchedule;
|
2014-02-21 05:43:54 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bool Scop::restrictDomains(__isl_take isl_union_set *Domain) {
|
|
|
|
bool Changed = false;
|
2015-05-27 13:16:57 +08:00
|
|
|
for (ScopStmt &Stmt : *this) {
|
|
|
|
isl_union_set *StmtDomain = isl_union_set_from_set(Stmt.getDomain());
|
2014-02-21 05:43:54 +08:00
|
|
|
isl_union_set *NewStmtDomain = isl_union_set_intersect(
|
|
|
|
isl_union_set_copy(StmtDomain), isl_union_set_copy(Domain));
|
|
|
|
|
|
|
|
if (isl_union_set_is_subset(StmtDomain, NewStmtDomain)) {
|
|
|
|
isl_union_set_free(StmtDomain);
|
|
|
|
isl_union_set_free(NewStmtDomain);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
Changed = true;
|
|
|
|
|
|
|
|
isl_union_set_free(StmtDomain);
|
|
|
|
NewStmtDomain = isl_union_set_coalesce(NewStmtDomain);
|
|
|
|
|
|
|
|
if (isl_union_set_is_empty(NewStmtDomain)) {
|
2015-05-27 13:16:57 +08:00
|
|
|
Stmt.restrictDomain(isl_set_empty(Stmt.getDomainSpace()));
|
2014-02-21 05:43:54 +08:00
|
|
|
isl_union_set_free(NewStmtDomain);
|
|
|
|
} else
|
2015-05-27 13:16:57 +08:00
|
|
|
Stmt.restrictDomain(isl_set_from_union_set(NewStmtDomain));
|
2014-02-21 05:43:54 +08:00
|
|
|
}
|
|
|
|
isl_union_set_free(Domain);
|
|
|
|
return Changed;
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
ScalarEvolution *Scop::getSE() const { return SE; }
|
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
struct MapToDimensionDataTy {
|
|
|
|
int N;
|
|
|
|
isl_union_pw_multi_aff *Res;
|
|
|
|
};
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
// Create a function that maps the elements of 'Set' to its N-th dimension and
|
|
|
|
// add it to User->Res.
|
2015-07-14 17:33:13 +08:00
|
|
|
//
|
2015-12-22 06:45:53 +08:00
|
|
|
// @param Set The input set.
|
|
|
|
// @param User->N The dimension to map to.
|
|
|
|
// @param User->Res The isl_union_pw_multi_aff to which to add the result.
|
2015-07-14 17:33:13 +08:00
|
|
|
//
|
2015-12-22 06:45:53 +08:00
|
|
|
// @returns isl_stat_ok if no error occured, othewise isl_stat_error.
|
2015-07-14 17:33:13 +08:00
|
|
|
static isl_stat mapToDimension_AddSet(__isl_take isl_set *Set, void *User) {
|
|
|
|
struct MapToDimensionDataTy *Data = (struct MapToDimensionDataTy *)User;
|
|
|
|
int Dim;
|
|
|
|
isl_space *Space;
|
|
|
|
isl_pw_multi_aff *PMA;
|
|
|
|
|
|
|
|
Dim = isl_set_dim(Set, isl_dim_set);
|
|
|
|
Space = isl_set_get_space(Set);
|
|
|
|
PMA = isl_pw_multi_aff_project_out_map(Space, isl_dim_set, Data->N,
|
|
|
|
Dim - Data->N);
|
|
|
|
if (Data->N > 1)
|
|
|
|
PMA = isl_pw_multi_aff_drop_dims(PMA, isl_dim_out, 0, Data->N - 1);
|
|
|
|
Data->Res = isl_union_pw_multi_aff_add_pw_multi_aff(Data->Res, PMA);
|
|
|
|
|
|
|
|
isl_set_free(Set);
|
|
|
|
|
|
|
|
return isl_stat_ok;
|
|
|
|
}
|
|
|
|
|
2016-09-02 14:33:33 +08:00
|
|
|
// Create an isl_multi_union_aff that defines an identity mapping from the
|
|
|
|
// elements of USet to their N-th dimension.
|
2015-12-22 06:45:53 +08:00
|
|
|
//
|
|
|
|
// # Example:
|
|
|
|
//
|
|
|
|
// Domain: { A[i,j]; B[i,j,k] }
|
|
|
|
// N: 1
|
2015-07-14 17:33:13 +08:00
|
|
|
//
|
2015-12-22 06:45:53 +08:00
|
|
|
// Resulting Mapping: { {A[i,j] -> [(j)]; B[i,j,k] -> [(j)] }
|
|
|
|
//
|
|
|
|
// @param USet A union set describing the elements for which to generate a
|
|
|
|
// mapping.
|
2015-07-14 17:33:13 +08:00
|
|
|
// @param N The dimension to map to.
|
2015-12-22 06:45:53 +08:00
|
|
|
// @returns A mapping from USet to its N-th dimension.
|
2015-07-14 17:33:13 +08:00
|
|
|
static __isl_give isl_multi_union_pw_aff *
|
2015-12-22 06:45:53 +08:00
|
|
|
mapToDimension(__isl_take isl_union_set *USet, int N) {
|
|
|
|
assert(N >= 0);
|
2015-12-22 07:01:53 +08:00
|
|
|
assert(USet);
|
2015-12-22 06:45:53 +08:00
|
|
|
assert(!isl_union_set_is_empty(USet));
|
2015-09-10 23:27:46 +08:00
|
|
|
|
2015-07-14 17:33:13 +08:00
|
|
|
struct MapToDimensionDataTy Data;
|
|
|
|
|
2015-12-22 06:45:53 +08:00
|
|
|
auto *Space = isl_union_set_get_space(USet);
|
|
|
|
auto *PwAff = isl_union_pw_multi_aff_empty(Space);
|
2015-07-14 17:33:13 +08:00
|
|
|
|
2015-12-22 06:45:53 +08:00
|
|
|
Data = {N, PwAff};
|
|
|
|
|
|
|
|
auto Res = isl_union_set_foreach_set(USet, &mapToDimension_AddSet, &Data);
|
2016-01-20 23:41:30 +08:00
|
|
|
(void)Res;
|
|
|
|
|
2015-12-22 06:45:53 +08:00
|
|
|
assert(Res == isl_stat_ok);
|
|
|
|
|
|
|
|
isl_union_set_free(USet);
|
2015-07-14 17:33:13 +08:00
|
|
|
return isl_multi_union_pw_aff_from_union_pw_multi_aff(Data.Res);
|
|
|
|
}
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
void Scop::addScopStmt(BasicBlock *BB, Loop *SurroundingLoop) {
|
2016-11-22 04:09:40 +08:00
|
|
|
assert(BB && "Unexpected nullptr!");
|
2017-03-16 06:16:43 +08:00
|
|
|
Stmts.emplace_back(*this, *BB, SurroundingLoop);
|
2016-11-22 04:09:40 +08:00
|
|
|
auto *Stmt = &Stmts.back();
|
|
|
|
StmtMap[BB] = Stmt;
|
|
|
|
}
|
|
|
|
|
2017-03-16 06:16:43 +08:00
|
|
|
void Scop::addScopStmt(Region *R, Loop *SurroundingLoop) {
|
2016-11-22 04:09:40 +08:00
|
|
|
assert(R && "Unexpected nullptr!");
|
2017-03-16 06:16:43 +08:00
|
|
|
Stmts.emplace_back(*this, *R, SurroundingLoop);
|
2016-11-22 04:09:40 +08:00
|
|
|
auto *Stmt = &Stmts.back();
|
|
|
|
for (BasicBlock *BB : R->blocks())
|
2015-07-14 17:33:13 +08:00
|
|
|
StmtMap[BB] = Stmt;
|
|
|
|
}
|
|
|
|
|
2016-09-14 14:26:09 +08:00
|
|
|
ScopStmt *Scop::addScopStmt(__isl_take isl_map *SourceRel,
|
|
|
|
__isl_take isl_map *TargetRel,
|
|
|
|
__isl_take isl_set *Domain) {
|
2016-11-09 12:24:49 +08:00
|
|
|
#ifndef NDEBUG
|
2016-11-06 05:02:43 +08:00
|
|
|
isl_set *SourceDomain = isl_map_domain(isl_map_copy(SourceRel));
|
|
|
|
isl_set *TargetDomain = isl_map_domain(isl_map_copy(TargetRel));
|
|
|
|
assert(isl_set_is_subset(Domain, TargetDomain) &&
|
|
|
|
"Target access not defined for complete statement domain");
|
|
|
|
assert(isl_set_is_subset(Domain, SourceDomain) &&
|
|
|
|
"Source access not defined for complete statement domain");
|
|
|
|
isl_set_free(SourceDomain);
|
|
|
|
isl_set_free(TargetDomain);
|
2016-11-09 12:24:49 +08:00
|
|
|
#endif
|
2016-09-14 14:26:09 +08:00
|
|
|
Stmts.emplace_back(*this, SourceRel, TargetRel, Domain);
|
|
|
|
CopyStmtsNum++;
|
|
|
|
return &(Stmts.back());
|
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
void Scop::buildSchedule(LoopInfo &LI) {
|
2016-05-23 20:42:38 +08:00
|
|
|
Loop *L = getLoopSurroundingScop(*this, LI);
|
2016-02-01 19:54:13 +08:00
|
|
|
LoopStackTy LoopStack({LoopStackElementTy(L, nullptr, 0)});
|
2016-05-19 20:34:57 +08:00
|
|
|
buildSchedule(getRegion().getNode(), LoopStack, LI);
|
2016-04-04 03:36:52 +08:00
|
|
|
assert(LoopStack.size() == 1 && LoopStack.back().L == L);
|
|
|
|
Schedule = LoopStack[0].Schedule;
|
2016-01-06 20:59:23 +08:00
|
|
|
}
|
|
|
|
|
2016-02-01 19:54:13 +08:00
|
|
|
/// To generate a schedule for the elements in a Region we traverse the Region
|
|
|
|
/// in reverse-post-order and add the contained RegionNodes in traversal order
|
|
|
|
/// to the schedule of the loop that is currently at the top of the LoopStack.
|
|
|
|
/// For loop-free codes, this results in a correct sequential ordering.
|
|
|
|
///
|
|
|
|
/// Example:
|
|
|
|
/// bb1(0)
|
|
|
|
/// / \.
|
|
|
|
/// bb2(1) bb3(2)
|
|
|
|
/// \ / \.
|
|
|
|
/// bb4(3) bb5(4)
|
|
|
|
/// \ /
|
|
|
|
/// bb6(5)
|
|
|
|
///
|
|
|
|
/// Including loops requires additional processing. Whenever a loop header is
|
|
|
|
/// encountered, the corresponding loop is added to the @p LoopStack. Starting
|
|
|
|
/// from an empty schedule, we first process all RegionNodes that are within
|
|
|
|
/// this loop and complete the sequential schedule at this loop-level before
|
|
|
|
/// processing about any other nodes. To implement this
|
|
|
|
/// loop-nodes-first-processing, the reverse post-order traversal is
|
|
|
|
/// insufficient. Hence, we additionally check if the traversal yields
|
|
|
|
/// sub-regions or blocks that are outside the last loop on the @p LoopStack.
|
|
|
|
/// These region-nodes are then queue and only traverse after the all nodes
|
|
|
|
/// within the current loop have been processed.
|
2016-05-19 20:34:57 +08:00
|
|
|
void Scop::buildSchedule(Region *R, LoopStackTy &LoopStack, LoopInfo &LI) {
|
2016-05-23 20:42:38 +08:00
|
|
|
Loop *OuterScopLoop = getLoopSurroundingScop(*this, LI);
|
2016-02-01 19:54:13 +08:00
|
|
|
|
|
|
|
ReversePostOrderTraversal<Region *> RTraversal(R);
|
|
|
|
std::deque<RegionNode *> WorkList(RTraversal.begin(), RTraversal.end());
|
|
|
|
std::deque<RegionNode *> DelayList;
|
|
|
|
bool LastRNWaiting = false;
|
|
|
|
|
|
|
|
// Iterate over the region @p R in reverse post-order but queue
|
|
|
|
// sub-regions/blocks iff they are not part of the last encountered but not
|
|
|
|
// completely traversed loop. The variable LastRNWaiting is a flag to indicate
|
|
|
|
// that we queued the last sub-region/block from the reverse post-order
|
|
|
|
// iterator. If it is set we have to explore the next sub-region/block from
|
|
|
|
// the iterator (if any) to guarantee progress. If it is not set we first try
|
|
|
|
// the next queued sub-region/blocks.
|
|
|
|
while (!WorkList.empty() || !DelayList.empty()) {
|
|
|
|
RegionNode *RN;
|
|
|
|
|
|
|
|
if ((LastRNWaiting && !WorkList.empty()) || DelayList.size() == 0) {
|
|
|
|
RN = WorkList.front();
|
|
|
|
WorkList.pop_front();
|
|
|
|
LastRNWaiting = false;
|
|
|
|
} else {
|
|
|
|
RN = DelayList.front();
|
|
|
|
DelayList.pop_front();
|
|
|
|
}
|
|
|
|
|
|
|
|
Loop *L = getRegionNodeLoop(RN, LI);
|
2016-05-23 20:40:48 +08:00
|
|
|
if (!contains(L))
|
2016-02-01 19:54:13 +08:00
|
|
|
L = OuterScopLoop;
|
|
|
|
|
2016-04-04 03:36:52 +08:00
|
|
|
Loop *LastLoop = LoopStack.back().L;
|
2016-02-01 19:54:13 +08:00
|
|
|
if (LastLoop != L) {
|
2016-04-04 07:09:06 +08:00
|
|
|
if (LastLoop && !LastLoop->contains(L)) {
|
2016-02-01 19:54:13 +08:00
|
|
|
LastRNWaiting = true;
|
|
|
|
DelayList.push_back(RN);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
LoopStack.push_back({L, nullptr, 0});
|
|
|
|
}
|
2016-05-19 20:34:57 +08:00
|
|
|
buildSchedule(RN, LoopStack, LI);
|
2016-02-01 19:54:13 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-05-19 20:34:57 +08:00
|
|
|
void Scop::buildSchedule(RegionNode *RN, LoopStackTy &LoopStack, LoopInfo &LI) {
|
2016-01-06 20:59:23 +08:00
|
|
|
|
2016-01-06 23:30:06 +08:00
|
|
|
if (RN->isSubRegion()) {
|
|
|
|
auto *LocalRegion = RN->getNodeAs<Region>();
|
2016-05-19 20:34:57 +08:00
|
|
|
if (!isNonAffineSubRegion(LocalRegion)) {
|
|
|
|
buildSchedule(LocalRegion, LoopStack, LI);
|
2016-01-06 23:30:06 +08:00
|
|
|
return;
|
2015-09-10 23:27:46 +08:00
|
|
|
}
|
2016-01-06 23:30:06 +08:00
|
|
|
}
|
2015-02-24 20:00:50 +08:00
|
|
|
|
2016-02-01 19:54:13 +08:00
|
|
|
auto &LoopData = LoopStack.back();
|
|
|
|
LoopData.NumBlocksProcessed += getNumBlocksInRegionNode(RN);
|
2015-07-14 17:33:13 +08:00
|
|
|
|
2016-02-25 06:08:19 +08:00
|
|
|
if (auto *Stmt = getStmtFor(RN)) {
|
2016-01-06 23:30:06 +08:00
|
|
|
auto *UDomain = isl_union_set_from_set(Stmt->getDomain());
|
|
|
|
auto *StmtSchedule = isl_schedule_from_domain(UDomain);
|
2016-02-01 19:54:13 +08:00
|
|
|
LoopData.Schedule = combineInSequence(LoopData.Schedule, StmtSchedule);
|
2016-01-06 23:30:06 +08:00
|
|
|
}
|
|
|
|
|
2016-02-01 19:54:13 +08:00
|
|
|
// Check if we just processed the last node in this loop. If we did, finalize
|
|
|
|
// the loop by:
|
|
|
|
//
|
|
|
|
// - adding new schedule dimensions
|
|
|
|
// - folding the resulting schedule into the parent loop schedule
|
|
|
|
// - dropping the loop schedule from the LoopStack.
|
|
|
|
//
|
|
|
|
// Then continue to check surrounding loops, which might also have been
|
|
|
|
// completed by this node.
|
|
|
|
while (LoopData.L &&
|
2017-03-08 00:17:55 +08:00
|
|
|
LoopData.NumBlocksProcessed == getNumBlocksInLoop(LoopData.L)) {
|
2016-02-22 00:37:25 +08:00
|
|
|
auto *Schedule = LoopData.Schedule;
|
2016-02-01 19:54:13 +08:00
|
|
|
auto NumBlocksProcessed = LoopData.NumBlocksProcessed;
|
|
|
|
|
|
|
|
LoopStack.pop_back();
|
|
|
|
auto &NextLoopData = LoopStack.back();
|
|
|
|
|
|
|
|
if (Schedule) {
|
|
|
|
auto *Domain = isl_schedule_get_domain(Schedule);
|
|
|
|
auto *MUPA = mapToDimension(Domain, LoopStack.size());
|
|
|
|
Schedule = isl_schedule_insert_partial_schedule(Schedule, MUPA);
|
|
|
|
NextLoopData.Schedule =
|
|
|
|
combineInSequence(NextLoopData.Schedule, Schedule);
|
2016-01-06 23:30:06 +08:00
|
|
|
}
|
2015-12-22 07:01:53 +08:00
|
|
|
|
2016-02-01 19:54:13 +08:00
|
|
|
NextLoopData.NumBlocksProcessed += NumBlocksProcessed;
|
|
|
|
LoopData = NextLoopData;
|
2015-07-14 17:33:13 +08:00
|
|
|
}
|
2011-04-29 14:27:02 +08:00
|
|
|
}
|
|
|
|
|
2016-02-25 06:08:19 +08:00
|
|
|
ScopStmt *Scop::getStmtFor(BasicBlock *BB) const {
|
2015-05-27 14:51:34 +08:00
|
|
|
auto StmtMapIt = StmtMap.find(BB);
|
2014-11-01 07:13:39 +08:00
|
|
|
if (StmtMapIt == StmtMap.end())
|
|
|
|
return nullptr;
|
|
|
|
return StmtMapIt->second;
|
|
|
|
}
|
|
|
|
|
2016-02-25 06:08:19 +08:00
|
|
|
ScopStmt *Scop::getStmtFor(RegionNode *RN) const {
|
|
|
|
if (RN->isSubRegion())
|
|
|
|
return getStmtFor(RN->getNodeAs<Region>());
|
|
|
|
return getStmtFor(RN->getNodeAs<BasicBlock>());
|
|
|
|
}
|
|
|
|
|
|
|
|
ScopStmt *Scop::getStmtFor(Region *R) const {
|
|
|
|
ScopStmt *Stmt = getStmtFor(R->getEntry());
|
|
|
|
assert(!Stmt || Stmt->getRegion() == R);
|
|
|
|
return Stmt;
|
2015-12-14 03:21:45 +08:00
|
|
|
}
|
|
|
|
|
2015-08-31 05:13:53 +08:00
|
|
|
int Scop::getRelativeLoopDepth(const Loop *L) const {
|
|
|
|
Loop *OuterLoop =
|
|
|
|
L ? R.outermostLoopInRegion(const_cast<Loop *>(L)) : nullptr;
|
|
|
|
if (!OuterLoop)
|
|
|
|
return -1;
|
2015-08-27 14:53:52 +08:00
|
|
|
return L->getLoopDepth() - OuterLoop->getLoopDepth();
|
|
|
|
}
|
|
|
|
|
2016-07-30 17:25:51 +08:00
|
|
|
ScopArrayInfo *Scop::getArrayInfoByName(const std::string BaseName) {
|
|
|
|
for (auto &SAI : arrays()) {
|
|
|
|
if (SAI->getName() == BaseName)
|
|
|
|
return SAI;
|
|
|
|
}
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2016-05-31 17:41:04 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
void ScopInfoRegionPass::getAnalysisUsage(AnalysisUsage &AU) const {
|
|
|
|
AU.addRequired<LoopInfoWrapperPass>();
|
|
|
|
AU.addRequired<RegionInfoPass>();
|
|
|
|
AU.addRequired<DominatorTreeWrapperPass>();
|
|
|
|
AU.addRequiredTransitive<ScalarEvolutionWrapperPass>();
|
2017-05-12 22:37:29 +08:00
|
|
|
AU.addRequiredTransitive<ScopDetectionWrapperPass>();
|
2016-05-31 17:41:04 +08:00
|
|
|
AU.addRequired<AAResultsWrapperPass>();
|
2017-03-17 21:56:53 +08:00
|
|
|
AU.addRequired<AssumptionCacheTracker>();
|
2016-05-31 17:41:04 +08:00
|
|
|
AU.setPreservesAll();
|
|
|
|
}
|
|
|
|
|
2017-02-17 16:12:36 +08:00
|
|
|
void updateLoopCountStatistic(ScopDetection::LoopStats Stats) {
|
|
|
|
NumLoopsInScop += Stats.NumLoops;
|
|
|
|
MaxNumLoopsInScop =
|
|
|
|
std::max(MaxNumLoopsInScop.getValue(), (unsigned)Stats.NumLoops);
|
|
|
|
|
|
|
|
if (Stats.MaxDepth == 1)
|
|
|
|
NumScopsDepthOne++;
|
|
|
|
else if (Stats.MaxDepth == 2)
|
|
|
|
NumScopsDepthTwo++;
|
|
|
|
else if (Stats.MaxDepth == 3)
|
|
|
|
NumScopsDepthThree++;
|
|
|
|
else if (Stats.MaxDepth == 4)
|
|
|
|
NumScopsDepthFour++;
|
|
|
|
else if (Stats.MaxDepth == 5)
|
|
|
|
NumScopsDepthFive++;
|
|
|
|
else
|
|
|
|
NumScopsDepthLarger++;
|
|
|
|
}
|
|
|
|
|
2016-05-31 17:41:04 +08:00
|
|
|
bool ScopInfoRegionPass::runOnRegion(Region *R, RGPassManager &RGM) {
|
2017-05-12 22:37:29 +08:00
|
|
|
auto &SD = getAnalysis<ScopDetectionWrapperPass>().getSD();
|
2016-05-31 17:41:04 +08:00
|
|
|
|
|
|
|
if (!SD.isMaxRegionInScop(*R))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
Function *F = R->getEntry()->getParent();
|
|
|
|
auto &SE = getAnalysis<ScalarEvolutionWrapperPass>().getSE();
|
|
|
|
auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
|
|
|
|
auto &AA = getAnalysis<AAResultsWrapperPass>().getAAResults();
|
|
|
|
auto const &DL = F->getParent()->getDataLayout();
|
|
|
|
auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
|
2017-03-17 21:56:53 +08:00
|
|
|
auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(*F);
|
2016-05-31 17:41:04 +08:00
|
|
|
|
2017-03-17 21:56:53 +08:00
|
|
|
ScopBuilder SB(R, AC, AA, DL, DT, LI, SD, SE);
|
2016-06-27 17:25:40 +08:00
|
|
|
S = SB.getScop(); // take ownership of scop object
|
2017-02-17 16:12:36 +08:00
|
|
|
|
|
|
|
if (S) {
|
|
|
|
ScopDetection::LoopStats Stats =
|
|
|
|
ScopDetection::countBeneficialLoops(&S->getRegion(), SE, LI, 0);
|
|
|
|
updateLoopCountStatistic(Stats);
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:27:02 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-05-31 17:41:04 +08:00
|
|
|
void ScopInfoRegionPass::print(raw_ostream &OS, const Module *) const {
|
2016-06-27 17:25:40 +08:00
|
|
|
if (S)
|
|
|
|
S->print(OS);
|
|
|
|
else
|
|
|
|
OS << "Invalid Scop!\n";
|
2016-05-31 17:41:04 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
char ScopInfoRegionPass::ID = 0;
|
2011-04-29 14:27:02 +08:00
|
|
|
|
2016-05-31 17:41:04 +08:00
|
|
|
Pass *polly::createScopInfoRegionPassPass() { return new ScopInfoRegionPass(); }
|
2013-03-23 09:05:07 +08:00
|
|
|
|
2016-05-31 17:41:04 +08:00
|
|
|
INITIALIZE_PASS_BEGIN(ScopInfoRegionPass, "polly-scops",
|
2011-10-08 08:30:40 +08:00
|
|
|
"Polly - Create polyhedral description of Scops", false,
|
2013-03-23 09:05:07 +08:00
|
|
|
false);
|
2015-09-10 06:13:56 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass);
|
2017-03-17 21:56:53 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker);
|
2015-01-17 22:16:56 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass);
|
2014-07-20 02:40:17 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(RegionInfoPass);
|
2015-08-17 18:57:08 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass);
|
2017-05-12 22:37:29 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(ScopDetectionWrapperPass);
|
2015-08-31 05:13:53 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass);
|
2016-05-31 17:41:04 +08:00
|
|
|
INITIALIZE_PASS_END(ScopInfoRegionPass, "polly-scops",
|
2011-10-08 08:30:40 +08:00
|
|
|
"Polly - Create polyhedral description of Scops", false,
|
|
|
|
false)
|
2016-06-27 17:32:30 +08:00
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
2017-05-15 20:55:14 +08:00
|
|
|
ScopInfo::ScopInfo(const DataLayout &DL, ScopDetection &SD, ScalarEvolution &SE,
|
|
|
|
LoopInfo &LI, AliasAnalysis &AA, DominatorTree &DT,
|
|
|
|
AssumptionCache &AC) {
|
|
|
|
/// Create polyhedral descripton of scops for all the valid regions of a
|
|
|
|
/// function.
|
|
|
|
for (auto &It : SD) {
|
|
|
|
Region *R = const_cast<Region *>(It);
|
|
|
|
if (!SD.isMaxRegionInScop(*R))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
ScopBuilder SB(R, AC, AA, DL, DT, LI, SD, SE);
|
|
|
|
std::unique_ptr<Scop> S = SB.getScop();
|
|
|
|
if (!S)
|
|
|
|
continue;
|
|
|
|
bool Inserted = RegionToScopMap.insert({R, std::move(S)}).second;
|
|
|
|
assert(Inserted && "Building Scop for the same region twice!");
|
|
|
|
(void)Inserted;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
AnalysisKey ScopInfoAnalysis::Key;
|
|
|
|
|
|
|
|
ScopInfoAnalysis::Result ScopInfoAnalysis::run(Function &F,
|
|
|
|
FunctionAnalysisManager &FAM) {
|
|
|
|
auto &SD = FAM.getResult<ScopAnalysis>(F);
|
|
|
|
auto &SE = FAM.getResult<ScalarEvolutionAnalysis>(F);
|
|
|
|
auto &LI = FAM.getResult<LoopAnalysis>(F);
|
|
|
|
auto &AA = FAM.getResult<AAManager>(F);
|
|
|
|
auto &DT = FAM.getResult<DominatorTreeAnalysis>(F);
|
|
|
|
auto &AC = FAM.getResult<AssumptionAnalysis>(F);
|
|
|
|
auto &DL = F.getParent()->getDataLayout();
|
|
|
|
return {DL, SD, SE, LI, AA, DT, AC};
|
|
|
|
}
|
|
|
|
|
|
|
|
PreservedAnalyses ScopInfoPrinterPass::run(Function &F,
|
|
|
|
FunctionAnalysisManager &FAM) {
|
|
|
|
auto &SI = FAM.getResult<ScopInfoAnalysis>(F);
|
|
|
|
for (auto &It : SI) {
|
|
|
|
if (It.second)
|
|
|
|
It.second->print(Stream);
|
|
|
|
else
|
|
|
|
Stream << "Invalid Scop!\n";
|
|
|
|
}
|
|
|
|
return PreservedAnalyses::all();
|
|
|
|
}
|
|
|
|
|
2016-06-27 17:32:30 +08:00
|
|
|
void ScopInfoWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {
|
|
|
|
AU.addRequired<LoopInfoWrapperPass>();
|
|
|
|
AU.addRequired<RegionInfoPass>();
|
|
|
|
AU.addRequired<DominatorTreeWrapperPass>();
|
|
|
|
AU.addRequiredTransitive<ScalarEvolutionWrapperPass>();
|
2017-05-12 22:37:29 +08:00
|
|
|
AU.addRequiredTransitive<ScopDetectionWrapperPass>();
|
2016-06-27 17:32:30 +08:00
|
|
|
AU.addRequired<AAResultsWrapperPass>();
|
2017-03-17 21:56:53 +08:00
|
|
|
AU.addRequired<AssumptionCacheTracker>();
|
2016-06-27 17:32:30 +08:00
|
|
|
AU.setPreservesAll();
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ScopInfoWrapperPass::runOnFunction(Function &F) {
|
2017-05-12 22:37:29 +08:00
|
|
|
auto &SD = getAnalysis<ScopDetectionWrapperPass>().getSD();
|
2016-06-27 17:32:30 +08:00
|
|
|
auto &SE = getAnalysis<ScalarEvolutionWrapperPass>().getSE();
|
|
|
|
auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
|
|
|
|
auto &AA = getAnalysis<AAResultsWrapperPass>().getAAResults();
|
|
|
|
auto const &DL = F.getParent()->getDataLayout();
|
|
|
|
auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
|
2017-03-17 21:56:53 +08:00
|
|
|
auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
|
2016-06-27 17:32:30 +08:00
|
|
|
|
2017-05-15 20:55:14 +08:00
|
|
|
Result.reset(new ScopInfo{DL, SD, SE, LI, AA, DT, AC});
|
2016-06-27 17:32:30 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ScopInfoWrapperPass::print(raw_ostream &OS, const Module *) const {
|
2017-05-15 20:55:14 +08:00
|
|
|
for (auto &It : *Result) {
|
2016-06-27 17:32:30 +08:00
|
|
|
if (It.second)
|
|
|
|
It.second->print(OS);
|
|
|
|
else
|
|
|
|
OS << "Invalid Scop!\n";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
char ScopInfoWrapperPass::ID = 0;
|
|
|
|
|
|
|
|
Pass *polly::createScopInfoWrapperPassPass() {
|
|
|
|
return new ScopInfoWrapperPass();
|
|
|
|
}
|
|
|
|
|
|
|
|
INITIALIZE_PASS_BEGIN(
|
|
|
|
ScopInfoWrapperPass, "polly-function-scops",
|
|
|
|
"Polly - Create polyhedral description of all Scops of a function", false,
|
|
|
|
false);
|
|
|
|
INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass);
|
2017-03-17 21:56:53 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker);
|
2016-06-27 17:32:30 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass);
|
|
|
|
INITIALIZE_PASS_DEPENDENCY(RegionInfoPass);
|
|
|
|
INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass);
|
2017-05-12 22:37:29 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(ScopDetectionWrapperPass);
|
2016-06-27 17:32:30 +08:00
|
|
|
INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass);
|
|
|
|
INITIALIZE_PASS_END(
|
|
|
|
ScopInfoWrapperPass, "polly-function-scops",
|
|
|
|
"Polly - Create polyhedral description of all Scops of a function", false,
|
|
|
|
false)
|