forked from OSchip/llvm-project
3783 lines
141 KiB
C++
3783 lines
141 KiB
C++
//===- llvm/unittest/IR/OpenMPIRBuilderTest.cpp - OpenMPIRBuilder tests ---===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/Frontend/OpenMP/OMPConstants.h"
|
|
#include "llvm/Frontend/OpenMP/OMPIRBuilder.h"
|
|
#include "llvm/IR/BasicBlock.h"
|
|
#include "llvm/IR/DIBuilder.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/IR/InstIterator.h"
|
|
#include "llvm/IR/LLVMContext.h"
|
|
#include "llvm/IR/Module.h"
|
|
#include "llvm/IR/Verifier.h"
|
|
#include "llvm/Passes/PassBuilder.h"
|
|
#include "llvm/Transforms/Utils/BasicBlockUtils.h"
|
|
#include "gtest/gtest.h"
|
|
|
|
using namespace llvm;
|
|
using namespace omp;
|
|
|
|
namespace {
|
|
|
|
/// Create an instruction that uses the values in \p Values. We use "printf"
|
|
/// just because it is often used for this purpose in test code, but it is never
|
|
/// executed here.
|
|
static CallInst *createPrintfCall(IRBuilder<> &Builder, StringRef FormatStr,
|
|
ArrayRef<Value *> Values) {
|
|
Module *M = Builder.GetInsertBlock()->getParent()->getParent();
|
|
|
|
GlobalVariable *GV = Builder.CreateGlobalString(FormatStr, "", 0, M);
|
|
Constant *Zero = ConstantInt::get(Type::getInt32Ty(M->getContext()), 0);
|
|
Constant *Indices[] = {Zero, Zero};
|
|
Constant *FormatStrConst =
|
|
ConstantExpr::getInBoundsGetElementPtr(GV->getValueType(), GV, Indices);
|
|
|
|
Function *PrintfDecl = M->getFunction("printf");
|
|
if (!PrintfDecl) {
|
|
GlobalValue::LinkageTypes Linkage = Function::ExternalLinkage;
|
|
FunctionType *Ty = FunctionType::get(Builder.getInt32Ty(), true);
|
|
PrintfDecl = Function::Create(Ty, Linkage, "printf", M);
|
|
}
|
|
|
|
SmallVector<Value *, 4> Args;
|
|
Args.push_back(FormatStrConst);
|
|
Args.append(Values.begin(), Values.end());
|
|
return Builder.CreateCall(PrintfDecl, Args);
|
|
}
|
|
|
|
/// Verify that blocks in \p RefOrder are corresponds to the depth-first visit
|
|
/// order the control flow of \p F.
|
|
///
|
|
/// This is an easy way to verify the branching structure of the CFG without
|
|
/// checking every branch instruction individually. For the CFG of a
|
|
/// CanonicalLoopInfo, the Cond BB's terminating branch's first edge is entering
|
|
/// the body, i.e. the DFS order corresponds to the execution order with one
|
|
/// loop iteration.
|
|
static testing::AssertionResult
|
|
verifyDFSOrder(Function *F, ArrayRef<BasicBlock *> RefOrder) {
|
|
ArrayRef<BasicBlock *>::iterator It = RefOrder.begin();
|
|
ArrayRef<BasicBlock *>::iterator E = RefOrder.end();
|
|
|
|
df_iterator_default_set<BasicBlock *, 16> Visited;
|
|
auto DFS = llvm::depth_first_ext(&F->getEntryBlock(), Visited);
|
|
|
|
BasicBlock *Prev = nullptr;
|
|
for (BasicBlock *BB : DFS) {
|
|
if (It != E && BB == *It) {
|
|
Prev = *It;
|
|
++It;
|
|
}
|
|
}
|
|
|
|
if (It == E)
|
|
return testing::AssertionSuccess();
|
|
if (!Prev)
|
|
return testing::AssertionFailure()
|
|
<< "Did not find " << (*It)->getName() << " in control flow";
|
|
return testing::AssertionFailure()
|
|
<< "Expected " << Prev->getName() << " before " << (*It)->getName()
|
|
<< " in control flow";
|
|
}
|
|
|
|
/// Verify that blocks in \p RefOrder are in the same relative order in the
|
|
/// linked lists of blocks in \p F. The linked list may contain additional
|
|
/// blocks in-between.
|
|
///
|
|
/// While the order in the linked list is not relevant for semantics, keeping
|
|
/// the order roughly in execution order makes its printout easier to read.
|
|
static testing::AssertionResult
|
|
verifyListOrder(Function *F, ArrayRef<BasicBlock *> RefOrder) {
|
|
ArrayRef<BasicBlock *>::iterator It = RefOrder.begin();
|
|
ArrayRef<BasicBlock *>::iterator E = RefOrder.end();
|
|
|
|
BasicBlock *Prev = nullptr;
|
|
for (BasicBlock &BB : *F) {
|
|
if (It != E && &BB == *It) {
|
|
Prev = *It;
|
|
++It;
|
|
}
|
|
}
|
|
|
|
if (It == E)
|
|
return testing::AssertionSuccess();
|
|
if (!Prev)
|
|
return testing::AssertionFailure() << "Did not find " << (*It)->getName()
|
|
<< " in function " << F->getName();
|
|
return testing::AssertionFailure()
|
|
<< "Expected " << Prev->getName() << " before " << (*It)->getName()
|
|
<< " in function " << F->getName();
|
|
}
|
|
|
|
class OpenMPIRBuilderTest : public testing::Test {
|
|
protected:
|
|
void SetUp() override {
|
|
M.reset(new Module("MyModule", Ctx));
|
|
FunctionType *FTy =
|
|
FunctionType::get(Type::getVoidTy(Ctx), {Type::getInt32Ty(Ctx)},
|
|
/*isVarArg=*/false);
|
|
F = Function::Create(FTy, Function::ExternalLinkage, "", M.get());
|
|
BB = BasicBlock::Create(Ctx, "", F);
|
|
|
|
DIBuilder DIB(*M);
|
|
auto File = DIB.createFile("test.dbg", "/src", llvm::None,
|
|
Optional<StringRef>("/src/test.dbg"));
|
|
auto CU =
|
|
DIB.createCompileUnit(dwarf::DW_LANG_C, File, "llvm-C", true, "", 0);
|
|
auto Type = DIB.createSubroutineType(DIB.getOrCreateTypeArray(None));
|
|
auto SP = DIB.createFunction(
|
|
CU, "foo", "", File, 1, Type, 1, DINode::FlagZero,
|
|
DISubprogram::SPFlagDefinition | DISubprogram::SPFlagOptimized);
|
|
F->setSubprogram(SP);
|
|
auto Scope = DIB.createLexicalBlockFile(SP, File, 0);
|
|
DIB.finalize();
|
|
DL = DILocation::get(Ctx, 3, 7, Scope);
|
|
}
|
|
|
|
void TearDown() override {
|
|
BB = nullptr;
|
|
M.reset();
|
|
}
|
|
|
|
/// Create a function with a simple loop that calls printf using the logical
|
|
/// loop counter for use with tests that need a CanonicalLoopInfo object.
|
|
CanonicalLoopInfo *buildSingleLoopFunction(DebugLoc DL,
|
|
OpenMPIRBuilder &OMPBuilder,
|
|
Instruction **Call = nullptr,
|
|
BasicBlock **BodyCode = nullptr) {
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
Value *TripCount = F->getArg(0);
|
|
|
|
auto LoopBodyGenCB = [&](OpenMPIRBuilder::InsertPointTy CodeGenIP,
|
|
llvm::Value *LC) {
|
|
Builder.restoreIP(CodeGenIP);
|
|
if (BodyCode)
|
|
*BodyCode = Builder.GetInsertBlock();
|
|
|
|
// Add something that consumes the induction variable to the body.
|
|
CallInst *CallInst = createPrintfCall(Builder, "%d\\n", {LC});
|
|
if (Call)
|
|
*Call = CallInst;
|
|
};
|
|
CanonicalLoopInfo *Loop =
|
|
OMPBuilder.createCanonicalLoop(Loc, LoopBodyGenCB, TripCount);
|
|
|
|
// Finalize the function.
|
|
Builder.restoreIP(Loop->getAfterIP());
|
|
Builder.CreateRetVoid();
|
|
|
|
return Loop;
|
|
}
|
|
|
|
LLVMContext Ctx;
|
|
std::unique_ptr<Module> M;
|
|
Function *F;
|
|
BasicBlock *BB;
|
|
DebugLoc DL;
|
|
};
|
|
|
|
class OpenMPIRBuilderTestWithParams
|
|
: public OpenMPIRBuilderTest,
|
|
public ::testing::WithParamInterface<omp::OMPScheduleType> {};
|
|
|
|
// Returns the value stored in the given allocation. Returns null if the given
|
|
// value is not a result of an InstTy instruction, if no value is stored or if
|
|
// there is more than one store.
|
|
template <typename InstTy> static Value *findStoredValue(Value *AllocaValue) {
|
|
Instruction *Inst = dyn_cast<InstTy>(AllocaValue);
|
|
if (!Inst)
|
|
return nullptr;
|
|
StoreInst *Store = nullptr;
|
|
for (Use &U : Inst->uses()) {
|
|
if (auto *CandidateStore = dyn_cast<StoreInst>(U.getUser())) {
|
|
EXPECT_EQ(Store, nullptr);
|
|
Store = CandidateStore;
|
|
}
|
|
}
|
|
if (!Store)
|
|
return nullptr;
|
|
return Store->getValueOperand();
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateBarrier) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OMPBuilder.createBarrier({IRBuilder<>::InsertPoint()}, OMPD_for);
|
|
EXPECT_TRUE(M->global_empty());
|
|
EXPECT_EQ(M->size(), 1U);
|
|
EXPECT_EQ(F->size(), 1U);
|
|
EXPECT_EQ(BB->size(), 0U);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP()});
|
|
OMPBuilder.createBarrier(Loc, OMPD_for);
|
|
EXPECT_FALSE(M->global_empty());
|
|
EXPECT_EQ(M->size(), 3U);
|
|
EXPECT_EQ(F->size(), 1U);
|
|
EXPECT_EQ(BB->size(), 2U);
|
|
|
|
CallInst *GTID = dyn_cast<CallInst>(&BB->front());
|
|
EXPECT_NE(GTID, nullptr);
|
|
EXPECT_EQ(GTID->arg_size(), 1U);
|
|
EXPECT_EQ(GTID->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
CallInst *Barrier = dyn_cast<CallInst>(GTID->getNextNode());
|
|
EXPECT_NE(Barrier, nullptr);
|
|
EXPECT_EQ(Barrier->arg_size(), 2U);
|
|
EXPECT_EQ(Barrier->getCalledFunction()->getName(), "__kmpc_barrier");
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
EXPECT_EQ(cast<CallInst>(Barrier)->getArgOperand(1), GTID);
|
|
|
|
Builder.CreateUnreachable();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateCancel) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
|
|
BasicBlock *CBB = BasicBlock::Create(Ctx, "", F);
|
|
new UnreachableInst(Ctx, CBB);
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
ASSERT_NE(IP.getBlock(), nullptr);
|
|
ASSERT_EQ(IP.getBlock()->end(), IP.getPoint());
|
|
BranchInst::Create(CBB, IP.getBlock());
|
|
};
|
|
OMPBuilder.pushFinalizationCB({FiniCB, OMPD_parallel, true});
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP()});
|
|
auto NewIP = OMPBuilder.createCancel(Loc, nullptr, OMPD_parallel);
|
|
Builder.restoreIP(NewIP);
|
|
EXPECT_FALSE(M->global_empty());
|
|
EXPECT_EQ(M->size(), 4U);
|
|
EXPECT_EQ(F->size(), 4U);
|
|
EXPECT_EQ(BB->size(), 4U);
|
|
|
|
CallInst *GTID = dyn_cast<CallInst>(&BB->front());
|
|
EXPECT_NE(GTID, nullptr);
|
|
EXPECT_EQ(GTID->arg_size(), 1U);
|
|
EXPECT_EQ(GTID->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
CallInst *Cancel = dyn_cast<CallInst>(GTID->getNextNode());
|
|
EXPECT_NE(Cancel, nullptr);
|
|
EXPECT_EQ(Cancel->arg_size(), 3U);
|
|
EXPECT_EQ(Cancel->getCalledFunction()->getName(), "__kmpc_cancel");
|
|
EXPECT_FALSE(Cancel->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(Cancel->getCalledFunction()->doesNotFreeMemory());
|
|
EXPECT_EQ(Cancel->getNumUses(), 1U);
|
|
Instruction *CancelBBTI = Cancel->getParent()->getTerminator();
|
|
EXPECT_EQ(CancelBBTI->getNumSuccessors(), 2U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(0), NewIP.getBlock());
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(1)->size(), 3U);
|
|
CallInst *GTID1 = dyn_cast<CallInst>(&CancelBBTI->getSuccessor(1)->front());
|
|
EXPECT_NE(GTID1, nullptr);
|
|
EXPECT_EQ(GTID1->arg_size(), 1U);
|
|
EXPECT_EQ(GTID1->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID1->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID1->getCalledFunction()->doesNotFreeMemory());
|
|
CallInst *Barrier = dyn_cast<CallInst>(GTID1->getNextNode());
|
|
EXPECT_NE(Barrier, nullptr);
|
|
EXPECT_EQ(Barrier->arg_size(), 2U);
|
|
EXPECT_EQ(Barrier->getCalledFunction()->getName(), "__kmpc_cancel_barrier");
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotFreeMemory());
|
|
EXPECT_EQ(Barrier->getNumUses(), 0U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(1)->getTerminator()->getNumSuccessors(),
|
|
1U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(1)->getTerminator()->getSuccessor(0),
|
|
CBB);
|
|
|
|
EXPECT_EQ(cast<CallInst>(Cancel)->getArgOperand(1), GTID);
|
|
|
|
OMPBuilder.popFinalizationCB();
|
|
|
|
Builder.CreateUnreachable();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateCancelIfCond) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
|
|
BasicBlock *CBB = BasicBlock::Create(Ctx, "", F);
|
|
new UnreachableInst(Ctx, CBB);
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
ASSERT_NE(IP.getBlock(), nullptr);
|
|
ASSERT_EQ(IP.getBlock()->end(), IP.getPoint());
|
|
BranchInst::Create(CBB, IP.getBlock());
|
|
};
|
|
OMPBuilder.pushFinalizationCB({FiniCB, OMPD_parallel, true});
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP()});
|
|
auto NewIP = OMPBuilder.createCancel(Loc, Builder.getTrue(), OMPD_parallel);
|
|
Builder.restoreIP(NewIP);
|
|
EXPECT_FALSE(M->global_empty());
|
|
EXPECT_EQ(M->size(), 4U);
|
|
EXPECT_EQ(F->size(), 7U);
|
|
EXPECT_EQ(BB->size(), 1U);
|
|
ASSERT_TRUE(isa<BranchInst>(BB->getTerminator()));
|
|
ASSERT_EQ(BB->getTerminator()->getNumSuccessors(), 2U);
|
|
BB = BB->getTerminator()->getSuccessor(0);
|
|
EXPECT_EQ(BB->size(), 4U);
|
|
|
|
|
|
CallInst *GTID = dyn_cast<CallInst>(&BB->front());
|
|
EXPECT_NE(GTID, nullptr);
|
|
EXPECT_EQ(GTID->arg_size(), 1U);
|
|
EXPECT_EQ(GTID->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
CallInst *Cancel = dyn_cast<CallInst>(GTID->getNextNode());
|
|
EXPECT_NE(Cancel, nullptr);
|
|
EXPECT_EQ(Cancel->arg_size(), 3U);
|
|
EXPECT_EQ(Cancel->getCalledFunction()->getName(), "__kmpc_cancel");
|
|
EXPECT_FALSE(Cancel->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(Cancel->getCalledFunction()->doesNotFreeMemory());
|
|
EXPECT_EQ(Cancel->getNumUses(), 1U);
|
|
Instruction *CancelBBTI = Cancel->getParent()->getTerminator();
|
|
EXPECT_EQ(CancelBBTI->getNumSuccessors(), 2U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(0)->size(), 1U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(0)->getUniqueSuccessor(), NewIP.getBlock());
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(1)->size(), 3U);
|
|
CallInst *GTID1 = dyn_cast<CallInst>(&CancelBBTI->getSuccessor(1)->front());
|
|
EXPECT_NE(GTID1, nullptr);
|
|
EXPECT_EQ(GTID1->arg_size(), 1U);
|
|
EXPECT_EQ(GTID1->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID1->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID1->getCalledFunction()->doesNotFreeMemory());
|
|
CallInst *Barrier = dyn_cast<CallInst>(GTID1->getNextNode());
|
|
EXPECT_NE(Barrier, nullptr);
|
|
EXPECT_EQ(Barrier->arg_size(), 2U);
|
|
EXPECT_EQ(Barrier->getCalledFunction()->getName(), "__kmpc_cancel_barrier");
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotFreeMemory());
|
|
EXPECT_EQ(Barrier->getNumUses(), 0U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(1)->getTerminator()->getNumSuccessors(),
|
|
1U);
|
|
EXPECT_EQ(CancelBBTI->getSuccessor(1)->getTerminator()->getSuccessor(0),
|
|
CBB);
|
|
|
|
EXPECT_EQ(cast<CallInst>(Cancel)->getArgOperand(1), GTID);
|
|
|
|
OMPBuilder.popFinalizationCB();
|
|
|
|
Builder.CreateUnreachable();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateCancelBarrier) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
|
|
BasicBlock *CBB = BasicBlock::Create(Ctx, "", F);
|
|
new UnreachableInst(Ctx, CBB);
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
ASSERT_NE(IP.getBlock(), nullptr);
|
|
ASSERT_EQ(IP.getBlock()->end(), IP.getPoint());
|
|
BranchInst::Create(CBB, IP.getBlock());
|
|
};
|
|
OMPBuilder.pushFinalizationCB({FiniCB, OMPD_parallel, true});
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP()});
|
|
auto NewIP = OMPBuilder.createBarrier(Loc, OMPD_for);
|
|
Builder.restoreIP(NewIP);
|
|
EXPECT_FALSE(M->global_empty());
|
|
EXPECT_EQ(M->size(), 3U);
|
|
EXPECT_EQ(F->size(), 4U);
|
|
EXPECT_EQ(BB->size(), 4U);
|
|
|
|
CallInst *GTID = dyn_cast<CallInst>(&BB->front());
|
|
EXPECT_NE(GTID, nullptr);
|
|
EXPECT_EQ(GTID->arg_size(), 1U);
|
|
EXPECT_EQ(GTID->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
CallInst *Barrier = dyn_cast<CallInst>(GTID->getNextNode());
|
|
EXPECT_NE(Barrier, nullptr);
|
|
EXPECT_EQ(Barrier->arg_size(), 2U);
|
|
EXPECT_EQ(Barrier->getCalledFunction()->getName(), "__kmpc_cancel_barrier");
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(Barrier->getCalledFunction()->doesNotFreeMemory());
|
|
EXPECT_EQ(Barrier->getNumUses(), 1U);
|
|
Instruction *BarrierBBTI = Barrier->getParent()->getTerminator();
|
|
EXPECT_EQ(BarrierBBTI->getNumSuccessors(), 2U);
|
|
EXPECT_EQ(BarrierBBTI->getSuccessor(0), NewIP.getBlock());
|
|
EXPECT_EQ(BarrierBBTI->getSuccessor(1)->size(), 1U);
|
|
EXPECT_EQ(BarrierBBTI->getSuccessor(1)->getTerminator()->getNumSuccessors(),
|
|
1U);
|
|
EXPECT_EQ(BarrierBBTI->getSuccessor(1)->getTerminator()->getSuccessor(0),
|
|
CBB);
|
|
|
|
EXPECT_EQ(cast<CallInst>(Barrier)->getArgOperand(1), GTID);
|
|
|
|
OMPBuilder.popFinalizationCB();
|
|
|
|
Builder.CreateUnreachable();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, DbgLoc) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
OMPBuilder.createBarrier(Loc, OMPD_for);
|
|
CallInst *GTID = dyn_cast<CallInst>(&BB->front());
|
|
CallInst *Barrier = dyn_cast<CallInst>(GTID->getNextNode());
|
|
EXPECT_EQ(GTID->getDebugLoc(), DL);
|
|
EXPECT_EQ(Barrier->getDebugLoc(), DL);
|
|
EXPECT_TRUE(isa<GlobalVariable>(Barrier->getOperand(0)));
|
|
if (!isa<GlobalVariable>(Barrier->getOperand(0)))
|
|
return;
|
|
GlobalVariable *Ident = cast<GlobalVariable>(Barrier->getOperand(0));
|
|
EXPECT_TRUE(Ident->hasInitializer());
|
|
if (!Ident->hasInitializer())
|
|
return;
|
|
Constant *Initializer = Ident->getInitializer();
|
|
EXPECT_TRUE(
|
|
isa<GlobalVariable>(Initializer->getOperand(4)->stripPointerCasts()));
|
|
GlobalVariable *SrcStrGlob =
|
|
cast<GlobalVariable>(Initializer->getOperand(4)->stripPointerCasts());
|
|
if (!SrcStrGlob)
|
|
return;
|
|
EXPECT_TRUE(isa<ConstantDataArray>(SrcStrGlob->getInitializer()));
|
|
ConstantDataArray *SrcSrc =
|
|
dyn_cast<ConstantDataArray>(SrcStrGlob->getInitializer());
|
|
if (!SrcSrc)
|
|
return;
|
|
EXPECT_EQ(SrcSrc->getAsCString(), ";/src/test.dbg;foo;3;7;;");
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, ParallelSimple) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI = nullptr;
|
|
|
|
unsigned NumBodiesGenerated = 0;
|
|
unsigned NumPrivatizedVars = 0;
|
|
unsigned NumFinalizationPoints = 0;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumBodiesGenerated;
|
|
|
|
Builder.restoreIP(AllocaIP);
|
|
PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
Value *PrivLoad = Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI,
|
|
"local.use");
|
|
Value *Cmp = Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
Instruction *ThenTerm, *ElseTerm;
|
|
SplitBlockAndInsertIfThenElse(Cmp, CodeGenIP.getBlock()->getTerminator(),
|
|
&ThenTerm, &ElseTerm);
|
|
|
|
Builder.SetInsertPoint(ThenTerm);
|
|
Builder.CreateBr(&ContinuationIP);
|
|
ThenTerm->eraseFromParent();
|
|
};
|
|
|
|
auto PrivCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
Value &Orig, Value &Inner,
|
|
Value *&ReplacementValue) -> InsertPointTy {
|
|
++NumPrivatizedVars;
|
|
|
|
if (!isa<AllocaInst>(Orig)) {
|
|
EXPECT_EQ(&Orig, F->arg_begin());
|
|
ReplacementValue = &Inner;
|
|
return CodeGenIP;
|
|
}
|
|
|
|
// Since the original value is an allocation, it has a pointer type and
|
|
// therefore no additional wrapping should happen.
|
|
EXPECT_EQ(&Orig, &Inner);
|
|
|
|
// Trivial copy (=firstprivate).
|
|
Builder.restoreIP(AllocaIP);
|
|
Type *VTy = Inner.getType()->getPointerElementType();
|
|
Value *V = Builder.CreateLoad(VTy, &Inner, Orig.getName() + ".reload");
|
|
ReplacementValue = Builder.CreateAlloca(VTy, 0, Orig.getName() + ".copy");
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(V, ReplacementValue);
|
|
return CodeGenIP;
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy CodeGenIP) { ++NumFinalizationPoints; };
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
IRBuilder<>::InsertPoint AfterIP =
|
|
OMPBuilder.createParallel(Loc, AllocaIP, BodyGenCB, PrivCB, FiniCB,
|
|
nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
EXPECT_EQ(NumBodiesGenerated, 1U);
|
|
EXPECT_EQ(NumPrivatizedVars, 1U);
|
|
EXPECT_EQ(NumFinalizationPoints, 1U);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_NE(PrivAI, nullptr);
|
|
Function *OutlinedFn = PrivAI->getFunction();
|
|
EXPECT_NE(F, OutlinedFn);
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
EXPECT_TRUE(OutlinedFn->hasFnAttribute(Attribute::NoUnwind));
|
|
EXPECT_TRUE(OutlinedFn->hasFnAttribute(Attribute::NoRecurse));
|
|
EXPECT_TRUE(OutlinedFn->hasParamAttribute(0, Attribute::NoAlias));
|
|
EXPECT_TRUE(OutlinedFn->hasParamAttribute(1, Attribute::NoAlias));
|
|
|
|
EXPECT_TRUE(OutlinedFn->hasInternalLinkage());
|
|
EXPECT_EQ(OutlinedFn->arg_size(), 3U);
|
|
|
|
EXPECT_EQ(&OutlinedFn->getEntryBlock(), PrivAI->getParent());
|
|
EXPECT_EQ(OutlinedFn->getNumUses(), 1U);
|
|
User *Usr = OutlinedFn->user_back();
|
|
ASSERT_TRUE(isa<ConstantExpr>(Usr));
|
|
CallInst *ForkCI = dyn_cast<CallInst>(Usr->user_back());
|
|
ASSERT_NE(ForkCI, nullptr);
|
|
|
|
EXPECT_EQ(ForkCI->getCalledFunction()->getName(), "__kmpc_fork_call");
|
|
EXPECT_EQ(ForkCI->arg_size(), 4U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(ForkCI->getArgOperand(0)));
|
|
EXPECT_EQ(ForkCI->getArgOperand(1),
|
|
ConstantInt::get(Type::getInt32Ty(Ctx), 1U));
|
|
EXPECT_EQ(ForkCI->getArgOperand(2), Usr);
|
|
EXPECT_EQ(findStoredValue<AllocaInst>(ForkCI->getArgOperand(3)),
|
|
F->arg_begin());
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, ParallelNested) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
unsigned NumInnerBodiesGenerated = 0;
|
|
unsigned NumOuterBodiesGenerated = 0;
|
|
unsigned NumFinalizationPoints = 0;
|
|
|
|
auto InnerBodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumInnerBodiesGenerated;
|
|
};
|
|
|
|
auto PrivCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
Value &Orig, Value &Inner,
|
|
Value *&ReplacementValue) -> InsertPointTy {
|
|
// Trivial copy (=firstprivate).
|
|
Builder.restoreIP(AllocaIP);
|
|
Type *VTy = Inner.getType()->getPointerElementType();
|
|
Value *V = Builder.CreateLoad(VTy, &Inner, Orig.getName() + ".reload");
|
|
ReplacementValue = Builder.CreateAlloca(VTy, 0, Orig.getName() + ".copy");
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(V, ReplacementValue);
|
|
return CodeGenIP;
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy CodeGenIP) { ++NumFinalizationPoints; };
|
|
|
|
auto OuterBodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumOuterBodiesGenerated;
|
|
Builder.restoreIP(CodeGenIP);
|
|
BasicBlock *CGBB = CodeGenIP.getBlock();
|
|
BasicBlock *NewBB = SplitBlock(CGBB, &*CodeGenIP.getPoint());
|
|
CGBB->getTerminator()->eraseFromParent();
|
|
;
|
|
|
|
IRBuilder<>::InsertPoint AfterIP = OMPBuilder.createParallel(
|
|
InsertPointTy(CGBB, CGBB->end()), AllocaIP, InnerBodyGenCB, PrivCB,
|
|
FiniCB, nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateBr(NewBB);
|
|
};
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
IRBuilder<>::InsertPoint AfterIP =
|
|
OMPBuilder.createParallel(Loc, AllocaIP, OuterBodyGenCB, PrivCB, FiniCB,
|
|
nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
|
|
EXPECT_EQ(NumInnerBodiesGenerated, 1U);
|
|
EXPECT_EQ(NumOuterBodiesGenerated, 1U);
|
|
EXPECT_EQ(NumFinalizationPoints, 2U);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_EQ(M->size(), 5U);
|
|
for (Function &OutlinedFn : *M) {
|
|
if (F == &OutlinedFn || OutlinedFn.isDeclaration())
|
|
continue;
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
EXPECT_TRUE(OutlinedFn.hasFnAttribute(Attribute::NoUnwind));
|
|
EXPECT_TRUE(OutlinedFn.hasFnAttribute(Attribute::NoRecurse));
|
|
EXPECT_TRUE(OutlinedFn.hasParamAttribute(0, Attribute::NoAlias));
|
|
EXPECT_TRUE(OutlinedFn.hasParamAttribute(1, Attribute::NoAlias));
|
|
|
|
EXPECT_TRUE(OutlinedFn.hasInternalLinkage());
|
|
EXPECT_EQ(OutlinedFn.arg_size(), 2U);
|
|
|
|
EXPECT_EQ(OutlinedFn.getNumUses(), 1U);
|
|
User *Usr = OutlinedFn.user_back();
|
|
ASSERT_TRUE(isa<ConstantExpr>(Usr));
|
|
CallInst *ForkCI = dyn_cast<CallInst>(Usr->user_back());
|
|
ASSERT_NE(ForkCI, nullptr);
|
|
|
|
EXPECT_EQ(ForkCI->getCalledFunction()->getName(), "__kmpc_fork_call");
|
|
EXPECT_EQ(ForkCI->arg_size(), 3U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(ForkCI->getArgOperand(0)));
|
|
EXPECT_EQ(ForkCI->getArgOperand(1),
|
|
ConstantInt::get(Type::getInt32Ty(Ctx), 0U));
|
|
EXPECT_EQ(ForkCI->getArgOperand(2), Usr);
|
|
}
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, ParallelNested2Inner) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
unsigned NumInnerBodiesGenerated = 0;
|
|
unsigned NumOuterBodiesGenerated = 0;
|
|
unsigned NumFinalizationPoints = 0;
|
|
|
|
auto InnerBodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumInnerBodiesGenerated;
|
|
};
|
|
|
|
auto PrivCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
Value &Orig, Value &Inner,
|
|
Value *&ReplacementValue) -> InsertPointTy {
|
|
// Trivial copy (=firstprivate).
|
|
Builder.restoreIP(AllocaIP);
|
|
Type *VTy = Inner.getType()->getPointerElementType();
|
|
Value *V = Builder.CreateLoad(VTy, &Inner, Orig.getName() + ".reload");
|
|
ReplacementValue = Builder.CreateAlloca(VTy, 0, Orig.getName() + ".copy");
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(V, ReplacementValue);
|
|
return CodeGenIP;
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy CodeGenIP) { ++NumFinalizationPoints; };
|
|
|
|
auto OuterBodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumOuterBodiesGenerated;
|
|
Builder.restoreIP(CodeGenIP);
|
|
BasicBlock *CGBB = CodeGenIP.getBlock();
|
|
BasicBlock *NewBB1 = SplitBlock(CGBB, &*CodeGenIP.getPoint());
|
|
BasicBlock *NewBB2 = SplitBlock(NewBB1, &*NewBB1->getFirstInsertionPt());
|
|
CGBB->getTerminator()->eraseFromParent();
|
|
;
|
|
NewBB1->getTerminator()->eraseFromParent();
|
|
;
|
|
|
|
IRBuilder<>::InsertPoint AfterIP1 = OMPBuilder.createParallel(
|
|
InsertPointTy(CGBB, CGBB->end()), AllocaIP, InnerBodyGenCB, PrivCB,
|
|
FiniCB, nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
|
|
Builder.restoreIP(AfterIP1);
|
|
Builder.CreateBr(NewBB1);
|
|
|
|
IRBuilder<>::InsertPoint AfterIP2 = OMPBuilder.createParallel(
|
|
InsertPointTy(NewBB1, NewBB1->end()), AllocaIP, InnerBodyGenCB, PrivCB,
|
|
FiniCB, nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
|
|
Builder.restoreIP(AfterIP2);
|
|
Builder.CreateBr(NewBB2);
|
|
};
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
IRBuilder<>::InsertPoint AfterIP =
|
|
OMPBuilder.createParallel(Loc, AllocaIP, OuterBodyGenCB, PrivCB, FiniCB,
|
|
nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
|
|
EXPECT_EQ(NumInnerBodiesGenerated, 2U);
|
|
EXPECT_EQ(NumOuterBodiesGenerated, 1U);
|
|
EXPECT_EQ(NumFinalizationPoints, 3U);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_EQ(M->size(), 6U);
|
|
for (Function &OutlinedFn : *M) {
|
|
if (F == &OutlinedFn || OutlinedFn.isDeclaration())
|
|
continue;
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
EXPECT_TRUE(OutlinedFn.hasFnAttribute(Attribute::NoUnwind));
|
|
EXPECT_TRUE(OutlinedFn.hasFnAttribute(Attribute::NoRecurse));
|
|
EXPECT_TRUE(OutlinedFn.hasParamAttribute(0, Attribute::NoAlias));
|
|
EXPECT_TRUE(OutlinedFn.hasParamAttribute(1, Attribute::NoAlias));
|
|
|
|
EXPECT_TRUE(OutlinedFn.hasInternalLinkage());
|
|
EXPECT_EQ(OutlinedFn.arg_size(), 2U);
|
|
|
|
unsigned NumAllocas = 0;
|
|
for (Instruction &I : instructions(OutlinedFn))
|
|
NumAllocas += isa<AllocaInst>(I);
|
|
EXPECT_EQ(NumAllocas, 1U);
|
|
|
|
EXPECT_EQ(OutlinedFn.getNumUses(), 1U);
|
|
User *Usr = OutlinedFn.user_back();
|
|
ASSERT_TRUE(isa<ConstantExpr>(Usr));
|
|
CallInst *ForkCI = dyn_cast<CallInst>(Usr->user_back());
|
|
ASSERT_NE(ForkCI, nullptr);
|
|
|
|
EXPECT_EQ(ForkCI->getCalledFunction()->getName(), "__kmpc_fork_call");
|
|
EXPECT_EQ(ForkCI->arg_size(), 3U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(ForkCI->getArgOperand(0)));
|
|
EXPECT_EQ(ForkCI->getArgOperand(1),
|
|
ConstantInt::get(Type::getInt32Ty(Ctx), 0U));
|
|
EXPECT_EQ(ForkCI->getArgOperand(2), Usr);
|
|
}
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, ParallelIfCond) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI = nullptr;
|
|
|
|
unsigned NumBodiesGenerated = 0;
|
|
unsigned NumPrivatizedVars = 0;
|
|
unsigned NumFinalizationPoints = 0;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumBodiesGenerated;
|
|
|
|
Builder.restoreIP(AllocaIP);
|
|
PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
Value *PrivLoad = Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI,
|
|
"local.use");
|
|
Value *Cmp = Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
Instruction *ThenTerm, *ElseTerm;
|
|
SplitBlockAndInsertIfThenElse(Cmp, CodeGenIP.getBlock()->getTerminator(),
|
|
&ThenTerm, &ElseTerm);
|
|
|
|
Builder.SetInsertPoint(ThenTerm);
|
|
Builder.CreateBr(&ContinuationIP);
|
|
ThenTerm->eraseFromParent();
|
|
};
|
|
|
|
auto PrivCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
Value &Orig, Value &Inner,
|
|
Value *&ReplacementValue) -> InsertPointTy {
|
|
++NumPrivatizedVars;
|
|
|
|
if (!isa<AllocaInst>(Orig)) {
|
|
EXPECT_EQ(&Orig, F->arg_begin());
|
|
ReplacementValue = &Inner;
|
|
return CodeGenIP;
|
|
}
|
|
|
|
// Since the original value is an allocation, it has a pointer type and
|
|
// therefore no additional wrapping should happen.
|
|
EXPECT_EQ(&Orig, &Inner);
|
|
|
|
// Trivial copy (=firstprivate).
|
|
Builder.restoreIP(AllocaIP);
|
|
Type *VTy = Inner.getType()->getPointerElementType();
|
|
Value *V = Builder.CreateLoad(VTy, &Inner, Orig.getName() + ".reload");
|
|
ReplacementValue = Builder.CreateAlloca(VTy, 0, Orig.getName() + ".copy");
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(V, ReplacementValue);
|
|
return CodeGenIP;
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy CodeGenIP) {
|
|
++NumFinalizationPoints;
|
|
// No destructors.
|
|
};
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
IRBuilder<>::InsertPoint AfterIP =
|
|
OMPBuilder.createParallel(Loc, AllocaIP, BodyGenCB, PrivCB, FiniCB,
|
|
Builder.CreateIsNotNull(F->arg_begin()),
|
|
nullptr, OMP_PROC_BIND_default, false);
|
|
|
|
EXPECT_EQ(NumBodiesGenerated, 1U);
|
|
EXPECT_EQ(NumPrivatizedVars, 1U);
|
|
EXPECT_EQ(NumFinalizationPoints, 1U);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_NE(PrivAI, nullptr);
|
|
Function *OutlinedFn = PrivAI->getFunction();
|
|
EXPECT_NE(F, OutlinedFn);
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_TRUE(OutlinedFn->hasInternalLinkage());
|
|
EXPECT_EQ(OutlinedFn->arg_size(), 3U);
|
|
|
|
EXPECT_EQ(&OutlinedFn->getEntryBlock(), PrivAI->getParent());
|
|
ASSERT_EQ(OutlinedFn->getNumUses(), 2U);
|
|
|
|
CallInst *DirectCI = nullptr;
|
|
CallInst *ForkCI = nullptr;
|
|
for (User *Usr : OutlinedFn->users()) {
|
|
if (isa<CallInst>(Usr)) {
|
|
ASSERT_EQ(DirectCI, nullptr);
|
|
DirectCI = cast<CallInst>(Usr);
|
|
} else {
|
|
ASSERT_TRUE(isa<ConstantExpr>(Usr));
|
|
ASSERT_EQ(Usr->getNumUses(), 1U);
|
|
ASSERT_TRUE(isa<CallInst>(Usr->user_back()));
|
|
ForkCI = cast<CallInst>(Usr->user_back());
|
|
}
|
|
}
|
|
|
|
EXPECT_EQ(ForkCI->getCalledFunction()->getName(), "__kmpc_fork_call");
|
|
EXPECT_EQ(ForkCI->arg_size(), 4U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(ForkCI->getArgOperand(0)));
|
|
EXPECT_EQ(ForkCI->getArgOperand(1),
|
|
ConstantInt::get(Type::getInt32Ty(Ctx), 1));
|
|
Value *StoredForkArg = findStoredValue<AllocaInst>(ForkCI->getArgOperand(3));
|
|
EXPECT_EQ(StoredForkArg, F->arg_begin());
|
|
|
|
EXPECT_EQ(DirectCI->getCalledFunction(), OutlinedFn);
|
|
EXPECT_EQ(DirectCI->arg_size(), 3U);
|
|
EXPECT_TRUE(isa<AllocaInst>(DirectCI->getArgOperand(0)));
|
|
EXPECT_TRUE(isa<AllocaInst>(DirectCI->getArgOperand(1)));
|
|
Value *StoredDirectArg =
|
|
findStoredValue<AllocaInst>(DirectCI->getArgOperand(2));
|
|
EXPECT_EQ(StoredDirectArg, F->arg_begin());
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, ParallelCancelBarrier) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
unsigned NumBodiesGenerated = 0;
|
|
unsigned NumPrivatizedVars = 0;
|
|
unsigned NumFinalizationPoints = 0;
|
|
|
|
CallInst *CheckedBarrier = nullptr;
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationIP) {
|
|
++NumBodiesGenerated;
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
// Create three barriers, two cancel barriers but only one checked.
|
|
Function *CBFn, *BFn;
|
|
|
|
Builder.restoreIP(
|
|
OMPBuilder.createBarrier(Builder.saveIP(), OMPD_parallel));
|
|
|
|
CBFn = M->getFunction("__kmpc_cancel_barrier");
|
|
BFn = M->getFunction("__kmpc_barrier");
|
|
ASSERT_NE(CBFn, nullptr);
|
|
ASSERT_EQ(BFn, nullptr);
|
|
ASSERT_EQ(CBFn->getNumUses(), 1U);
|
|
ASSERT_TRUE(isa<CallInst>(CBFn->user_back()));
|
|
ASSERT_EQ(CBFn->user_back()->getNumUses(), 1U);
|
|
CheckedBarrier = cast<CallInst>(CBFn->user_back());
|
|
|
|
Builder.restoreIP(
|
|
OMPBuilder.createBarrier(Builder.saveIP(), OMPD_parallel, true));
|
|
CBFn = M->getFunction("__kmpc_cancel_barrier");
|
|
BFn = M->getFunction("__kmpc_barrier");
|
|
ASSERT_NE(CBFn, nullptr);
|
|
ASSERT_NE(BFn, nullptr);
|
|
ASSERT_EQ(CBFn->getNumUses(), 1U);
|
|
ASSERT_EQ(BFn->getNumUses(), 1U);
|
|
ASSERT_TRUE(isa<CallInst>(BFn->user_back()));
|
|
ASSERT_EQ(BFn->user_back()->getNumUses(), 0U);
|
|
|
|
Builder.restoreIP(OMPBuilder.createBarrier(Builder.saveIP(), OMPD_parallel,
|
|
false, false));
|
|
ASSERT_EQ(CBFn->getNumUses(), 2U);
|
|
ASSERT_EQ(BFn->getNumUses(), 1U);
|
|
ASSERT_TRUE(CBFn->user_back() != CheckedBarrier);
|
|
ASSERT_TRUE(isa<CallInst>(CBFn->user_back()));
|
|
ASSERT_EQ(CBFn->user_back()->getNumUses(), 0U);
|
|
};
|
|
|
|
auto PrivCB = [&](InsertPointTy, InsertPointTy, Value &V, Value &,
|
|
Value *&) -> InsertPointTy {
|
|
++NumPrivatizedVars;
|
|
llvm_unreachable("No privatization callback call expected!");
|
|
};
|
|
|
|
FunctionType *FakeDestructorTy =
|
|
FunctionType::get(Type::getVoidTy(Ctx), {Type::getInt32Ty(Ctx)},
|
|
/*isVarArg=*/false);
|
|
auto *FakeDestructor = Function::Create(
|
|
FakeDestructorTy, Function::ExternalLinkage, "fakeDestructor", M.get());
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
++NumFinalizationPoints;
|
|
Builder.restoreIP(IP);
|
|
Builder.CreateCall(FakeDestructor,
|
|
{Builder.getInt32(NumFinalizationPoints)});
|
|
};
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
IRBuilder<>::InsertPoint AfterIP =
|
|
OMPBuilder.createParallel(Loc, AllocaIP, BodyGenCB, PrivCB, FiniCB,
|
|
Builder.CreateIsNotNull(F->arg_begin()),
|
|
nullptr, OMP_PROC_BIND_default, true);
|
|
|
|
EXPECT_EQ(NumBodiesGenerated, 1U);
|
|
EXPECT_EQ(NumPrivatizedVars, 0U);
|
|
EXPECT_EQ(NumFinalizationPoints, 2U);
|
|
EXPECT_EQ(FakeDestructor->getNumUses(), 2U);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
BasicBlock *ExitBB = nullptr;
|
|
for (const User *Usr : FakeDestructor->users()) {
|
|
const CallInst *CI = dyn_cast<CallInst>(Usr);
|
|
ASSERT_EQ(CI->getCalledFunction(), FakeDestructor);
|
|
ASSERT_TRUE(isa<BranchInst>(CI->getNextNode()));
|
|
ASSERT_EQ(CI->getNextNode()->getNumSuccessors(), 1U);
|
|
if (ExitBB)
|
|
ASSERT_EQ(CI->getNextNode()->getSuccessor(0), ExitBB);
|
|
else
|
|
ExitBB = CI->getNextNode()->getSuccessor(0);
|
|
ASSERT_EQ(ExitBB->size(), 1U);
|
|
if (!isa<ReturnInst>(ExitBB->front())) {
|
|
ASSERT_TRUE(isa<BranchInst>(ExitBB->front()));
|
|
ASSERT_EQ(cast<BranchInst>(ExitBB->front()).getNumSuccessors(), 1U);
|
|
ASSERT_TRUE(isa<ReturnInst>(
|
|
cast<BranchInst>(ExitBB->front()).getSuccessor(0)->front()));
|
|
}
|
|
}
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, ParallelForwardAsPointers) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
|
|
Type *I32Ty = Type::getInt32Ty(M->getContext());
|
|
Type *I32PtrTy = Type::getInt32PtrTy(M->getContext());
|
|
Type *StructTy = StructType::get(I32Ty, I32PtrTy);
|
|
Type *StructPtrTy = StructTy->getPointerTo();
|
|
Type *VoidTy = Type::getVoidTy(M->getContext());
|
|
FunctionCallee RetI32Func = M->getOrInsertFunction("ret_i32", I32Ty);
|
|
FunctionCallee TakeI32Func =
|
|
M->getOrInsertFunction("take_i32", VoidTy, I32Ty);
|
|
FunctionCallee RetI32PtrFunc = M->getOrInsertFunction("ret_i32ptr", I32PtrTy);
|
|
FunctionCallee TakeI32PtrFunc =
|
|
M->getOrInsertFunction("take_i32ptr", VoidTy, I32PtrTy);
|
|
FunctionCallee RetStructFunc = M->getOrInsertFunction("ret_struct", StructTy);
|
|
FunctionCallee TakeStructFunc =
|
|
M->getOrInsertFunction("take_struct", VoidTy, StructTy);
|
|
FunctionCallee RetStructPtrFunc =
|
|
M->getOrInsertFunction("ret_structptr", StructPtrTy);
|
|
FunctionCallee TakeStructPtrFunc =
|
|
M->getOrInsertFunction("take_structPtr", VoidTy, StructPtrTy);
|
|
Value *I32Val = Builder.CreateCall(RetI32Func);
|
|
Value *I32PtrVal = Builder.CreateCall(RetI32PtrFunc);
|
|
Value *StructVal = Builder.CreateCall(RetStructFunc);
|
|
Value *StructPtrVal = Builder.CreateCall(RetStructPtrFunc);
|
|
|
|
Instruction *Internal;
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationBB) {
|
|
IRBuilder<>::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(CodeGenIP);
|
|
Internal = Builder.CreateCall(TakeI32Func, I32Val);
|
|
Builder.CreateCall(TakeI32PtrFunc, I32PtrVal);
|
|
Builder.CreateCall(TakeStructFunc, StructVal);
|
|
Builder.CreateCall(TakeStructPtrFunc, StructPtrVal);
|
|
};
|
|
auto PrivCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP, Value &,
|
|
Value &Inner, Value *&ReplacementValue) {
|
|
ReplacementValue = &Inner;
|
|
return CodeGenIP;
|
|
};
|
|
auto FiniCB = [](InsertPointTy) {};
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
IRBuilder<>::InsertPoint AfterIP =
|
|
OMPBuilder.createParallel(Loc, AllocaIP, BodyGenCB, PrivCB, FiniCB,
|
|
nullptr, nullptr, OMP_PROC_BIND_default, false);
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
Function *OutlinedFn = Internal->getFunction();
|
|
|
|
Type *Arg2Type = OutlinedFn->getArg(2)->getType();
|
|
EXPECT_TRUE(Arg2Type->isPointerTy());
|
|
EXPECT_EQ(Arg2Type->getPointerElementType(), I32Ty);
|
|
|
|
// Arguments that need to be passed through pointers and reloaded will get
|
|
// used earlier in the functions and therefore will appear first in the
|
|
// argument list after outlining.
|
|
Type *Arg3Type = OutlinedFn->getArg(3)->getType();
|
|
EXPECT_TRUE(Arg3Type->isPointerTy());
|
|
EXPECT_EQ(Arg3Type->getPointerElementType(), StructTy);
|
|
|
|
Type *Arg4Type = OutlinedFn->getArg(4)->getType();
|
|
EXPECT_EQ(Arg4Type, I32PtrTy);
|
|
|
|
Type *Arg5Type = OutlinedFn->getArg(5)->getType();
|
|
EXPECT_EQ(Arg5Type, StructPtrTy);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CanonicalLoopSimple) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
Value *TripCount = F->getArg(0);
|
|
|
|
unsigned NumBodiesGenerated = 0;
|
|
auto LoopBodyGenCB = [&](InsertPointTy CodeGenIP, llvm::Value *LC) {
|
|
NumBodiesGenerated += 1;
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
Value *Cmp = Builder.CreateICmpEQ(LC, TripCount);
|
|
Instruction *ThenTerm, *ElseTerm;
|
|
SplitBlockAndInsertIfThenElse(Cmp, CodeGenIP.getBlock()->getTerminator(),
|
|
&ThenTerm, &ElseTerm);
|
|
};
|
|
|
|
CanonicalLoopInfo *Loop =
|
|
OMPBuilder.createCanonicalLoop(Loc, LoopBodyGenCB, TripCount);
|
|
|
|
Builder.restoreIP(Loop->getAfterIP());
|
|
ReturnInst *RetInst = Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
|
|
Loop->assertOK();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_EQ(NumBodiesGenerated, 1U);
|
|
|
|
// Verify control flow structure (in addition to Loop->assertOK()).
|
|
EXPECT_EQ(Loop->getPreheader()->getSinglePredecessor(), &F->getEntryBlock());
|
|
EXPECT_EQ(Loop->getAfter(), Builder.GetInsertBlock());
|
|
|
|
Instruction *IndVar = Loop->getIndVar();
|
|
EXPECT_TRUE(isa<PHINode>(IndVar));
|
|
EXPECT_EQ(IndVar->getType(), TripCount->getType());
|
|
EXPECT_EQ(IndVar->getParent(), Loop->getHeader());
|
|
|
|
EXPECT_EQ(Loop->getTripCount(), TripCount);
|
|
|
|
BasicBlock *Body = Loop->getBody();
|
|
Instruction *CmpInst = &Body->getInstList().front();
|
|
EXPECT_TRUE(isa<ICmpInst>(CmpInst));
|
|
EXPECT_EQ(CmpInst->getOperand(0), IndVar);
|
|
|
|
BasicBlock *LatchPred = Loop->getLatch()->getSinglePredecessor();
|
|
EXPECT_TRUE(llvm::all_of(successors(Body), [=](BasicBlock *SuccBB) {
|
|
return SuccBB->getSingleSuccessor() == LatchPred;
|
|
}));
|
|
|
|
EXPECT_EQ(&Loop->getAfter()->front(), RetInst);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CanonicalLoopBounds) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
IRBuilder<> Builder(BB);
|
|
|
|
// Check the trip count is computed correctly. We generate the canonical loop
|
|
// but rely on the IRBuilder's constant folder to compute the final result
|
|
// since all inputs are constant. To verify overflow situations, limit the
|
|
// trip count / loop counter widths to 16 bits.
|
|
auto EvalTripCount = [&](int64_t Start, int64_t Stop, int64_t Step,
|
|
bool IsSigned, bool InclusiveStop) -> int64_t {
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
Type *LCTy = Type::getInt16Ty(Ctx);
|
|
Value *StartVal = ConstantInt::get(LCTy, Start);
|
|
Value *StopVal = ConstantInt::get(LCTy, Stop);
|
|
Value *StepVal = ConstantInt::get(LCTy, Step);
|
|
auto LoopBodyGenCB = [&](InsertPointTy CodeGenIP, llvm::Value *LC) {};
|
|
CanonicalLoopInfo *Loop =
|
|
OMPBuilder.createCanonicalLoop(Loc, LoopBodyGenCB, StartVal, StopVal,
|
|
StepVal, IsSigned, InclusiveStop);
|
|
Loop->assertOK();
|
|
Builder.restoreIP(Loop->getAfterIP());
|
|
Value *TripCount = Loop->getTripCount();
|
|
return cast<ConstantInt>(TripCount)->getValue().getZExtValue();
|
|
};
|
|
|
|
EXPECT_EQ(EvalTripCount(0, 0, 1, false, false), 0);
|
|
EXPECT_EQ(EvalTripCount(0, 1, 2, false, false), 1);
|
|
EXPECT_EQ(EvalTripCount(0, 42, 1, false, false), 42);
|
|
EXPECT_EQ(EvalTripCount(0, 42, 2, false, false), 21);
|
|
EXPECT_EQ(EvalTripCount(21, 42, 1, false, false), 21);
|
|
EXPECT_EQ(EvalTripCount(0, 5, 5, false, false), 1);
|
|
EXPECT_EQ(EvalTripCount(0, 9, 5, false, false), 2);
|
|
EXPECT_EQ(EvalTripCount(0, 11, 5, false, false), 3);
|
|
EXPECT_EQ(EvalTripCount(0, 0xFFFF, 1, false, false), 0xFFFF);
|
|
EXPECT_EQ(EvalTripCount(0xFFFF, 0, 1, false, false), 0);
|
|
EXPECT_EQ(EvalTripCount(0xFFFE, 0xFFFF, 1, false, false), 1);
|
|
EXPECT_EQ(EvalTripCount(0, 0xFFFF, 0x100, false, false), 0x100);
|
|
EXPECT_EQ(EvalTripCount(0, 0xFFFF, 0xFFFF, false, false), 1);
|
|
|
|
EXPECT_EQ(EvalTripCount(0, 6, 5, false, false), 2);
|
|
EXPECT_EQ(EvalTripCount(0, 0xFFFF, 0xFFFE, false, false), 2);
|
|
EXPECT_EQ(EvalTripCount(0, 0, 1, false, true), 1);
|
|
EXPECT_EQ(EvalTripCount(0, 0, 0xFFFF, false, true), 1);
|
|
EXPECT_EQ(EvalTripCount(0, 0xFFFE, 1, false, true), 0xFFFF);
|
|
EXPECT_EQ(EvalTripCount(0, 0xFFFE, 2, false, true), 0x8000);
|
|
|
|
EXPECT_EQ(EvalTripCount(0, 0, -1, true, false), 0);
|
|
EXPECT_EQ(EvalTripCount(0, 1, -1, true, true), 0);
|
|
EXPECT_EQ(EvalTripCount(20, 5, -5, true, false), 3);
|
|
EXPECT_EQ(EvalTripCount(20, 5, -5, true, true), 4);
|
|
EXPECT_EQ(EvalTripCount(-4, -2, 2, true, false), 1);
|
|
EXPECT_EQ(EvalTripCount(-4, -3, 2, true, false), 1);
|
|
EXPECT_EQ(EvalTripCount(-4, -2, 2, true, true), 2);
|
|
|
|
EXPECT_EQ(EvalTripCount(INT16_MIN, 0, 1, true, false), 0x8000);
|
|
EXPECT_EQ(EvalTripCount(INT16_MIN, 0, 1, true, true), 0x8001);
|
|
EXPECT_EQ(EvalTripCount(INT16_MIN, 0x7FFF, 1, true, false), 0xFFFF);
|
|
EXPECT_EQ(EvalTripCount(INT16_MIN + 1, 0x7FFF, 1, true, true), 0xFFFF);
|
|
EXPECT_EQ(EvalTripCount(INT16_MIN, 0, 0x7FFF, true, false), 2);
|
|
EXPECT_EQ(EvalTripCount(0x7FFF, 0, -1, true, false), 0x7FFF);
|
|
EXPECT_EQ(EvalTripCount(0, INT16_MIN, -1, true, false), 0x8000);
|
|
EXPECT_EQ(EvalTripCount(0, INT16_MIN, -16, true, false), 0x800);
|
|
EXPECT_EQ(EvalTripCount(0x7FFF, INT16_MIN, -1, true, false), 0xFFFF);
|
|
EXPECT_EQ(EvalTripCount(0x7FFF, 1, INT16_MIN, true, false), 1);
|
|
EXPECT_EQ(EvalTripCount(0x7FFF, -1, INT16_MIN, true, true), 2);
|
|
|
|
// Finalize the function and verify it.
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CollapseNestedLoops) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
Type *LCTy = F->getArg(0)->getType();
|
|
Constant *One = ConstantInt::get(LCTy, 1);
|
|
Constant *Two = ConstantInt::get(LCTy, 2);
|
|
Value *OuterTripCount =
|
|
Builder.CreateAdd(F->getArg(0), Two, "tripcount.outer");
|
|
Value *InnerTripCount =
|
|
Builder.CreateAdd(F->getArg(0), One, "tripcount.inner");
|
|
|
|
// Fix an insertion point for ComputeIP.
|
|
BasicBlock *LoopNextEnter =
|
|
BasicBlock::Create(M->getContext(), "loopnest.enter", F,
|
|
Builder.GetInsertBlock()->getNextNode());
|
|
BranchInst *EnterBr = Builder.CreateBr(LoopNextEnter);
|
|
InsertPointTy ComputeIP{EnterBr->getParent(), EnterBr->getIterator()};
|
|
|
|
Builder.SetInsertPoint(LoopNextEnter);
|
|
OpenMPIRBuilder::LocationDescription OuterLoc(Builder.saveIP(), DL);
|
|
|
|
CanonicalLoopInfo *InnerLoop = nullptr;
|
|
CallInst *InbetweenLead = nullptr;
|
|
CallInst *InbetweenTrail = nullptr;
|
|
CallInst *Call = nullptr;
|
|
auto OuterLoopBodyGenCB = [&](InsertPointTy OuterCodeGenIP, Value *OuterLC) {
|
|
Builder.restoreIP(OuterCodeGenIP);
|
|
InbetweenLead =
|
|
createPrintfCall(Builder, "In-between lead i=%d\\n", {OuterLC});
|
|
|
|
auto InnerLoopBodyGenCB = [&](InsertPointTy InnerCodeGenIP,
|
|
Value *InnerLC) {
|
|
Builder.restoreIP(InnerCodeGenIP);
|
|
Call = createPrintfCall(Builder, "body i=%d j=%d\\n", {OuterLC, InnerLC});
|
|
};
|
|
InnerLoop = OMPBuilder.createCanonicalLoop(
|
|
Builder.saveIP(), InnerLoopBodyGenCB, InnerTripCount, "inner");
|
|
|
|
Builder.restoreIP(InnerLoop->getAfterIP());
|
|
InbetweenTrail =
|
|
createPrintfCall(Builder, "In-between trail i=%d\\n", {OuterLC});
|
|
};
|
|
CanonicalLoopInfo *OuterLoop = OMPBuilder.createCanonicalLoop(
|
|
OuterLoc, OuterLoopBodyGenCB, OuterTripCount, "outer");
|
|
|
|
// Finish the function.
|
|
Builder.restoreIP(OuterLoop->getAfterIP());
|
|
Builder.CreateRetVoid();
|
|
|
|
CanonicalLoopInfo *Collapsed =
|
|
OMPBuilder.collapseLoops(DL, {OuterLoop, InnerLoop}, ComputeIP);
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
// Verify control flow and BB order.
|
|
BasicBlock *RefOrder[] = {
|
|
Collapsed->getPreheader(), Collapsed->getHeader(),
|
|
Collapsed->getCond(), Collapsed->getBody(),
|
|
InbetweenLead->getParent(), Call->getParent(),
|
|
InbetweenTrail->getParent(), Collapsed->getLatch(),
|
|
Collapsed->getExit(), Collapsed->getAfter(),
|
|
};
|
|
EXPECT_TRUE(verifyDFSOrder(F, RefOrder));
|
|
EXPECT_TRUE(verifyListOrder(F, RefOrder));
|
|
|
|
// Verify the total trip count.
|
|
auto *TripCount = cast<MulOperator>(Collapsed->getTripCount());
|
|
EXPECT_EQ(TripCount->getOperand(0), OuterTripCount);
|
|
EXPECT_EQ(TripCount->getOperand(1), InnerTripCount);
|
|
|
|
// Verify the changed indvar.
|
|
auto *OuterIV = cast<BinaryOperator>(Call->getOperand(1));
|
|
EXPECT_EQ(OuterIV->getOpcode(), Instruction::UDiv);
|
|
EXPECT_EQ(OuterIV->getParent(), Collapsed->getBody());
|
|
EXPECT_EQ(OuterIV->getOperand(1), InnerTripCount);
|
|
EXPECT_EQ(OuterIV->getOperand(0), Collapsed->getIndVar());
|
|
|
|
auto *InnerIV = cast<BinaryOperator>(Call->getOperand(2));
|
|
EXPECT_EQ(InnerIV->getOpcode(), Instruction::URem);
|
|
EXPECT_EQ(InnerIV->getParent(), Collapsed->getBody());
|
|
EXPECT_EQ(InnerIV->getOperand(0), Collapsed->getIndVar());
|
|
EXPECT_EQ(InnerIV->getOperand(1), InnerTripCount);
|
|
|
|
EXPECT_EQ(InbetweenLead->getOperand(1), OuterIV);
|
|
EXPECT_EQ(InbetweenTrail->getOperand(1), OuterIV);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, TileSingleLoop) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
Instruction *Call;
|
|
BasicBlock *BodyCode;
|
|
CanonicalLoopInfo *Loop =
|
|
buildSingleLoopFunction(DL, OMPBuilder, &Call, &BodyCode);
|
|
|
|
Instruction *OrigIndVar = Loop->getIndVar();
|
|
EXPECT_EQ(Call->getOperand(1), OrigIndVar);
|
|
|
|
// Tile the loop.
|
|
Constant *TileSize = ConstantInt::get(Loop->getIndVarType(), APInt(32, 7));
|
|
std::vector<CanonicalLoopInfo *> GenLoops =
|
|
OMPBuilder.tileLoops(DL, {Loop}, {TileSize});
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_EQ(GenLoops.size(), 2u);
|
|
CanonicalLoopInfo *Floor = GenLoops[0];
|
|
CanonicalLoopInfo *Tile = GenLoops[1];
|
|
|
|
BasicBlock *RefOrder[] = {
|
|
Floor->getPreheader(), Floor->getHeader(), Floor->getCond(),
|
|
Floor->getBody(), Tile->getPreheader(), Tile->getHeader(),
|
|
Tile->getCond(), Tile->getBody(), BodyCode,
|
|
Tile->getLatch(), Tile->getExit(), Tile->getAfter(),
|
|
Floor->getLatch(), Floor->getExit(), Floor->getAfter(),
|
|
};
|
|
EXPECT_TRUE(verifyDFSOrder(F, RefOrder));
|
|
EXPECT_TRUE(verifyListOrder(F, RefOrder));
|
|
|
|
// Check the induction variable.
|
|
EXPECT_EQ(Call->getParent(), BodyCode);
|
|
auto *Shift = cast<AddOperator>(Call->getOperand(1));
|
|
EXPECT_EQ(cast<Instruction>(Shift)->getParent(), Tile->getBody());
|
|
EXPECT_EQ(Shift->getOperand(1), Tile->getIndVar());
|
|
auto *Scale = cast<MulOperator>(Shift->getOperand(0));
|
|
EXPECT_EQ(cast<Instruction>(Scale)->getParent(), Tile->getBody());
|
|
EXPECT_EQ(Scale->getOperand(0), TileSize);
|
|
EXPECT_EQ(Scale->getOperand(1), Floor->getIndVar());
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, TileNestedLoops) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
Value *TripCount = F->getArg(0);
|
|
Type *LCTy = TripCount->getType();
|
|
|
|
BasicBlock *BodyCode = nullptr;
|
|
CanonicalLoopInfo *InnerLoop = nullptr;
|
|
auto OuterLoopBodyGenCB = [&](InsertPointTy OuterCodeGenIP,
|
|
llvm::Value *OuterLC) {
|
|
auto InnerLoopBodyGenCB = [&](InsertPointTy InnerCodeGenIP,
|
|
llvm::Value *InnerLC) {
|
|
Builder.restoreIP(InnerCodeGenIP);
|
|
BodyCode = Builder.GetInsertBlock();
|
|
|
|
// Add something that consumes the induction variables to the body.
|
|
createPrintfCall(Builder, "i=%d j=%d\\n", {OuterLC, InnerLC});
|
|
};
|
|
InnerLoop = OMPBuilder.createCanonicalLoop(
|
|
OuterCodeGenIP, InnerLoopBodyGenCB, TripCount, "inner");
|
|
};
|
|
CanonicalLoopInfo *OuterLoop = OMPBuilder.createCanonicalLoop(
|
|
Loc, OuterLoopBodyGenCB, TripCount, "outer");
|
|
|
|
// Finalize the function.
|
|
Builder.restoreIP(OuterLoop->getAfterIP());
|
|
Builder.CreateRetVoid();
|
|
|
|
// Tile to loop nest.
|
|
Constant *OuterTileSize = ConstantInt::get(LCTy, APInt(32, 11));
|
|
Constant *InnerTileSize = ConstantInt::get(LCTy, APInt(32, 7));
|
|
std::vector<CanonicalLoopInfo *> GenLoops = OMPBuilder.tileLoops(
|
|
DL, {OuterLoop, InnerLoop}, {OuterTileSize, InnerTileSize});
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_EQ(GenLoops.size(), 4u);
|
|
CanonicalLoopInfo *Floor1 = GenLoops[0];
|
|
CanonicalLoopInfo *Floor2 = GenLoops[1];
|
|
CanonicalLoopInfo *Tile1 = GenLoops[2];
|
|
CanonicalLoopInfo *Tile2 = GenLoops[3];
|
|
|
|
BasicBlock *RefOrder[] = {
|
|
Floor1->getPreheader(),
|
|
Floor1->getHeader(),
|
|
Floor1->getCond(),
|
|
Floor1->getBody(),
|
|
Floor2->getPreheader(),
|
|
Floor2->getHeader(),
|
|
Floor2->getCond(),
|
|
Floor2->getBody(),
|
|
Tile1->getPreheader(),
|
|
Tile1->getHeader(),
|
|
Tile1->getCond(),
|
|
Tile1->getBody(),
|
|
Tile2->getPreheader(),
|
|
Tile2->getHeader(),
|
|
Tile2->getCond(),
|
|
Tile2->getBody(),
|
|
BodyCode,
|
|
Tile2->getLatch(),
|
|
Tile2->getExit(),
|
|
Tile2->getAfter(),
|
|
Tile1->getLatch(),
|
|
Tile1->getExit(),
|
|
Tile1->getAfter(),
|
|
Floor2->getLatch(),
|
|
Floor2->getExit(),
|
|
Floor2->getAfter(),
|
|
Floor1->getLatch(),
|
|
Floor1->getExit(),
|
|
Floor1->getAfter(),
|
|
};
|
|
EXPECT_TRUE(verifyDFSOrder(F, RefOrder));
|
|
EXPECT_TRUE(verifyListOrder(F, RefOrder));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, TileNestedLoopsWithBounds) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
|
|
IRBuilder<> Builder(BB);
|
|
Value *TripCount = F->getArg(0);
|
|
Type *LCTy = TripCount->getType();
|
|
|
|
Value *OuterStartVal = ConstantInt::get(LCTy, 2);
|
|
Value *OuterStopVal = TripCount;
|
|
Value *OuterStep = ConstantInt::get(LCTy, 5);
|
|
Value *InnerStartVal = ConstantInt::get(LCTy, 13);
|
|
Value *InnerStopVal = TripCount;
|
|
Value *InnerStep = ConstantInt::get(LCTy, 3);
|
|
|
|
// Fix an insertion point for ComputeIP.
|
|
BasicBlock *LoopNextEnter =
|
|
BasicBlock::Create(M->getContext(), "loopnest.enter", F,
|
|
Builder.GetInsertBlock()->getNextNode());
|
|
BranchInst *EnterBr = Builder.CreateBr(LoopNextEnter);
|
|
InsertPointTy ComputeIP{EnterBr->getParent(), EnterBr->getIterator()};
|
|
|
|
InsertPointTy LoopIP{LoopNextEnter, LoopNextEnter->begin()};
|
|
OpenMPIRBuilder::LocationDescription Loc({LoopIP, DL});
|
|
|
|
BasicBlock *BodyCode = nullptr;
|
|
CanonicalLoopInfo *InnerLoop = nullptr;
|
|
CallInst *Call = nullptr;
|
|
auto OuterLoopBodyGenCB = [&](InsertPointTy OuterCodeGenIP,
|
|
llvm::Value *OuterLC) {
|
|
auto InnerLoopBodyGenCB = [&](InsertPointTy InnerCodeGenIP,
|
|
llvm::Value *InnerLC) {
|
|
Builder.restoreIP(InnerCodeGenIP);
|
|
BodyCode = Builder.GetInsertBlock();
|
|
|
|
// Add something that consumes the induction variable to the body.
|
|
Call = createPrintfCall(Builder, "i=%d j=%d\\n", {OuterLC, InnerLC});
|
|
};
|
|
InnerLoop = OMPBuilder.createCanonicalLoop(
|
|
OuterCodeGenIP, InnerLoopBodyGenCB, InnerStartVal, InnerStopVal,
|
|
InnerStep, false, false, ComputeIP, "inner");
|
|
};
|
|
CanonicalLoopInfo *OuterLoop = OMPBuilder.createCanonicalLoop(
|
|
Loc, OuterLoopBodyGenCB, OuterStartVal, OuterStopVal, OuterStep, false,
|
|
false, ComputeIP, "outer");
|
|
|
|
// Finalize the function
|
|
Builder.restoreIP(OuterLoop->getAfterIP());
|
|
Builder.CreateRetVoid();
|
|
|
|
// Tile the loop nest.
|
|
Constant *TileSize0 = ConstantInt::get(LCTy, APInt(32, 11));
|
|
Constant *TileSize1 = ConstantInt::get(LCTy, APInt(32, 7));
|
|
std::vector<CanonicalLoopInfo *> GenLoops =
|
|
OMPBuilder.tileLoops(DL, {OuterLoop, InnerLoop}, {TileSize0, TileSize1});
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_EQ(GenLoops.size(), 4u);
|
|
CanonicalLoopInfo *Floor0 = GenLoops[0];
|
|
CanonicalLoopInfo *Floor1 = GenLoops[1];
|
|
CanonicalLoopInfo *Tile0 = GenLoops[2];
|
|
CanonicalLoopInfo *Tile1 = GenLoops[3];
|
|
|
|
BasicBlock *RefOrder[] = {
|
|
Floor0->getPreheader(),
|
|
Floor0->getHeader(),
|
|
Floor0->getCond(),
|
|
Floor0->getBody(),
|
|
Floor1->getPreheader(),
|
|
Floor1->getHeader(),
|
|
Floor1->getCond(),
|
|
Floor1->getBody(),
|
|
Tile0->getPreheader(),
|
|
Tile0->getHeader(),
|
|
Tile0->getCond(),
|
|
Tile0->getBody(),
|
|
Tile1->getPreheader(),
|
|
Tile1->getHeader(),
|
|
Tile1->getCond(),
|
|
Tile1->getBody(),
|
|
BodyCode,
|
|
Tile1->getLatch(),
|
|
Tile1->getExit(),
|
|
Tile1->getAfter(),
|
|
Tile0->getLatch(),
|
|
Tile0->getExit(),
|
|
Tile0->getAfter(),
|
|
Floor1->getLatch(),
|
|
Floor1->getExit(),
|
|
Floor1->getAfter(),
|
|
Floor0->getLatch(),
|
|
Floor0->getExit(),
|
|
Floor0->getAfter(),
|
|
};
|
|
EXPECT_TRUE(verifyDFSOrder(F, RefOrder));
|
|
EXPECT_TRUE(verifyListOrder(F, RefOrder));
|
|
|
|
EXPECT_EQ(Call->getParent(), BodyCode);
|
|
|
|
auto *RangeShift0 = cast<AddOperator>(Call->getOperand(1));
|
|
EXPECT_EQ(RangeShift0->getOperand(1), OuterStartVal);
|
|
auto *RangeScale0 = cast<MulOperator>(RangeShift0->getOperand(0));
|
|
EXPECT_EQ(RangeScale0->getOperand(1), OuterStep);
|
|
auto *TileShift0 = cast<AddOperator>(RangeScale0->getOperand(0));
|
|
EXPECT_EQ(cast<Instruction>(TileShift0)->getParent(), Tile1->getBody());
|
|
EXPECT_EQ(TileShift0->getOperand(1), Tile0->getIndVar());
|
|
auto *TileScale0 = cast<MulOperator>(TileShift0->getOperand(0));
|
|
EXPECT_EQ(cast<Instruction>(TileScale0)->getParent(), Tile1->getBody());
|
|
EXPECT_EQ(TileScale0->getOperand(0), TileSize0);
|
|
EXPECT_EQ(TileScale0->getOperand(1), Floor0->getIndVar());
|
|
|
|
auto *RangeShift1 = cast<AddOperator>(Call->getOperand(2));
|
|
EXPECT_EQ(cast<Instruction>(RangeShift1)->getParent(), BodyCode);
|
|
EXPECT_EQ(RangeShift1->getOperand(1), InnerStartVal);
|
|
auto *RangeScale1 = cast<MulOperator>(RangeShift1->getOperand(0));
|
|
EXPECT_EQ(cast<Instruction>(RangeScale1)->getParent(), BodyCode);
|
|
EXPECT_EQ(RangeScale1->getOperand(1), InnerStep);
|
|
auto *TileShift1 = cast<AddOperator>(RangeScale1->getOperand(0));
|
|
EXPECT_EQ(cast<Instruction>(TileShift1)->getParent(), Tile1->getBody());
|
|
EXPECT_EQ(TileShift1->getOperand(1), Tile1->getIndVar());
|
|
auto *TileScale1 = cast<MulOperator>(TileShift1->getOperand(0));
|
|
EXPECT_EQ(cast<Instruction>(TileScale1)->getParent(), Tile1->getBody());
|
|
EXPECT_EQ(TileScale1->getOperand(0), TileSize1);
|
|
EXPECT_EQ(TileScale1->getOperand(1), Floor1->getIndVar());
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, TileSingleLoopCounts) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
IRBuilder<> Builder(BB);
|
|
|
|
// Create a loop, tile it, and extract its trip count. All input values are
|
|
// constant and IRBuilder evaluates all-constant arithmetic inplace, such that
|
|
// the floor trip count itself will be a ConstantInt. Unfortunately we cannot
|
|
// do the same for the tile loop.
|
|
auto GetFloorCount = [&](int64_t Start, int64_t Stop, int64_t Step,
|
|
bool IsSigned, bool InclusiveStop,
|
|
int64_t TileSize) -> uint64_t {
|
|
OpenMPIRBuilder::LocationDescription Loc(Builder.saveIP(), DL);
|
|
Type *LCTy = Type::getInt16Ty(Ctx);
|
|
Value *StartVal = ConstantInt::get(LCTy, Start);
|
|
Value *StopVal = ConstantInt::get(LCTy, Stop);
|
|
Value *StepVal = ConstantInt::get(LCTy, Step);
|
|
|
|
// Generate a loop.
|
|
auto LoopBodyGenCB = [&](InsertPointTy CodeGenIP, llvm::Value *LC) {};
|
|
CanonicalLoopInfo *Loop =
|
|
OMPBuilder.createCanonicalLoop(Loc, LoopBodyGenCB, StartVal, StopVal,
|
|
StepVal, IsSigned, InclusiveStop);
|
|
InsertPointTy AfterIP = Loop->getAfterIP();
|
|
|
|
// Tile the loop.
|
|
Value *TileSizeVal = ConstantInt::get(LCTy, TileSize);
|
|
std::vector<CanonicalLoopInfo *> GenLoops =
|
|
OMPBuilder.tileLoops(Loc.DL, {Loop}, {TileSizeVal});
|
|
|
|
// Set the insertion pointer to after loop, where the next loop will be
|
|
// emitted.
|
|
Builder.restoreIP(AfterIP);
|
|
|
|
// Extract the trip count.
|
|
CanonicalLoopInfo *FloorLoop = GenLoops[0];
|
|
Value *FloorTripCount = FloorLoop->getTripCount();
|
|
return cast<ConstantInt>(FloorTripCount)->getValue().getZExtValue();
|
|
};
|
|
|
|
// Empty iteration domain.
|
|
EXPECT_EQ(GetFloorCount(0, 0, 1, false, false, 7), 0u);
|
|
EXPECT_EQ(GetFloorCount(0, -1, 1, false, true, 7), 0u);
|
|
EXPECT_EQ(GetFloorCount(-1, -1, -1, true, false, 7), 0u);
|
|
EXPECT_EQ(GetFloorCount(-1, 0, -1, true, true, 7), 0u);
|
|
EXPECT_EQ(GetFloorCount(-1, -1, 3, true, false, 7), 0u);
|
|
|
|
// Only complete tiles.
|
|
EXPECT_EQ(GetFloorCount(0, 14, 1, false, false, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(0, 14, 1, false, false, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(1, 15, 1, false, false, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(0, -14, -1, true, false, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(-1, -14, -1, true, true, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(0, 3 * 7 * 2, 3, false, false, 7), 2u);
|
|
|
|
// Only a partial tile.
|
|
EXPECT_EQ(GetFloorCount(0, 1, 1, false, false, 7), 1u);
|
|
EXPECT_EQ(GetFloorCount(0, 6, 1, false, false, 7), 1u);
|
|
EXPECT_EQ(GetFloorCount(-1, 1, 3, true, false, 7), 1u);
|
|
EXPECT_EQ(GetFloorCount(-1, -2, -1, true, false, 7), 1u);
|
|
EXPECT_EQ(GetFloorCount(0, 2, 3, false, false, 7), 1u);
|
|
|
|
// Complete and partial tiles.
|
|
EXPECT_EQ(GetFloorCount(0, 13, 1, false, false, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(0, 15, 1, false, false, 7), 3u);
|
|
EXPECT_EQ(GetFloorCount(-1, -14, -1, true, false, 7), 2u);
|
|
EXPECT_EQ(GetFloorCount(0, 3 * 7 * 5 - 1, 3, false, false, 7), 5u);
|
|
EXPECT_EQ(GetFloorCount(-1, -3 * 7 * 5, -3, true, false, 7), 5u);
|
|
|
|
// Close to 16-bit integer range.
|
|
EXPECT_EQ(GetFloorCount(0, 0xFFFF, 1, false, false, 1), 0xFFFFu);
|
|
EXPECT_EQ(GetFloorCount(0, 0xFFFF, 1, false, false, 7), 0xFFFFu / 7 + 1);
|
|
EXPECT_EQ(GetFloorCount(0, 0xFFFE, 1, false, true, 7), 0xFFFFu / 7 + 1);
|
|
EXPECT_EQ(GetFloorCount(-0x8000, 0x7FFF, 1, true, false, 7), 0xFFFFu / 7 + 1);
|
|
EXPECT_EQ(GetFloorCount(-0x7FFF, 0x7FFF, 1, true, true, 7), 0xFFFFu / 7 + 1);
|
|
EXPECT_EQ(GetFloorCount(0, 0xFFFE, 1, false, false, 0xFFFF), 1u);
|
|
EXPECT_EQ(GetFloorCount(-0x8000, 0x7FFF, 1, true, false, 0xFFFF), 1u);
|
|
|
|
// Finalize the function.
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, UnrollLoopFull) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
|
|
CanonicalLoopInfo *CLI = buildSingleLoopFunction(DL, OMPBuilder);
|
|
|
|
// Unroll the loop.
|
|
OMPBuilder.unrollLoopFull(DL, CLI);
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
PassBuilder PB;
|
|
FunctionAnalysisManager FAM;
|
|
PB.registerFunctionAnalyses(FAM);
|
|
LoopInfo &LI = FAM.getResult<LoopAnalysis>(*F);
|
|
|
|
const std::vector<Loop *> &TopLvl = LI.getTopLevelLoops();
|
|
EXPECT_EQ(TopLvl.size(), 1u);
|
|
|
|
Loop *L = TopLvl.front();
|
|
EXPECT_TRUE(getBooleanLoopAttribute(L, "llvm.loop.unroll.enable"));
|
|
EXPECT_TRUE(getBooleanLoopAttribute(L, "llvm.loop.unroll.full"));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, UnrollLoopPartial) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
CanonicalLoopInfo *CLI = buildSingleLoopFunction(DL, OMPBuilder);
|
|
|
|
// Unroll the loop.
|
|
CanonicalLoopInfo *UnrolledLoop = nullptr;
|
|
OMPBuilder.unrollLoopPartial(DL, CLI, 5, &UnrolledLoop);
|
|
ASSERT_NE(UnrolledLoop, nullptr);
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
UnrolledLoop->assertOK();
|
|
|
|
PassBuilder PB;
|
|
FunctionAnalysisManager FAM;
|
|
PB.registerFunctionAnalyses(FAM);
|
|
LoopInfo &LI = FAM.getResult<LoopAnalysis>(*F);
|
|
|
|
const std::vector<Loop *> &TopLvl = LI.getTopLevelLoops();
|
|
EXPECT_EQ(TopLvl.size(), 1u);
|
|
Loop *Outer = TopLvl.front();
|
|
EXPECT_EQ(Outer->getHeader(), UnrolledLoop->getHeader());
|
|
EXPECT_EQ(Outer->getLoopLatch(), UnrolledLoop->getLatch());
|
|
EXPECT_EQ(Outer->getExitingBlock(), UnrolledLoop->getCond());
|
|
EXPECT_EQ(Outer->getExitBlock(), UnrolledLoop->getExit());
|
|
|
|
EXPECT_EQ(Outer->getSubLoops().size(), 1u);
|
|
Loop *Inner = Outer->getSubLoops().front();
|
|
|
|
EXPECT_TRUE(getBooleanLoopAttribute(Inner, "llvm.loop.unroll.enable"));
|
|
EXPECT_EQ(getIntLoopAttribute(Inner, "llvm.loop.unroll.count"), 5);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, UnrollLoopHeuristic) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
|
|
CanonicalLoopInfo *CLI = buildSingleLoopFunction(DL, OMPBuilder);
|
|
|
|
// Unroll the loop.
|
|
OMPBuilder.unrollLoopHeuristic(DL, CLI);
|
|
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
PassBuilder PB;
|
|
FunctionAnalysisManager FAM;
|
|
PB.registerFunctionAnalyses(FAM);
|
|
LoopInfo &LI = FAM.getResult<LoopAnalysis>(*F);
|
|
|
|
const std::vector<Loop *> &TopLvl = LI.getTopLevelLoops();
|
|
EXPECT_EQ(TopLvl.size(), 1u);
|
|
|
|
Loop *L = TopLvl.front();
|
|
EXPECT_TRUE(getBooleanLoopAttribute(L, "llvm.loop.unroll.enable"));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, StaticWorkShareLoop) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
Type *LCTy = Type::getInt32Ty(Ctx);
|
|
Value *StartVal = ConstantInt::get(LCTy, 10);
|
|
Value *StopVal = ConstantInt::get(LCTy, 52);
|
|
Value *StepVal = ConstantInt::get(LCTy, 2);
|
|
auto LoopBodyGen = [&](InsertPointTy, llvm::Value *) {};
|
|
|
|
CanonicalLoopInfo *CLI = OMPBuilder.createCanonicalLoop(
|
|
Loc, LoopBodyGen, StartVal, StopVal, StepVal,
|
|
/*IsSigned=*/false, /*InclusiveStop=*/false);
|
|
BasicBlock *Preheader = CLI->getPreheader();
|
|
BasicBlock *Body = CLI->getBody();
|
|
Value *IV = CLI->getIndVar();
|
|
BasicBlock *ExitBlock = CLI->getExit();
|
|
|
|
Builder.SetInsertPoint(BB, BB->getFirstInsertionPt());
|
|
InsertPointTy AllocaIP = Builder.saveIP();
|
|
|
|
OMPBuilder.applyStaticWorkshareLoop(DL, CLI, AllocaIP, /*NeedsBarrier=*/true);
|
|
|
|
BasicBlock *Cond = Body->getSinglePredecessor();
|
|
Instruction *Cmp = &*Cond->begin();
|
|
Value *TripCount = Cmp->getOperand(1);
|
|
|
|
auto AllocaIter = BB->begin();
|
|
ASSERT_GE(std::distance(BB->begin(), BB->end()), 4);
|
|
AllocaInst *PLastIter = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
AllocaInst *PLowerBound = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
AllocaInst *PUpperBound = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
AllocaInst *PStride = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
EXPECT_NE(PLastIter, nullptr);
|
|
EXPECT_NE(PLowerBound, nullptr);
|
|
EXPECT_NE(PUpperBound, nullptr);
|
|
EXPECT_NE(PStride, nullptr);
|
|
|
|
auto PreheaderIter = Preheader->begin();
|
|
ASSERT_GE(std::distance(Preheader->begin(), Preheader->end()), 7);
|
|
StoreInst *LowerBoundStore = dyn_cast<StoreInst>(&*(PreheaderIter++));
|
|
StoreInst *UpperBoundStore = dyn_cast<StoreInst>(&*(PreheaderIter++));
|
|
StoreInst *StrideStore = dyn_cast<StoreInst>(&*(PreheaderIter++));
|
|
ASSERT_NE(LowerBoundStore, nullptr);
|
|
ASSERT_NE(UpperBoundStore, nullptr);
|
|
ASSERT_NE(StrideStore, nullptr);
|
|
|
|
auto *OrigLowerBound =
|
|
dyn_cast<ConstantInt>(LowerBoundStore->getValueOperand());
|
|
auto *OrigUpperBound =
|
|
dyn_cast<ConstantInt>(UpperBoundStore->getValueOperand());
|
|
auto *OrigStride = dyn_cast<ConstantInt>(StrideStore->getValueOperand());
|
|
ASSERT_NE(OrigLowerBound, nullptr);
|
|
ASSERT_NE(OrigUpperBound, nullptr);
|
|
ASSERT_NE(OrigStride, nullptr);
|
|
EXPECT_EQ(OrigLowerBound->getValue(), 0);
|
|
EXPECT_EQ(OrigUpperBound->getValue(), 20);
|
|
EXPECT_EQ(OrigStride->getValue(), 1);
|
|
|
|
// Check that the loop IV is updated to account for the lower bound returned
|
|
// by the OpenMP runtime call.
|
|
BinaryOperator *Add = dyn_cast<BinaryOperator>(&Body->front());
|
|
EXPECT_EQ(Add->getOperand(0), IV);
|
|
auto *LoadedLowerBound = dyn_cast<LoadInst>(Add->getOperand(1));
|
|
ASSERT_NE(LoadedLowerBound, nullptr);
|
|
EXPECT_EQ(LoadedLowerBound->getPointerOperand(), PLowerBound);
|
|
|
|
// Check that the trip count is updated to account for the lower and upper
|
|
// bounds return by the OpenMP runtime call.
|
|
auto *AddOne = dyn_cast<Instruction>(TripCount);
|
|
ASSERT_NE(AddOne, nullptr);
|
|
ASSERT_TRUE(AddOne->isBinaryOp());
|
|
auto *One = dyn_cast<ConstantInt>(AddOne->getOperand(1));
|
|
ASSERT_NE(One, nullptr);
|
|
EXPECT_EQ(One->getValue(), 1);
|
|
auto *Difference = dyn_cast<Instruction>(AddOne->getOperand(0));
|
|
ASSERT_NE(Difference, nullptr);
|
|
ASSERT_TRUE(Difference->isBinaryOp());
|
|
EXPECT_EQ(Difference->getOperand(1), LoadedLowerBound);
|
|
auto *LoadedUpperBound = dyn_cast<LoadInst>(Difference->getOperand(0));
|
|
ASSERT_NE(LoadedUpperBound, nullptr);
|
|
EXPECT_EQ(LoadedUpperBound->getPointerOperand(), PUpperBound);
|
|
|
|
// The original loop iterator should only be used in the condition, in the
|
|
// increment and in the statement that adds the lower bound to it.
|
|
EXPECT_EQ(std::distance(IV->use_begin(), IV->use_end()), 3);
|
|
|
|
// The exit block should contain the "fini" call and the barrier call,
|
|
// plus the call to obtain the thread ID.
|
|
size_t NumCallsInExitBlock =
|
|
count_if(*ExitBlock, [](Instruction &I) { return isa<CallInst>(I); });
|
|
EXPECT_EQ(NumCallsInExitBlock, 3u);
|
|
}
|
|
|
|
TEST_P(OpenMPIRBuilderTestWithParams, DynamicWorkShareLoop) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
omp::OMPScheduleType SchedType = GetParam();
|
|
uint32_t ChunkSize = 1;
|
|
switch (SchedType & ~omp::OMPScheduleType::ModifierMask) {
|
|
case omp::OMPScheduleType::DynamicChunked:
|
|
case omp::OMPScheduleType::GuidedChunked:
|
|
ChunkSize = 7;
|
|
break;
|
|
case omp::OMPScheduleType::Auto:
|
|
case omp::OMPScheduleType::Runtime:
|
|
ChunkSize = 1;
|
|
break;
|
|
default:
|
|
assert(0 && "unknown type for this test");
|
|
break;
|
|
}
|
|
|
|
Type *LCTy = Type::getInt32Ty(Ctx);
|
|
Value *StartVal = ConstantInt::get(LCTy, 10);
|
|
Value *StopVal = ConstantInt::get(LCTy, 52);
|
|
Value *StepVal = ConstantInt::get(LCTy, 2);
|
|
Value *ChunkVal = ConstantInt::get(LCTy, ChunkSize);
|
|
auto LoopBodyGen = [&](InsertPointTy, llvm::Value *) {};
|
|
|
|
CanonicalLoopInfo *CLI = OMPBuilder.createCanonicalLoop(
|
|
Loc, LoopBodyGen, StartVal, StopVal, StepVal,
|
|
/*IsSigned=*/false, /*InclusiveStop=*/false);
|
|
|
|
Builder.SetInsertPoint(BB, BB->getFirstInsertionPt());
|
|
InsertPointTy AllocaIP = Builder.saveIP();
|
|
|
|
// Collect all the info from CLI, as it isn't usable after the call to
|
|
// createDynamicWorkshareLoop.
|
|
InsertPointTy AfterIP = CLI->getAfterIP();
|
|
BasicBlock *Preheader = CLI->getPreheader();
|
|
BasicBlock *ExitBlock = CLI->getExit();
|
|
Value *IV = CLI->getIndVar();
|
|
|
|
InsertPointTy EndIP =
|
|
OMPBuilder.applyDynamicWorkshareLoop(DL, CLI, AllocaIP, SchedType,
|
|
/*NeedsBarrier=*/true, ChunkVal);
|
|
// The returned value should be the "after" point.
|
|
ASSERT_EQ(EndIP.getBlock(), AfterIP.getBlock());
|
|
ASSERT_EQ(EndIP.getPoint(), AfterIP.getPoint());
|
|
|
|
auto AllocaIter = BB->begin();
|
|
ASSERT_GE(std::distance(BB->begin(), BB->end()), 4);
|
|
AllocaInst *PLastIter = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
AllocaInst *PLowerBound = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
AllocaInst *PUpperBound = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
AllocaInst *PStride = dyn_cast<AllocaInst>(&*(AllocaIter++));
|
|
EXPECT_NE(PLastIter, nullptr);
|
|
EXPECT_NE(PLowerBound, nullptr);
|
|
EXPECT_NE(PUpperBound, nullptr);
|
|
EXPECT_NE(PStride, nullptr);
|
|
|
|
auto PreheaderIter = Preheader->begin();
|
|
ASSERT_GE(std::distance(Preheader->begin(), Preheader->end()), 6);
|
|
StoreInst *LowerBoundStore = dyn_cast<StoreInst>(&*(PreheaderIter++));
|
|
StoreInst *UpperBoundStore = dyn_cast<StoreInst>(&*(PreheaderIter++));
|
|
StoreInst *StrideStore = dyn_cast<StoreInst>(&*(PreheaderIter++));
|
|
ASSERT_NE(LowerBoundStore, nullptr);
|
|
ASSERT_NE(UpperBoundStore, nullptr);
|
|
ASSERT_NE(StrideStore, nullptr);
|
|
|
|
CallInst *ThreadIdCall = dyn_cast<CallInst>(&*(PreheaderIter++));
|
|
ASSERT_NE(ThreadIdCall, nullptr);
|
|
EXPECT_EQ(ThreadIdCall->getCalledFunction()->getName(),
|
|
"__kmpc_global_thread_num");
|
|
|
|
CallInst *InitCall = dyn_cast<CallInst>(&*PreheaderIter);
|
|
|
|
ASSERT_NE(InitCall, nullptr);
|
|
EXPECT_EQ(InitCall->getCalledFunction()->getName(),
|
|
"__kmpc_dispatch_init_4u");
|
|
EXPECT_EQ(InitCall->arg_size(), 7U);
|
|
EXPECT_EQ(InitCall->getArgOperand(6), ConstantInt::get(LCTy, ChunkSize));
|
|
ConstantInt *SchedVal = cast<ConstantInt>(InitCall->getArgOperand(2));
|
|
EXPECT_EQ(SchedVal->getValue(), static_cast<uint64_t>(SchedType));
|
|
|
|
ConstantInt *OrigLowerBound =
|
|
dyn_cast<ConstantInt>(LowerBoundStore->getValueOperand());
|
|
ConstantInt *OrigUpperBound =
|
|
dyn_cast<ConstantInt>(UpperBoundStore->getValueOperand());
|
|
ConstantInt *OrigStride =
|
|
dyn_cast<ConstantInt>(StrideStore->getValueOperand());
|
|
ASSERT_NE(OrigLowerBound, nullptr);
|
|
ASSERT_NE(OrigUpperBound, nullptr);
|
|
ASSERT_NE(OrigStride, nullptr);
|
|
EXPECT_EQ(OrigLowerBound->getValue(), 1);
|
|
EXPECT_EQ(OrigUpperBound->getValue(), 21);
|
|
EXPECT_EQ(OrigStride->getValue(), 1);
|
|
|
|
// The original loop iterator should only be used in the condition, in the
|
|
// increment and in the statement that adds the lower bound to it.
|
|
EXPECT_EQ(std::distance(IV->use_begin(), IV->use_end()), 3);
|
|
|
|
// The exit block should contain the barrier call, plus the call to obtain
|
|
// the thread ID.
|
|
size_t NumCallsInExitBlock =
|
|
count_if(*ExitBlock, [](Instruction &I) { return isa<CallInst>(I); });
|
|
EXPECT_EQ(NumCallsInExitBlock, 2u);
|
|
|
|
// Add a termination to our block and check that it is internally consistent.
|
|
Builder.restoreIP(EndIP);
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
INSTANTIATE_TEST_SUITE_P(
|
|
OpenMPWSLoopSchedulingTypes, OpenMPIRBuilderTestWithParams,
|
|
::testing::Values(omp::OMPScheduleType::DynamicChunked,
|
|
omp::OMPScheduleType::GuidedChunked,
|
|
omp::OMPScheduleType::Auto, omp::OMPScheduleType::Runtime,
|
|
omp::OMPScheduleType::DynamicChunked |
|
|
omp::OMPScheduleType::ModifierMonotonic,
|
|
omp::OMPScheduleType::DynamicChunked |
|
|
omp::OMPScheduleType::ModifierNonmonotonic,
|
|
omp::OMPScheduleType::GuidedChunked |
|
|
omp::OMPScheduleType::ModifierMonotonic,
|
|
omp::OMPScheduleType::GuidedChunked |
|
|
omp::OMPScheduleType::ModifierNonmonotonic,
|
|
omp::OMPScheduleType::Auto |
|
|
omp::OMPScheduleType::ModifierMonotonic,
|
|
omp::OMPScheduleType::Runtime |
|
|
omp::OMPScheduleType::ModifierMonotonic));
|
|
|
|
TEST_F(OpenMPIRBuilderTest, MasterDirective) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI = nullptr;
|
|
|
|
BasicBlock *EntryBB = nullptr;
|
|
BasicBlock *ExitBB = nullptr;
|
|
BasicBlock *ThenBB = nullptr;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
if (AllocaIP.isSet())
|
|
Builder.restoreIP(AllocaIP);
|
|
else
|
|
Builder.SetInsertPoint(&*(F->getEntryBlock().getFirstInsertionPt()));
|
|
PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
|
|
llvm::BasicBlock *CodeGenIPBB = CodeGenIP.getBlock();
|
|
llvm::Instruction *CodeGenIPInst = &*CodeGenIP.getPoint();
|
|
EXPECT_EQ(CodeGenIPBB->getTerminator(), CodeGenIPInst);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
// collect some info for checks later
|
|
ExitBB = FiniBB.getUniqueSuccessor();
|
|
ThenBB = Builder.GetInsertBlock();
|
|
EntryBB = ThenBB->getUniquePredecessor();
|
|
|
|
// simple instructions for body
|
|
Value *PrivLoad = Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI,
|
|
"local.use");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
Builder.restoreIP(OMPBuilder.createMaster(Builder, BodyGenCB, FiniCB));
|
|
Value *EntryBBTI = EntryBB->getTerminator();
|
|
EXPECT_NE(EntryBBTI, nullptr);
|
|
EXPECT_TRUE(isa<BranchInst>(EntryBBTI));
|
|
BranchInst *EntryBr = cast<BranchInst>(EntryBB->getTerminator());
|
|
EXPECT_TRUE(EntryBr->isConditional());
|
|
EXPECT_EQ(EntryBr->getSuccessor(0), ThenBB);
|
|
EXPECT_EQ(ThenBB->getUniqueSuccessor(), ExitBB);
|
|
EXPECT_EQ(EntryBr->getSuccessor(1), ExitBB);
|
|
|
|
CmpInst *CondInst = cast<CmpInst>(EntryBr->getCondition());
|
|
EXPECT_TRUE(isa<CallInst>(CondInst->getOperand(0)));
|
|
|
|
CallInst *MasterEntryCI = cast<CallInst>(CondInst->getOperand(0));
|
|
EXPECT_EQ(MasterEntryCI->arg_size(), 2U);
|
|
EXPECT_EQ(MasterEntryCI->getCalledFunction()->getName(), "__kmpc_master");
|
|
EXPECT_TRUE(isa<GlobalVariable>(MasterEntryCI->getArgOperand(0)));
|
|
|
|
CallInst *MasterEndCI = nullptr;
|
|
for (auto &FI : *ThenBB) {
|
|
Instruction *cur = &FI;
|
|
if (isa<CallInst>(cur)) {
|
|
MasterEndCI = cast<CallInst>(cur);
|
|
if (MasterEndCI->getCalledFunction()->getName() == "__kmpc_end_master")
|
|
break;
|
|
MasterEndCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(MasterEndCI, nullptr);
|
|
EXPECT_EQ(MasterEndCI->arg_size(), 2U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(MasterEndCI->getArgOperand(0)));
|
|
EXPECT_EQ(MasterEndCI->getArgOperand(1), MasterEntryCI->getArgOperand(1));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, MaskedDirective) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI = nullptr;
|
|
|
|
BasicBlock *EntryBB = nullptr;
|
|
BasicBlock *ExitBB = nullptr;
|
|
BasicBlock *ThenBB = nullptr;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
if (AllocaIP.isSet())
|
|
Builder.restoreIP(AllocaIP);
|
|
else
|
|
Builder.SetInsertPoint(&*(F->getEntryBlock().getFirstInsertionPt()));
|
|
PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
|
|
llvm::BasicBlock *CodeGenIPBB = CodeGenIP.getBlock();
|
|
llvm::Instruction *CodeGenIPInst = &*CodeGenIP.getPoint();
|
|
EXPECT_EQ(CodeGenIPBB->getTerminator(), CodeGenIPInst);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
// collect some info for checks later
|
|
ExitBB = FiniBB.getUniqueSuccessor();
|
|
ThenBB = Builder.GetInsertBlock();
|
|
EntryBB = ThenBB->getUniquePredecessor();
|
|
|
|
// simple instructions for body
|
|
Value *PrivLoad =
|
|
Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI, "local.use");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
Constant *Filter = ConstantInt::get(Type::getInt32Ty(M->getContext()), 0);
|
|
Builder.restoreIP(
|
|
OMPBuilder.createMasked(Builder, BodyGenCB, FiniCB, Filter));
|
|
Value *EntryBBTI = EntryBB->getTerminator();
|
|
EXPECT_NE(EntryBBTI, nullptr);
|
|
EXPECT_TRUE(isa<BranchInst>(EntryBBTI));
|
|
BranchInst *EntryBr = cast<BranchInst>(EntryBB->getTerminator());
|
|
EXPECT_TRUE(EntryBr->isConditional());
|
|
EXPECT_EQ(EntryBr->getSuccessor(0), ThenBB);
|
|
EXPECT_EQ(ThenBB->getUniqueSuccessor(), ExitBB);
|
|
EXPECT_EQ(EntryBr->getSuccessor(1), ExitBB);
|
|
|
|
CmpInst *CondInst = cast<CmpInst>(EntryBr->getCondition());
|
|
EXPECT_TRUE(isa<CallInst>(CondInst->getOperand(0)));
|
|
|
|
CallInst *MaskedEntryCI = cast<CallInst>(CondInst->getOperand(0));
|
|
EXPECT_EQ(MaskedEntryCI->arg_size(), 3U);
|
|
EXPECT_EQ(MaskedEntryCI->getCalledFunction()->getName(), "__kmpc_masked");
|
|
EXPECT_TRUE(isa<GlobalVariable>(MaskedEntryCI->getArgOperand(0)));
|
|
|
|
CallInst *MaskedEndCI = nullptr;
|
|
for (auto &FI : *ThenBB) {
|
|
Instruction *cur = &FI;
|
|
if (isa<CallInst>(cur)) {
|
|
MaskedEndCI = cast<CallInst>(cur);
|
|
if (MaskedEndCI->getCalledFunction()->getName() == "__kmpc_end_masked")
|
|
break;
|
|
MaskedEndCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(MaskedEndCI, nullptr);
|
|
EXPECT_EQ(MaskedEndCI->arg_size(), 2U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(MaskedEndCI->getArgOperand(0)));
|
|
EXPECT_EQ(MaskedEndCI->getArgOperand(1), MaskedEntryCI->getArgOperand(1));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CriticalDirective) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
|
|
BasicBlock *EntryBB = nullptr;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
// collect some info for checks later
|
|
EntryBB = FiniBB.getUniquePredecessor();
|
|
|
|
// actual start for bodyCB
|
|
llvm::BasicBlock *CodeGenIPBB = CodeGenIP.getBlock();
|
|
llvm::Instruction *CodeGenIPInst = &*CodeGenIP.getPoint();
|
|
EXPECT_EQ(CodeGenIPBB->getTerminator(), CodeGenIPInst);
|
|
EXPECT_EQ(EntryBB, CodeGenIPBB);
|
|
|
|
// body begin
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
Value *PrivLoad = Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI,
|
|
"local.use");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
Builder.restoreIP(OMPBuilder.createCritical(Builder, BodyGenCB, FiniCB,
|
|
"testCRT", nullptr));
|
|
|
|
Value *EntryBBTI = EntryBB->getTerminator();
|
|
EXPECT_EQ(EntryBBTI, nullptr);
|
|
|
|
CallInst *CriticalEntryCI = nullptr;
|
|
for (auto &EI : *EntryBB) {
|
|
Instruction *cur = &EI;
|
|
if (isa<CallInst>(cur)) {
|
|
CriticalEntryCI = cast<CallInst>(cur);
|
|
if (CriticalEntryCI->getCalledFunction()->getName() == "__kmpc_critical")
|
|
break;
|
|
CriticalEntryCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(CriticalEntryCI, nullptr);
|
|
EXPECT_EQ(CriticalEntryCI->arg_size(), 3U);
|
|
EXPECT_EQ(CriticalEntryCI->getCalledFunction()->getName(), "__kmpc_critical");
|
|
EXPECT_TRUE(isa<GlobalVariable>(CriticalEntryCI->getArgOperand(0)));
|
|
|
|
CallInst *CriticalEndCI = nullptr;
|
|
for (auto &FI : *EntryBB) {
|
|
Instruction *cur = &FI;
|
|
if (isa<CallInst>(cur)) {
|
|
CriticalEndCI = cast<CallInst>(cur);
|
|
if (CriticalEndCI->getCalledFunction()->getName() ==
|
|
"__kmpc_end_critical")
|
|
break;
|
|
CriticalEndCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(CriticalEndCI, nullptr);
|
|
EXPECT_EQ(CriticalEndCI->arg_size(), 3U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(CriticalEndCI->getArgOperand(0)));
|
|
EXPECT_EQ(CriticalEndCI->getArgOperand(1), CriticalEntryCI->getArgOperand(1));
|
|
PointerType *CriticalNamePtrTy =
|
|
PointerType::getUnqual(ArrayType::get(Type::getInt32Ty(Ctx), 8));
|
|
EXPECT_EQ(CriticalEndCI->getArgOperand(2), CriticalEntryCI->getArgOperand(2));
|
|
EXPECT_EQ(CriticalEndCI->getArgOperand(2)->getType(), CriticalNamePtrTy);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OrderedDirectiveDependSource) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
LLVMContext &Ctx = M->getContext();
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
InsertPointTy AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
|
|
unsigned NumLoops = 2;
|
|
SmallVector<Value *, 2> StoreValues;
|
|
Type *LCTy = Type::getInt64Ty(Ctx);
|
|
StoreValues.emplace_back(ConstantInt::get(LCTy, 1));
|
|
StoreValues.emplace_back(ConstantInt::get(LCTy, 2));
|
|
|
|
// Test for "#omp ordered depend(source)"
|
|
Builder.restoreIP(OMPBuilder.createOrderedDepend(Builder, AllocaIP, NumLoops,
|
|
StoreValues, ".cnt.addr",
|
|
/*IsDependSource=*/true));
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
AllocaInst *AllocInst = dyn_cast<AllocaInst>(&BB->front());
|
|
ASSERT_NE(AllocInst, nullptr);
|
|
ArrayType *ArrType = dyn_cast<ArrayType>(AllocInst->getAllocatedType());
|
|
EXPECT_EQ(ArrType->getNumElements(), NumLoops);
|
|
EXPECT_TRUE(
|
|
AllocInst->getAllocatedType()->getArrayElementType()->isIntegerTy(64));
|
|
|
|
Instruction *IterInst = dyn_cast<Instruction>(AllocInst);
|
|
for (unsigned Iter = 0; Iter < NumLoops; Iter++) {
|
|
GetElementPtrInst *DependAddrGEPIter =
|
|
dyn_cast<GetElementPtrInst>(IterInst->getNextNode());
|
|
ASSERT_NE(DependAddrGEPIter, nullptr);
|
|
EXPECT_EQ(DependAddrGEPIter->getPointerOperand(), AllocInst);
|
|
EXPECT_EQ(DependAddrGEPIter->getNumIndices(), (unsigned)2);
|
|
auto *FirstIdx = dyn_cast<ConstantInt>(DependAddrGEPIter->getOperand(1));
|
|
auto *SecondIdx = dyn_cast<ConstantInt>(DependAddrGEPIter->getOperand(2));
|
|
ASSERT_NE(FirstIdx, nullptr);
|
|
ASSERT_NE(SecondIdx, nullptr);
|
|
EXPECT_EQ(FirstIdx->getValue(), 0);
|
|
EXPECT_EQ(SecondIdx->getValue(), Iter);
|
|
StoreInst *StoreValue =
|
|
dyn_cast<StoreInst>(DependAddrGEPIter->getNextNode());
|
|
ASSERT_NE(StoreValue, nullptr);
|
|
EXPECT_EQ(StoreValue->getValueOperand(), StoreValues[Iter]);
|
|
EXPECT_EQ(StoreValue->getPointerOperand(), DependAddrGEPIter);
|
|
IterInst = dyn_cast<Instruction>(StoreValue);
|
|
}
|
|
|
|
GetElementPtrInst *DependBaseAddrGEP =
|
|
dyn_cast<GetElementPtrInst>(IterInst->getNextNode());
|
|
ASSERT_NE(DependBaseAddrGEP, nullptr);
|
|
EXPECT_EQ(DependBaseAddrGEP->getPointerOperand(), AllocInst);
|
|
EXPECT_EQ(DependBaseAddrGEP->getNumIndices(), (unsigned)2);
|
|
auto *FirstIdx = dyn_cast<ConstantInt>(DependBaseAddrGEP->getOperand(1));
|
|
auto *SecondIdx = dyn_cast<ConstantInt>(DependBaseAddrGEP->getOperand(2));
|
|
ASSERT_NE(FirstIdx, nullptr);
|
|
ASSERT_NE(SecondIdx, nullptr);
|
|
EXPECT_EQ(FirstIdx->getValue(), 0);
|
|
EXPECT_EQ(SecondIdx->getValue(), 0);
|
|
|
|
CallInst *GTID = dyn_cast<CallInst>(DependBaseAddrGEP->getNextNode());
|
|
ASSERT_NE(GTID, nullptr);
|
|
EXPECT_EQ(GTID->arg_size(), 1U);
|
|
EXPECT_EQ(GTID->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
CallInst *Depend = dyn_cast<CallInst>(GTID->getNextNode());
|
|
ASSERT_NE(Depend, nullptr);
|
|
EXPECT_EQ(Depend->arg_size(), 3U);
|
|
EXPECT_EQ(Depend->getCalledFunction()->getName(), "__kmpc_doacross_post");
|
|
EXPECT_TRUE(isa<GlobalVariable>(Depend->getArgOperand(0)));
|
|
EXPECT_EQ(Depend->getArgOperand(1), GTID);
|
|
EXPECT_EQ(Depend->getArgOperand(2), DependBaseAddrGEP);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OrderedDirectiveDependSink) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
LLVMContext &Ctx = M->getContext();
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
InsertPointTy AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
|
|
unsigned NumLoops = 2;
|
|
SmallVector<Value *, 2> StoreValues;
|
|
Type *LCTy = Type::getInt64Ty(Ctx);
|
|
StoreValues.emplace_back(ConstantInt::get(LCTy, 1));
|
|
StoreValues.emplace_back(ConstantInt::get(LCTy, 2));
|
|
|
|
// Test for "#omp ordered depend(sink: vec)"
|
|
Builder.restoreIP(OMPBuilder.createOrderedDepend(Builder, AllocaIP, NumLoops,
|
|
StoreValues, ".cnt.addr",
|
|
/*IsDependSource=*/false));
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
AllocaInst *AllocInst = dyn_cast<AllocaInst>(&BB->front());
|
|
ASSERT_NE(AllocInst, nullptr);
|
|
ArrayType *ArrType = dyn_cast<ArrayType>(AllocInst->getAllocatedType());
|
|
EXPECT_EQ(ArrType->getNumElements(), NumLoops);
|
|
EXPECT_TRUE(
|
|
AllocInst->getAllocatedType()->getArrayElementType()->isIntegerTy(64));
|
|
|
|
Instruction *IterInst = dyn_cast<Instruction>(AllocInst);
|
|
for (unsigned Iter = 0; Iter < NumLoops; Iter++) {
|
|
GetElementPtrInst *DependAddrGEPIter =
|
|
dyn_cast<GetElementPtrInst>(IterInst->getNextNode());
|
|
ASSERT_NE(DependAddrGEPIter, nullptr);
|
|
EXPECT_EQ(DependAddrGEPIter->getPointerOperand(), AllocInst);
|
|
EXPECT_EQ(DependAddrGEPIter->getNumIndices(), (unsigned)2);
|
|
auto *FirstIdx = dyn_cast<ConstantInt>(DependAddrGEPIter->getOperand(1));
|
|
auto *SecondIdx = dyn_cast<ConstantInt>(DependAddrGEPIter->getOperand(2));
|
|
ASSERT_NE(FirstIdx, nullptr);
|
|
ASSERT_NE(SecondIdx, nullptr);
|
|
EXPECT_EQ(FirstIdx->getValue(), 0);
|
|
EXPECT_EQ(SecondIdx->getValue(), Iter);
|
|
StoreInst *StoreValue =
|
|
dyn_cast<StoreInst>(DependAddrGEPIter->getNextNode());
|
|
ASSERT_NE(StoreValue, nullptr);
|
|
EXPECT_EQ(StoreValue->getValueOperand(), StoreValues[Iter]);
|
|
EXPECT_EQ(StoreValue->getPointerOperand(), DependAddrGEPIter);
|
|
IterInst = dyn_cast<Instruction>(StoreValue);
|
|
}
|
|
|
|
GetElementPtrInst *DependBaseAddrGEP =
|
|
dyn_cast<GetElementPtrInst>(IterInst->getNextNode());
|
|
ASSERT_NE(DependBaseAddrGEP, nullptr);
|
|
EXPECT_EQ(DependBaseAddrGEP->getPointerOperand(), AllocInst);
|
|
EXPECT_EQ(DependBaseAddrGEP->getNumIndices(), (unsigned)2);
|
|
auto *FirstIdx = dyn_cast<ConstantInt>(DependBaseAddrGEP->getOperand(1));
|
|
auto *SecondIdx = dyn_cast<ConstantInt>(DependBaseAddrGEP->getOperand(2));
|
|
ASSERT_NE(FirstIdx, nullptr);
|
|
ASSERT_NE(SecondIdx, nullptr);
|
|
EXPECT_EQ(FirstIdx->getValue(), 0);
|
|
EXPECT_EQ(SecondIdx->getValue(), 0);
|
|
|
|
CallInst *GTID = dyn_cast<CallInst>(DependBaseAddrGEP->getNextNode());
|
|
ASSERT_NE(GTID, nullptr);
|
|
EXPECT_EQ(GTID->arg_size(), 1U);
|
|
EXPECT_EQ(GTID->getCalledFunction()->getName(), "__kmpc_global_thread_num");
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotAccessMemory());
|
|
EXPECT_FALSE(GTID->getCalledFunction()->doesNotFreeMemory());
|
|
|
|
CallInst *Depend = dyn_cast<CallInst>(GTID->getNextNode());
|
|
ASSERT_NE(Depend, nullptr);
|
|
EXPECT_EQ(Depend->arg_size(), 3U);
|
|
EXPECT_EQ(Depend->getCalledFunction()->getName(), "__kmpc_doacross_wait");
|
|
EXPECT_TRUE(isa<GlobalVariable>(Depend->getArgOperand(0)));
|
|
EXPECT_EQ(Depend->getArgOperand(1), GTID);
|
|
EXPECT_EQ(Depend->getArgOperand(2), DependBaseAddrGEP);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OrderedDirectiveThreads) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI =
|
|
Builder.CreateAlloca(F->arg_begin()->getType(), nullptr, "priv.inst");
|
|
|
|
BasicBlock *EntryBB = nullptr;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
EntryBB = FiniBB.getUniquePredecessor();
|
|
|
|
llvm::BasicBlock *CodeGenIPBB = CodeGenIP.getBlock();
|
|
llvm::Instruction *CodeGenIPInst = &*CodeGenIP.getPoint();
|
|
EXPECT_EQ(CodeGenIPBB->getTerminator(), CodeGenIPInst);
|
|
EXPECT_EQ(EntryBB, CodeGenIPBB);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
Value *PrivLoad =
|
|
Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI, "local.use");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
// Test for "#omp ordered [threads]"
|
|
Builder.restoreIP(
|
|
OMPBuilder.createOrderedThreadsSimd(Builder, BodyGenCB, FiniCB, true));
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_NE(EntryBB->getTerminator(), nullptr);
|
|
|
|
CallInst *OrderedEntryCI = nullptr;
|
|
for (auto &EI : *EntryBB) {
|
|
Instruction *Cur = &EI;
|
|
if (isa<CallInst>(Cur)) {
|
|
OrderedEntryCI = cast<CallInst>(Cur);
|
|
if (OrderedEntryCI->getCalledFunction()->getName() == "__kmpc_ordered")
|
|
break;
|
|
OrderedEntryCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(OrderedEntryCI, nullptr);
|
|
EXPECT_EQ(OrderedEntryCI->arg_size(), 2U);
|
|
EXPECT_EQ(OrderedEntryCI->getCalledFunction()->getName(), "__kmpc_ordered");
|
|
EXPECT_TRUE(isa<GlobalVariable>(OrderedEntryCI->getArgOperand(0)));
|
|
|
|
CallInst *OrderedEndCI = nullptr;
|
|
for (auto &FI : *EntryBB) {
|
|
Instruction *Cur = &FI;
|
|
if (isa<CallInst>(Cur)) {
|
|
OrderedEndCI = cast<CallInst>(Cur);
|
|
if (OrderedEndCI->getCalledFunction()->getName() == "__kmpc_end_ordered")
|
|
break;
|
|
OrderedEndCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(OrderedEndCI, nullptr);
|
|
EXPECT_EQ(OrderedEndCI->arg_size(), 2U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(OrderedEndCI->getArgOperand(0)));
|
|
EXPECT_EQ(OrderedEndCI->getArgOperand(1), OrderedEntryCI->getArgOperand(1));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OrderedDirectiveSimd) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI =
|
|
Builder.CreateAlloca(F->arg_begin()->getType(), nullptr, "priv.inst");
|
|
|
|
BasicBlock *EntryBB = nullptr;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
EntryBB = FiniBB.getUniquePredecessor();
|
|
|
|
llvm::BasicBlock *CodeGenIPBB = CodeGenIP.getBlock();
|
|
llvm::Instruction *CodeGenIPInst = &*CodeGenIP.getPoint();
|
|
EXPECT_EQ(CodeGenIPBB->getTerminator(), CodeGenIPInst);
|
|
EXPECT_EQ(EntryBB, CodeGenIPBB);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
Value *PrivLoad =
|
|
Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI, "local.use");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
// Test for "#omp ordered simd"
|
|
Builder.restoreIP(
|
|
OMPBuilder.createOrderedThreadsSimd(Builder, BodyGenCB, FiniCB, false));
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
|
|
EXPECT_NE(EntryBB->getTerminator(), nullptr);
|
|
|
|
CallInst *OrderedEntryCI = nullptr;
|
|
for (auto &EI : *EntryBB) {
|
|
Instruction *Cur = &EI;
|
|
if (isa<CallInst>(Cur)) {
|
|
OrderedEntryCI = cast<CallInst>(Cur);
|
|
if (OrderedEntryCI->getCalledFunction()->getName() == "__kmpc_ordered")
|
|
break;
|
|
OrderedEntryCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_EQ(OrderedEntryCI, nullptr);
|
|
|
|
CallInst *OrderedEndCI = nullptr;
|
|
for (auto &FI : *EntryBB) {
|
|
Instruction *Cur = &FI;
|
|
if (isa<CallInst>(Cur)) {
|
|
OrderedEndCI = cast<CallInst>(Cur);
|
|
if (OrderedEndCI->getCalledFunction()->getName() == "__kmpc_end_ordered")
|
|
break;
|
|
OrderedEndCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_EQ(OrderedEndCI, nullptr);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CopyinBlocks) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
IntegerType* Int32 = Type::getInt32Ty(M->getContext());
|
|
AllocaInst* MasterAddress = Builder.CreateAlloca(Int32->getPointerTo());
|
|
AllocaInst* PrivAddress = Builder.CreateAlloca(Int32->getPointerTo());
|
|
|
|
BasicBlock *EntryBB = BB;
|
|
|
|
OMPBuilder.createCopyinClauseBlocks(Builder.saveIP(), MasterAddress,
|
|
PrivAddress, Int32, /*BranchtoEnd*/ true);
|
|
|
|
BranchInst* EntryBr = dyn_cast_or_null<BranchInst>(EntryBB->getTerminator());
|
|
|
|
EXPECT_NE(EntryBr, nullptr);
|
|
EXPECT_TRUE(EntryBr->isConditional());
|
|
|
|
BasicBlock* NotMasterBB = EntryBr->getSuccessor(0);
|
|
BasicBlock* CopyinEnd = EntryBr->getSuccessor(1);
|
|
CmpInst* CMP = dyn_cast_or_null<CmpInst>(EntryBr->getCondition());
|
|
|
|
EXPECT_NE(CMP, nullptr);
|
|
EXPECT_NE(NotMasterBB, nullptr);
|
|
EXPECT_NE(CopyinEnd, nullptr);
|
|
|
|
BranchInst* NotMasterBr = dyn_cast_or_null<BranchInst>(NotMasterBB->getTerminator());
|
|
EXPECT_NE(NotMasterBr, nullptr);
|
|
EXPECT_FALSE(NotMasterBr->isConditional());
|
|
EXPECT_EQ(CopyinEnd,NotMasterBr->getSuccessor(0));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, SingleDirective) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
AllocaInst *PrivAI = nullptr;
|
|
|
|
BasicBlock *EntryBB = nullptr;
|
|
BasicBlock *ExitBB = nullptr;
|
|
BasicBlock *ThenBB = nullptr;
|
|
|
|
auto BodyGenCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
if (AllocaIP.isSet())
|
|
Builder.restoreIP(AllocaIP);
|
|
else
|
|
Builder.SetInsertPoint(&*(F->getEntryBlock().getFirstInsertionPt()));
|
|
PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
|
|
llvm::BasicBlock *CodeGenIPBB = CodeGenIP.getBlock();
|
|
llvm::Instruction *CodeGenIPInst = &*CodeGenIP.getPoint();
|
|
EXPECT_EQ(CodeGenIPBB->getTerminator(), CodeGenIPInst);
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
// collect some info for checks later
|
|
ExitBB = FiniBB.getUniqueSuccessor();
|
|
ThenBB = Builder.GetInsertBlock();
|
|
EntryBB = ThenBB->getUniquePredecessor();
|
|
|
|
// simple instructions for body
|
|
Value *PrivLoad = Builder.CreateLoad(PrivAI->getAllocatedType(), PrivAI,
|
|
"local.use");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
};
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
Builder.restoreIP(
|
|
OMPBuilder.createSingle(Builder, BodyGenCB, FiniCB, /*DidIt*/ nullptr));
|
|
Value *EntryBBTI = EntryBB->getTerminator();
|
|
EXPECT_NE(EntryBBTI, nullptr);
|
|
EXPECT_TRUE(isa<BranchInst>(EntryBBTI));
|
|
BranchInst *EntryBr = cast<BranchInst>(EntryBB->getTerminator());
|
|
EXPECT_TRUE(EntryBr->isConditional());
|
|
EXPECT_EQ(EntryBr->getSuccessor(0), ThenBB);
|
|
EXPECT_EQ(ThenBB->getUniqueSuccessor(), ExitBB);
|
|
EXPECT_EQ(EntryBr->getSuccessor(1), ExitBB);
|
|
|
|
CmpInst *CondInst = cast<CmpInst>(EntryBr->getCondition());
|
|
EXPECT_TRUE(isa<CallInst>(CondInst->getOperand(0)));
|
|
|
|
CallInst *SingleEntryCI = cast<CallInst>(CondInst->getOperand(0));
|
|
EXPECT_EQ(SingleEntryCI->arg_size(), 2U);
|
|
EXPECT_EQ(SingleEntryCI->getCalledFunction()->getName(), "__kmpc_single");
|
|
EXPECT_TRUE(isa<GlobalVariable>(SingleEntryCI->getArgOperand(0)));
|
|
|
|
CallInst *SingleEndCI = nullptr;
|
|
for (auto &FI : *ThenBB) {
|
|
Instruction *cur = &FI;
|
|
if (isa<CallInst>(cur)) {
|
|
SingleEndCI = cast<CallInst>(cur);
|
|
if (SingleEndCI->getCalledFunction()->getName() == "__kmpc_end_single")
|
|
break;
|
|
SingleEndCI = nullptr;
|
|
}
|
|
}
|
|
EXPECT_NE(SingleEndCI, nullptr);
|
|
EXPECT_EQ(SingleEndCI->arg_size(), 2U);
|
|
EXPECT_TRUE(isa<GlobalVariable>(SingleEndCI->getArgOperand(0)));
|
|
EXPECT_EQ(SingleEndCI->getArgOperand(1), SingleEntryCI->getArgOperand(1));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OMPAtomicReadFlt) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
Type *Float32 = Type::getFloatTy(M->getContext());
|
|
AllocaInst *XVal = Builder.CreateAlloca(Float32);
|
|
XVal->setName("AtomicVar");
|
|
AllocaInst *VVal = Builder.CreateAlloca(Float32);
|
|
VVal->setName("AtomicRead");
|
|
AtomicOrdering AO = AtomicOrdering::Monotonic;
|
|
OpenMPIRBuilder::AtomicOpValue X = {XVal, false, false};
|
|
OpenMPIRBuilder::AtomicOpValue V = {VVal, false, false};
|
|
|
|
Builder.restoreIP(OMPBuilder.createAtomicRead(Loc, X, V, AO));
|
|
|
|
IntegerType *IntCastTy =
|
|
IntegerType::get(M->getContext(), Float32->getScalarSizeInBits());
|
|
|
|
BitCastInst *CastFrmFlt = cast<BitCastInst>(VVal->getNextNode());
|
|
EXPECT_EQ(CastFrmFlt->getSrcTy(), Float32->getPointerTo());
|
|
EXPECT_EQ(CastFrmFlt->getDestTy(), IntCastTy->getPointerTo());
|
|
EXPECT_EQ(CastFrmFlt->getOperand(0), XVal);
|
|
|
|
LoadInst *AtomicLoad = cast<LoadInst>(CastFrmFlt->getNextNode());
|
|
EXPECT_TRUE(AtomicLoad->isAtomic());
|
|
EXPECT_EQ(AtomicLoad->getPointerOperand(), CastFrmFlt);
|
|
|
|
BitCastInst *CastToFlt = cast<BitCastInst>(AtomicLoad->getNextNode());
|
|
EXPECT_EQ(CastToFlt->getSrcTy(), IntCastTy);
|
|
EXPECT_EQ(CastToFlt->getDestTy(), Float32);
|
|
EXPECT_EQ(CastToFlt->getOperand(0), AtomicLoad);
|
|
|
|
StoreInst *StoreofAtomic = cast<StoreInst>(CastToFlt->getNextNode());
|
|
EXPECT_EQ(StoreofAtomic->getValueOperand(), CastToFlt);
|
|
EXPECT_EQ(StoreofAtomic->getPointerOperand(), VVal);
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OMPAtomicReadInt) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
IntegerType *Int32 = Type::getInt32Ty(M->getContext());
|
|
AllocaInst *XVal = Builder.CreateAlloca(Int32);
|
|
XVal->setName("AtomicVar");
|
|
AllocaInst *VVal = Builder.CreateAlloca(Int32);
|
|
VVal->setName("AtomicRead");
|
|
AtomicOrdering AO = AtomicOrdering::Monotonic;
|
|
OpenMPIRBuilder::AtomicOpValue X = {XVal, false, false};
|
|
OpenMPIRBuilder::AtomicOpValue V = {VVal, false, false};
|
|
|
|
BasicBlock *EntryBB = BB;
|
|
|
|
Builder.restoreIP(OMPBuilder.createAtomicRead(Loc, X, V, AO));
|
|
LoadInst *AtomicLoad = nullptr;
|
|
StoreInst *StoreofAtomic = nullptr;
|
|
|
|
for (Instruction &Cur : *EntryBB) {
|
|
if (isa<LoadInst>(Cur)) {
|
|
AtomicLoad = cast<LoadInst>(&Cur);
|
|
if (AtomicLoad->getPointerOperand() == XVal)
|
|
continue;
|
|
AtomicLoad = nullptr;
|
|
} else if (isa<StoreInst>(Cur)) {
|
|
StoreofAtomic = cast<StoreInst>(&Cur);
|
|
if (StoreofAtomic->getPointerOperand() == VVal)
|
|
continue;
|
|
StoreofAtomic = nullptr;
|
|
}
|
|
}
|
|
|
|
EXPECT_NE(AtomicLoad, nullptr);
|
|
EXPECT_TRUE(AtomicLoad->isAtomic());
|
|
|
|
EXPECT_NE(StoreofAtomic, nullptr);
|
|
EXPECT_EQ(StoreofAtomic->getValueOperand(), AtomicLoad);
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OMPAtomicWriteFlt) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
LLVMContext &Ctx = M->getContext();
|
|
Type *Float32 = Type::getFloatTy(Ctx);
|
|
AllocaInst *XVal = Builder.CreateAlloca(Float32);
|
|
XVal->setName("AtomicVar");
|
|
OpenMPIRBuilder::AtomicOpValue X = {XVal, false, false};
|
|
AtomicOrdering AO = AtomicOrdering::Monotonic;
|
|
Constant *ValToWrite = ConstantFP::get(Float32, 1.0);
|
|
|
|
Builder.restoreIP(OMPBuilder.createAtomicWrite(Loc, X, ValToWrite, AO));
|
|
|
|
IntegerType *IntCastTy =
|
|
IntegerType::get(M->getContext(), Float32->getScalarSizeInBits());
|
|
|
|
BitCastInst *CastFrmFlt = cast<BitCastInst>(XVal->getNextNode());
|
|
EXPECT_EQ(CastFrmFlt->getSrcTy(), Float32->getPointerTo());
|
|
EXPECT_EQ(CastFrmFlt->getDestTy(), IntCastTy->getPointerTo());
|
|
EXPECT_EQ(CastFrmFlt->getOperand(0), XVal);
|
|
|
|
Value *ExprCast = Builder.CreateBitCast(ValToWrite, IntCastTy);
|
|
|
|
StoreInst *StoreofAtomic = cast<StoreInst>(CastFrmFlt->getNextNode());
|
|
EXPECT_EQ(StoreofAtomic->getValueOperand(), ExprCast);
|
|
EXPECT_EQ(StoreofAtomic->getPointerOperand(), CastFrmFlt);
|
|
EXPECT_TRUE(StoreofAtomic->isAtomic());
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OMPAtomicWriteInt) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
LLVMContext &Ctx = M->getContext();
|
|
IntegerType *Int32 = Type::getInt32Ty(Ctx);
|
|
AllocaInst *XVal = Builder.CreateAlloca(Int32);
|
|
XVal->setName("AtomicVar");
|
|
OpenMPIRBuilder::AtomicOpValue X = {XVal, false, false};
|
|
AtomicOrdering AO = AtomicOrdering::Monotonic;
|
|
ConstantInt *ValToWrite = ConstantInt::get(Type::getInt32Ty(Ctx), 1U);
|
|
|
|
BasicBlock *EntryBB = BB;
|
|
|
|
Builder.restoreIP(OMPBuilder.createAtomicWrite(Loc, X, ValToWrite, AO));
|
|
|
|
StoreInst *StoreofAtomic = nullptr;
|
|
|
|
for (Instruction &Cur : *EntryBB) {
|
|
if (isa<StoreInst>(Cur)) {
|
|
StoreofAtomic = cast<StoreInst>(&Cur);
|
|
if (StoreofAtomic->getPointerOperand() == XVal)
|
|
continue;
|
|
StoreofAtomic = nullptr;
|
|
}
|
|
}
|
|
|
|
EXPECT_NE(StoreofAtomic, nullptr);
|
|
EXPECT_TRUE(StoreofAtomic->isAtomic());
|
|
EXPECT_EQ(StoreofAtomic->getValueOperand(), ValToWrite);
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OMPAtomicUpdate) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
IntegerType *Int32 = Type::getInt32Ty(M->getContext());
|
|
AllocaInst *XVal = Builder.CreateAlloca(Int32);
|
|
XVal->setName("AtomicVar");
|
|
Builder.CreateStore(ConstantInt::get(Type::getInt32Ty(Ctx), 0U), XVal);
|
|
OpenMPIRBuilder::AtomicOpValue X = {XVal, false, false};
|
|
AtomicOrdering AO = AtomicOrdering::Monotonic;
|
|
ConstantInt *ConstVal = ConstantInt::get(Type::getInt32Ty(Ctx), 1U);
|
|
Value *Expr = nullptr;
|
|
AtomicRMWInst::BinOp RMWOp = AtomicRMWInst::Sub;
|
|
bool IsXLHSInRHSPart = false;
|
|
|
|
BasicBlock *EntryBB = BB;
|
|
Instruction *AllocIP = EntryBB->getFirstNonPHI();
|
|
Value *Sub = nullptr;
|
|
|
|
auto UpdateOp = [&](Value *Atomic, IRBuilder<> &IRB) {
|
|
Sub = IRB.CreateSub(ConstVal, Atomic);
|
|
return Sub;
|
|
};
|
|
Builder.restoreIP(OMPBuilder.createAtomicUpdate(
|
|
Builder, AllocIP, X, Expr, AO, RMWOp, UpdateOp, IsXLHSInRHSPart));
|
|
BasicBlock *ContBB = EntryBB->getSingleSuccessor();
|
|
BranchInst *ContTI = dyn_cast<BranchInst>(ContBB->getTerminator());
|
|
EXPECT_NE(ContTI, nullptr);
|
|
BasicBlock *EndBB = ContTI->getSuccessor(0);
|
|
EXPECT_TRUE(ContTI->isConditional());
|
|
EXPECT_EQ(ContTI->getSuccessor(1), ContBB);
|
|
EXPECT_NE(EndBB, nullptr);
|
|
|
|
PHINode *Phi = dyn_cast<PHINode>(&ContBB->front());
|
|
EXPECT_NE(Phi, nullptr);
|
|
EXPECT_EQ(Phi->getNumIncomingValues(), 2U);
|
|
EXPECT_EQ(Phi->getIncomingBlock(0), EntryBB);
|
|
EXPECT_EQ(Phi->getIncomingBlock(1), ContBB);
|
|
|
|
EXPECT_EQ(Sub->getNumUses(), 1U);
|
|
StoreInst *St = dyn_cast<StoreInst>(Sub->user_back());
|
|
AllocaInst *UpdateTemp = dyn_cast<AllocaInst>(St->getPointerOperand());
|
|
|
|
ExtractValueInst *ExVI1 =
|
|
dyn_cast<ExtractValueInst>(Phi->getIncomingValueForBlock(ContBB));
|
|
EXPECT_NE(ExVI1, nullptr);
|
|
AtomicCmpXchgInst *CmpExchg =
|
|
dyn_cast<AtomicCmpXchgInst>(ExVI1->getAggregateOperand());
|
|
EXPECT_NE(CmpExchg, nullptr);
|
|
EXPECT_EQ(CmpExchg->getPointerOperand(), XVal);
|
|
EXPECT_EQ(CmpExchg->getCompareOperand(), Phi);
|
|
EXPECT_EQ(CmpExchg->getSuccessOrdering(), AtomicOrdering::Monotonic);
|
|
|
|
LoadInst *Ld = dyn_cast<LoadInst>(CmpExchg->getNewValOperand());
|
|
EXPECT_NE(Ld, nullptr);
|
|
EXPECT_EQ(UpdateTemp, Ld->getPointerOperand());
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, OMPAtomicCapture) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
LLVMContext &Ctx = M->getContext();
|
|
IntegerType *Int32 = Type::getInt32Ty(Ctx);
|
|
AllocaInst *XVal = Builder.CreateAlloca(Int32);
|
|
XVal->setName("AtomicVar");
|
|
AllocaInst *VVal = Builder.CreateAlloca(Int32);
|
|
VVal->setName("AtomicCapTar");
|
|
StoreInst *Init =
|
|
Builder.CreateStore(ConstantInt::get(Type::getInt32Ty(Ctx), 0U), XVal);
|
|
|
|
OpenMPIRBuilder::AtomicOpValue X = {XVal, false, false};
|
|
OpenMPIRBuilder::AtomicOpValue V = {VVal, false, false};
|
|
AtomicOrdering AO = AtomicOrdering::Monotonic;
|
|
ConstantInt *Expr = ConstantInt::get(Type::getInt32Ty(Ctx), 1U);
|
|
AtomicRMWInst::BinOp RMWOp = AtomicRMWInst::Add;
|
|
bool IsXLHSInRHSPart = true;
|
|
bool IsPostfixUpdate = true;
|
|
bool UpdateExpr = true;
|
|
|
|
BasicBlock *EntryBB = BB;
|
|
Instruction *AllocIP = EntryBB->getFirstNonPHI();
|
|
|
|
// integer update - not used
|
|
auto UpdateOp = [&](Value *Atomic, IRBuilder<> &IRB) { return nullptr; };
|
|
|
|
Builder.restoreIP(OMPBuilder.createAtomicCapture(
|
|
Builder, AllocIP, X, V, Expr, AO, RMWOp, UpdateOp, UpdateExpr,
|
|
IsPostfixUpdate, IsXLHSInRHSPart));
|
|
EXPECT_EQ(EntryBB->getParent()->size(), 1U);
|
|
AtomicRMWInst *ARWM = dyn_cast<AtomicRMWInst>(Init->getNextNode());
|
|
EXPECT_NE(ARWM, nullptr);
|
|
EXPECT_EQ(ARWM->getPointerOperand(), XVal);
|
|
EXPECT_EQ(ARWM->getOperation(), RMWOp);
|
|
StoreInst *St = dyn_cast<StoreInst>(ARWM->user_back());
|
|
EXPECT_NE(St, nullptr);
|
|
EXPECT_EQ(St->getPointerOperand(), VVal);
|
|
|
|
Builder.CreateRetVoid();
|
|
OMPBuilder.finalize();
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
}
|
|
|
|
/// Returns the single instruction of InstTy type in BB that uses the value V.
|
|
/// If there is more than one such instruction, returns null.
|
|
template <typename InstTy>
|
|
static InstTy *findSingleUserInBlock(Value *V, BasicBlock *BB) {
|
|
InstTy *Result = nullptr;
|
|
for (User *U : V->users()) {
|
|
auto *Inst = dyn_cast<InstTy>(U);
|
|
if (!Inst || Inst->getParent() != BB)
|
|
continue;
|
|
if (Result)
|
|
return nullptr;
|
|
Result = Inst;
|
|
}
|
|
return Result;
|
|
}
|
|
|
|
/// Returns true if BB contains a simple binary reduction that loads a value
|
|
/// from Accum, performs some binary operation with it, and stores it back to
|
|
/// Accum.
|
|
static bool isSimpleBinaryReduction(Value *Accum, BasicBlock *BB,
|
|
Instruction::BinaryOps *OpCode = nullptr) {
|
|
StoreInst *Store = findSingleUserInBlock<StoreInst>(Accum, BB);
|
|
if (!Store)
|
|
return false;
|
|
auto *Stored = dyn_cast<BinaryOperator>(Store->getOperand(0));
|
|
if (!Stored)
|
|
return false;
|
|
if (OpCode && *OpCode != Stored->getOpcode())
|
|
return false;
|
|
auto *Load = dyn_cast<LoadInst>(Stored->getOperand(0));
|
|
return Load && Load->getOperand(0) == Accum;
|
|
}
|
|
|
|
/// Returns true if BB contains a binary reduction that reduces V using a binary
|
|
/// operator into an accumulator that is a function argument.
|
|
static bool isValueReducedToFuncArg(Value *V, BasicBlock *BB) {
|
|
auto *ReductionOp = findSingleUserInBlock<BinaryOperator>(V, BB);
|
|
if (!ReductionOp)
|
|
return false;
|
|
|
|
auto *GlobalLoad = dyn_cast<LoadInst>(ReductionOp->getOperand(0));
|
|
if (!GlobalLoad)
|
|
return false;
|
|
|
|
auto *Store = findSingleUserInBlock<StoreInst>(ReductionOp, BB);
|
|
if (!Store)
|
|
return false;
|
|
|
|
return Store->getPointerOperand() == GlobalLoad->getPointerOperand() &&
|
|
isa<Argument>(GlobalLoad->getPointerOperand());
|
|
}
|
|
|
|
/// Finds among users of Ptr a pair of GEP instructions with indices [0, 0] and
|
|
/// [0, 1], respectively, and assigns results of these instructions to Zero and
|
|
/// One. Returns true on success, false on failure or if such instructions are
|
|
/// not unique among the users of Ptr.
|
|
static bool findGEPZeroOne(Value *Ptr, Value *&Zero, Value *&One) {
|
|
Zero = nullptr;
|
|
One = nullptr;
|
|
for (User *U : Ptr->users()) {
|
|
if (auto *GEP = dyn_cast<GetElementPtrInst>(U)) {
|
|
if (GEP->getNumIndices() != 2)
|
|
continue;
|
|
auto *FirstIdx = dyn_cast<ConstantInt>(GEP->getOperand(1));
|
|
auto *SecondIdx = dyn_cast<ConstantInt>(GEP->getOperand(2));
|
|
EXPECT_NE(FirstIdx, nullptr);
|
|
EXPECT_NE(SecondIdx, nullptr);
|
|
|
|
EXPECT_TRUE(FirstIdx->isZero());
|
|
if (SecondIdx->isZero()) {
|
|
if (Zero)
|
|
return false;
|
|
Zero = GEP;
|
|
} else if (SecondIdx->isOne()) {
|
|
if (One)
|
|
return false;
|
|
One = GEP;
|
|
} else {
|
|
return false;
|
|
}
|
|
}
|
|
}
|
|
return Zero != nullptr && One != nullptr;
|
|
}
|
|
|
|
static OpenMPIRBuilder::InsertPointTy
|
|
sumReduction(OpenMPIRBuilder::InsertPointTy IP, Value *LHS, Value *RHS,
|
|
Value *&Result) {
|
|
IRBuilder<> Builder(IP.getBlock(), IP.getPoint());
|
|
Result = Builder.CreateFAdd(LHS, RHS, "red.add");
|
|
return Builder.saveIP();
|
|
}
|
|
|
|
static OpenMPIRBuilder::InsertPointTy
|
|
sumAtomicReduction(OpenMPIRBuilder::InsertPointTy IP, Value *LHS, Value *RHS) {
|
|
IRBuilder<> Builder(IP.getBlock(), IP.getPoint());
|
|
Value *Partial = Builder.CreateLoad(RHS->getType()->getPointerElementType(),
|
|
RHS, "red.partial");
|
|
Builder.CreateAtomicRMW(AtomicRMWInst::FAdd, LHS, Partial, None,
|
|
AtomicOrdering::Monotonic);
|
|
return Builder.saveIP();
|
|
}
|
|
|
|
static OpenMPIRBuilder::InsertPointTy
|
|
xorReduction(OpenMPIRBuilder::InsertPointTy IP, Value *LHS, Value *RHS,
|
|
Value *&Result) {
|
|
IRBuilder<> Builder(IP.getBlock(), IP.getPoint());
|
|
Result = Builder.CreateXor(LHS, RHS, "red.xor");
|
|
return Builder.saveIP();
|
|
}
|
|
|
|
static OpenMPIRBuilder::InsertPointTy
|
|
xorAtomicReduction(OpenMPIRBuilder::InsertPointTy IP, Value *LHS, Value *RHS) {
|
|
IRBuilder<> Builder(IP.getBlock(), IP.getPoint());
|
|
Value *Partial = Builder.CreateLoad(RHS->getType()->getPointerElementType(),
|
|
RHS, "red.partial");
|
|
Builder.CreateAtomicRMW(AtomicRMWInst::Xor, LHS, Partial, None,
|
|
AtomicOrdering::Monotonic);
|
|
return Builder.saveIP();
|
|
}
|
|
|
|
/// Populate Calls with call instructions calling the function with the given
|
|
/// FnID from the given function F.
|
|
static void findCalls(Function *F, omp::RuntimeFunction FnID,
|
|
OpenMPIRBuilder &OMPBuilder,
|
|
SmallVectorImpl<CallInst *> &Calls) {
|
|
Function *Fn = OMPBuilder.getOrCreateRuntimeFunctionPtr(FnID);
|
|
for (BasicBlock &BB : *F) {
|
|
for (Instruction &I : BB) {
|
|
auto *Call = dyn_cast<CallInst>(&I);
|
|
if (Call && Call->getCalledFunction() == Fn)
|
|
Calls.push_back(Call);
|
|
}
|
|
}
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateReductions) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
// Create variables to be reduced.
|
|
InsertPointTy OuterAllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
Value *SumReduced;
|
|
Value *XorReduced;
|
|
{
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(OuterAllocaIP);
|
|
SumReduced = Builder.CreateAlloca(Builder.getFloatTy());
|
|
XorReduced = Builder.CreateAlloca(Builder.getInt32Ty());
|
|
}
|
|
|
|
// Store initial values of reductions into global variables.
|
|
Builder.CreateStore(ConstantFP::get(Builder.getFloatTy(), 0.0), SumReduced);
|
|
Builder.CreateStore(Builder.getInt32(1), XorReduced);
|
|
|
|
// The loop body computes two reductions:
|
|
// sum of (float) thread-id;
|
|
// xor of thread-id;
|
|
// and store the result in global variables.
|
|
InsertPointTy BodyIP, BodyAllocaIP;
|
|
auto BodyGenCB = [&](InsertPointTy InnerAllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationBB) {
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
Constant *SrcLocStr = OMPBuilder.getOrCreateSrcLocStr(Loc);
|
|
Value *Ident = OMPBuilder.getOrCreateIdent(SrcLocStr);
|
|
Value *TID = OMPBuilder.getOrCreateThreadID(Ident);
|
|
Value *SumLocal =
|
|
Builder.CreateUIToFP(TID, Builder.getFloatTy(), "sum.local");
|
|
Value *SumPartial =
|
|
Builder.CreateLoad(SumReduced->getType()->getPointerElementType(),
|
|
SumReduced, "sum.partial");
|
|
Value *XorPartial =
|
|
Builder.CreateLoad(XorReduced->getType()->getPointerElementType(),
|
|
XorReduced, "xor.partial");
|
|
Value *Sum = Builder.CreateFAdd(SumPartial, SumLocal, "sum");
|
|
Value *Xor = Builder.CreateXor(XorPartial, TID, "xor");
|
|
Builder.CreateStore(Sum, SumReduced);
|
|
Builder.CreateStore(Xor, XorReduced);
|
|
|
|
BodyIP = Builder.saveIP();
|
|
BodyAllocaIP = InnerAllocaIP;
|
|
};
|
|
|
|
// Privatization for reduction creates local copies of reduction variables and
|
|
// initializes them to reduction-neutral values.
|
|
Value *SumPrivatized;
|
|
Value *XorPrivatized;
|
|
auto PrivCB = [&](InsertPointTy InnerAllocaIP, InsertPointTy CodeGenIP,
|
|
Value &Original, Value &Inner, Value *&ReplVal) {
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(InnerAllocaIP);
|
|
if (&Original == SumReduced) {
|
|
SumPrivatized = Builder.CreateAlloca(Builder.getFloatTy());
|
|
ReplVal = SumPrivatized;
|
|
} else if (&Original == XorReduced) {
|
|
XorPrivatized = Builder.CreateAlloca(Builder.getInt32Ty());
|
|
ReplVal = XorPrivatized;
|
|
} else {
|
|
ReplVal = &Inner;
|
|
return CodeGenIP;
|
|
}
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
if (&Original == SumReduced)
|
|
Builder.CreateStore(ConstantFP::get(Builder.getFloatTy(), 0.0),
|
|
SumPrivatized);
|
|
else if (&Original == XorReduced)
|
|
Builder.CreateStore(Builder.getInt32(0), XorPrivatized);
|
|
|
|
return Builder.saveIP();
|
|
};
|
|
|
|
// Do nothing in finalization.
|
|
auto FiniCB = [&](InsertPointTy CodeGenIP) { return CodeGenIP; };
|
|
|
|
InsertPointTy AfterIP =
|
|
OMPBuilder.createParallel(Loc, OuterAllocaIP, BodyGenCB, PrivCB, FiniCB,
|
|
/* IfCondition */ nullptr,
|
|
/* NumThreads */ nullptr, OMP_PROC_BIND_default,
|
|
/* IsCancellable */ false);
|
|
Builder.restoreIP(AfterIP);
|
|
|
|
OpenMPIRBuilder::ReductionInfo ReductionInfos[] = {
|
|
{SumReduced, SumPrivatized, sumReduction, sumAtomicReduction},
|
|
{XorReduced, XorPrivatized, xorReduction, xorAtomicReduction}};
|
|
|
|
OMPBuilder.createReductions(BodyIP, BodyAllocaIP, ReductionInfos);
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
|
|
OMPBuilder.finalize(F);
|
|
|
|
// The IR must be valid.
|
|
EXPECT_FALSE(verifyModule(*M));
|
|
|
|
// Outlining must have happened.
|
|
SmallVector<CallInst *> ForkCalls;
|
|
findCalls(F, omp::RuntimeFunction::OMPRTL___kmpc_fork_call, OMPBuilder,
|
|
ForkCalls);
|
|
ASSERT_EQ(ForkCalls.size(), 1u);
|
|
Value *CalleeVal = cast<Constant>(ForkCalls[0]->getOperand(2))->getOperand(0);
|
|
Function *Outlined = dyn_cast<Function>(CalleeVal);
|
|
EXPECT_NE(Outlined, nullptr);
|
|
|
|
// Check that the lock variable was created with the expected name.
|
|
GlobalVariable *LockVar =
|
|
M->getGlobalVariable(".gomp_critical_user_.reduction.var");
|
|
EXPECT_NE(LockVar, nullptr);
|
|
|
|
// Find the allocation of a local array that will be used to call the runtime
|
|
// reduciton function.
|
|
BasicBlock &AllocBlock = Outlined->getEntryBlock();
|
|
Value *LocalArray = nullptr;
|
|
for (Instruction &I : AllocBlock) {
|
|
if (AllocaInst *Alloc = dyn_cast<AllocaInst>(&I)) {
|
|
if (!Alloc->getAllocatedType()->isArrayTy() ||
|
|
!Alloc->getAllocatedType()->getArrayElementType()->isPointerTy())
|
|
continue;
|
|
LocalArray = Alloc;
|
|
break;
|
|
}
|
|
}
|
|
ASSERT_NE(LocalArray, nullptr);
|
|
|
|
// Find the call to the runtime reduction function.
|
|
BasicBlock *BB = AllocBlock.getUniqueSuccessor();
|
|
Value *LocalArrayPtr = nullptr;
|
|
Value *ReductionFnVal = nullptr;
|
|
Value *SwitchArg = nullptr;
|
|
for (Instruction &I : *BB) {
|
|
if (CallInst *Call = dyn_cast<CallInst>(&I)) {
|
|
if (Call->getCalledFunction() !=
|
|
OMPBuilder.getOrCreateRuntimeFunctionPtr(
|
|
RuntimeFunction::OMPRTL___kmpc_reduce))
|
|
continue;
|
|
LocalArrayPtr = Call->getOperand(4);
|
|
ReductionFnVal = Call->getOperand(5);
|
|
SwitchArg = Call;
|
|
break;
|
|
}
|
|
}
|
|
|
|
// Check that the local array is passed to the function.
|
|
ASSERT_NE(LocalArrayPtr, nullptr);
|
|
BitCastInst *BitCast = dyn_cast<BitCastInst>(LocalArrayPtr);
|
|
ASSERT_NE(BitCast, nullptr);
|
|
EXPECT_EQ(BitCast->getOperand(0), LocalArray);
|
|
|
|
// Find the GEP instructions preceding stores to the local array.
|
|
Value *FirstArrayElemPtr = nullptr;
|
|
Value *SecondArrayElemPtr = nullptr;
|
|
EXPECT_EQ(LocalArray->getNumUses(), 3u);
|
|
ASSERT_TRUE(
|
|
findGEPZeroOne(LocalArray, FirstArrayElemPtr, SecondArrayElemPtr));
|
|
|
|
// Check that the values stored into the local array are privatized reduction
|
|
// variables.
|
|
auto *FirstStored = dyn_cast_or_null<BitCastInst>(
|
|
findStoredValue<GetElementPtrInst>(FirstArrayElemPtr));
|
|
auto *SecondStored = dyn_cast_or_null<BitCastInst>(
|
|
findStoredValue<GetElementPtrInst>(SecondArrayElemPtr));
|
|
ASSERT_NE(FirstStored, nullptr);
|
|
ASSERT_NE(SecondStored, nullptr);
|
|
Value *FirstPrivatized = FirstStored->getOperand(0);
|
|
Value *SecondPrivatized = SecondStored->getOperand(0);
|
|
EXPECT_TRUE(
|
|
isSimpleBinaryReduction(FirstPrivatized, FirstStored->getParent()));
|
|
EXPECT_TRUE(
|
|
isSimpleBinaryReduction(SecondPrivatized, SecondStored->getParent()));
|
|
|
|
// Check that the result of the runtime reduction call is used for further
|
|
// dispatch.
|
|
ASSERT_EQ(SwitchArg->getNumUses(), 1u);
|
|
SwitchInst *Switch = dyn_cast<SwitchInst>(*SwitchArg->user_begin());
|
|
ASSERT_NE(Switch, nullptr);
|
|
EXPECT_EQ(Switch->getNumSuccessors(), 3u);
|
|
BasicBlock *NonAtomicBB = Switch->case_begin()->getCaseSuccessor();
|
|
BasicBlock *AtomicBB = std::next(Switch->case_begin())->getCaseSuccessor();
|
|
|
|
// Non-atomic block contains reductions to the global reduction variable,
|
|
// which is passed into the outlined function as an argument.
|
|
Value *FirstLoad =
|
|
findSingleUserInBlock<LoadInst>(FirstPrivatized, NonAtomicBB);
|
|
Value *SecondLoad =
|
|
findSingleUserInBlock<LoadInst>(SecondPrivatized, NonAtomicBB);
|
|
EXPECT_TRUE(isValueReducedToFuncArg(FirstLoad, NonAtomicBB));
|
|
EXPECT_TRUE(isValueReducedToFuncArg(SecondLoad, NonAtomicBB));
|
|
|
|
// Atomic block also constains reductions to the global reduction variable.
|
|
FirstLoad = findSingleUserInBlock<LoadInst>(FirstPrivatized, AtomicBB);
|
|
SecondLoad = findSingleUserInBlock<LoadInst>(SecondPrivatized, AtomicBB);
|
|
auto *FirstAtomic = findSingleUserInBlock<AtomicRMWInst>(FirstLoad, AtomicBB);
|
|
auto *SecondAtomic =
|
|
findSingleUserInBlock<AtomicRMWInst>(SecondLoad, AtomicBB);
|
|
ASSERT_NE(FirstAtomic, nullptr);
|
|
EXPECT_TRUE(isa<Argument>(FirstAtomic->getPointerOperand()));
|
|
ASSERT_NE(SecondAtomic, nullptr);
|
|
EXPECT_TRUE(isa<Argument>(SecondAtomic->getPointerOperand()));
|
|
|
|
// Check that the separate reduction function also performs (non-atomic)
|
|
// reductions after extracting reduction variables from its arguments.
|
|
Function *ReductionFn = cast<Function>(ReductionFnVal);
|
|
BasicBlock *FnReductionBB = &ReductionFn->getEntryBlock();
|
|
auto *Bitcast =
|
|
findSingleUserInBlock<BitCastInst>(ReductionFn->getArg(0), FnReductionBB);
|
|
Value *FirstLHSPtr;
|
|
Value *SecondLHSPtr;
|
|
ASSERT_TRUE(findGEPZeroOne(Bitcast, FirstLHSPtr, SecondLHSPtr));
|
|
Value *Opaque = findSingleUserInBlock<LoadInst>(FirstLHSPtr, FnReductionBB);
|
|
ASSERT_NE(Opaque, nullptr);
|
|
Bitcast = findSingleUserInBlock<BitCastInst>(Opaque, FnReductionBB);
|
|
ASSERT_NE(Bitcast, nullptr);
|
|
EXPECT_TRUE(isSimpleBinaryReduction(Bitcast, FnReductionBB));
|
|
Opaque = findSingleUserInBlock<LoadInst>(SecondLHSPtr, FnReductionBB);
|
|
ASSERT_NE(Opaque, nullptr);
|
|
Bitcast = findSingleUserInBlock<BitCastInst>(Opaque, FnReductionBB);
|
|
ASSERT_NE(Bitcast, nullptr);
|
|
EXPECT_TRUE(isSimpleBinaryReduction(Bitcast, FnReductionBB));
|
|
|
|
Bitcast =
|
|
findSingleUserInBlock<BitCastInst>(ReductionFn->getArg(1), FnReductionBB);
|
|
Value *FirstRHS;
|
|
Value *SecondRHS;
|
|
EXPECT_TRUE(findGEPZeroOne(Bitcast, FirstRHS, SecondRHS));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateTwoReductions) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
// Create variables to be reduced.
|
|
InsertPointTy OuterAllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
Value *SumReduced;
|
|
Value *XorReduced;
|
|
{
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(OuterAllocaIP);
|
|
SumReduced = Builder.CreateAlloca(Builder.getFloatTy());
|
|
XorReduced = Builder.CreateAlloca(Builder.getInt32Ty());
|
|
}
|
|
|
|
// Store initial values of reductions into global variables.
|
|
Builder.CreateStore(ConstantFP::get(Builder.getFloatTy(), 0.0), SumReduced);
|
|
Builder.CreateStore(Builder.getInt32(1), XorReduced);
|
|
|
|
InsertPointTy FirstBodyIP, FirstBodyAllocaIP;
|
|
auto FirstBodyGenCB = [&](InsertPointTy InnerAllocaIP,
|
|
InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationBB) {
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
Constant *SrcLocStr = OMPBuilder.getOrCreateSrcLocStr(Loc);
|
|
Value *Ident = OMPBuilder.getOrCreateIdent(SrcLocStr);
|
|
Value *TID = OMPBuilder.getOrCreateThreadID(Ident);
|
|
Value *SumLocal =
|
|
Builder.CreateUIToFP(TID, Builder.getFloatTy(), "sum.local");
|
|
Value *SumPartial =
|
|
Builder.CreateLoad(SumReduced->getType()->getPointerElementType(),
|
|
SumReduced, "sum.partial");
|
|
Value *Sum = Builder.CreateFAdd(SumPartial, SumLocal, "sum");
|
|
Builder.CreateStore(Sum, SumReduced);
|
|
|
|
FirstBodyIP = Builder.saveIP();
|
|
FirstBodyAllocaIP = InnerAllocaIP;
|
|
};
|
|
|
|
InsertPointTy SecondBodyIP, SecondBodyAllocaIP;
|
|
auto SecondBodyGenCB = [&](InsertPointTy InnerAllocaIP,
|
|
InsertPointTy CodeGenIP,
|
|
BasicBlock &ContinuationBB) {
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(CodeGenIP);
|
|
|
|
Constant *SrcLocStr = OMPBuilder.getOrCreateSrcLocStr(Loc);
|
|
Value *Ident = OMPBuilder.getOrCreateIdent(SrcLocStr);
|
|
Value *TID = OMPBuilder.getOrCreateThreadID(Ident);
|
|
Value *XorPartial =
|
|
Builder.CreateLoad(XorReduced->getType()->getPointerElementType(),
|
|
XorReduced, "xor.partial");
|
|
Value *Xor = Builder.CreateXor(XorPartial, TID, "xor");
|
|
Builder.CreateStore(Xor, XorReduced);
|
|
|
|
SecondBodyIP = Builder.saveIP();
|
|
SecondBodyAllocaIP = InnerAllocaIP;
|
|
};
|
|
|
|
// Privatization for reduction creates local copies of reduction variables and
|
|
// initializes them to reduction-neutral values. The same privatization
|
|
// callback is used for both loops, with dispatch based on the value being
|
|
// privatized.
|
|
Value *SumPrivatized;
|
|
Value *XorPrivatized;
|
|
auto PrivCB = [&](InsertPointTy InnerAllocaIP, InsertPointTy CodeGenIP,
|
|
Value &Original, Value &Inner, Value *&ReplVal) {
|
|
IRBuilderBase::InsertPointGuard Guard(Builder);
|
|
Builder.restoreIP(InnerAllocaIP);
|
|
if (&Original == SumReduced) {
|
|
SumPrivatized = Builder.CreateAlloca(Builder.getFloatTy());
|
|
ReplVal = SumPrivatized;
|
|
} else if (&Original == XorReduced) {
|
|
XorPrivatized = Builder.CreateAlloca(Builder.getInt32Ty());
|
|
ReplVal = XorPrivatized;
|
|
} else {
|
|
ReplVal = &Inner;
|
|
return CodeGenIP;
|
|
}
|
|
|
|
Builder.restoreIP(CodeGenIP);
|
|
if (&Original == SumReduced)
|
|
Builder.CreateStore(ConstantFP::get(Builder.getFloatTy(), 0.0),
|
|
SumPrivatized);
|
|
else if (&Original == XorReduced)
|
|
Builder.CreateStore(Builder.getInt32(0), XorPrivatized);
|
|
|
|
return Builder.saveIP();
|
|
};
|
|
|
|
// Do nothing in finalization.
|
|
auto FiniCB = [&](InsertPointTy CodeGenIP) { return CodeGenIP; };
|
|
|
|
Builder.restoreIP(
|
|
OMPBuilder.createParallel(Loc, OuterAllocaIP, FirstBodyGenCB, PrivCB,
|
|
FiniCB, /* IfCondition */ nullptr,
|
|
/* NumThreads */ nullptr, OMP_PROC_BIND_default,
|
|
/* IsCancellable */ false));
|
|
InsertPointTy AfterIP = OMPBuilder.createParallel(
|
|
{Builder.saveIP(), DL}, OuterAllocaIP, SecondBodyGenCB, PrivCB, FiniCB,
|
|
/* IfCondition */ nullptr,
|
|
/* NumThreads */ nullptr, OMP_PROC_BIND_default,
|
|
/* IsCancellable */ false);
|
|
|
|
OMPBuilder.createReductions(
|
|
FirstBodyIP, FirstBodyAllocaIP,
|
|
{{SumReduced, SumPrivatized, sumReduction, sumAtomicReduction}});
|
|
OMPBuilder.createReductions(
|
|
SecondBodyIP, SecondBodyAllocaIP,
|
|
{{XorReduced, XorPrivatized, xorReduction, xorAtomicReduction}});
|
|
|
|
Builder.restoreIP(AfterIP);
|
|
Builder.CreateRetVoid();
|
|
|
|
OMPBuilder.finalize(F);
|
|
|
|
// The IR must be valid.
|
|
EXPECT_FALSE(verifyModule(*M));
|
|
|
|
// Two different outlined functions must have been created.
|
|
SmallVector<CallInst *> ForkCalls;
|
|
findCalls(F, omp::RuntimeFunction::OMPRTL___kmpc_fork_call, OMPBuilder,
|
|
ForkCalls);
|
|
ASSERT_EQ(ForkCalls.size(), 2u);
|
|
Value *CalleeVal = cast<Constant>(ForkCalls[0]->getOperand(2))->getOperand(0);
|
|
Function *FirstCallee = cast<Function>(CalleeVal);
|
|
CalleeVal = cast<Constant>(ForkCalls[1]->getOperand(2))->getOperand(0);
|
|
Function *SecondCallee = cast<Function>(CalleeVal);
|
|
EXPECT_NE(FirstCallee, SecondCallee);
|
|
|
|
// Two different reduction functions must have been created.
|
|
SmallVector<CallInst *> ReduceCalls;
|
|
findCalls(FirstCallee, omp::RuntimeFunction::OMPRTL___kmpc_reduce, OMPBuilder,
|
|
ReduceCalls);
|
|
ASSERT_EQ(ReduceCalls.size(), 1u);
|
|
auto *AddReduction = cast<Function>(ReduceCalls[0]->getOperand(5));
|
|
ReduceCalls.clear();
|
|
findCalls(SecondCallee, omp::RuntimeFunction::OMPRTL___kmpc_reduce,
|
|
OMPBuilder, ReduceCalls);
|
|
auto *XorReduction = cast<Function>(ReduceCalls[0]->getOperand(5));
|
|
EXPECT_NE(AddReduction, XorReduction);
|
|
|
|
// Each reduction function does its own kind of reduction.
|
|
BasicBlock *FnReductionBB = &AddReduction->getEntryBlock();
|
|
auto *Bitcast = findSingleUserInBlock<BitCastInst>(AddReduction->getArg(0),
|
|
FnReductionBB);
|
|
ASSERT_NE(Bitcast, nullptr);
|
|
Value *FirstLHSPtr =
|
|
findSingleUserInBlock<GetElementPtrInst>(Bitcast, FnReductionBB);
|
|
ASSERT_NE(FirstLHSPtr, nullptr);
|
|
Value *Opaque = findSingleUserInBlock<LoadInst>(FirstLHSPtr, FnReductionBB);
|
|
ASSERT_NE(Opaque, nullptr);
|
|
Bitcast = findSingleUserInBlock<BitCastInst>(Opaque, FnReductionBB);
|
|
ASSERT_NE(Bitcast, nullptr);
|
|
Instruction::BinaryOps Opcode = Instruction::FAdd;
|
|
EXPECT_TRUE(isSimpleBinaryReduction(Bitcast, FnReductionBB, &Opcode));
|
|
|
|
FnReductionBB = &XorReduction->getEntryBlock();
|
|
Bitcast = findSingleUserInBlock<BitCastInst>(XorReduction->getArg(0),
|
|
FnReductionBB);
|
|
ASSERT_NE(Bitcast, nullptr);
|
|
Value *SecondLHSPtr =
|
|
findSingleUserInBlock<GetElementPtrInst>(Bitcast, FnReductionBB);
|
|
ASSERT_NE(FirstLHSPtr, nullptr);
|
|
Opaque = findSingleUserInBlock<LoadInst>(SecondLHSPtr, FnReductionBB);
|
|
ASSERT_NE(Opaque, nullptr);
|
|
Bitcast = findSingleUserInBlock<BitCastInst>(Opaque, FnReductionBB);
|
|
ASSERT_NE(Bitcast, nullptr);
|
|
Opcode = Instruction::Xor;
|
|
EXPECT_TRUE(isSimpleBinaryReduction(Bitcast, FnReductionBB, &Opcode));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateSections) {
|
|
using InsertPointTy = OpenMPIRBuilder::InsertPointTy;
|
|
using BodyGenCallbackTy = llvm::OpenMPIRBuilder::StorableBodyGenCallbackTy;
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
llvm::SmallVector<BodyGenCallbackTy, 4> SectionCBVector;
|
|
llvm::SmallVector<BasicBlock *, 4> CaseBBs;
|
|
|
|
BasicBlock *SwitchBB = nullptr;
|
|
BasicBlock *ForExitBB = nullptr;
|
|
BasicBlock *ForIncBB = nullptr;
|
|
AllocaInst *PrivAI = nullptr;
|
|
SwitchInst *Switch = nullptr;
|
|
|
|
unsigned NumBodiesGenerated = 0;
|
|
unsigned NumFiniCBCalls = 0;
|
|
PrivAI = Builder.CreateAlloca(F->arg_begin()->getType());
|
|
|
|
auto FiniCB = [&](InsertPointTy IP) {
|
|
++NumFiniCBCalls;
|
|
BasicBlock *IPBB = IP.getBlock();
|
|
EXPECT_NE(IPBB->end(), IP.getPoint());
|
|
};
|
|
|
|
auto SectionCB = [&](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
BasicBlock &FiniBB) {
|
|
++NumBodiesGenerated;
|
|
CaseBBs.push_back(CodeGenIP.getBlock());
|
|
SwitchBB = CodeGenIP.getBlock()->getSinglePredecessor();
|
|
Builder.restoreIP(CodeGenIP);
|
|
Builder.CreateStore(F->arg_begin(), PrivAI);
|
|
Value *PrivLoad =
|
|
Builder.CreateLoad(F->arg_begin()->getType(), PrivAI, "local.alloca");
|
|
Builder.CreateICmpNE(F->arg_begin(), PrivLoad);
|
|
Builder.CreateBr(&FiniBB);
|
|
ForIncBB =
|
|
CodeGenIP.getBlock()->getSinglePredecessor()->getSingleSuccessor();
|
|
};
|
|
auto PrivCB = [](InsertPointTy AllocaIP, InsertPointTy CodeGenIP,
|
|
llvm::Value &, llvm::Value &Val, llvm::Value *&ReplVal) {
|
|
// TODO: Privatization not implemented yet
|
|
return CodeGenIP;
|
|
};
|
|
|
|
SectionCBVector.push_back(SectionCB);
|
|
SectionCBVector.push_back(SectionCB);
|
|
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
Builder.restoreIP(OMPBuilder.createSections(Loc, AllocaIP, SectionCBVector,
|
|
PrivCB, FiniCB, false, false));
|
|
Builder.CreateRetVoid(); // Required at the end of the function
|
|
|
|
// Switch BB's predecessor is loop condition BB, whose successor at index 1 is
|
|
// loop's exit BB
|
|
ForExitBB =
|
|
SwitchBB->getSinglePredecessor()->getTerminator()->getSuccessor(1);
|
|
EXPECT_NE(ForExitBB, nullptr);
|
|
|
|
EXPECT_NE(PrivAI, nullptr);
|
|
Function *OutlinedFn = PrivAI->getFunction();
|
|
EXPECT_EQ(F, OutlinedFn);
|
|
EXPECT_FALSE(verifyModule(*M, &errs()));
|
|
EXPECT_EQ(OutlinedFn->arg_size(), 1U);
|
|
EXPECT_EQ(OutlinedFn->getBasicBlockList().size(), size_t(11));
|
|
|
|
BasicBlock *LoopPreheaderBB =
|
|
OutlinedFn->getEntryBlock().getSingleSuccessor();
|
|
// loop variables are 5 - lower bound, upper bound, stride, islastiter, and
|
|
// iterator/counter
|
|
bool FoundForInit = false;
|
|
for (Instruction &Inst : *LoopPreheaderBB) {
|
|
if (isa<CallInst>(Inst)) {
|
|
if (cast<CallInst>(&Inst)->getCalledFunction()->getName() ==
|
|
"__kmpc_for_static_init_4u") {
|
|
FoundForInit = true;
|
|
}
|
|
}
|
|
}
|
|
EXPECT_EQ(FoundForInit, true);
|
|
|
|
bool FoundForExit = false;
|
|
bool FoundBarrier = false;
|
|
for (Instruction &Inst : *ForExitBB) {
|
|
if (isa<CallInst>(Inst)) {
|
|
if (cast<CallInst>(&Inst)->getCalledFunction()->getName() ==
|
|
"__kmpc_for_static_fini") {
|
|
FoundForExit = true;
|
|
}
|
|
if (cast<CallInst>(&Inst)->getCalledFunction()->getName() ==
|
|
"__kmpc_barrier") {
|
|
FoundBarrier = true;
|
|
}
|
|
if (FoundForExit && FoundBarrier)
|
|
break;
|
|
}
|
|
}
|
|
EXPECT_EQ(FoundForExit, true);
|
|
EXPECT_EQ(FoundBarrier, true);
|
|
|
|
EXPECT_NE(SwitchBB, nullptr);
|
|
EXPECT_NE(SwitchBB->getTerminator(), nullptr);
|
|
EXPECT_EQ(isa<SwitchInst>(SwitchBB->getTerminator()), true);
|
|
Switch = cast<SwitchInst>(SwitchBB->getTerminator());
|
|
EXPECT_EQ(Switch->getNumCases(), 2U);
|
|
EXPECT_NE(ForIncBB, nullptr);
|
|
EXPECT_EQ(Switch->getSuccessor(0), ForIncBB);
|
|
|
|
EXPECT_EQ(CaseBBs.size(), 2U);
|
|
for (auto *&CaseBB : CaseBBs) {
|
|
EXPECT_EQ(CaseBB->getParent(), OutlinedFn);
|
|
EXPECT_EQ(CaseBB->getSingleSuccessor(), ForExitBB);
|
|
}
|
|
|
|
ASSERT_EQ(NumBodiesGenerated, 2U);
|
|
ASSERT_EQ(NumFiniCBCalls, 1U);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateOffloadMaptypes) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
SmallVector<uint64_t> Mappings = {0, 1};
|
|
GlobalVariable *OffloadMaptypesGlobal =
|
|
OMPBuilder.createOffloadMaptypes(Mappings, "offload_maptypes");
|
|
EXPECT_FALSE(M->global_empty());
|
|
EXPECT_EQ(OffloadMaptypesGlobal->getName(), "offload_maptypes");
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->isConstant());
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->hasGlobalUnnamedAddr());
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->hasPrivateLinkage());
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->hasInitializer());
|
|
Constant *Initializer = OffloadMaptypesGlobal->getInitializer();
|
|
EXPECT_TRUE(isa<ConstantDataArray>(Initializer));
|
|
ConstantDataArray *MappingInit = dyn_cast<ConstantDataArray>(Initializer);
|
|
EXPECT_EQ(MappingInit->getNumElements(), Mappings.size());
|
|
EXPECT_TRUE(MappingInit->getType()->getElementType()->isIntegerTy(64));
|
|
Constant *CA = ConstantDataArray::get(Builder.getContext(), Mappings);
|
|
EXPECT_EQ(MappingInit, CA);
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateOffloadMapnames) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
|
|
IRBuilder<> Builder(BB);
|
|
|
|
Constant *Cst1 = OMPBuilder.getOrCreateSrcLocStr("array1", "file1", 2, 5);
|
|
Constant *Cst2 = OMPBuilder.getOrCreateSrcLocStr("array2", "file1", 3, 5);
|
|
SmallVector<llvm::Constant *> Names = {Cst1, Cst2};
|
|
|
|
GlobalVariable *OffloadMaptypesGlobal =
|
|
OMPBuilder.createOffloadMapnames(Names, "offload_mapnames");
|
|
EXPECT_FALSE(M->global_empty());
|
|
EXPECT_EQ(OffloadMaptypesGlobal->getName(), "offload_mapnames");
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->isConstant());
|
|
EXPECT_FALSE(OffloadMaptypesGlobal->hasGlobalUnnamedAddr());
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->hasPrivateLinkage());
|
|
EXPECT_TRUE(OffloadMaptypesGlobal->hasInitializer());
|
|
Constant *Initializer = OffloadMaptypesGlobal->getInitializer();
|
|
EXPECT_TRUE(isa<Constant>(Initializer->getOperand(0)->stripPointerCasts()));
|
|
EXPECT_TRUE(isa<Constant>(Initializer->getOperand(1)->stripPointerCasts()));
|
|
|
|
GlobalVariable *Name1Gbl =
|
|
cast<GlobalVariable>(Initializer->getOperand(0)->stripPointerCasts());
|
|
EXPECT_TRUE(isa<ConstantDataArray>(Name1Gbl->getInitializer()));
|
|
ConstantDataArray *Name1GblCA =
|
|
dyn_cast<ConstantDataArray>(Name1Gbl->getInitializer());
|
|
EXPECT_EQ(Name1GblCA->getAsCString(), ";file1;array1;2;5;;");
|
|
|
|
GlobalVariable *Name2Gbl =
|
|
cast<GlobalVariable>(Initializer->getOperand(1)->stripPointerCasts());
|
|
EXPECT_TRUE(isa<ConstantDataArray>(Name2Gbl->getInitializer()));
|
|
ConstantDataArray *Name2GblCA =
|
|
dyn_cast<ConstantDataArray>(Name2Gbl->getInitializer());
|
|
EXPECT_EQ(Name2GblCA->getAsCString(), ";file1;array2;3;5;;");
|
|
|
|
EXPECT_TRUE(Initializer->getType()->getArrayElementType()->isPointerTy());
|
|
EXPECT_EQ(Initializer->getType()->getArrayNumElements(), Names.size());
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, CreateMapperAllocas) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
unsigned TotalNbOperand = 2;
|
|
|
|
OpenMPIRBuilder::MapperAllocas MapperAllocas;
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
OMPBuilder.createMapperAllocas(Loc, AllocaIP, TotalNbOperand, MapperAllocas);
|
|
EXPECT_NE(MapperAllocas.ArgsBase, nullptr);
|
|
EXPECT_NE(MapperAllocas.Args, nullptr);
|
|
EXPECT_NE(MapperAllocas.ArgSizes, nullptr);
|
|
EXPECT_TRUE(MapperAllocas.ArgsBase->getAllocatedType()->isArrayTy());
|
|
ArrayType *ArrType =
|
|
dyn_cast<ArrayType>(MapperAllocas.ArgsBase->getAllocatedType());
|
|
EXPECT_EQ(ArrType->getNumElements(), TotalNbOperand);
|
|
EXPECT_TRUE(MapperAllocas.ArgsBase->getAllocatedType()
|
|
->getArrayElementType()
|
|
->isPointerTy());
|
|
EXPECT_TRUE(MapperAllocas.ArgsBase->getAllocatedType()
|
|
->getArrayElementType()
|
|
->getPointerElementType()
|
|
->isIntegerTy(8));
|
|
|
|
EXPECT_TRUE(MapperAllocas.Args->getAllocatedType()->isArrayTy());
|
|
ArrType = dyn_cast<ArrayType>(MapperAllocas.Args->getAllocatedType());
|
|
EXPECT_EQ(ArrType->getNumElements(), TotalNbOperand);
|
|
EXPECT_TRUE(MapperAllocas.Args->getAllocatedType()
|
|
->getArrayElementType()
|
|
->isPointerTy());
|
|
EXPECT_TRUE(MapperAllocas.Args->getAllocatedType()
|
|
->getArrayElementType()
|
|
->getPointerElementType()
|
|
->isIntegerTy(8));
|
|
|
|
EXPECT_TRUE(MapperAllocas.ArgSizes->getAllocatedType()->isArrayTy());
|
|
ArrType = dyn_cast<ArrayType>(MapperAllocas.ArgSizes->getAllocatedType());
|
|
EXPECT_EQ(ArrType->getNumElements(), TotalNbOperand);
|
|
EXPECT_TRUE(MapperAllocas.ArgSizes->getAllocatedType()
|
|
->getArrayElementType()
|
|
->isIntegerTy(64));
|
|
}
|
|
|
|
TEST_F(OpenMPIRBuilderTest, EmitMapperCall) {
|
|
OpenMPIRBuilder OMPBuilder(*M);
|
|
OMPBuilder.initialize();
|
|
F->setName("func");
|
|
IRBuilder<> Builder(BB);
|
|
LLVMContext &Ctx = M->getContext();
|
|
|
|
OpenMPIRBuilder::LocationDescription Loc({Builder.saveIP(), DL});
|
|
|
|
unsigned TotalNbOperand = 2;
|
|
|
|
OpenMPIRBuilder::MapperAllocas MapperAllocas;
|
|
IRBuilder<>::InsertPoint AllocaIP(&F->getEntryBlock(),
|
|
F->getEntryBlock().getFirstInsertionPt());
|
|
OMPBuilder.createMapperAllocas(Loc, AllocaIP, TotalNbOperand, MapperAllocas);
|
|
|
|
auto *BeginMapperFunc = OMPBuilder.getOrCreateRuntimeFunctionPtr(
|
|
omp::OMPRTL___tgt_target_data_begin_mapper);
|
|
|
|
SmallVector<uint64_t> Flags = {0, 2};
|
|
|
|
Constant *SrcLocCst = OMPBuilder.getOrCreateSrcLocStr("", "file1", 2, 5);
|
|
Value *SrcLocInfo = OMPBuilder.getOrCreateIdent(SrcLocCst);
|
|
|
|
Constant *Cst1 = OMPBuilder.getOrCreateSrcLocStr("array1", "file1", 2, 5);
|
|
Constant *Cst2 = OMPBuilder.getOrCreateSrcLocStr("array2", "file1", 3, 5);
|
|
SmallVector<llvm::Constant *> Names = {Cst1, Cst2};
|
|
|
|
GlobalVariable *Maptypes =
|
|
OMPBuilder.createOffloadMaptypes(Flags, ".offload_maptypes");
|
|
Value *MaptypesArg = Builder.CreateConstInBoundsGEP2_32(
|
|
ArrayType::get(Type::getInt64Ty(Ctx), TotalNbOperand), Maptypes,
|
|
/*Idx0=*/0, /*Idx1=*/0);
|
|
|
|
GlobalVariable *Mapnames =
|
|
OMPBuilder.createOffloadMapnames(Names, ".offload_mapnames");
|
|
Value *MapnamesArg = Builder.CreateConstInBoundsGEP2_32(
|
|
ArrayType::get(Type::getInt8PtrTy(Ctx), TotalNbOperand), Mapnames,
|
|
/*Idx0=*/0, /*Idx1=*/0);
|
|
|
|
OMPBuilder.emitMapperCall(Builder.saveIP(), BeginMapperFunc, SrcLocInfo,
|
|
MaptypesArg, MapnamesArg, MapperAllocas, -1,
|
|
TotalNbOperand);
|
|
|
|
CallInst *MapperCall = dyn_cast<CallInst>(&BB->back());
|
|
EXPECT_NE(MapperCall, nullptr);
|
|
EXPECT_EQ(MapperCall->arg_size(), 9U);
|
|
EXPECT_EQ(MapperCall->getCalledFunction()->getName(),
|
|
"__tgt_target_data_begin_mapper");
|
|
EXPECT_EQ(MapperCall->getOperand(0), SrcLocInfo);
|
|
EXPECT_TRUE(MapperCall->getOperand(1)->getType()->isIntegerTy(64));
|
|
EXPECT_TRUE(MapperCall->getOperand(2)->getType()->isIntegerTy(32));
|
|
|
|
EXPECT_EQ(MapperCall->getOperand(6), MaptypesArg);
|
|
EXPECT_EQ(MapperCall->getOperand(7), MapnamesArg);
|
|
EXPECT_TRUE(MapperCall->getOperand(8)->getType()->isPointerTy());
|
|
}
|
|
|
|
} // namespace
|