Add IRBuilder::CreateVectorSplat and use it to simplify code.

llvm-svn: 171349
This commit is contained in:
Benjamin Kramer 2013-01-01 19:55:16 +00:00
parent c003a4521b
commit 614b5e85b9
3 changed files with 18 additions and 24 deletions

View File

@ -1367,6 +1367,22 @@ public:
ConstantExpr::getSizeOf(ArgType->getElementType()),
Name);
}
/// CreateVectorSplat - Return a vector value that contains \arg V broadcasted
/// to \p NumElts elements.
Value *CreateVectorSplat(unsigned NumElts, Value *V, const Twine &Name = "") {
assert(NumElts > 0 && "Cannot splat to an empty vector!");
// First insert it into an undef vector so we can shuffle it.
Type *I32Ty = getInt32Ty();
Value *Undef = UndefValue::get(VectorType::get(V->getType(), NumElts));
V = CreateInsertElement(Undef, V, ConstantInt::get(I32Ty, 0),
Name + ".splatinsert");
// Shuffle the value across the desired number of elements.
Value *Zeros = ConstantAggregateZero::get(VectorType::get(I32Ty, NumElts));
return CreateShuffleVector(V, Undef, Zeros, Name + ".splat");
}
};
}

View File

@ -2660,18 +2660,7 @@ private:
/// \brief Compute a vector splat for a given element value.
Value *getVectorSplat(IRBuilder<> &IRB, Value *V, unsigned NumElements) {
assert(NumElements > 0 && "Cannot splat to an empty vector.");
// First insert it into a one-element vector so we can shuffle it. It is
// really silly that LLVM's IR requires this in order to form a splat.
Value *Undef = UndefValue::get(VectorType::get(V->getType(), 1));
V = IRB.CreateInsertElement(Undef, V, IRB.getInt32(0),
getName(".splatinsert"));
// Shuffle the value across the desired number of elements.
SmallVector<Constant*, 8> Mask(NumElements, IRB.getInt32(0));
V = IRB.CreateShuffleVector(V, Undef, ConstantVector::get(Mask),
getName(".splat"));
V = IRB.CreateVectorSplat(NumElements, V, NamePrefix);
DEBUG(dbgs() << " splat: " << *V << "\n");
return V;
}

View File

@ -150,11 +150,6 @@ LoopVectorizationLegality::RuntimePointerCheck::insert(ScalarEvolution *SE,
}
Value *InnerLoopVectorizer::getBroadcastInstrs(Value *V) {
// Create the types.
LLVMContext &C = V->getContext();
Type *VTy = VectorType::get(V->getType(), VF);
Type *I32 = IntegerType::getInt32Ty(C);
// Save the current insertion location.
Instruction *Loc = Builder.GetInsertPoint();
@ -167,14 +162,8 @@ Value *InnerLoopVectorizer::getBroadcastInstrs(Value *V) {
if (Invariant)
Builder.SetInsertPoint(LoopVectorPreHeader->getTerminator());
Constant *Zero = ConstantInt::get(I32, 0);
Value *Zeros = ConstantAggregateZero::get(VectorType::get(I32, VF));
Value *UndefVal = UndefValue::get(VTy);
// Insert the value into a new vector.
Value *SingleElem = Builder.CreateInsertElement(UndefVal, V, Zero);
// Broadcast the scalar into all locations in the vector.
Value *Shuf = Builder.CreateShuffleVector(SingleElem, UndefVal, Zeros,
"broadcast");
Value *Shuf = Builder.CreateVectorSplat(VF, V, "broadcast");
// Restore the builder insertion point.
if (Invariant)