mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-28 06:32:09 +00:00
LoopVectorize: Keep the IRBuilder on the stack.
No functionality change. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@166274 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
0d3c8d5d16
commit
17f68c52d2
@ -67,11 +67,7 @@ public:
|
|||||||
SingleBlockLoopVectorizer(Loop *OrigLoop, ScalarEvolution *Se, LoopInfo *Li,
|
SingleBlockLoopVectorizer(Loop *OrigLoop, ScalarEvolution *Se, LoopInfo *Li,
|
||||||
LPPassManager *Lpm, unsigned VecWidth):
|
LPPassManager *Lpm, unsigned VecWidth):
|
||||||
Orig(OrigLoop), SE(Se), LI(Li), LPM(Lpm), VF(VecWidth),
|
Orig(OrigLoop), SE(Se), LI(Li), LPM(Lpm), VF(VecWidth),
|
||||||
Builder(0), Induction(0), OldInduction(0) { }
|
Builder(Se->getContext()), Induction(0), OldInduction(0) { }
|
||||||
|
|
||||||
~SingleBlockLoopVectorizer() {
|
|
||||||
delete Builder;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Perform the actual loop widening (vectorization).
|
// Perform the actual loop widening (vectorization).
|
||||||
void vectorize() {
|
void vectorize() {
|
||||||
@ -81,7 +77,7 @@ public:
|
|||||||
vectorizeLoop();
|
vectorizeLoop();
|
||||||
// register the new loop.
|
// register the new loop.
|
||||||
cleanup();
|
cleanup();
|
||||||
}
|
}
|
||||||
|
|
||||||
private:
|
private:
|
||||||
/// Create an empty loop, based on the loop ranges of the old loop.
|
/// Create an empty loop, based on the loop ranges of the old loop.
|
||||||
@ -131,7 +127,7 @@ private:
|
|||||||
unsigned VF;
|
unsigned VF;
|
||||||
|
|
||||||
// The builder that we use
|
// The builder that we use
|
||||||
IRBuilder<> *Builder;
|
IRBuilder<> Builder;
|
||||||
|
|
||||||
// --- Vectorization state ---
|
// --- Vectorization state ---
|
||||||
|
|
||||||
@ -241,10 +237,10 @@ Value *SingleBlockLoopVectorizer::getBroadcastInstrs(Value *V) {
|
|||||||
Value *Zeros = ConstantAggregateZero::get(VectorType::get(I32, VF));
|
Value *Zeros = ConstantAggregateZero::get(VectorType::get(I32, VF));
|
||||||
Value *UndefVal = UndefValue::get(VTy);
|
Value *UndefVal = UndefValue::get(VTy);
|
||||||
// Insert the value into a new vector.
|
// Insert the value into a new vector.
|
||||||
Value *SingleElem = Builder->CreateInsertElement(UndefVal, V, Zero);
|
Value *SingleElem = Builder.CreateInsertElement(UndefVal, V, Zero);
|
||||||
// Broadcast the scalar into all locations in the vector.
|
// Broadcast the scalar into all locations in the vector.
|
||||||
Value *Shuf = Builder->CreateShuffleVector(SingleElem, UndefVal, Zeros,
|
Value *Shuf = Builder.CreateShuffleVector(SingleElem, UndefVal, Zeros,
|
||||||
"broadcast");
|
"broadcast");
|
||||||
// We are accessing the induction variable. Make sure to promote the
|
// We are accessing the induction variable. Make sure to promote the
|
||||||
// index for each consecutive SIMD lane. This adds 0,1,2 ... to all lanes.
|
// index for each consecutive SIMD lane. This adds 0,1,2 ... to all lanes.
|
||||||
if (V == Induction)
|
if (V == Induction)
|
||||||
@ -269,7 +265,7 @@ Value *SingleBlockLoopVectorizer::getConsecutiveVector(Value* Val) {
|
|||||||
// Add the consecutive indices to the vector value.
|
// Add the consecutive indices to the vector value.
|
||||||
Constant *Cv = ConstantVector::get(Indices);
|
Constant *Cv = ConstantVector::get(Indices);
|
||||||
assert(Cv->getType() == Val->getType() && "Invalid consecutive vec");
|
assert(Cv->getType() == Val->getType() && "Invalid consecutive vec");
|
||||||
return Builder->CreateAdd(Val, Cv, "induction");
|
return Builder.CreateAdd(Val, Cv, "induction");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@ -304,7 +300,7 @@ Value *SingleBlockLoopVectorizer::getVectorValue(Value *V) {
|
|||||||
// If we saved a vectorized copy of V, use it.
|
// If we saved a vectorized copy of V, use it.
|
||||||
ValueMap::iterator it = WidenMap.find(V);
|
ValueMap::iterator it = WidenMap.find(V);
|
||||||
if (it != WidenMap.end())
|
if (it != WidenMap.end())
|
||||||
return it->second;
|
return it->second;
|
||||||
|
|
||||||
// Broadcast V and save the value for future uses.
|
// Broadcast V and save the value for future uses.
|
||||||
Value *B = getBroadcastInstrs(V);
|
Value *B = getBroadcastInstrs(V);
|
||||||
@ -364,18 +360,18 @@ void SingleBlockLoopVectorizer::scalarizeInstruction(Instruction *Instr) {
|
|||||||
Value *Op = Params[op];
|
Value *Op = Params[op];
|
||||||
// Param is a vector. Need to extract the right lane.
|
// Param is a vector. Need to extract the right lane.
|
||||||
if (Op->getType()->isVectorTy())
|
if (Op->getType()->isVectorTy())
|
||||||
Op = Builder->CreateExtractElement(Op, Builder->getInt32(i));
|
Op = Builder.CreateExtractElement(Op, Builder.getInt32(i));
|
||||||
Cloned->setOperand(op, Op);
|
Cloned->setOperand(op, Op);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Place the cloned scalar in the new loop.
|
// Place the cloned scalar in the new loop.
|
||||||
Builder->Insert(Cloned);
|
Builder.Insert(Cloned);
|
||||||
|
|
||||||
// If the original scalar returns a value we need to place it in a vector
|
// If the original scalar returns a value we need to place it in a vector
|
||||||
// so that future users will be able to use it.
|
// so that future users will be able to use it.
|
||||||
if (!IsVoidRetTy)
|
if (!IsVoidRetTy)
|
||||||
VecResults = Builder->CreateInsertElement(VecResults, Cloned,
|
VecResults = Builder.CreateInsertElement(VecResults, Cloned,
|
||||||
Builder->getInt32(i));
|
Builder.getInt32(i));
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!IsVoidRetTy)
|
if (!IsVoidRetTy)
|
||||||
@ -421,15 +417,15 @@ void SingleBlockLoopVectorizer::createEmptyLoop() {
|
|||||||
assert(BypassBlock && "Invalid loop structure");
|
assert(BypassBlock && "Invalid loop structure");
|
||||||
|
|
||||||
BasicBlock *VectorPH =
|
BasicBlock *VectorPH =
|
||||||
BypassBlock->splitBasicBlock(BypassBlock->getTerminator(), "vector.ph");
|
BypassBlock->splitBasicBlock(BypassBlock->getTerminator(), "vector.ph");
|
||||||
BasicBlock *VecBody = VectorPH->splitBasicBlock(VectorPH->getTerminator(),
|
BasicBlock *VecBody = VectorPH->splitBasicBlock(VectorPH->getTerminator(),
|
||||||
"vector.body");
|
"vector.body");
|
||||||
|
|
||||||
BasicBlock *MiddleBlock = VecBody->splitBasicBlock(VecBody->getTerminator(),
|
BasicBlock *MiddleBlock = VecBody->splitBasicBlock(VecBody->getTerminator(),
|
||||||
"middle.block");
|
"middle.block");
|
||||||
BasicBlock *ScalarPH =
|
BasicBlock *ScalarPH =
|
||||||
MiddleBlock->splitBasicBlock(MiddleBlock->getTerminator(),
|
MiddleBlock->splitBasicBlock(MiddleBlock->getTerminator(),
|
||||||
"scalar.preheader");
|
"scalar.preheader");
|
||||||
|
|
||||||
// Find the induction variable.
|
// Find the induction variable.
|
||||||
BasicBlock *OldBasicBlock = Orig->getHeader();
|
BasicBlock *OldBasicBlock = Orig->getHeader();
|
||||||
@ -439,11 +435,10 @@ void SingleBlockLoopVectorizer::createEmptyLoop() {
|
|||||||
|
|
||||||
// Use this IR builder to create the loop instructions (Phi, Br, Cmp)
|
// Use this IR builder to create the loop instructions (Phi, Br, Cmp)
|
||||||
// inside the loop.
|
// inside the loop.
|
||||||
Builder = new IRBuilder<>(VecBody);
|
Builder.SetInsertPoint(VecBody->getFirstInsertionPt());
|
||||||
Builder->SetInsertPoint(VecBody->getFirstInsertionPt());
|
|
||||||
|
|
||||||
// Generate the induction variable.
|
// Generate the induction variable.
|
||||||
Induction = Builder->CreatePHI(IdxTy, 2, "index");
|
Induction = Builder.CreatePHI(IdxTy, 2, "index");
|
||||||
Constant *Zero = ConstantInt::get(IdxTy, 0);
|
Constant *Zero = ConstantInt::get(IdxTy, 0);
|
||||||
Constant *Step = ConstantInt::get(IdxTy, VF);
|
Constant *Step = ConstantInt::get(IdxTy, VF);
|
||||||
|
|
||||||
@ -494,12 +489,12 @@ void SingleBlockLoopVectorizer::createEmptyLoop() {
|
|||||||
MiddleBlock->getTerminator()->eraseFromParent();
|
MiddleBlock->getTerminator()->eraseFromParent();
|
||||||
|
|
||||||
// Create i+1 and fill the PHINode.
|
// Create i+1 and fill the PHINode.
|
||||||
Value *NextIdx = Builder->CreateAdd(Induction, Step, "index.next");
|
Value *NextIdx = Builder.CreateAdd(Induction, Step, "index.next");
|
||||||
Induction->addIncoming(Zero, VectorPH);
|
Induction->addIncoming(Zero, VectorPH);
|
||||||
Induction->addIncoming(NextIdx, VecBody);
|
Induction->addIncoming(NextIdx, VecBody);
|
||||||
// Create the compare.
|
// Create the compare.
|
||||||
Value *ICmp = Builder->CreateICmpEQ(NextIdx, CountRoundDown);
|
Value *ICmp = Builder.CreateICmpEQ(NextIdx, CountRoundDown);
|
||||||
Builder->CreateCondBr(ICmp, MiddleBlock, VecBody);
|
Builder.CreateCondBr(ICmp, MiddleBlock, VecBody);
|
||||||
|
|
||||||
// Now we have two terminators. Remove the old one from the block.
|
// Now we have two terminators. Remove the old one from the block.
|
||||||
VecBody->getTerminator()->eraseFromParent();
|
VecBody->getTerminator()->eraseFromParent();
|
||||||
@ -509,7 +504,7 @@ void SingleBlockLoopVectorizer::createEmptyLoop() {
|
|||||||
OldInduction->setIncomingValue(BlockIdx, CountRoundDown);
|
OldInduction->setIncomingValue(BlockIdx, CountRoundDown);
|
||||||
|
|
||||||
// Get ready to start creating new instructions into the vectorized body.
|
// Get ready to start creating new instructions into the vectorized body.
|
||||||
Builder->SetInsertPoint(VecBody->getFirstInsertionPt());
|
Builder.SetInsertPoint(VecBody->getFirstInsertionPt());
|
||||||
|
|
||||||
// Register the new loop.
|
// Register the new loop.
|
||||||
Loop* Lp = new Loop();
|
Loop* Lp = new Loop();
|
||||||
@ -562,7 +557,7 @@ void SingleBlockLoopVectorizer::vectorizeLoop() {
|
|||||||
Value *A = getVectorValue(Inst->getOperand(0));
|
Value *A = getVectorValue(Inst->getOperand(0));
|
||||||
Value *B = getVectorValue(Inst->getOperand(1));
|
Value *B = getVectorValue(Inst->getOperand(1));
|
||||||
// Use this vector value for all users of the original instruction.
|
// Use this vector value for all users of the original instruction.
|
||||||
WidenMap[Inst] = Builder->CreateBinOp(BinOp->getOpcode(), A, B);
|
WidenMap[Inst] = Builder.CreateBinOp(BinOp->getOpcode(), A, B);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case Instruction::Select: {
|
case Instruction::Select: {
|
||||||
@ -570,7 +565,7 @@ void SingleBlockLoopVectorizer::vectorizeLoop() {
|
|||||||
Value *A = getVectorValue(Inst->getOperand(0));
|
Value *A = getVectorValue(Inst->getOperand(0));
|
||||||
Value *B = getVectorValue(Inst->getOperand(1));
|
Value *B = getVectorValue(Inst->getOperand(1));
|
||||||
Value *C = getVectorValue(Inst->getOperand(2));
|
Value *C = getVectorValue(Inst->getOperand(2));
|
||||||
WidenMap[Inst] = Builder->CreateSelect(A, B, C);
|
WidenMap[Inst] = Builder.CreateSelect(A, B, C);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -582,9 +577,9 @@ void SingleBlockLoopVectorizer::vectorizeLoop() {
|
|||||||
Value *A = getVectorValue(Inst->getOperand(0));
|
Value *A = getVectorValue(Inst->getOperand(0));
|
||||||
Value *B = getVectorValue(Inst->getOperand(1));
|
Value *B = getVectorValue(Inst->getOperand(1));
|
||||||
if (FCmp)
|
if (FCmp)
|
||||||
WidenMap[Inst] = Builder->CreateFCmp(Cmp->getPredicate(), A, B);
|
WidenMap[Inst] = Builder.CreateFCmp(Cmp->getPredicate(), A, B);
|
||||||
else
|
else
|
||||||
WidenMap[Inst] = Builder->CreateICmp(Cmp->getPredicate(), A, B);
|
WidenMap[Inst] = Builder.CreateICmp(Cmp->getPredicate(), A, B);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -605,10 +600,10 @@ void SingleBlockLoopVectorizer::vectorizeLoop() {
|
|||||||
GetElementPtrInst *Gep2 = cast<GetElementPtrInst>(Gep->clone());
|
GetElementPtrInst *Gep2 = cast<GetElementPtrInst>(Gep->clone());
|
||||||
unsigned NumOperands = Gep->getNumOperands();
|
unsigned NumOperands = Gep->getNumOperands();
|
||||||
Gep2->setOperand(NumOperands - 1, Induction);
|
Gep2->setOperand(NumOperands - 1, Induction);
|
||||||
Ptr = Builder->Insert(Gep2);
|
Ptr = Builder.Insert(Gep2);
|
||||||
Ptr = Builder->CreateBitCast(Ptr, StTy->getPointerTo());
|
Ptr = Builder.CreateBitCast(Ptr, StTy->getPointerTo());
|
||||||
Value *Val = getVectorValue(SI->getValueOperand());
|
Value *Val = getVectorValue(SI->getValueOperand());
|
||||||
Builder->CreateStore(Val, Ptr)->setAlignment(Alignment);
|
Builder.CreateStore(Val, Ptr)->setAlignment(Alignment);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case Instruction::Load: {
|
case Instruction::Load: {
|
||||||
@ -629,9 +624,9 @@ void SingleBlockLoopVectorizer::vectorizeLoop() {
|
|||||||
GetElementPtrInst *Gep2 = cast<GetElementPtrInst>(Gep->clone());
|
GetElementPtrInst *Gep2 = cast<GetElementPtrInst>(Gep->clone());
|
||||||
unsigned NumOperands = Gep->getNumOperands();
|
unsigned NumOperands = Gep->getNumOperands();
|
||||||
Gep2->setOperand(NumOperands - 1, Induction);
|
Gep2->setOperand(NumOperands - 1, Induction);
|
||||||
Ptr = Builder->Insert(Gep2);
|
Ptr = Builder.Insert(Gep2);
|
||||||
Ptr = Builder->CreateBitCast(Ptr, RetTy->getPointerTo());
|
Ptr = Builder.CreateBitCast(Ptr, RetTy->getPointerTo());
|
||||||
LI = Builder->CreateLoad(Ptr);
|
LI = Builder.CreateLoad(Ptr);
|
||||||
LI->setAlignment(Alignment);
|
LI->setAlignment(Alignment);
|
||||||
// Use this vector value for all users of the load.
|
// Use this vector value for all users of the load.
|
||||||
WidenMap[Inst] = LI;
|
WidenMap[Inst] = LI;
|
||||||
@ -653,7 +648,7 @@ void SingleBlockLoopVectorizer::vectorizeLoop() {
|
|||||||
CastInst *CI = dyn_cast<CastInst>(Inst);
|
CastInst *CI = dyn_cast<CastInst>(Inst);
|
||||||
Value *A = getVectorValue(Inst->getOperand(0));
|
Value *A = getVectorValue(Inst->getOperand(0));
|
||||||
Type *DestTy = VectorType::get(CI->getType()->getScalarType(), VF);
|
Type *DestTy = VectorType::get(CI->getType()->getScalarType(), VF);
|
||||||
WidenMap[Inst] = Builder->CreateCast(CI->getOpcode(), A, DestTy);
|
WidenMap[Inst] = Builder.CreateCast(CI->getOpcode(), A, DestTy);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -815,8 +810,8 @@ bool LoopVectorizationLegality::canVectorizeBlock(BasicBlock &BB) {
|
|||||||
} // next instr.
|
} // next instr.
|
||||||
|
|
||||||
if (NumPhis != 1) {
|
if (NumPhis != 1) {
|
||||||
DEBUG(dbgs() << "LV: Did not find a Phi node.\n");
|
DEBUG(dbgs() << "LV: Did not find a Phi node.\n");
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Check that the underlying objects of the reads and writes are either
|
// Check that the underlying objects of the reads and writes are either
|
||||||
|
Loading…
x
Reference in New Issue
Block a user