mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-15 07:34:33 +00:00
[InstCombine] Don't fold a GEP into itself through a PHI node
This can only occur (I think) through the back-edge of the loop. However, folding a GEP into itself means that the value of the previous iteration needs to be stored in the meantime, thus requiring an additional register variable to be live, but not actually achieving anything (the gep still needs to be executed once per loop iteration). The attached test case is derived from: typedef unsigned uint32; typedef unsigned char uint8; inline uint8 *f(uint32 value, uint8 *target) { while (value >= 0x80) { value >>= 7; ++target; } ++target; return target; } uint8 *g(uint32 b, uint8 *target) { target = f(b, f(42, target)); return target; } What happens is that the GEP stored in incptr2 is folded into itself through the loop's back-edge and the phi-node stored in loopptr, effectively incrementing the ptr by "2" in each iteration instead of "1". In this case, it is actually increasing the number of GEPs required as the GEP before the loop can't be folded away anymore. For comparison: With this patch: define i8* @test4(i32 %value, i8* %buffer) { entry: %cmp = icmp ugt i32 %value, 127 br i1 %cmp, label %loop.header, label %exit loop.header: ; preds = %entry br label %loop.body loop.body: ; preds = %loop.body, %loop.header %buffer.pn = phi i8* [ %buffer, %loop.header ], [ %loopptr, %loop.body ] %newval = phi i32 [ %value, %loop.header ], [ %shr, %loop.body ] %loopptr = getelementptr inbounds i8, i8* %buffer.pn, i64 1 %shr = lshr i32 %newval, 7 %cmp2 = icmp ugt i32 %newval, 16383 br i1 %cmp2, label %loop.body, label %loop.exit loop.exit: ; preds = %loop.body br label %exit exit: ; preds = %loop.exit, %entry %0 = phi i8* [ %loopptr, %loop.exit ], [ %buffer, %entry ] %incptr3 = getelementptr inbounds i8, i8* %0, i64 2 ret i8* %incptr3 } Without this patch: define i8* @test4(i32 %value, i8* %buffer) { entry: %incptr = getelementptr inbounds i8, i8* %buffer, i64 1 %cmp = icmp ugt i32 %value, 127 br i1 %cmp, label %loop.header, label %exit loop.header: ; preds = %entry br label %loop.body loop.body: ; preds = %loop.body, %loop.header %0 = phi i8* [ %buffer, %loop.header ], [ %loopptr, %loop.body ] %loopptr = phi i8* [ %incptr, %loop.header ], [ %incptr2, %loop.body ] %newval = phi i32 [ %value, %loop.header ], [ %shr, %loop.body ] %shr = lshr i32 %newval, 7 %incptr2 = getelementptr inbounds i8, i8* %0, i64 2 %cmp2 = icmp ugt i32 %newval, 16383 br i1 %cmp2, label %loop.body, label %loop.exit loop.exit: ; preds = %loop.body br label %exit exit: ; preds = %loop.exit, %entry %ptr2 = phi i8* [ %incptr2, %loop.exit ], [ %incptr, %entry ] %incptr3 = getelementptr inbounds i8, i8* %ptr2, i64 1 ret i8* %incptr3 } Review: http://reviews.llvm.org/D8245 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@232718 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
12f0d20753
commit
3baea2951d
@ -1333,6 +1333,15 @@ Instruction *InstCombiner::visitGetElementPtrInst(GetElementPtrInst &GEP) {
|
|||||||
if (!Op1)
|
if (!Op1)
|
||||||
return nullptr;
|
return nullptr;
|
||||||
|
|
||||||
|
// Don't fold a GEP into itself through a PHI node. This can only happen
|
||||||
|
// through the back-edge of a loop. Folding a GEP into itself means that
|
||||||
|
// the value of the previous iteration needs to be stored in the meantime,
|
||||||
|
// thus requiring an additional register variable to be live, but not
|
||||||
|
// actually achieving anything (the GEP still needs to be executed once per
|
||||||
|
// loop iteration).
|
||||||
|
if (Op1 == &GEP)
|
||||||
|
return nullptr;
|
||||||
|
|
||||||
signed DI = -1;
|
signed DI = -1;
|
||||||
|
|
||||||
for (auto I = PN->op_begin()+1, E = PN->op_end(); I !=E; ++I) {
|
for (auto I = PN->op_begin()+1, E = PN->op_end(); I !=E; ++I) {
|
||||||
@ -1340,6 +1349,10 @@ Instruction *InstCombiner::visitGetElementPtrInst(GetElementPtrInst &GEP) {
|
|||||||
if (!Op2 || Op1->getNumOperands() != Op2->getNumOperands())
|
if (!Op2 || Op1->getNumOperands() != Op2->getNumOperands())
|
||||||
return nullptr;
|
return nullptr;
|
||||||
|
|
||||||
|
// As for Op1 above, don't try to fold a GEP into itself.
|
||||||
|
if (Op2 == &GEP)
|
||||||
|
return nullptr;
|
||||||
|
|
||||||
// Keep track of the type as we walk the GEP.
|
// Keep track of the type as we walk the GEP.
|
||||||
Type *CurTy = Op1->getOperand(0)->getType()->getScalarType();
|
Type *CurTy = Op1->getOperand(0)->getType()->getScalarType();
|
||||||
|
|
||||||
|
@ -98,3 +98,39 @@ bb5:
|
|||||||
@_ZTIi = external constant i8*
|
@_ZTIi = external constant i8*
|
||||||
declare i32 @__gxx_personality_v0(...)
|
declare i32 @__gxx_personality_v0(...)
|
||||||
declare i32 @foo1(i32)
|
declare i32 @foo1(i32)
|
||||||
|
|
||||||
|
|
||||||
|
; Check that instcombine doesn't fold GEPs into themselves through a loop
|
||||||
|
; back-edge.
|
||||||
|
|
||||||
|
define i8* @test4(i32 %value, i8* %buffer) {
|
||||||
|
entry:
|
||||||
|
%incptr = getelementptr inbounds i8, i8* %buffer, i64 1
|
||||||
|
%cmp = icmp ugt i32 %value, 127
|
||||||
|
br i1 %cmp, label %loop.header, label %exit
|
||||||
|
|
||||||
|
loop.header:
|
||||||
|
br label %loop.body
|
||||||
|
|
||||||
|
loop.body:
|
||||||
|
%loopptr = phi i8* [ %incptr, %loop.header ], [ %incptr2, %loop.body ]
|
||||||
|
%newval = phi i32 [ %value, %loop.header ], [ %shr, %loop.body ]
|
||||||
|
%shr = lshr i32 %newval, 7
|
||||||
|
%incptr2 = getelementptr inbounds i8, i8* %loopptr, i64 1
|
||||||
|
%cmp2 = icmp ugt i32 %shr, 127
|
||||||
|
br i1 %cmp2, label %loop.body, label %loop.exit
|
||||||
|
|
||||||
|
loop.exit:
|
||||||
|
%exitptr = phi i8* [ %incptr2, %loop.body ]
|
||||||
|
br label %exit
|
||||||
|
|
||||||
|
exit:
|
||||||
|
%ptr2 = phi i8* [ %exitptr, %loop.exit ], [ %incptr, %entry ]
|
||||||
|
%incptr3 = getelementptr inbounds i8, i8* %ptr2, i64 1
|
||||||
|
ret i8* %incptr3
|
||||||
|
|
||||||
|
; CHECK-LABEL: @test4(
|
||||||
|
; CHECK: loop.body:
|
||||||
|
; CHECK: getelementptr{{.*}}i64 1
|
||||||
|
; CHECK: exit:
|
||||||
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user