mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-02-21 06:30:16 +00:00
Enable code placement optimization pass for ARM.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@114746 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
c451051157
commit
fff606d7b2
@ -76,11 +76,6 @@ ARMInterworking("arm-interworking", cl::Hidden,
|
|||||||
cl::desc("Enable / disable ARM interworking (for debugging only)"),
|
cl::desc("Enable / disable ARM interworking (for debugging only)"),
|
||||||
cl::init(true));
|
cl::init(true));
|
||||||
|
|
||||||
static cl::opt<bool>
|
|
||||||
EnableARMCodePlacement("arm-code-placement", cl::Hidden,
|
|
||||||
cl::desc("Enable code placement pass for ARM"),
|
|
||||||
cl::init(false));
|
|
||||||
|
|
||||||
void ARMTargetLowering::addTypeForNEON(EVT VT, EVT PromotedLdStVT,
|
void ARMTargetLowering::addTypeForNEON(EVT VT, EVT PromotedLdStVT,
|
||||||
EVT PromotedBitwiseVT) {
|
EVT PromotedBitwiseVT) {
|
||||||
if (VT != PromotedLdStVT) {
|
if (VT != PromotedLdStVT) {
|
||||||
@ -550,8 +545,7 @@ ARMTargetLowering::ARMTargetLowering(TargetMachine &TM)
|
|||||||
// are at least 4 bytes aligned.
|
// are at least 4 bytes aligned.
|
||||||
setMinStackArgumentAlignment(4);
|
setMinStackArgumentAlignment(4);
|
||||||
|
|
||||||
if (EnableARMCodePlacement)
|
benefitFromCodePlacementOpt = true;
|
||||||
benefitFromCodePlacementOpt = true;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
std::pair<const TargetRegisterClass*, uint8_t>
|
std::pair<const TargetRegisterClass*, uint8_t>
|
||||||
|
@ -18,13 +18,13 @@ tailrecurse: ; preds = %sw.bb, %entry
|
|||||||
%0 = ptrtoint i8* %tmp2 to i32
|
%0 = ptrtoint i8* %tmp2 to i32
|
||||||
|
|
||||||
; CHECK: ands r12, r12, #3
|
; CHECK: ands r12, r12, #3
|
||||||
; CHECK-NEXT: beq LBB0_4
|
; CHECK-NEXT: beq LBB0_2
|
||||||
|
|
||||||
; T2: movs r5, #3
|
; T2: movs r5, #3
|
||||||
; T2-NEXT: mov r6, r4
|
; T2-NEXT: mov r6, r4
|
||||||
; T2-NEXT: ands r6, r5
|
; T2-NEXT: ands r6, r5
|
||||||
; T2-NEXT: tst r4, r5
|
; T2-NEXT: tst r4, r5
|
||||||
; T2-NEXT: beq LBB0_5
|
; T2-NEXT: beq LBB0_3
|
||||||
|
|
||||||
%and = and i32 %0, 3
|
%and = and i32 %0, 3
|
||||||
%tst = icmp eq i32 %and, 0
|
%tst = icmp eq i32 %and, 0
|
||||||
|
@ -5,8 +5,9 @@
|
|||||||
%struct.list_data_s = type { i16, i16 }
|
%struct.list_data_s = type { i16, i16 }
|
||||||
%struct.list_head = type { %struct.list_head*, %struct.list_data_s* }
|
%struct.list_head = type { %struct.list_head*, %struct.list_data_s* }
|
||||||
|
|
||||||
define arm_apcscc %struct.list_head* @t(%struct.list_head* %list) nounwind {
|
define arm_apcscc %struct.list_head* @t1(%struct.list_head* %list) nounwind {
|
||||||
entry:
|
entry:
|
||||||
|
; CHECK: t1:
|
||||||
%0 = icmp eq %struct.list_head* %list, null
|
%0 = icmp eq %struct.list_head* %list, null
|
||||||
br i1 %0, label %bb2, label %bb
|
br i1 %0, label %bb2, label %bb
|
||||||
|
|
||||||
@ -27,3 +28,51 @@ bb2:
|
|||||||
%next.0.lcssa = phi %struct.list_head* [ null, %entry ], [ %list_addr.05, %bb ]
|
%next.0.lcssa = phi %struct.list_head* [ null, %entry ], [ %list_addr.05, %bb ]
|
||||||
ret %struct.list_head* %next.0.lcssa
|
ret %struct.list_head* %next.0.lcssa
|
||||||
}
|
}
|
||||||
|
|
||||||
|
; Optimize loop entry, eliminate intra loop branches
|
||||||
|
; rdar://8117827
|
||||||
|
define i32 @t2(i32 %passes, i32* nocapture %src, i32 %size) nounwind readonly {
|
||||||
|
entry:
|
||||||
|
; CHECK: t2:
|
||||||
|
; CHECK: beq LBB1_5
|
||||||
|
%0 = icmp eq i32 %passes, 0 ; <i1> [#uses=1]
|
||||||
|
br i1 %0, label %bb5, label %bb.nph15
|
||||||
|
|
||||||
|
; CHECK: LBB1_2
|
||||||
|
bb1: ; preds = %bb2.preheader, %bb1
|
||||||
|
; CHECK: LBB1_3:
|
||||||
|
; CHECK: bne LBB1_3
|
||||||
|
%indvar = phi i32 [ %indvar.next, %bb1 ], [ 0, %bb2.preheader ] ; <i32> [#uses=2]
|
||||||
|
%sum.08 = phi i32 [ %2, %bb1 ], [ %sum.110, %bb2.preheader ] ; <i32> [#uses=1]
|
||||||
|
%tmp17 = sub i32 %i.07, %indvar ; <i32> [#uses=1]
|
||||||
|
%scevgep = getelementptr i32* %src, i32 %tmp17 ; <i32*> [#uses=1]
|
||||||
|
%1 = load i32* %scevgep, align 4 ; <i32> [#uses=1]
|
||||||
|
%2 = add nsw i32 %1, %sum.08 ; <i32> [#uses=2]
|
||||||
|
%indvar.next = add i32 %indvar, 1 ; <i32> [#uses=2]
|
||||||
|
%exitcond = icmp eq i32 %indvar.next, %size ; <i1> [#uses=1]
|
||||||
|
br i1 %exitcond, label %bb3, label %bb1
|
||||||
|
|
||||||
|
bb3: ; preds = %bb1, %bb2.preheader
|
||||||
|
; CHECK: LBB1_4
|
||||||
|
; CHECK: bne LBB1_2
|
||||||
|
; CHECK-NOT: b LBB1_
|
||||||
|
; CHECK: ldmia sp!
|
||||||
|
%sum.0.lcssa = phi i32 [ %sum.110, %bb2.preheader ], [ %2, %bb1 ] ; <i32> [#uses=2]
|
||||||
|
%3 = add i32 %pass.011, 1 ; <i32> [#uses=2]
|
||||||
|
%exitcond18 = icmp eq i32 %3, %passes ; <i1> [#uses=1]
|
||||||
|
br i1 %exitcond18, label %bb5, label %bb2.preheader
|
||||||
|
|
||||||
|
bb.nph15: ; preds = %entry
|
||||||
|
%i.07 = add i32 %size, -1 ; <i32> [#uses=2]
|
||||||
|
%4 = icmp sgt i32 %i.07, -1 ; <i1> [#uses=1]
|
||||||
|
br label %bb2.preheader
|
||||||
|
|
||||||
|
bb2.preheader: ; preds = %bb3, %bb.nph15
|
||||||
|
%pass.011 = phi i32 [ 0, %bb.nph15 ], [ %3, %bb3 ] ; <i32> [#uses=1]
|
||||||
|
%sum.110 = phi i32 [ 0, %bb.nph15 ], [ %sum.0.lcssa, %bb3 ] ; <i32> [#uses=2]
|
||||||
|
br i1 %4, label %bb1, label %bb3
|
||||||
|
|
||||||
|
bb5: ; preds = %bb3, %entry
|
||||||
|
%sum.1.lcssa = phi i32 [ 0, %entry ], [ %sum.0.lcssa, %bb3 ] ; <i32> [#uses=1]
|
||||||
|
ret i32 %sum.1.lcssa
|
||||||
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user