mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-11-02 07:11:49 +00:00
Teach LoopVectorize about address space sizes
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@188980 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
9d3c398d61
commit
978de6b56a
@ -2667,7 +2667,8 @@ bool LoopVectorizationLegality::canVectorize() {
|
|||||||
|
|
||||||
static Type *convertPointerToIntegerType(DataLayout &DL, Type *Ty) {
|
static Type *convertPointerToIntegerType(DataLayout &DL, Type *Ty) {
|
||||||
if (Ty->isPointerTy())
|
if (Ty->isPointerTy())
|
||||||
return DL.getIntPtrType(Ty->getContext());
|
return DL.getIntPtrType(Ty);
|
||||||
|
|
||||||
return Ty;
|
return Ty;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -4,10 +4,10 @@
|
|||||||
; return std::accumulate(A, A + n, 0);
|
; return std::accumulate(A, A + n, 0);
|
||||||
; }
|
; }
|
||||||
|
|
||||||
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
target datalayout = "e-p:64:64:64-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-n8:16:32:64-S128"
|
||||||
target triple = "x86_64-apple-macosx10.8.0"
|
|
||||||
|
|
||||||
;CHECK-LABEL: @sum_array(
|
;CHECK-LABEL: @sum_array(
|
||||||
|
;CHECK: phi i64
|
||||||
;CHECK: phi <4 x i32>
|
;CHECK: phi <4 x i32>
|
||||||
;CHECK: load <4 x i32>
|
;CHECK: load <4 x i32>
|
||||||
;CHECK: add nsw <4 x i32>
|
;CHECK: add nsw <4 x i32>
|
||||||
@ -31,3 +31,30 @@ _ZSt10accumulateIPiiET0_T_S2_S1_.exit: ; preds = %.lr.ph.i, %0
|
|||||||
%.01.lcssa.i = phi i32 [ 0, %0 ], [ %5, %.lr.ph.i ]
|
%.01.lcssa.i = phi i32 [ 0, %0 ], [ %5, %.lr.ph.i ]
|
||||||
ret i32 %.01.lcssa.i
|
ret i32 %.01.lcssa.i
|
||||||
}
|
}
|
||||||
|
|
||||||
|
; Same, but use a pointer with a different size.
|
||||||
|
;CHECK-LABEL: @sum_array_as1(
|
||||||
|
;CHECK: phi i16
|
||||||
|
;CHECK: phi <4 x i32>
|
||||||
|
;CHECK: load <4 x i32>
|
||||||
|
;CHECK: add nsw <4 x i32>
|
||||||
|
;CHECK: ret i32
|
||||||
|
define i32 @sum_array_as1(i32 addrspace(1)* %A, i32 %n) nounwind uwtable readonly noinline ssp {
|
||||||
|
%1 = sext i32 %n to i64
|
||||||
|
%2 = getelementptr inbounds i32 addrspace(1)* %A, i64 %1
|
||||||
|
%3 = icmp eq i32 %n, 0
|
||||||
|
br i1 %3, label %_ZSt10accumulateIPiiET0_T_S2_S1_.exit, label %.lr.ph.i
|
||||||
|
|
||||||
|
.lr.ph.i: ; preds = %0, %.lr.ph.i
|
||||||
|
%.03.i = phi i32 addrspace(1)* [ %6, %.lr.ph.i ], [ %A, %0 ]
|
||||||
|
%.012.i = phi i32 [ %5, %.lr.ph.i ], [ 0, %0 ]
|
||||||
|
%4 = load i32 addrspace(1)* %.03.i, align 4
|
||||||
|
%5 = add nsw i32 %4, %.012.i
|
||||||
|
%6 = getelementptr inbounds i32 addrspace(1)* %.03.i, i64 1
|
||||||
|
%7 = icmp eq i32 addrspace(1)* %6, %2
|
||||||
|
br i1 %7, label %_ZSt10accumulateIPiiET0_T_S2_S1_.exit, label %.lr.ph.i
|
||||||
|
|
||||||
|
_ZSt10accumulateIPiiET0_T_S2_S1_.exit: ; preds = %.lr.ph.i, %0
|
||||||
|
%.01.lcssa.i = phi i32 [ 0, %0 ], [ %5, %.lr.ph.i ]
|
||||||
|
ret i32 %.01.lcssa.i
|
||||||
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user