mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-16 11:30:51 +00:00
34288d885e
Now that we can fully specify extload legality, we can declare them legal for the PMOVSX/PMOVZX instructions. This for instance enables a DAGCombine to fire on code such as (and (<zextload-equivalent> ...), <redundant mask>) to turn it into: (zextload ...) as seen in the testcase changes. There is one regression, in widen_load-2.ll: we're no longer able to do store-to-load forwarding with illegal extload memory types. This will be addressed separately. Differential Revision: http://reviews.llvm.org/D6533 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@226676 91177308-0d34-0410-b5e6-96231b3b80d8
136 lines
3.0 KiB
LLVM
136 lines
3.0 KiB
LLVM
; RUN: llc < %s -mtriple=i686-linux -mcpu=corei7 | FileCheck %s
|
|
; RUN: opt -instsimplify -disable-output < %s
|
|
|
|
;CHECK: SHUFF0
|
|
define <8 x i32*> @SHUFF0(<4 x i32*> %ptrv) nounwind {
|
|
entry:
|
|
%G = shufflevector <4 x i32*> %ptrv, <4 x i32*> %ptrv, <8 x i32> <i32 2, i32 7, i32 1, i32 2, i32 4, i32 5, i32 1, i32 1>
|
|
;CHECK: pshufd
|
|
ret <8 x i32*> %G
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: SHUFF1
|
|
define <4 x i32*> @SHUFF1(<4 x i32*> %ptrv) nounwind {
|
|
entry:
|
|
%G = shufflevector <4 x i32*> %ptrv, <4 x i32*> %ptrv, <4 x i32> <i32 2, i32 7, i32 7, i32 2>
|
|
;CHECK: pshufd
|
|
ret <4 x i32*> %G
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: SHUFF3
|
|
define <4 x i8*> @SHUFF3(<4 x i8*> %ptrv) nounwind {
|
|
entry:
|
|
%G = shufflevector <4 x i8*> %ptrv, <4 x i8*> undef, <4 x i32> <i32 2, i32 7, i32 1, i32 2>
|
|
;CHECK: pshufd
|
|
ret <4 x i8*> %G
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: LOAD0
|
|
define <4 x i8*> @LOAD0(<4 x i8*>* %p) nounwind {
|
|
entry:
|
|
%G = load <4 x i8*>* %p
|
|
;CHECK: movaps
|
|
ret <4 x i8*> %G
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: LOAD1
|
|
define <4 x i8*> @LOAD1(<4 x i8*>* %p) nounwind {
|
|
entry:
|
|
%G = load <4 x i8*>* %p
|
|
;CHECK: movdqa
|
|
;CHECK: pshufd
|
|
;CHECK: movdqa
|
|
%T = shufflevector <4 x i8*> %G, <4 x i8*> %G, <4 x i32> <i32 7, i32 1, i32 4, i32 3>
|
|
store <4 x i8*> %T, <4 x i8*>* %p
|
|
ret <4 x i8*> %G
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: LOAD2
|
|
define <4 x i8*> @LOAD2(<4 x i8*>* %p) nounwind {
|
|
entry:
|
|
%I = alloca <4 x i8*>
|
|
;CHECK: sub
|
|
%G = load <4 x i8*>* %p
|
|
;CHECK: movaps
|
|
store <4 x i8*> %G, <4 x i8*>* %I
|
|
;CHECK: movaps
|
|
%Z = load <4 x i8*>* %I
|
|
ret <4 x i8*> %Z
|
|
;CHECK: add
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: INT2PTR0
|
|
define <4 x i32> @INT2PTR0(<4 x i8*>* %p) nounwind {
|
|
entry:
|
|
%G = load <4 x i8*>* %p
|
|
;CHECK: movl
|
|
;CHECK: movaps
|
|
%K = ptrtoint <4 x i8*> %G to <4 x i32>
|
|
;CHECK: ret
|
|
ret <4 x i32> %K
|
|
}
|
|
|
|
;CHECK: INT2PTR1
|
|
define <4 x i32*> @INT2PTR1(<4 x i8>* %p) nounwind {
|
|
entry:
|
|
%G = load <4 x i8>* %p
|
|
;CHECK: movl
|
|
;CHECK: pmovzxbd (%
|
|
%K = inttoptr <4 x i8> %G to <4 x i32*>
|
|
;CHECK: ret
|
|
ret <4 x i32*> %K
|
|
}
|
|
|
|
;CHECK: BITCAST0
|
|
define <4 x i32*> @BITCAST0(<4 x i8*>* %p) nounwind {
|
|
entry:
|
|
%G = load <4 x i8*>* %p
|
|
;CHECK: movl
|
|
%T = bitcast <4 x i8*> %G to <4 x i32*>
|
|
;CHECK: movaps
|
|
;CHECK: ret
|
|
ret <4 x i32*> %T
|
|
}
|
|
|
|
;CHECK: BITCAST1
|
|
define <2 x i32*> @BITCAST1(<2 x i8*>* %p) nounwind {
|
|
entry:
|
|
%G = load <2 x i8*>* %p
|
|
;CHECK: movl
|
|
;CHECK: pmovzxdq
|
|
%T = bitcast <2 x i8*> %G to <2 x i32*>
|
|
;CHECK: ret
|
|
ret <2 x i32*> %T
|
|
}
|
|
|
|
;CHECK: ICMP0
|
|
define <4 x i32> @ICMP0(<4 x i8*>* %p0, <4 x i8*>* %p1) nounwind {
|
|
entry:
|
|
%g0 = load <4 x i8*>* %p0
|
|
%g1 = load <4 x i8*>* %p1
|
|
%k = icmp sgt <4 x i8*> %g0, %g1
|
|
;CHECK: pcmpgtd
|
|
%j = select <4 x i1> %k, <4 x i32> <i32 0, i32 1, i32 2, i32 4>, <4 x i32> <i32 9, i32 8, i32 7, i32 6>
|
|
ret <4 x i32> %j
|
|
;CHECK: ret
|
|
}
|
|
|
|
;CHECK: ICMP1
|
|
define <4 x i32> @ICMP1(<4 x i8*>* %p0, <4 x i8*>* %p1) nounwind {
|
|
entry:
|
|
%g0 = load <4 x i8*>* %p0
|
|
%g1 = load <4 x i8*>* %p1
|
|
%k = icmp eq <4 x i8*> %g0, %g1
|
|
;CHECK: pcmpeqd
|
|
%j = select <4 x i1> %k, <4 x i32> <i32 0, i32 1, i32 2, i32 4>, <4 x i32> <i32 9, i32 8, i32 7, i32 6>
|
|
ret <4 x i32> %j
|
|
;CHECK: ret
|
|
}
|
|
|