mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-16 14:31:59 +00:00
[ARM] check bitwidth in PerformORCombine
When simplifying a (or (and B A) (and C ~A)) to a (VBSL A B C) ensure that the bitwidth of the second operands to both ands match before comparing the negation of the values. Split the check of the value of the second operands to the ands. Move the cast and variable declaration slightly higher to make it slightly easier to follow. Bug-Id: 16700 Signed-off-by: Saleem Abdulrasool <compnerd@compnerd.org> git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@187404 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
bcbb5dacbd
commit
f7f22a64df
@ -8407,24 +8407,31 @@ static SDValue PerformORCombine(SDNode *N,
|
|||||||
unsigned SplatBitSize;
|
unsigned SplatBitSize;
|
||||||
bool HasAnyUndefs;
|
bool HasAnyUndefs;
|
||||||
|
|
||||||
|
APInt SplatBits0, SplatBits1;
|
||||||
BuildVectorSDNode *BVN0 = dyn_cast<BuildVectorSDNode>(N0->getOperand(1));
|
BuildVectorSDNode *BVN0 = dyn_cast<BuildVectorSDNode>(N0->getOperand(1));
|
||||||
APInt SplatBits0;
|
BuildVectorSDNode *BVN1 = dyn_cast<BuildVectorSDNode>(N1->getOperand(1));
|
||||||
|
// Ensure that the second operand of both ands are constants
|
||||||
if (BVN0 && BVN0->isConstantSplat(SplatBits0, SplatUndef, SplatBitSize,
|
if (BVN0 && BVN0->isConstantSplat(SplatBits0, SplatUndef, SplatBitSize,
|
||||||
HasAnyUndefs) && !HasAnyUndefs) {
|
HasAnyUndefs) && !HasAnyUndefs) {
|
||||||
BuildVectorSDNode *BVN1 = dyn_cast<BuildVectorSDNode>(N1->getOperand(1));
|
|
||||||
APInt SplatBits1;
|
|
||||||
if (BVN1 && BVN1->isConstantSplat(SplatBits1, SplatUndef, SplatBitSize,
|
if (BVN1 && BVN1->isConstantSplat(SplatBits1, SplatUndef, SplatBitSize,
|
||||||
HasAnyUndefs) && !HasAnyUndefs &&
|
HasAnyUndefs) && !HasAnyUndefs) {
|
||||||
|
// Ensure that the bit width of the constants are the same and that
|
||||||
|
// the splat arguments are logical inverses as per the pattern we
|
||||||
|
// are trying to simplify.
|
||||||
|
if (SplatBits0.getBitWidth() == SplatBits1.getBitWidth() &&
|
||||||
SplatBits0 == ~SplatBits1) {
|
SplatBits0 == ~SplatBits1) {
|
||||||
// Canonicalize the vector type to make instruction selection simpler.
|
// Canonicalize the vector type to make instruction selection
|
||||||
|
// simpler.
|
||||||
EVT CanonicalVT = VT.is128BitVector() ? MVT::v4i32 : MVT::v2i32;
|
EVT CanonicalVT = VT.is128BitVector() ? MVT::v4i32 : MVT::v2i32;
|
||||||
SDValue Result = DAG.getNode(ARMISD::VBSL, dl, CanonicalVT,
|
SDValue Result = DAG.getNode(ARMISD::VBSL, dl, CanonicalVT,
|
||||||
N0->getOperand(1), N0->getOperand(0),
|
N0->getOperand(1),
|
||||||
|
N0->getOperand(0),
|
||||||
N1->getOperand(0));
|
N1->getOperand(0));
|
||||||
return DAG.getNode(ISD::BITCAST, dl, VT, Result);
|
return DAG.getNode(ISD::BITCAST, dl, VT, Result);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
// Try to use the ARM/Thumb2 BFI (bitfield insert) instruction when
|
// Try to use the ARM/Thumb2 BFI (bitfield insert) instruction when
|
||||||
// reasonable.
|
// reasonable.
|
||||||
|
32
test/CodeGen/ARM/2013-07-29-vector-or-combine.ll
Normal file
32
test/CodeGen/ARM/2013-07-29-vector-or-combine.ll
Normal file
@ -0,0 +1,32 @@
|
|||||||
|
; RUN: llc < %s -mcpu=cortex-a8 | FileCheck %s
|
||||||
|
; ModuleID = 'bugpoint-reduced-simplified.bc'
|
||||||
|
target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:64:128-a0:0:64-n32-S64"
|
||||||
|
target triple = "armv7--linux-gnueabi"
|
||||||
|
|
||||||
|
; CHECK-LABEL: function
|
||||||
|
define void @function() {
|
||||||
|
; CHECK: cmp r0, #0
|
||||||
|
; CHECK: bxne lr
|
||||||
|
; CHECK: vmov.i32 q8, #0xff0000
|
||||||
|
entry:
|
||||||
|
br i1 undef, label %vector.body, label %for.end
|
||||||
|
|
||||||
|
; CHECK: vld1.32 {d18, d19}, [r0]
|
||||||
|
; CHECK: vand q10, q9, q8
|
||||||
|
; CHECK: vbic.i16 q9, #0xff
|
||||||
|
; CHECK: vorr q9, q9, q10
|
||||||
|
; CHECK: vst1.32 {d18, d19}, [r0]
|
||||||
|
vector.body:
|
||||||
|
%wide.load = load <4 x i32>* undef, align 4
|
||||||
|
%0 = and <4 x i32> %wide.load, <i32 -16711936, i32 -16711936, i32 -16711936, i32 -16711936>
|
||||||
|
%1 = sub <4 x i32> %wide.load, zeroinitializer
|
||||||
|
%2 = and <4 x i32> %1, <i32 16711680, i32 16711680, i32 16711680, i32 16711680>
|
||||||
|
%3 = or <4 x i32> undef, %0
|
||||||
|
%4 = or <4 x i32> %3, %2
|
||||||
|
store <4 x i32> %4, <4 x i32>* undef, align 4
|
||||||
|
br label %vector.body
|
||||||
|
|
||||||
|
for.end:
|
||||||
|
ret void
|
||||||
|
}
|
||||||
|
|
Loading…
x
Reference in New Issue
Block a user