mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-03 13:31:05 +00:00
On AVX, we can load v8i32 at a time. The bug happens when two uneven loads are used.
When we load the v12i32 type, the GenWidenVectorLoads method generates two loads: v8i32 and v4i32 and attempts to use CONCAT_VECTORS to join them. In this fix I concat undef values to widen the smaller value. The test "widen_load-2.ll" also exposes this bug on AVX. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@147964 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
3bf052b76c
commit
c8d12eee12
@ -2329,19 +2329,37 @@ SDValue DAGTypeLegalizer::GenWidenVectorLoads(SmallVector<SDValue, 16> &LdChain,
|
|||||||
BasePtr = DAG.getNode(ISD::ADD, dl, BasePtr.getValueType(), BasePtr,
|
BasePtr = DAG.getNode(ISD::ADD, dl, BasePtr.getValueType(), BasePtr,
|
||||||
DAG.getIntPtrConstant(Increment));
|
DAG.getIntPtrConstant(Increment));
|
||||||
|
|
||||||
|
SDValue L;
|
||||||
if (LdWidth < NewVTWidth) {
|
if (LdWidth < NewVTWidth) {
|
||||||
// Our current type we are using is too large, find a better size
|
// Our current type we are using is too large, find a better size
|
||||||
NewVT = FindMemType(DAG, TLI, LdWidth, WidenVT, LdAlign, WidthDiff);
|
NewVT = FindMemType(DAG, TLI, LdWidth, WidenVT, LdAlign, WidthDiff);
|
||||||
NewVTWidth = NewVT.getSizeInBits();
|
NewVTWidth = NewVT.getSizeInBits();
|
||||||
}
|
L = DAG.getLoad(NewVT, dl, Chain, BasePtr,
|
||||||
|
|
||||||
SDValue LdOp = DAG.getLoad(NewVT, dl, Chain, BasePtr,
|
|
||||||
LD->getPointerInfo().getWithOffset(Offset),
|
LD->getPointerInfo().getWithOffset(Offset),
|
||||||
isVolatile,
|
isVolatile,
|
||||||
isNonTemporal, isInvariant,
|
isNonTemporal, isInvariant,
|
||||||
MinAlign(Align, Increment));
|
MinAlign(Align, Increment));
|
||||||
LdChain.push_back(LdOp.getValue(1));
|
LdChain.push_back(L.getValue(1));
|
||||||
LdOps.push_back(LdOp);
|
if (L->getValueType(0).isVector()) {
|
||||||
|
SmallVector<SDValue, 16> Loads;
|
||||||
|
Loads.push_back(L);
|
||||||
|
unsigned size = L->getValueSizeInBits(0);
|
||||||
|
while (size < LdOp->getValueSizeInBits(0)) {
|
||||||
|
Loads.push_back(DAG.getUNDEF(L->getValueType(0)));
|
||||||
|
size += L->getValueSizeInBits(0);
|
||||||
|
}
|
||||||
|
L = DAG.getNode(ISD::CONCAT_VECTORS, dl, LdOp->getValueType(0),
|
||||||
|
&Loads[0], Loads.size());
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
L = DAG.getLoad(NewVT, dl, Chain, BasePtr,
|
||||||
|
LD->getPointerInfo().getWithOffset(Offset), isVolatile,
|
||||||
|
isNonTemporal, isInvariant, MinAlign(Align, Increment));
|
||||||
|
LdChain.push_back(L.getValue(1));
|
||||||
|
}
|
||||||
|
|
||||||
|
LdOps.push_back(L);
|
||||||
|
|
||||||
|
|
||||||
LdWidth -= NewVTWidth;
|
LdWidth -= NewVTWidth;
|
||||||
}
|
}
|
||||||
|
12
test/CodeGen/X86/2012-01-11-split-cv.ll
Normal file
12
test/CodeGen/X86/2012-01-11-split-cv.ll
Normal file
@ -0,0 +1,12 @@
|
|||||||
|
; RUN: llc < %s -march=x86 -mcpu=corei7-avx -mattr=+avx -mtriple=i686-pc-win32 | FileCheck %s
|
||||||
|
|
||||||
|
;CHECK: add18i16
|
||||||
|
define void @add18i16(<18 x i16>* nocapture sret %ret, <18 x i16>* %bp) nounwind {
|
||||||
|
;CHECK: vmovups
|
||||||
|
%b = load <18 x i16>* %bp, align 16
|
||||||
|
%x = add <18 x i16> zeroinitializer, %b
|
||||||
|
store <18 x i16> %x, <18 x i16>* %ret, align 16
|
||||||
|
;CHECK: ret
|
||||||
|
ret void
|
||||||
|
}
|
||||||
|
|
Loading…
Reference in New Issue
Block a user