mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-04-07 01:38:26 +00:00
[DAGCombine] Fix a bug in a BUILD_VECTOR combine
When trying to convert a BUILD_VECTOR into a shuffle, we try to split a single source vector that is twice as wide as the destination vector. We can not do this when we also need the zero vector to create a blend. This fixes PR22774. Differential Revision: http://reviews.llvm.org/D8040 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@231219 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
4e942d63c0
commit
bbfda9c125
@ -11358,7 +11358,9 @@ SDValue DAGCombiner::visitBUILD_VECTOR(SDNode *N) {
|
||||
} else if (VecInT.getSizeInBits() == VT.getSizeInBits() * 2) {
|
||||
// If the input vector is too large, try to split it.
|
||||
// We don't support having two input vectors that are too large.
|
||||
if (VecIn2.getNode())
|
||||
// If the zero vector was used, we can not split the vector,
|
||||
// since we'd need 3 inputs.
|
||||
if (UsesZeroVector || VecIn2.getNode())
|
||||
return SDValue();
|
||||
|
||||
if (!TLI.isExtractSubvectorCheap(VT, VT.getVectorNumElements()))
|
||||
@ -11370,7 +11372,6 @@ SDValue DAGCombiner::visitBUILD_VECTOR(SDNode *N) {
|
||||
DAG.getConstant(VT.getVectorNumElements(), TLI.getVectorIdxTy()));
|
||||
VecIn1 = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, VT, VecIn1,
|
||||
DAG.getConstant(0, TLI.getVectorIdxTy()));
|
||||
UsesZeroVector = false;
|
||||
} else
|
||||
return SDValue();
|
||||
}
|
||||
|
20
test/CodeGen/X86/pr22774.ll
Normal file
20
test/CodeGen/X86/pr22774.ll
Normal file
@ -0,0 +1,20 @@
|
||||
; RUN: llc -mattr=avx %s -o - | FileCheck %s
|
||||
|
||||
target datalayout = "e-m:o-i64:64-f80:128-n8:16:32:64-S128"
|
||||
target triple = "x86_64-pc-linux-gnu"
|
||||
|
||||
@in = global <4 x i64> <i64 -1, i64 -1, i64 -1, i64 -1>, align 32
|
||||
@out = global <2 x i64> zeroinitializer, align 16
|
||||
|
||||
define i32 @_Z3foov() {
|
||||
entry:
|
||||
; CHECK: vmovdqa in(%rip), %ymm0
|
||||
; CHECK-NEXT: vmovq %xmm0, %xmm0
|
||||
; CHECK-NEXT: vmovdqa %xmm0, out(%rip)
|
||||
%0 = load <4 x i64>, <4 x i64>* @in, align 32
|
||||
%vecext = extractelement <4 x i64> %0, i32 0
|
||||
%vecinit = insertelement <2 x i64> undef, i64 %vecext, i32 0
|
||||
%vecinit1 = insertelement <2 x i64> %vecinit, i64 0, i32 1
|
||||
store <2 x i64> %vecinit1, <2 x i64>* @out, align 16
|
||||
ret i32 0
|
||||
}
|
Loading…
x
Reference in New Issue
Block a user