mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-02-05 14:34:55 +00:00
R600/SI: Fix crash with VSELECT
https://bugs.freedesktop.org/show_bug.cgi?id=66175 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@186616 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
ac85f3f65c
commit
4e518fd941
@ -34,6 +34,9 @@ SITargetLowering::SITargetLowering(TargetMachine &TM) :
|
|||||||
addRegisterClass(MVT::i1, &AMDGPU::SReg_64RegClass);
|
addRegisterClass(MVT::i1, &AMDGPU::SReg_64RegClass);
|
||||||
addRegisterClass(MVT::i64, &AMDGPU::SReg_64RegClass);
|
addRegisterClass(MVT::i64, &AMDGPU::SReg_64RegClass);
|
||||||
|
|
||||||
|
addRegisterClass(MVT::v2i1, &AMDGPU::VReg_64RegClass);
|
||||||
|
addRegisterClass(MVT::v4i1, &AMDGPU::VReg_128RegClass);
|
||||||
|
|
||||||
addRegisterClass(MVT::v16i8, &AMDGPU::SReg_128RegClass);
|
addRegisterClass(MVT::v16i8, &AMDGPU::SReg_128RegClass);
|
||||||
addRegisterClass(MVT::v32i8, &AMDGPU::SReg_256RegClass);
|
addRegisterClass(MVT::v32i8, &AMDGPU::SReg_256RegClass);
|
||||||
addRegisterClass(MVT::v64i8, &AMDGPU::SReg_512RegClass);
|
addRegisterClass(MVT::v64i8, &AMDGPU::SReg_512RegClass);
|
||||||
@ -72,6 +75,9 @@ SITargetLowering::SITargetLowering(TargetMachine &TM) :
|
|||||||
|
|
||||||
setOperationAction(ISD::SELECT_CC, MVT::Other, Expand);
|
setOperationAction(ISD::SELECT_CC, MVT::Other, Expand);
|
||||||
|
|
||||||
|
setOperationAction(ISD::SETCC, MVT::v2i1, Expand);
|
||||||
|
setOperationAction(ISD::SETCC, MVT::v4i1, Expand);
|
||||||
|
|
||||||
setOperationAction(ISD::SIGN_EXTEND, MVT::i64, Custom);
|
setOperationAction(ISD::SIGN_EXTEND, MVT::i64, Custom);
|
||||||
|
|
||||||
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
|
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
|
||||||
@ -318,7 +324,10 @@ MachineBasicBlock * SITargetLowering::EmitInstrWithCustomInserter(
|
|||||||
}
|
}
|
||||||
|
|
||||||
EVT SITargetLowering::getSetCCResultType(LLVMContext &, EVT VT) const {
|
EVT SITargetLowering::getSetCCResultType(LLVMContext &, EVT VT) const {
|
||||||
|
if (!VT.isVector()) {
|
||||||
return MVT::i1;
|
return MVT::i1;
|
||||||
|
}
|
||||||
|
return MVT::getVectorVT(MVT::i1, VT.getVectorNumElements());
|
||||||
}
|
}
|
||||||
|
|
||||||
MVT SITargetLowering::getScalarShiftAmountTy(EVT VT) const {
|
MVT SITargetLowering::getScalarShiftAmountTy(EVT VT) const {
|
||||||
|
@ -1487,6 +1487,9 @@ def : BitConvert <f64, i64, VReg_64>;
|
|||||||
def : BitConvert <v2f32, v2i32, VReg_64>;
|
def : BitConvert <v2f32, v2i32, VReg_64>;
|
||||||
def : BitConvert <v2i32, v2f32, VReg_64>;
|
def : BitConvert <v2i32, v2f32, VReg_64>;
|
||||||
|
|
||||||
|
def : BitConvert <v4f32, v4i32, VReg_128>;
|
||||||
|
def : BitConvert <v4i32, v4f32, VReg_128>;
|
||||||
|
|
||||||
/********** =================== **********/
|
/********** =================== **********/
|
||||||
/********** Src & Dst modifiers **********/
|
/********** Src & Dst modifiers **********/
|
||||||
/********** =================== **********/
|
/********** =================== **********/
|
||||||
|
@ -1,9 +1,14 @@
|
|||||||
;RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck --check-prefix=EG-CHECK %s
|
;RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck --check-prefix=EG-CHECK %s
|
||||||
|
;RUN: llc < %s -march=r600 -mcpu=SI | FileCheck --check-prefix=SI-CHECK %s
|
||||||
|
|
||||||
;EG-CHECK: @test_select_v2i32
|
;EG-CHECK: @test_select_v2i32
|
||||||
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
||||||
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
||||||
|
|
||||||
|
;SI-CHECK: @test_select_v2i32
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
|
||||||
define void @test_select_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in0, <2 x i32> addrspace(1)* %in1) {
|
define void @test_select_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in0, <2 x i32> addrspace(1)* %in1) {
|
||||||
entry:
|
entry:
|
||||||
%0 = load <2 x i32> addrspace(1)* %in0
|
%0 = load <2 x i32> addrspace(1)* %in0
|
||||||
@ -18,6 +23,10 @@ entry:
|
|||||||
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
||||||
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
||||||
|
|
||||||
|
;SI-CHECK: @test_select_v2f32
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
|
||||||
define void @test_select_v2f32(<2 x float> addrspace(1)* %out, <2 x float> addrspace(1)* %in0, <2 x float> addrspace(1)* %in1) {
|
define void @test_select_v2f32(<2 x float> addrspace(1)* %out, <2 x float> addrspace(1)* %in0, <2 x float> addrspace(1)* %in1) {
|
||||||
entry:
|
entry:
|
||||||
%0 = load <2 x float> addrspace(1)* %in0
|
%0 = load <2 x float> addrspace(1)* %in0
|
||||||
@ -34,6 +43,12 @@ entry:
|
|||||||
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
||||||
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
;EG-CHECK: CNDE_INT {{\*? *}}T{{[0-9]+\.[XYZW], PV\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
|
||||||
|
|
||||||
|
;SI-CHECK: @test_select_v4i32
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
;SI-CHECK: V_CNDMASK_B32_e64
|
||||||
|
|
||||||
define void @test_select_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in0, <4 x i32> addrspace(1)* %in1) {
|
define void @test_select_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in0, <4 x i32> addrspace(1)* %in1) {
|
||||||
entry:
|
entry:
|
||||||
%0 = load <4 x i32> addrspace(1)* %in0
|
%0 = load <4 x i32> addrspace(1)* %in0
|
||||||
|
Loading…
x
Reference in New Issue
Block a user