mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-12 13:30:51 +00:00
R600/SI: Optimize SI_KILL for constant operands
If the SI_KILL operand is constant, we can either clear the exec mask if the operand is negative, or do nothing otherwise. Reviewed-by: Tom Stellard <thomas.stellard@amd.com> git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@202337 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
a5fbf24716
commit
644aecfc97
@ -1333,7 +1333,7 @@ def SI_END_CF : InstSI <
|
||||
|
||||
def SI_KILL : InstSI <
|
||||
(outs),
|
||||
(ins VReg_32:$src),
|
||||
(ins VSrc_32:$src),
|
||||
"SI_KILL $src",
|
||||
[(int_AMDGPU_kill f32:$src)]
|
||||
>;
|
||||
@ -1425,7 +1425,7 @@ def : Pat<
|
||||
|
||||
def : Pat <
|
||||
(int_AMDGPU_kilp),
|
||||
(SI_KILL (V_MOV_B32_e32 0xbf800000))
|
||||
(SI_KILL 0xbf800000)
|
||||
>;
|
||||
|
||||
/* int_SI_vs_load_input */
|
||||
|
@ -55,6 +55,7 @@
|
||||
#include "llvm/CodeGen/MachineFunctionPass.h"
|
||||
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
||||
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
||||
#include "llvm/IR/Constants.h"
|
||||
|
||||
using namespace llvm;
|
||||
|
||||
@ -294,6 +295,7 @@ void SILowerControlFlowPass::Branch(MachineInstr &MI) {
|
||||
void SILowerControlFlowPass::Kill(MachineInstr &MI) {
|
||||
MachineBasicBlock &MBB = *MI.getParent();
|
||||
DebugLoc DL = MI.getDebugLoc();
|
||||
const MachineOperand &Op = MI.getOperand(0);
|
||||
|
||||
// Kill is only allowed in pixel / geometry shaders
|
||||
assert(MBB.getParent()->getInfo<SIMachineFunctionInfo>()->ShaderType ==
|
||||
@ -301,10 +303,19 @@ void SILowerControlFlowPass::Kill(MachineInstr &MI) {
|
||||
MBB.getParent()->getInfo<SIMachineFunctionInfo>()->ShaderType ==
|
||||
ShaderType::GEOMETRY);
|
||||
|
||||
// Clear this pixel from the exec mask if the operand is negative
|
||||
// Clear this thread from the exec mask if the operand is negative
|
||||
if ((Op.isImm() || Op.isFPImm())) {
|
||||
// Constant operand: Set exec mask to 0 or do nothing
|
||||
if (Op.isImm() ? (Op.getImm() & 0x80000000) :
|
||||
Op.getFPImm()->isNegative()) {
|
||||
BuildMI(MBB, &MI, DL, TII->get(AMDGPU::S_MOV_B64), AMDGPU::EXEC)
|
||||
.addImm(0);
|
||||
}
|
||||
} else {
|
||||
BuildMI(MBB, &MI, DL, TII->get(AMDGPU::V_CMPX_LE_F32_e32), AMDGPU::VCC)
|
||||
.addImm(0)
|
||||
.addOperand(MI.getOperand(0));
|
||||
.addOperand(Op);
|
||||
}
|
||||
|
||||
MI.eraseFromParent();
|
||||
}
|
||||
|
@ -1,13 +1,17 @@
|
||||
; RUN: llc < %s -march=r600 -mcpu=verde -verify-machineinstrs | FileCheck --check-prefix=SI %s
|
||||
|
||||
; SI-LABEL: @kill_gs
|
||||
; SI: V_CMPX_LE_F32
|
||||
; SI-LABEL: @kill_gs_const
|
||||
; SI-NOT: V_CMPX_LE_F32
|
||||
; SI: S_MOV_B64 exec, 0
|
||||
|
||||
define void @kill_gs() #0 {
|
||||
define void @kill_gs_const() #0 {
|
||||
main_body:
|
||||
%0 = icmp ule i32 0, 3
|
||||
%1 = select i1 %0, float 1.000000e+00, float -1.000000e+00
|
||||
call void @llvm.AMDGPU.kill(float %1)
|
||||
%2 = icmp ule i32 3, 0
|
||||
%3 = select i1 %2, float 1.000000e+00, float -1.000000e+00
|
||||
call void @llvm.AMDGPU.kill(float %3)
|
||||
ret void
|
||||
}
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user