mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-24 08:33:39 +00:00
R600: Make cttz / ctlz cheap to speculate
Speculating things is generally good. SI+ has instructions for these for 32-bit values. This is still probably better even with the expansion for 64-bit values, although it is odd that this callback doesn't have the size as a parameter. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@225822 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
88e1d95d4d
commit
9e495c518c
@ -471,6 +471,18 @@ bool AMDGPUTargetLowering::isLoadBitCastBeneficial(EVT LoadTy,
|
|||||||
(LScalarSize < 32));
|
(LScalarSize < 32));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// SI+ has instructions for cttz / ctlz for 32-bit values. This is probably also
|
||||||
|
// profitable with the expansion for 64-bit since it's generally good to
|
||||||
|
// speculate things.
|
||||||
|
// FIXME: These should really have the size as a parameter.
|
||||||
|
bool AMDGPUTargetLowering::isCheapToSpeculateCttz() const {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool AMDGPUTargetLowering::isCheapToSpeculateCtlz() const {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
//===---------------------------------------------------------------------===//
|
//===---------------------------------------------------------------------===//
|
||||||
// Target Properties
|
// Target Properties
|
||||||
//===---------------------------------------------------------------------===//
|
//===---------------------------------------------------------------------===//
|
||||||
|
@ -129,6 +129,9 @@ public:
|
|||||||
EVT ExtVT) const override;
|
EVT ExtVT) const override;
|
||||||
|
|
||||||
bool isLoadBitCastBeneficial(EVT, EVT) const override;
|
bool isLoadBitCastBeneficial(EVT, EVT) const override;
|
||||||
|
bool isCheapToSpeculateCttz() const override;
|
||||||
|
bool isCheapToSpeculateCtlz() const override;
|
||||||
|
|
||||||
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
|
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
|
||||||
bool isVarArg,
|
bool isVarArg,
|
||||||
const SmallVectorImpl<ISD::OutputArg> &Outs,
|
const SmallVectorImpl<ISD::OutputArg> &Outs,
|
||||||
|
224
test/CodeGen/R600/cttz-ctlz.ll
Normal file
224
test/CodeGen/R600/cttz-ctlz.ll
Normal file
@ -0,0 +1,224 @@
|
|||||||
|
; RUN: opt -S -codegenprepare -mtriple=r600-unknown-unknown -mcpu=SI < %s | FileCheck -check-prefix=SI -check-prefix=ALL %s
|
||||||
|
|
||||||
|
|
||||||
|
define i64 @test1(i64 %A) {
|
||||||
|
; ALL-LABEL: @test1(
|
||||||
|
; SI: [[CTLZ:%[A-Za-z0-9]+]] = call i64 @llvm.ctlz.i64(i64 %A, i1 false)
|
||||||
|
; SI-NEXT: ret i64 [[CTLZ]]
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i64 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i64 [ %0, %cond.true ], [ 64, %entry ]
|
||||||
|
ret i64 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define i32 @test2(i32 %A) {
|
||||||
|
; ALL-LABEL: @test2(
|
||||||
|
; SI: [[CTLZ:%[A-Za-z0-9]+]] = call i32 @llvm.ctlz.i32(i32 %A, i1 false)
|
||||||
|
; SI-NEXT: ret i32 [[CTLZ]]
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i32 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i32 [ %0, %cond.true ], [ 32, %entry ]
|
||||||
|
ret i32 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define signext i16 @test3(i16 signext %A) {
|
||||||
|
; ALL-LABEL: @test3(
|
||||||
|
; SI: [[CTLZ:%[A-Za-z0-9]+]] = call i16 @llvm.ctlz.i16(i16 %A, i1 false)
|
||||||
|
; SI-NEXT: ret i16 [[CTLZ]]
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i16 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i16 [ %0, %cond.true ], [ 16, %entry ]
|
||||||
|
ret i16 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define i64 @test1b(i64 %A) {
|
||||||
|
; ALL-LABEL: @test1b(
|
||||||
|
; SI: [[CTTZ:%[A-Za-z0-9]+]] = call i64 @llvm.cttz.i64(i64 %A, i1 false)
|
||||||
|
; SI-NEXT: ret i64 [[CTTZ]]
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i64 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i64 [ %0, %cond.true ], [ 64, %entry ]
|
||||||
|
ret i64 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define i32 @test2b(i32 %A) {
|
||||||
|
; ALL-LABEL: @test2b(
|
||||||
|
; SI: [[CTTZ:%[A-Za-z0-9]+]] = call i32 @llvm.cttz.i32(i32 %A, i1 false)
|
||||||
|
; SI-NEXT: ret i32 [[CTTZ]]
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i32 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i32 [ %0, %cond.true ], [ 32, %entry ]
|
||||||
|
ret i32 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define signext i16 @test3b(i16 signext %A) {
|
||||||
|
; ALL-LABEL: @test3b(
|
||||||
|
; SI: [[CTTZ:%[A-Za-z0-9]+]] = call i16 @llvm.cttz.i16(i16 %A, i1 false)
|
||||||
|
; SI-NEXT: ret i16 [[CTTZ]]
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i16 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i16 [ %0, %cond.true ], [ 16, %entry ]
|
||||||
|
ret i16 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define i64 @test1c(i64 %A) {
|
||||||
|
; ALL-LABEL: @test1c(
|
||||||
|
; ALL: icmp eq i64 %A, 0
|
||||||
|
; ALL: call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i64 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i64 [ %0, %cond.true ], [ 63, %entry ]
|
||||||
|
ret i64 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
define i32 @test2c(i32 %A) {
|
||||||
|
; ALL-LABEL: @test2c(
|
||||||
|
; ALL: icmp eq i32 %A, 0
|
||||||
|
; ALL: call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i32 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i32 [ %0, %cond.true ], [ 31, %entry ]
|
||||||
|
ret i32 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define signext i16 @test3c(i16 signext %A) {
|
||||||
|
; ALL-LABEL: @test3c(
|
||||||
|
; ALL: icmp eq i16 %A, 0
|
||||||
|
; ALL: call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i16 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i16 [ %0, %cond.true ], [ 15, %entry ]
|
||||||
|
ret i16 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define i64 @test1d(i64 %A) {
|
||||||
|
; ALL-LABEL: @test1d(
|
||||||
|
; ALL: icmp eq i64 %A, 0
|
||||||
|
; ALL: call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i64 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i64 [ %0, %cond.true ], [ 63, %entry ]
|
||||||
|
ret i64 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define i32 @test2d(i32 %A) {
|
||||||
|
; ALL-LABEL: @test2d(
|
||||||
|
; ALL: icmp eq i32 %A, 0
|
||||||
|
; ALL: call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i32 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i32 [ %0, %cond.true ], [ 31, %entry ]
|
||||||
|
ret i32 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
define signext i16 @test3d(i16 signext %A) {
|
||||||
|
; ALL-LABEL: @test3d(
|
||||||
|
; ALL: icmp eq i16 %A, 0
|
||||||
|
; ALL: call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
||||||
|
entry:
|
||||||
|
%tobool = icmp eq i16 %A, 0
|
||||||
|
br i1 %tobool, label %cond.end, label %cond.true
|
||||||
|
|
||||||
|
cond.true: ; preds = %entry
|
||||||
|
%0 = tail call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
||||||
|
br label %cond.end
|
||||||
|
|
||||||
|
cond.end: ; preds = %entry, %cond.true
|
||||||
|
%cond = phi i16 [ %0, %cond.true ], [ 15, %entry ]
|
||||||
|
ret i16 %cond
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
declare i64 @llvm.ctlz.i64(i64, i1)
|
||||||
|
declare i32 @llvm.ctlz.i32(i32, i1)
|
||||||
|
declare i16 @llvm.ctlz.i16(i16, i1)
|
||||||
|
declare i64 @llvm.cttz.i64(i64, i1)
|
||||||
|
declare i32 @llvm.cttz.i32(i32, i1)
|
||||||
|
declare i16 @llvm.cttz.i16(i16, i1)
|
Loading…
x
Reference in New Issue
Block a user