mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-12 17:32:19 +00:00
e46783d5b7
This patch improves the logic added at revision 224899 (see review D6728) that teaches the backend when it is profitable to speculate calls to cttz/ctlz. The original algorithm conservatively avoided speculating more than one instruction from a basic block in a control flow grap modelling an if-statement. In particular, the only allowed instruction (excluding the terminator) was a call to cttz/ctlz. However, there are cases where we could be less conservative and still be able to speculate a call to cttz/ctlz. With this patch, CodeGenPrepare now tries to speculate a cttz/ctlz if the result is zero extended/truncated in the same basic block, and the zext/trunc instruction is "free" for the target. Added new test cases to CodeGen/X86/cttz-ctlz.ll Differential Revision: http://reviews.llvm.org/D6853 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@225274 91177308-0d34-0410-b5e6-96231b3b80d8
423 lines
13 KiB
LLVM
423 lines
13 KiB
LLVM
; RUN: opt -S -codegenprepare -mtriple=x86_64-unknown-unknown -mattr=+bmi < %s | FileCheck %s --check-prefix=ALL --check-prefix=BMI
|
|
; RUN: opt -S -codegenprepare -mtriple=x86_64-unknown-unknown -mattr=+lzcnt < %s | FileCheck %s --check-prefix=ALL --check-prefix=LZCNT
|
|
; RUN: opt -S -codegenprepare -mtriple=x86_64-unknown-unknown < %s | FileCheck %s --check-prefix=ALL --check-prefix=GENERIC
|
|
|
|
|
|
define i64 @test1(i64 %A) {
|
|
; ALL-LABEL: @test1(
|
|
; LZCNT: [[CTLZ:%[A-Za-z0-9]+]] = call i64 @llvm.ctlz.i64(i64 %A, i1 false)
|
|
; LZCNT-NEXT: ret i64 [[CTLZ]]
|
|
; BMI: icmp eq i64 %A, 0
|
|
; BMI: call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
|
; GENERIC: icmp eq i64 %A, 0
|
|
; GENERIC: call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i64 [ %0, %cond.true ], [ 64, %entry ]
|
|
ret i64 %cond
|
|
}
|
|
|
|
|
|
define i32 @test2(i32 %A) {
|
|
; ALL-LABEL: @test2(
|
|
; LZCNT: [[CTLZ:%[A-Za-z0-9]+]] = call i32 @llvm.ctlz.i32(i32 %A, i1 false)
|
|
; LZCNT-NEXT: ret i32 [[CTLZ]]
|
|
; BMI: icmp eq i32 %A, 0
|
|
; BMI: call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
; GENERIC: icmp eq i32 %A, 0
|
|
; GENERIC: call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i32 [ %0, %cond.true ], [ 32, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
|
|
define signext i16 @test3(i16 signext %A) {
|
|
; ALL-LABEL: @test3(
|
|
; LZCNT: [[CTLZ:%[A-Za-z0-9]+]] = call i16 @llvm.ctlz.i16(i16 %A, i1 false)
|
|
; LZCNT-NEXT: ret i16 [[CTLZ]]
|
|
; BMI: icmp eq i16 %A, 0
|
|
; BMI: call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
|
; GENERIC: icmp eq i16 %A, 0
|
|
; GENERIC: call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i16 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %0, %cond.true ], [ 16, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
|
|
define i64 @test1b(i64 %A) {
|
|
; ALL-LABEL: @test1b(
|
|
; LZCNT: icmp eq i64 %A, 0
|
|
; LZCNT: call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
|
; BMI: [[CTTZ:%[A-Za-z0-9]+]] = call i64 @llvm.cttz.i64(i64 %A, i1 false)
|
|
; BMI-NEXT: ret i64 [[CTTZ]]
|
|
; GENERIC: icmp eq i64 %A, 0
|
|
; GENERIC: call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i64 [ %0, %cond.true ], [ 64, %entry ]
|
|
ret i64 %cond
|
|
}
|
|
|
|
|
|
define i32 @test2b(i32 %A) {
|
|
; ALL-LABEL: @test2b(
|
|
; LZCNT: icmp eq i32 %A, 0
|
|
; LZCNT: call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
; BMI: [[CTTZ:%[A-Za-z0-9]+]] = call i32 @llvm.cttz.i32(i32 %A, i1 false)
|
|
; BMI-NEXT: ret i32 [[CTTZ]]
|
|
; GENERIC: icmp eq i32 %A, 0
|
|
; GENERIC: call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i32 [ %0, %cond.true ], [ 32, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
|
|
define signext i16 @test3b(i16 signext %A) {
|
|
; ALL-LABEL: @test3b(
|
|
; LZCNT: icmp eq i16 %A, 0
|
|
; LZCNT: call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
|
; BMI: [[CTTZ:%[A-Za-z0-9]+]] = call i16 @llvm.cttz.i16(i16 %A, i1 false)
|
|
; BMI-NEXT: ret i16 [[CTTZ]]
|
|
; GENERIC: icmp eq i16 %A, 0
|
|
; GENERIC: call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i16 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %0, %cond.true ], [ 16, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
|
|
define i64 @test1c(i64 %A) {
|
|
; ALL-LABEL: @test1c(
|
|
; ALL: icmp eq i64 %A, 0
|
|
; ALL: call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.ctlz.i64(i64 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i64 [ %0, %cond.true ], [ 63, %entry ]
|
|
ret i64 %cond
|
|
}
|
|
|
|
define i32 @test2c(i32 %A) {
|
|
; ALL-LABEL: @test2c(
|
|
; ALL: icmp eq i32 %A, 0
|
|
; ALL: call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i32 [ %0, %cond.true ], [ 31, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
|
|
define signext i16 @test3c(i16 signext %A) {
|
|
; ALL-LABEL: @test3c(
|
|
; ALL: icmp eq i16 %A, 0
|
|
; ALL: call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i16 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i16 @llvm.ctlz.i16(i16 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %0, %cond.true ], [ 15, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
|
|
define i64 @test1d(i64 %A) {
|
|
; ALL-LABEL: @test1d(
|
|
; ALL: icmp eq i64 %A, 0
|
|
; ALL: call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.cttz.i64(i64 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i64 [ %0, %cond.true ], [ 63, %entry ]
|
|
ret i64 %cond
|
|
}
|
|
|
|
|
|
define i32 @test2d(i32 %A) {
|
|
; ALL-LABEL: @test2d(
|
|
; ALL: icmp eq i32 %A, 0
|
|
; ALL: call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.cttz.i32(i32 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i32 [ %0, %cond.true ], [ 31, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
|
|
define signext i16 @test3d(i16 signext %A) {
|
|
; ALL-LABEL: @test3d(
|
|
; ALL: icmp eq i16 %A, 0
|
|
; ALL: call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i16 %A, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i16 @llvm.cttz.i16(i16 %A, i1 true)
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %0, %cond.true ], [ 15, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
; The following tests verify that calls to cttz/ctlz are speculated even if
|
|
; basic block %cond.true has an extra zero extend/truncate which is "free"
|
|
; for the target.
|
|
|
|
define i64 @test1e(i32 %x) {
|
|
; ALL-LABEL: @test1e(
|
|
; LZCNT: icmp eq i32 %x, 0
|
|
; LZCNT: call i32 @llvm.cttz.i32(i32 %x, i1 true)
|
|
; BMI: call i32 @llvm.cttz.i32(i32 %x, i1 false)
|
|
; GENERIC: icmp eq i32 %x, 0
|
|
; GENERIC: call i32 @llvm.cttz.i32(i32 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.cttz.i32(i32 %x, i1 true)
|
|
%phitmp2 = zext i32 %0 to i64
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i64 [ %phitmp2, %cond.true ], [ 32, %entry ]
|
|
ret i64 %cond
|
|
}
|
|
|
|
define i32 @test2e(i64 %x) {
|
|
; ALL-LABEL: @test2e(
|
|
; LZCNT: icmp eq i64 %x, 0
|
|
; LZCNT: call i64 @llvm.cttz.i64(i64 %x, i1 true)
|
|
; BMI: call i64 @llvm.cttz.i64(i64 %x, i1 false)
|
|
; GENERIC: icmp eq i64 %x, 0
|
|
; GENERIC: call i64 @llvm.cttz.i64(i64 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.cttz.i64(i64 %x, i1 true)
|
|
%cast = trunc i64 %0 to i32
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i32 [ %cast, %cond.true ], [ 64, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
define i64 @test3e(i32 %x) {
|
|
; ALL-LABEL: @test3e(
|
|
; BMI: icmp eq i32 %x, 0
|
|
; BMI: call i32 @llvm.ctlz.i32(i32 %x, i1 true)
|
|
; LZCNT: call i32 @llvm.ctlz.i32(i32 %x, i1 false)
|
|
; GENERIC: icmp eq i32 %x, 0
|
|
; GENERIC: call i32 @llvm.ctlz.i32(i32 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %x, i1 true)
|
|
%phitmp2 = zext i32 %0 to i64
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i64 [ %phitmp2, %cond.true ], [ 32, %entry ]
|
|
ret i64 %cond
|
|
}
|
|
|
|
define i32 @test4e(i64 %x) {
|
|
; ALL-LABEL: @test4e(
|
|
; BMI: icmp eq i64 %x, 0
|
|
; BMI: call i64 @llvm.ctlz.i64(i64 %x, i1 true)
|
|
; LZCNT: call i64 @llvm.ctlz.i64(i64 %x, i1 false)
|
|
; GENERIC: icmp eq i64 %x, 0
|
|
; GENERIC: call i64 @llvm.ctlz.i64(i64 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.ctlz.i64(i64 %x, i1 true)
|
|
%cast = trunc i64 %0 to i32
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i32 [ %cast, %cond.true ], [ 64, %entry ]
|
|
ret i32 %cond
|
|
}
|
|
|
|
define i16 @test5e(i64 %x) {
|
|
; ALL-LABEL: @test5e(
|
|
; BMI: icmp eq i64 %x, 0
|
|
; BMI: call i64 @llvm.ctlz.i64(i64 %x, i1 true)
|
|
; LZCNT: call i64 @llvm.ctlz.i64(i64 %x, i1 false)
|
|
; GENERIC: icmp eq i64 %x, 0
|
|
; GENERIC: call i64 @llvm.ctlz.i64(i64 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.ctlz.i64(i64 %x, i1 true)
|
|
%cast = trunc i64 %0 to i16
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %cast, %cond.true ], [ 64, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
define i16 @test6e(i32 %x) {
|
|
; ALL-LABEL: @test6e(
|
|
; BMI: icmp eq i32 %x, 0
|
|
; BMI: call i32 @llvm.ctlz.i32(i32 %x, i1 true)
|
|
; LZCNT: call i32 @llvm.ctlz.i32(i32 %x, i1 false)
|
|
; GENERIC: icmp eq i32 %x, 0
|
|
; GENERIC: call i32 @llvm.ctlz.i32(i32 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.ctlz.i32(i32 %x, i1 true)
|
|
%cast = trunc i32 %0 to i16
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %cast, %cond.true ], [ 32, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
define i16 @test7e(i64 %x) {
|
|
; ALL-LABEL: @test7e(
|
|
; LZCNT: icmp eq i64 %x, 0
|
|
; LZCNT: call i64 @llvm.cttz.i64(i64 %x, i1 true)
|
|
; BMI: call i64 @llvm.cttz.i64(i64 %x, i1 false)
|
|
; GENERIC: icmp eq i64 %x, 0
|
|
; GENERIC: call i64 @llvm.cttz.i64(i64 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i64 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i64 @llvm.cttz.i64(i64 %x, i1 true)
|
|
%cast = trunc i64 %0 to i16
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %cast, %cond.true ], [ 64, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
define i16 @test8e(i32 %x) {
|
|
; ALL-LABEL: @test8e(
|
|
; LZCNT: icmp eq i32 %x, 0
|
|
; LZCNT: call i32 @llvm.cttz.i32(i32 %x, i1 true)
|
|
; BMI: call i32 @llvm.cttz.i32(i32 %x, i1 false)
|
|
; GENERIC: icmp eq i32 %x, 0
|
|
; GENERIC: call i32 @llvm.cttz.i32(i32 %x, i1 true)
|
|
entry:
|
|
%tobool = icmp eq i32 %x, 0
|
|
br i1 %tobool, label %cond.end, label %cond.true
|
|
|
|
cond.true: ; preds = %entry
|
|
%0 = tail call i32 @llvm.cttz.i32(i32 %x, i1 true)
|
|
%cast = trunc i32 %0 to i16
|
|
br label %cond.end
|
|
|
|
cond.end: ; preds = %entry, %cond.true
|
|
%cond = phi i16 [ %cast, %cond.true ], [ 32, %entry ]
|
|
ret i16 %cond
|
|
}
|
|
|
|
|
|
declare i64 @llvm.ctlz.i64(i64, i1)
|
|
declare i32 @llvm.ctlz.i32(i32, i1)
|
|
declare i16 @llvm.ctlz.i16(i16, i1)
|
|
declare i64 @llvm.cttz.i64(i64, i1)
|
|
declare i32 @llvm.cttz.i32(i32, i1)
|
|
declare i16 @llvm.cttz.i16(i16, i1)
|