Hal Finkel b9ed50cf17 [PowerPC] [Constant Hoisting] Enable constant hoisting on PPC
Implements the various TTI functions to enable constant hoisting on PPC. The
only significant test-suite change is this:

MultiSource/Benchmarks/VersaBench/bmm/bmm - 20% speedup
(which essentially reverses the slowdown from r206120).

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@206141 91177308-0d34-0410-b5e6-96231b3b80d8
2014-04-13 23:02:40 +00:00

67 lines
1.6 KiB
LLVM

; RUN: opt -S -consthoist < %s | FileCheck %s
target datalayout = "E-m:e-i64:64-n32:64"
target triple = "powerpc64-unknown-linux-gnu"
; Here the masks are all contiguous, and should not be hoisted.
define i32 @test1() nounwind {
entry:
; CHECK-LABEL: @test1
; CHECK-NOT: bitcast i32 65535 to i32
; CHECK: and i32 undef, 65535
%conv121 = and i32 undef, 65535
br i1 undef, label %if.then152, label %if.end167
if.then152:
; CHECK: and i32 undef, 65535
%conv153 = and i32 undef, 65535
br i1 undef, label %if.end167, label %end2
if.end167:
; CHECK: and i32 {{.*}}, 32768
%shl161 = shl nuw nsw i32 %conv121, 15
%0 = load i8* undef, align 1
%conv169 = zext i8 %0 to i32
%shl170 = shl nuw nsw i32 %conv169, 7
%shl161.masked = and i32 %shl161, 32768
%conv174 = or i32 %shl170, %shl161.masked
%cmp178 = icmp ugt i32 %conv174, 32767
br i1 %cmp178, label %end1, label %end2
end1:
unreachable
end2:
unreachable
}
; Here the masks are not contiguous, and should be hoisted.
define i32 @test2() nounwind {
entry:
; CHECK-LABEL: @test2
; CHECK: bitcast i32 65531 to i32
%conv121 = and i32 undef, 65531
br i1 undef, label %if.then152, label %if.end167
if.then152:
%conv153 = and i32 undef, 65531
br i1 undef, label %if.end167, label %end2
if.end167:
; CHECK: add i32 {{.*}}, -32758
%shl161 = shl nuw nsw i32 %conv121, 15
%0 = load i8* undef, align 1
%conv169 = zext i8 %0 to i32
%shl170 = shl nuw nsw i32 %conv169, 7
%shl161.masked = and i32 %shl161, 32773
%conv174 = or i32 %shl170, %shl161.masked
%cmp178 = icmp ugt i32 %conv174, 32767
br i1 %cmp178, label %end1, label %end2
end1:
unreachable
end2:
unreachable
}