mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-02 07:32:52 +00:00
InstCombine: Turn urem to bitwise-and more often
Use isKnownToBeAPowerOfTwo in visitUrem so that we may more aggressively fold away urem instructions. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@181661 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
d84ccfaf50
commit
a8ccefc0a3
@ -1027,31 +1027,13 @@ Instruction *InstCombiner::visitURem(BinaryOperator &I) {
|
||||
if (Instruction *common = commonIRemTransforms(I))
|
||||
return common;
|
||||
|
||||
// X urem C^2 -> X and C-1
|
||||
{ const APInt *C;
|
||||
if (match(Op1, m_Power2(C)))
|
||||
return BinaryOperator::CreateAnd(Op0,
|
||||
ConstantInt::get(I.getType(), *C-1));
|
||||
}
|
||||
|
||||
// Turn A % (C << N), where C is 2^k, into A & ((C << N)-1)
|
||||
if (match(Op1, m_Shl(m_Power2(), m_Value()))) {
|
||||
// X urem Y -> X and Y-1, where Y is a power of 2,
|
||||
if (isKnownToBeAPowerOfTwo(Op1, /*OrZero*/true)) {
|
||||
Constant *N1 = Constant::getAllOnesValue(I.getType());
|
||||
Value *Add = Builder->CreateAdd(Op1, N1);
|
||||
return BinaryOperator::CreateAnd(Op0, Add);
|
||||
}
|
||||
|
||||
// urem X, (select Cond, 2^C1, 2^C2) -->
|
||||
// select Cond, (and X, C1-1), (and X, C2-1)
|
||||
// when C1&C2 are powers of two.
|
||||
{ Value *Cond; const APInt *C1, *C2;
|
||||
if (match(Op1, m_Select(m_Value(Cond), m_Power2(C1), m_Power2(C2)))) {
|
||||
Value *TrueAnd = Builder->CreateAnd(Op0, *C1-1, Op1->getName()+".t");
|
||||
Value *FalseAnd = Builder->CreateAnd(Op0, *C2-1, Op1->getName()+".f");
|
||||
return SelectInst::Create(Cond, TrueAnd, FalseAnd);
|
||||
}
|
||||
}
|
||||
|
||||
// (zext A) urem (zext B) --> zext (A urem B)
|
||||
if (ZExtInst *ZOp0 = dyn_cast<ZExtInst>(Op0))
|
||||
if (Value *ZOp1 = dyn_castZExtVal(Op1, ZOp0->getSrcTy()))
|
||||
|
@ -1,36 +1,56 @@
|
||||
; This test makes sure that these instructions are properly eliminated.
|
||||
; This test makes sure that urem instructions are properly eliminated.
|
||||
;
|
||||
; RUN: opt < %s -instcombine -S | not grep rem
|
||||
; RUN: opt < %s -instcombine -S | FileCheck %s
|
||||
; END.
|
||||
|
||||
define i32 @test1(i32 %A) {
|
||||
; CHECK: @test1
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%B = srem i32 %A, 1 ; ISA constant 0
|
||||
ret i32 %B
|
||||
}
|
||||
|
||||
define i32 @test2(i32 %A) { ; 0 % X = 0, we don't need to preserve traps
|
||||
; CHECK: @test2
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%B = srem i32 0, %A
|
||||
ret i32 %B
|
||||
}
|
||||
|
||||
define i32 @test3(i32 %A) {
|
||||
; CHECK: @test3
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i32 %A, 7
|
||||
; CHECK-NEXT: ret i32 [[AND]]
|
||||
%B = urem i32 %A, 8
|
||||
ret i32 %B
|
||||
}
|
||||
|
||||
define i1 @test3a(i32 %A) {
|
||||
; CHECK: @test3a
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i32 %A, 7
|
||||
; CHECK-NEXT: [[CMP:%.*]] = icmp ne i32 [[AND]], 0
|
||||
; CHECK-NEXT: ret i1 [[CMP]]
|
||||
%B = srem i32 %A, -8
|
||||
%C = icmp ne i32 %B, 0
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
define i32 @test4(i32 %X, i1 %C) {
|
||||
; CHECK: @test4
|
||||
; CHECK-NEXT: [[SEL:%.*]] = select i1 %C, i32 0, i32 7
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i32 [[SEL]], %X
|
||||
%V = select i1 %C, i32 1, i32 8
|
||||
%R = urem i32 %X, %V
|
||||
ret i32 %R
|
||||
}
|
||||
|
||||
define i32 @test5(i32 %X, i8 %B) {
|
||||
; CHECK: @test5
|
||||
; CHECK-NEXT: [[ZEXT:%.*]] = zext i8 %B to i32
|
||||
; CHECK-NEXT: [[SHL:%.*]] = shl nuw i32 32, [[ZEXT]]
|
||||
; CHECK-NEXT: [[ADD:%.*]] = add i32 [[SHL]], -1
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i32 [[ADD]], %X
|
||||
; CHECK-NEXT: ret i32 [[AND]]
|
||||
%shift.upgrd.1 = zext i8 %B to i32
|
||||
%Amt = shl i32 32, %shift.upgrd.1
|
||||
%V = urem i32 %X, %Amt
|
||||
@ -38,29 +58,39 @@ define i32 @test5(i32 %X, i8 %B) {
|
||||
}
|
||||
|
||||
define i32 @test6(i32 %A) {
|
||||
; CHECK: @test6
|
||||
; CHECK-NEXT: ret i32 undef
|
||||
%B = srem i32 %A, 0 ;; undef
|
||||
ret i32 %B
|
||||
}
|
||||
|
||||
define i32 @test7(i32 %A) {
|
||||
; CHECK: @test7
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%B = mul i32 %A, 8
|
||||
%C = srem i32 %B, 4
|
||||
ret i32 %C
|
||||
}
|
||||
|
||||
define i32 @test8(i32 %A) {
|
||||
; CHECK: @test8
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%B = shl i32 %A, 4
|
||||
%C = srem i32 %B, 8
|
||||
ret i32 %C
|
||||
}
|
||||
|
||||
define i32 @test9(i32 %A) {
|
||||
; CHECK: @test9
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%B = mul i32 %A, 64
|
||||
%C = urem i32 %B, 32
|
||||
ret i32 %C
|
||||
}
|
||||
|
||||
define i32 @test10(i8 %c) {
|
||||
; CHECK: @test10
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%tmp.1 = zext i8 %c to i32
|
||||
%tmp.2 = mul i32 %tmp.1, 4
|
||||
%tmp.3 = sext i32 %tmp.2 to i64
|
||||
@ -70,6 +100,8 @@ define i32 @test10(i8 %c) {
|
||||
}
|
||||
|
||||
define i32 @test11(i32 %i) {
|
||||
; CHECK: @test11
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%tmp.1 = and i32 %i, -2
|
||||
%tmp.3 = mul i32 %tmp.1, 2
|
||||
%tmp.5 = urem i32 %tmp.3, 4
|
||||
@ -77,12 +109,29 @@ define i32 @test11(i32 %i) {
|
||||
}
|
||||
|
||||
define i32 @test12(i32 %i) {
|
||||
; CHECK: @test12
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%tmp.1 = and i32 %i, -4
|
||||
%tmp.5 = srem i32 %tmp.1, 2
|
||||
ret i32 %tmp.5
|
||||
}
|
||||
|
||||
define i32 @test13(i32 %i) {
|
||||
; CHECK: @test13
|
||||
; CHECK-NEXT: ret i32 0
|
||||
%x = srem i32 %i, %i
|
||||
ret i32 %x
|
||||
}
|
||||
|
||||
define i64 @test14(i64 %x, i32 %y) {
|
||||
; CHECK: @test14
|
||||
; CHECK-NEXT: [[SHL:%.*]] = shl i32 1, %y
|
||||
; CHECK-NEXT: [[ZEXT:%.*]] = zext i32 [[SHL]] to i64
|
||||
; CHECK-NEXT: [[ADD:%.*]] = add i64 [[ZEXT]], -1
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i64 [[ADD]], %x
|
||||
; CHECK-NEXT: ret i64 [[AND]]
|
||||
%shl = shl i32 1, %y
|
||||
%zext = zext i32 %shl to i64
|
||||
%urem = urem i64 %x, %zext
|
||||
ret i64 %urem
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user