InstCombine: Turn urem to bitwise-and more often

Use isKnownToBeAPowerOfTwo in visitUrem so that we may more aggressively
fold away urem instructions.


git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@181661 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
David Majnemer 2013-05-11 09:01:28 +00:00
parent d84ccfaf50
commit a8ccefc0a3
2 changed files with 53 additions and 22 deletions

View File

@ -1027,31 +1027,13 @@ Instruction *InstCombiner::visitURem(BinaryOperator &I) {
if (Instruction *common = commonIRemTransforms(I)) if (Instruction *common = commonIRemTransforms(I))
return common; return common;
// X urem C^2 -> X and C-1 // X urem Y -> X and Y-1, where Y is a power of 2,
{ const APInt *C; if (isKnownToBeAPowerOfTwo(Op1, /*OrZero*/true)) {
if (match(Op1, m_Power2(C)))
return BinaryOperator::CreateAnd(Op0,
ConstantInt::get(I.getType(), *C-1));
}
// Turn A % (C << N), where C is 2^k, into A & ((C << N)-1)
if (match(Op1, m_Shl(m_Power2(), m_Value()))) {
Constant *N1 = Constant::getAllOnesValue(I.getType()); Constant *N1 = Constant::getAllOnesValue(I.getType());
Value *Add = Builder->CreateAdd(Op1, N1); Value *Add = Builder->CreateAdd(Op1, N1);
return BinaryOperator::CreateAnd(Op0, Add); return BinaryOperator::CreateAnd(Op0, Add);
} }
// urem X, (select Cond, 2^C1, 2^C2) -->
// select Cond, (and X, C1-1), (and X, C2-1)
// when C1&C2 are powers of two.
{ Value *Cond; const APInt *C1, *C2;
if (match(Op1, m_Select(m_Value(Cond), m_Power2(C1), m_Power2(C2)))) {
Value *TrueAnd = Builder->CreateAnd(Op0, *C1-1, Op1->getName()+".t");
Value *FalseAnd = Builder->CreateAnd(Op0, *C2-1, Op1->getName()+".f");
return SelectInst::Create(Cond, TrueAnd, FalseAnd);
}
}
// (zext A) urem (zext B) --> zext (A urem B) // (zext A) urem (zext B) --> zext (A urem B)
if (ZExtInst *ZOp0 = dyn_cast<ZExtInst>(Op0)) if (ZExtInst *ZOp0 = dyn_cast<ZExtInst>(Op0))
if (Value *ZOp1 = dyn_castZExtVal(Op1, ZOp0->getSrcTy())) if (Value *ZOp1 = dyn_castZExtVal(Op1, ZOp0->getSrcTy()))

View File

@ -1,36 +1,56 @@
; This test makes sure that these instructions are properly eliminated. ; This test makes sure that urem instructions are properly eliminated.
; ;
; RUN: opt < %s -instcombine -S | not grep rem ; RUN: opt < %s -instcombine -S | FileCheck %s
; END. ; END.
define i32 @test1(i32 %A) { define i32 @test1(i32 %A) {
; CHECK: @test1
; CHECK-NEXT: ret i32 0
%B = srem i32 %A, 1 ; ISA constant 0 %B = srem i32 %A, 1 ; ISA constant 0
ret i32 %B ret i32 %B
} }
define i32 @test2(i32 %A) { ; 0 % X = 0, we don't need to preserve traps define i32 @test2(i32 %A) { ; 0 % X = 0, we don't need to preserve traps
; CHECK: @test2
; CHECK-NEXT: ret i32 0
%B = srem i32 0, %A %B = srem i32 0, %A
ret i32 %B ret i32 %B
} }
define i32 @test3(i32 %A) { define i32 @test3(i32 %A) {
; CHECK: @test3
; CHECK-NEXT: [[AND:%.*]] = and i32 %A, 7
; CHECK-NEXT: ret i32 [[AND]]
%B = urem i32 %A, 8 %B = urem i32 %A, 8
ret i32 %B ret i32 %B
} }
define i1 @test3a(i32 %A) { define i1 @test3a(i32 %A) {
; CHECK: @test3a
; CHECK-NEXT: [[AND:%.*]] = and i32 %A, 7
; CHECK-NEXT: [[CMP:%.*]] = icmp ne i32 [[AND]], 0
; CHECK-NEXT: ret i1 [[CMP]]
%B = srem i32 %A, -8 %B = srem i32 %A, -8
%C = icmp ne i32 %B, 0 %C = icmp ne i32 %B, 0
ret i1 %C ret i1 %C
} }
define i32 @test4(i32 %X, i1 %C) { define i32 @test4(i32 %X, i1 %C) {
; CHECK: @test4
; CHECK-NEXT: [[SEL:%.*]] = select i1 %C, i32 0, i32 7
; CHECK-NEXT: [[AND:%.*]] = and i32 [[SEL]], %X
%V = select i1 %C, i32 1, i32 8 %V = select i1 %C, i32 1, i32 8
%R = urem i32 %X, %V %R = urem i32 %X, %V
ret i32 %R ret i32 %R
} }
define i32 @test5(i32 %X, i8 %B) { define i32 @test5(i32 %X, i8 %B) {
; CHECK: @test5
; CHECK-NEXT: [[ZEXT:%.*]] = zext i8 %B to i32
; CHECK-NEXT: [[SHL:%.*]] = shl nuw i32 32, [[ZEXT]]
; CHECK-NEXT: [[ADD:%.*]] = add i32 [[SHL]], -1
; CHECK-NEXT: [[AND:%.*]] = and i32 [[ADD]], %X
; CHECK-NEXT: ret i32 [[AND]]
%shift.upgrd.1 = zext i8 %B to i32 %shift.upgrd.1 = zext i8 %B to i32
%Amt = shl i32 32, %shift.upgrd.1 %Amt = shl i32 32, %shift.upgrd.1
%V = urem i32 %X, %Amt %V = urem i32 %X, %Amt
@ -38,29 +58,39 @@ define i32 @test5(i32 %X, i8 %B) {
} }
define i32 @test6(i32 %A) { define i32 @test6(i32 %A) {
; CHECK: @test6
; CHECK-NEXT: ret i32 undef
%B = srem i32 %A, 0 ;; undef %B = srem i32 %A, 0 ;; undef
ret i32 %B ret i32 %B
} }
define i32 @test7(i32 %A) { define i32 @test7(i32 %A) {
; CHECK: @test7
; CHECK-NEXT: ret i32 0
%B = mul i32 %A, 8 %B = mul i32 %A, 8
%C = srem i32 %B, 4 %C = srem i32 %B, 4
ret i32 %C ret i32 %C
} }
define i32 @test8(i32 %A) { define i32 @test8(i32 %A) {
; CHECK: @test8
; CHECK-NEXT: ret i32 0
%B = shl i32 %A, 4 %B = shl i32 %A, 4
%C = srem i32 %B, 8 %C = srem i32 %B, 8
ret i32 %C ret i32 %C
} }
define i32 @test9(i32 %A) { define i32 @test9(i32 %A) {
; CHECK: @test9
; CHECK-NEXT: ret i32 0
%B = mul i32 %A, 64 %B = mul i32 %A, 64
%C = urem i32 %B, 32 %C = urem i32 %B, 32
ret i32 %C ret i32 %C
} }
define i32 @test10(i8 %c) { define i32 @test10(i8 %c) {
; CHECK: @test10
; CHECK-NEXT: ret i32 0
%tmp.1 = zext i8 %c to i32 %tmp.1 = zext i8 %c to i32
%tmp.2 = mul i32 %tmp.1, 4 %tmp.2 = mul i32 %tmp.1, 4
%tmp.3 = sext i32 %tmp.2 to i64 %tmp.3 = sext i32 %tmp.2 to i64
@ -70,6 +100,8 @@ define i32 @test10(i8 %c) {
} }
define i32 @test11(i32 %i) { define i32 @test11(i32 %i) {
; CHECK: @test11
; CHECK-NEXT: ret i32 0
%tmp.1 = and i32 %i, -2 %tmp.1 = and i32 %i, -2
%tmp.3 = mul i32 %tmp.1, 2 %tmp.3 = mul i32 %tmp.1, 2
%tmp.5 = urem i32 %tmp.3, 4 %tmp.5 = urem i32 %tmp.3, 4
@ -77,12 +109,29 @@ define i32 @test11(i32 %i) {
} }
define i32 @test12(i32 %i) { define i32 @test12(i32 %i) {
; CHECK: @test12
; CHECK-NEXT: ret i32 0
%tmp.1 = and i32 %i, -4 %tmp.1 = and i32 %i, -4
%tmp.5 = srem i32 %tmp.1, 2 %tmp.5 = srem i32 %tmp.1, 2
ret i32 %tmp.5 ret i32 %tmp.5
} }
define i32 @test13(i32 %i) { define i32 @test13(i32 %i) {
; CHECK: @test13
; CHECK-NEXT: ret i32 0
%x = srem i32 %i, %i %x = srem i32 %i, %i
ret i32 %x ret i32 %x
} }
define i64 @test14(i64 %x, i32 %y) {
; CHECK: @test14
; CHECK-NEXT: [[SHL:%.*]] = shl i32 1, %y
; CHECK-NEXT: [[ZEXT:%.*]] = zext i32 [[SHL]] to i64
; CHECK-NEXT: [[ADD:%.*]] = add i64 [[ZEXT]], -1
; CHECK-NEXT: [[AND:%.*]] = and i64 [[ADD]], %x
; CHECK-NEXT: ret i64 [[AND]]
%shl = shl i32 1, %y
%zext = zext i32 %shl to i64
%urem = urem i64 %x, %zext
ret i64 %urem
}