mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-08-10 02:25:47 +00:00
Don't do FoldCmpLoadFromIndexedGlobal for non inbounds GEPs
This path wasn't tested before without a datalayout, so add some more tests and re-run with and without one. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@188507 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
@@ -226,8 +226,8 @@ static void ComputeUnsignedMinMaxValuesFromKnownBits(const APInt &KnownZero,
|
||||
Instruction *InstCombiner::
|
||||
FoldCmpLoadFromIndexedGlobal(GetElementPtrInst *GEP, GlobalVariable *GV,
|
||||
CmpInst &ICI, ConstantInt *AndCst) {
|
||||
// We need TD information to know the pointer size unless this is inbounds.
|
||||
if (!GEP->isInBounds() && TD == 0) return 0;
|
||||
if (!GEP->isInBounds())
|
||||
return 0;
|
||||
|
||||
Constant *Init = GV->getInitializer();
|
||||
if (!isa<ConstantArray>(Init) && !isa<ConstantDataArray>(Init))
|
||||
@@ -390,13 +390,6 @@ FoldCmpLoadFromIndexedGlobal(GetElementPtrInst *GEP, GlobalVariable *GV,
|
||||
// order the state machines in complexity of the generated code.
|
||||
Value *Idx = GEP->getOperand(2);
|
||||
|
||||
// If the index is larger than the pointer size of the target, truncate the
|
||||
// index down like the GEP would do implicitly. We don't have to do this for
|
||||
// an inbounds GEP because the index can't be out of range.
|
||||
if (!GEP->isInBounds() &&
|
||||
Idx->getType()->getPrimitiveSizeInBits() > TD->getPointerSizeInBits())
|
||||
Idx = Builder->CreateTrunc(Idx, TD->getIntPtrType(Idx->getContext()));
|
||||
|
||||
// If the comparison is only true for one or two elements, emit direct
|
||||
// comparisons.
|
||||
if (SecondTrueElement != Overdefined) {
|
||||
|
@@ -129,6 +129,33 @@ define i1 @test13(i64 %X, %S* %P) {
|
||||
; CHECK: %C = icmp eq i64 %X, -1
|
||||
}
|
||||
|
||||
define i1 @test13_i32(i32 %X, %S* %P) {
|
||||
; CHECK-LABEL: @test13_i32(
|
||||
; CHECK: %C = icmp eq i32 %X, -1
|
||||
%A = getelementptr inbounds %S* %P, i32 0, i32 1, i32 %X
|
||||
%B = getelementptr inbounds %S* %P, i32 0, i32 0
|
||||
%C = icmp eq i32* %A, %B
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
define i1 @test13_i16(i16 %X, %S* %P) {
|
||||
; CHECK-LABEL: @test13_i16(
|
||||
; CHECK: %C = icmp eq i16 %X, -1
|
||||
%A = getelementptr inbounds %S* %P, i16 0, i32 1, i16 %X
|
||||
%B = getelementptr inbounds %S* %P, i16 0, i32 0
|
||||
%C = icmp eq i32* %A, %B
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
define i1 @test13_i128(i128 %X, %S* %P) {
|
||||
; CHECK-LABEL: @test13_i128(
|
||||
; CHECK: %C = icmp eq i64 %1, -1
|
||||
%A = getelementptr inbounds %S* %P, i128 0, i32 1, i128 %X
|
||||
%B = getelementptr inbounds %S* %P, i128 0, i32 0
|
||||
%C = icmp eq i32* %A, %B
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
|
||||
@G = external global [3 x i8]
|
||||
define i8* @test14(i32 %Idx) {
|
||||
@@ -175,6 +202,33 @@ define i1 @test18(i16* %P, i32 %I) {
|
||||
; CHECK: %C = icmp slt i32 %I, 0
|
||||
}
|
||||
|
||||
; Smaller than pointer size
|
||||
define i1 @test18_i16(i16* %P, i16 %I) {
|
||||
; CHECK-LABEL: @test18_i16(
|
||||
; CHECK: %C = icmp slt i16 %I, 0
|
||||
%X = getelementptr inbounds i16* %P, i16 %I
|
||||
%C = icmp ult i16* %X, %P
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
; Same as pointer size
|
||||
define i1 @test18_i64(i16* %P, i64 %I) {
|
||||
; CHECK-LABEL: @test18_i64(
|
||||
; CHECK: %C = icmp slt i64 %I, 0
|
||||
%X = getelementptr inbounds i16* %P, i64 %I
|
||||
%C = icmp ult i16* %X, %P
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
; Larger than the pointer size
|
||||
define i1 @test18_i128(i16* %P, i128 %I) {
|
||||
; CHECK-LABEL: @test18_i128(
|
||||
; CHECK: %C = icmp slt i64 %1, 0
|
||||
%X = getelementptr inbounds i16* %P, i128 %I
|
||||
%C = icmp ult i16* %X, %P
|
||||
ret i1 %C
|
||||
}
|
||||
|
||||
define i32 @test19(i32* %P, i32 %A, i32 %B) {
|
||||
%tmp.4 = getelementptr inbounds i32* %P, i32 %A
|
||||
%tmp.9 = getelementptr inbounds i32* %P, i32 %B
|
||||
|
@@ -1,18 +1,45 @@
|
||||
; RUN: opt < %s -instcombine -S | FileCheck %s
|
||||
; RUN: opt -instcombine -S < %s | FileCheck -check-prefix=NODL %s
|
||||
; RUN: opt -instcombine -S -default-data-layout="p:32:32:32-n8:16:32:64" < %s | FileCheck -check-prefix=P32 %s
|
||||
|
||||
@G16 = internal constant [10 x i16] [i16 35, i16 82, i16 69, i16 81, i16 85,
|
||||
i16 73, i16 82, i16 69, i16 68, i16 0]
|
||||
@GD = internal constant [6 x double]
|
||||
[double -10.0, double 1.0, double 4.0, double 2.0, double -20.0, double -40.0]
|
||||
|
||||
%Foo = type { i32, i32, i32, i32 }
|
||||
|
||||
@GS = internal constant %Foo { i32 1, i32 4, i32 9, i32 14 }
|
||||
|
||||
@GStructArr = internal constant [4 x %Foo] [ %Foo { i32 1, i32 4, i32 9, i32 14 },
|
||||
%Foo { i32 5, i32 4, i32 6, i32 11 },
|
||||
%Foo { i32 6, i32 5, i32 9, i32 20 },
|
||||
%Foo { i32 12, i32 3, i32 9, i32 8 } ]
|
||||
|
||||
|
||||
define i1 @test1(i32 %X) {
|
||||
%P = getelementptr inbounds [10 x i16]* @G16, i32 0, i32 %X
|
||||
%Q = load i16* %P
|
||||
%R = icmp eq i16 %Q, 0
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test1(
|
||||
; CHECK-NEXT: %R = icmp eq i32 %X, 9
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test1(
|
||||
; NODL-NEXT: %R = icmp eq i32 %X, 9
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test1(
|
||||
; P32-NEXT: %R = icmp eq i32 %X, 9
|
||||
; P32-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test1_noinbounds(i32 %X) {
|
||||
%P = getelementptr [10 x i16]* @G16, i32 0, i32 %X
|
||||
%Q = load i16* %P
|
||||
%R = icmp eq i16 %Q, 0
|
||||
ret i1 %R
|
||||
; NODL-LABEL: @test1_noinbounds(
|
||||
; NODL-NEXT: %P = getelementptr [10 x i16]* @G16, i32 0, i32 %X
|
||||
|
||||
; P32-LABEL: @test1_noinbounds(
|
||||
; P32-NEXT: %P = getelementptr [10 x i16]* @G16, i32 0, i32 %X
|
||||
}
|
||||
|
||||
define i1 @test2(i32 %X) {
|
||||
@@ -20,9 +47,9 @@ define i1 @test2(i32 %X) {
|
||||
%Q = load i16* %P
|
||||
%R = icmp slt i16 %Q, 85
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test2(
|
||||
; CHECK-NEXT: %R = icmp ne i32 %X, 4
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test2(
|
||||
; NODL-NEXT: %R = icmp ne i32 %X, 4
|
||||
; NODL-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test3(i32 %X) {
|
||||
@@ -30,9 +57,14 @@ define i1 @test3(i32 %X) {
|
||||
%Q = load double* %P
|
||||
%R = fcmp oeq double %Q, 1.0
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test3(
|
||||
; CHECK-NEXT: %R = icmp eq i32 %X, 1
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test3(
|
||||
; NODL-NEXT: %R = icmp eq i32 %X, 1
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test3(
|
||||
; P32-NEXT: %R = icmp eq i32 %X, 1
|
||||
; P32-NEXT: ret i1 %R
|
||||
|
||||
}
|
||||
|
||||
define i1 @test4(i32 %X) {
|
||||
@@ -40,11 +72,17 @@ define i1 @test4(i32 %X) {
|
||||
%Q = load i16* %P
|
||||
%R = icmp sle i16 %Q, 73
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test4(
|
||||
; CHECK-NEXT: lshr i32 933, %X
|
||||
; CHECK-NEXT: and i32 {{.*}}, 1
|
||||
; CHECK-NEXT: %R = icmp ne i32 {{.*}}, 0
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test4(
|
||||
; NODL-NEXT: lshr i32 933, %X
|
||||
; NODL-NEXT: and i32 {{.*}}, 1
|
||||
; NODL-NEXT: %R = icmp ne i32 {{.*}}, 0
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test4(
|
||||
; P32-NEXT: lshr i32 933, %X
|
||||
; P32-NEXT: and i32 {{.*}}, 1
|
||||
; P32-NEXT: %R = icmp ne i32 {{.*}}, 0
|
||||
; P32-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test4_i16(i16 %X) {
|
||||
@@ -52,11 +90,19 @@ define i1 @test4_i16(i16 %X) {
|
||||
%Q = load i16* %P
|
||||
%R = icmp sle i16 %Q, 73
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test4_i16(
|
||||
; CHECK-NEXT: lshr i16 933, %X
|
||||
; CHECK-NEXT: and i16 {{.*}}, 1
|
||||
; CHECK-NEXT: %R = icmp ne i16 {{.*}}, 0
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
|
||||
; NODL-LABEL: @test4_i16(
|
||||
; NODL-NEXT: lshr i16 933, %X
|
||||
; NODL-NEXT: and i16 {{.*}}, 1
|
||||
; NODL-NEXT: %R = icmp ne i16 {{.*}}, 0
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test4_i16(
|
||||
; P32-NEXT: sext i16 %X to i32
|
||||
; P32-NEXT: lshr i32 933, %1
|
||||
; P32-NEXT: and i32 {{.*}}, 1
|
||||
; P32-NEXT: %R = icmp ne i32 {{.*}}, 0
|
||||
; P32-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test5(i32 %X) {
|
||||
@@ -64,11 +110,17 @@ define i1 @test5(i32 %X) {
|
||||
%Q = load i16* %P
|
||||
%R = icmp eq i16 %Q, 69
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test5(
|
||||
; CHECK-NEXT: icmp eq i32 %X, 2
|
||||
; CHECK-NEXT: icmp eq i32 %X, 7
|
||||
; CHECK-NEXT: %R = or i1
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test5(
|
||||
; NODL-NEXT: icmp eq i32 %X, 2
|
||||
; NODL-NEXT: icmp eq i32 %X, 7
|
||||
; NODL-NEXT: %R = or i1
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test5(
|
||||
; P32-NEXT: icmp eq i32 %X, 2
|
||||
; P32-NEXT: icmp eq i32 %X, 7
|
||||
; P32-NEXT: %R = or i1
|
||||
; P32-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test6(i32 %X) {
|
||||
@@ -76,10 +128,15 @@ define i1 @test6(i32 %X) {
|
||||
%Q = load double* %P
|
||||
%R = fcmp ogt double %Q, 0.0
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test6(
|
||||
; CHECK-NEXT: add i32 %X, -1
|
||||
; CHECK-NEXT: %R = icmp ult i32 {{.*}}, 3
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test6(
|
||||
; NODL-NEXT: add i32 %X, -1
|
||||
; NODL-NEXT: %R = icmp ult i32 {{.*}}, 3
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test6(
|
||||
; P32-NEXT: add i32 %X, -1
|
||||
; P32-NEXT: %R = icmp ult i32 {{.*}}, 3
|
||||
; P32-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test7(i32 %X) {
|
||||
@@ -87,10 +144,15 @@ define i1 @test7(i32 %X) {
|
||||
%Q = load double* %P
|
||||
%R = fcmp olt double %Q, 0.0
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test7(
|
||||
; CHECK-NEXT: add i32 %X, -1
|
||||
; CHECK-NEXT: %R = icmp ugt i32 {{.*}}, 2
|
||||
; CHECK-NEXT: ret i1 %R
|
||||
; NODL-LABEL: @test7(
|
||||
; NODL-NEXT: add i32 %X, -1
|
||||
; NODL-NEXT: %R = icmp ugt i32 {{.*}}, 2
|
||||
; NODL-NEXT: ret i1 %R
|
||||
|
||||
; P32-LABEL: @test7(
|
||||
; P32-NEXT: add i32 %X, -1
|
||||
; P32-NEXT: %R = icmp ugt i32 {{.*}}, 2
|
||||
; P32-NEXT: ret i1 %R
|
||||
}
|
||||
|
||||
define i1 @test8(i32 %X) {
|
||||
@@ -99,10 +161,15 @@ define i1 @test8(i32 %X) {
|
||||
%R = and i16 %Q, 3
|
||||
%S = icmp eq i16 %R, 0
|
||||
ret i1 %S
|
||||
; CHECK-LABEL: @test8(
|
||||
; CHECK-NEXT: and i32 %X, -2
|
||||
; CHECK-NEXT: icmp eq i32 {{.*}}, 8
|
||||
; CHECK-NEXT: ret i1
|
||||
; NODL-LABEL: @test8(
|
||||
; NODL-NEXT: and i32 %X, -2
|
||||
; NODL-NEXT: icmp eq i32 {{.*}}, 8
|
||||
; NODL-NEXT: ret i1
|
||||
|
||||
; P32-LABEL: @test8(
|
||||
; P32-NEXT: and i32 %X, -2
|
||||
; P32-NEXT: icmp eq i32 {{.*}}, 8
|
||||
; P32-NEXT: ret i1
|
||||
}
|
||||
|
||||
@GA = internal constant [4 x { i32, i32 } ] [
|
||||
@@ -117,8 +184,111 @@ define i1 @test9(i32 %X) {
|
||||
%Q = load i32* %P
|
||||
%R = icmp eq i32 %Q, 1
|
||||
ret i1 %R
|
||||
; CHECK-LABEL: @test9(
|
||||
; CHECK-NEXT: add i32 %X, -1
|
||||
; CHECK-NEXT: icmp ult i32 {{.*}}, 2
|
||||
; CHECK-NEXT: ret i1
|
||||
; NODL-LABEL: @test9(
|
||||
; NODL-NEXT: add i32 %X, -1
|
||||
; NODL-NEXT: icmp ult i32 {{.*}}, 2
|
||||
; NODL-NEXT: ret i1
|
||||
|
||||
; P32-LABEL: @test9(
|
||||
; P32-NEXT: add i32 %X, -1
|
||||
; P32-NEXT: icmp ult i32 {{.*}}, 2
|
||||
; P32-NEXT: ret i1
|
||||
}
|
||||
|
||||
define i1 @test10_struct(i32 %x) {
|
||||
; NODL-LABEL: @test10_struct(
|
||||
; NODL: getelementptr inbounds %Foo* @GS, i32 %x, i32 0
|
||||
|
||||
; P32-LABEL: @test10_struct(
|
||||
; P32: getelementptr inbounds %Foo* @GS, i32 %x, i32 0
|
||||
%p = getelementptr inbounds %Foo* @GS, i32 %x, i32 0
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 9
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
define i1 @test10_struct_noinbounds(i32 %x) {
|
||||
; NODL-LABEL: @test10_struct_noinbounds(
|
||||
; NODL: getelementptr %Foo* @GS, i32 %x, i32 0
|
||||
|
||||
; P32-LABEL: @test10_struct_noinbounds(
|
||||
; P32: getelementptr %Foo* @GS, i32 %x, i32 0
|
||||
%p = getelementptr %Foo* @GS, i32 %x, i32 0
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 9
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
; Test that the GEP indices are converted before we ever get here
|
||||
; Index < ptr size
|
||||
define i1 @test10_struct_i16(i16 %x){
|
||||
; NODL-LABEL: @test10_struct_i16(
|
||||
; NODL: getelementptr inbounds %Foo* @GS, i16 %x, i32 0
|
||||
|
||||
; P32-LABEL: @test10_struct_i16(
|
||||
; P32: %1 = sext i16 %x to i32
|
||||
; P32: getelementptr inbounds %Foo* @GS, i32 %1, i32 0
|
||||
%p = getelementptr inbounds %Foo* @GS, i16 %x, i32 0
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 0
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
; Test that the GEP indices are converted before we ever get here
|
||||
; Index > ptr size
|
||||
define i1 @test10_struct_i64(i64 %x){
|
||||
; NODL-LABEL: @test10_struct_i64(
|
||||
; NODL: getelementptr inbounds %Foo* @GS, i64 %x, i32 0
|
||||
|
||||
; P32-LABEL: @test10_struct_i64(
|
||||
; P32: %1 = trunc i64 %x to i32
|
||||
; P32: getelementptr inbounds %Foo* @GS, i32 %1, i32 0
|
||||
%p = getelementptr inbounds %Foo* @GS, i64 %x, i32 0
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 0
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
define i1 @test10_struct_arr(i32 %x) {
|
||||
; NODL-LABEL: @test10_struct_arr(
|
||||
; NODL-NEXT: %r = icmp ne i32 %x, 1
|
||||
; NODL-NEXT: ret i1 %r
|
||||
|
||||
; P32-LABEL: @test10_struct_arr(
|
||||
; P32-NEXT: %r = icmp ne i32 %x, 1
|
||||
; P32-NEXT: ret i1 %r
|
||||
%p = getelementptr inbounds [4 x %Foo]* @GStructArr, i32 0, i32 %x, i32 2
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 9
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
define i1 @test10_struct_arr_i16(i16 %x) {
|
||||
; NODL-LABEL: @test10_struct_arr_i16(
|
||||
; NODL-NEXT: %r = icmp ne i16 %x, 1
|
||||
; NODL-NEXT: ret i1 %r
|
||||
|
||||
; P32-LABEL: @test10_struct_arr_i16(
|
||||
; P32-NEXT: %r = icmp ne i16 %x, 1
|
||||
; P32-NEXT: ret i1 %r
|
||||
%p = getelementptr inbounds [4 x %Foo]* @GStructArr, i16 0, i16 %x, i32 2
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 9
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
define i1 @test10_struct_arr_i64(i64 %x) {
|
||||
; NODL-LABEL: @test10_struct_arr_i64(
|
||||
; NODL-NEXT: %r = icmp ne i64 %x, 1
|
||||
; NODL-NEXT: ret i1 %r
|
||||
|
||||
; P32-LABEL: @test10_struct_arr_i64(
|
||||
; P32-NEXT: trunc i64 %x to i32
|
||||
; P32-NEXT: %r = icmp ne i32 %1, 1
|
||||
; P32-NEXT: ret i1 %r
|
||||
%p = getelementptr inbounds [4 x %Foo]* @GStructArr, i64 0, i64 %x, i32 2
|
||||
%q = load i32* %p
|
||||
%r = icmp eq i32 %q, 9
|
||||
ret i1 %r
|
||||
}
|
||||
|
||||
|
Reference in New Issue
Block a user