diff --git a/test/CodeGen/X86/2006-05-11-InstrSched.ll b/test/CodeGen/X86/2006-05-11-InstrSched.ll index e9241420047..a7e060945bc 100644 --- a/test/CodeGen/X86/2006-05-11-InstrSched.ll +++ b/test/CodeGen/X86/2006-05-11-InstrSched.ll @@ -1,54 +1,55 @@ -; RUN: llvm-upgrade < %s | llvm-as | llc -march=x86 -mattr=+sse2 -stats 2>&1 |\ -; RUN: grep 'asm-printer' | grep 39 +; RUN: llvm-as < %s | llc -march=x86 -mattr=+sse2 -stats 2>&1 |\ +; RUN: grep 'asm-printer' | grep 37 target datalayout = "e-p:32:32" -void %foo(int* %mc, int* %bp, int* %ms, int* %xmb, int* %mpp, int* %tpmm, int* %ip, int* %tpim, int* %dpp, int* %tpdm, int* %bpi, int %M) { +define void @foo(i32* %mc, i32* %bp, i32* %ms, i32* %xmb, i32* %mpp, i32* %tpmm, i32* %ip, i32* %tpim, i32* %dpp, i32* %tpdm, i32* %bpi, i32 %M) { entry: - %tmp9 = setlt int %M, 5 ; [#uses=1] - br bool %tmp9, label %return, label %cond_true + %tmp9 = icmp slt i32 %M, 5 ; [#uses=1] + br i1 %tmp9, label %return, label %cond_true cond_true: ; preds = %cond_true, %entry - %indvar = phi uint [ 0, %entry ], [ %indvar.next, %cond_true ] ; [#uses=2] - %tmp. = shl uint %indvar, ubyte 2 ; [#uses=1] - %tmp.10 = add uint %tmp., 1 ; [#uses=2] - %k.0.0 = cast uint %tmp.10 to int ; [#uses=2] - %tmp31 = add int %k.0.0, -1 ; [#uses=4] - %tmp32 = getelementptr int* %mpp, int %tmp31 ; [#uses=1] - %tmp34 = cast int* %tmp32 to sbyte* ; [#uses=1] - %tmp = tail call <16 x sbyte> %llvm.x86.sse2.loadu.dq( sbyte* %tmp34 ) ; <<16 x sbyte>> [#uses=1] - %tmp42 = getelementptr int* %tpmm, int %tmp31 ; [#uses=1] - %tmp42 = cast int* %tmp42 to <4 x int>* ; <<4 x int>*> [#uses=1] - %tmp46 = load <4 x int>* %tmp42 ; <<4 x int>> [#uses=1] - %tmp54 = cast <16 x sbyte> %tmp to <4 x int> ; <<4 x int>> [#uses=1] - %tmp55 = add <4 x int> %tmp54, %tmp46 ; <<4 x int>> [#uses=2] - %tmp55 = cast <4 x int> %tmp55 to <2 x long> ; <<2 x long>> [#uses=1] - %tmp62 = getelementptr int* %ip, int %tmp31 ; [#uses=1] - %tmp65 = cast int* %tmp62 to sbyte* ; [#uses=1] - %tmp66 = tail call <16 x sbyte> %llvm.x86.sse2.loadu.dq( sbyte* %tmp65 ) ; <<16 x sbyte>> [#uses=1] - %tmp73 = getelementptr int* %tpim, int %tmp31 ; [#uses=1] - %tmp73 = cast int* %tmp73 to <4 x int>* ; <<4 x int>*> [#uses=1] - %tmp77 = load <4 x int>* %tmp73 ; <<4 x int>> [#uses=1] - %tmp87 = cast <16 x sbyte> %tmp66 to <4 x int> ; <<4 x int>> [#uses=1] - %tmp88 = add <4 x int> %tmp87, %tmp77 ; <<4 x int>> [#uses=2] - %tmp88 = cast <4 x int> %tmp88 to <2 x long> ; <<2 x long>> [#uses=1] - %tmp99 = tail call <4 x int> %llvm.x86.sse2.pcmpgt.d( <4 x int> %tmp88, <4 x int> %tmp55 ) ; <<4 x int>> [#uses=1] - %tmp99 = cast <4 x int> %tmp99 to <2 x long> ; <<2 x long>> [#uses=2] - %tmp110 = xor <2 x long> %tmp99, < long -1, long -1 > ; <<2 x long>> [#uses=1] - %tmp111 = and <2 x long> %tmp110, %tmp55 ; <<2 x long>> [#uses=1] - %tmp121 = and <2 x long> %tmp99, %tmp88 ; <<2 x long>> [#uses=1] - %tmp131 = or <2 x long> %tmp121, %tmp111 ; <<2 x long>> [#uses=1] - %tmp137 = getelementptr int* %mc, uint %tmp.10 ; [#uses=1] - %tmp137 = cast int* %tmp137 to <2 x long>* ; <<2 x long>*> [#uses=1] - store <2 x long> %tmp131, <2 x long>* %tmp137 - %tmp147 = add int %k.0.0, 8 ; [#uses=1] - %tmp = setgt int %tmp147, %M ; [#uses=1] - %indvar.next = add uint %indvar, 1 ; [#uses=1] - br bool %tmp, label %return, label %cond_true + %indvar = phi i32 [ 0, %entry ], [ %indvar.next, %cond_true ] ; [#uses=2] + %tmp. = shl i32 %indvar, 2 ; [#uses=1] + %tmp.10 = add i32 %tmp., 1 ; [#uses=2] + %k.0.0 = bitcast i32 %tmp.10 to i32 ; [#uses=2] + %tmp31 = add i32 %k.0.0, -1 ; [#uses=4] + %tmp32 = getelementptr i32* %mpp, i32 %tmp31 ; [#uses=1] + %tmp34 = bitcast i32* %tmp32 to i8* ; [#uses=1] + %tmp = tail call <16 x i8> @llvm.x86.sse2.loadu.dq( i8* %tmp34 ) ; <<16 x i8>> [#uses=1] + %tmp42 = getelementptr i32* %tpmm, i32 %tmp31 ; [#uses=1] + %tmp42.upgrd.1 = bitcast i32* %tmp42 to <4 x i32>* ; <<4 x i32>*> [#uses=1] + %tmp46 = load <4 x i32>* %tmp42.upgrd.1 ; <<4 x i32>> [#uses=1] + %tmp54 = bitcast <16 x i8> %tmp to <4 x i32> ; <<4 x i32>> [#uses=1] + %tmp55 = add <4 x i32> %tmp54, %tmp46 ; <<4 x i32>> [#uses=2] + %tmp55.upgrd.2 = bitcast <4 x i32> %tmp55 to <2 x i64> ; <<2 x i64>> [#uses=1] + %tmp62 = getelementptr i32* %ip, i32 %tmp31 ; [#uses=1] + %tmp65 = bitcast i32* %tmp62 to i8* ; [#uses=1] + %tmp66 = tail call <16 x i8> @llvm.x86.sse2.loadu.dq( i8* %tmp65 ) ; <<16 x i8>> [#uses=1] + %tmp73 = getelementptr i32* %tpim, i32 %tmp31 ; [#uses=1] + %tmp73.upgrd.3 = bitcast i32* %tmp73 to <4 x i32>* ; <<4 x i32>*> [#uses=1] + %tmp77 = load <4 x i32>* %tmp73.upgrd.3 ; <<4 x i32>> [#uses=1] + %tmp87 = bitcast <16 x i8> %tmp66 to <4 x i32> ; <<4 x i32>> [#uses=1] + %tmp88 = add <4 x i32> %tmp87, %tmp77 ; <<4 x i32>> [#uses=2] + %tmp88.upgrd.4 = bitcast <4 x i32> %tmp88 to <2 x i64> ; <<2 x i64>> [#uses=1] + %tmp99 = tail call <4 x i32> @llvm.x86.sse2.pcmpgt.d( <4 x i32> %tmp88, <4 x i32> %tmp55 ) ; <<4 x i32>> [#uses=1] + %tmp99.upgrd.5 = bitcast <4 x i32> %tmp99 to <2 x i64> ; <<2 x i64>> [#uses=2] + %tmp110 = xor <2 x i64> %tmp99.upgrd.5, < i64 -1, i64 -1 > ; <<2 x i64>> [#uses=1] + %tmp111 = and <2 x i64> %tmp110, %tmp55.upgrd.2 ; <<2 x i64>> [#uses=1] + %tmp121 = and <2 x i64> %tmp99.upgrd.5, %tmp88.upgrd.4 ; <<2 x i64>> [#uses=1] + %tmp131 = or <2 x i64> %tmp121, %tmp111 ; <<2 x i64>> [#uses=1] + %gep.upgrd.6 = zext i32 %tmp.10 to i64 ; [#uses=1] + %tmp137 = getelementptr i32* %mc, i64 %gep.upgrd.6 ; [#uses=1] + %tmp137.upgrd.7 = bitcast i32* %tmp137 to <2 x i64>* ; <<2 x i64>*> [#uses=1] + store <2 x i64> %tmp131, <2 x i64>* %tmp137.upgrd.7 + %tmp147 = add i32 %k.0.0, 8 ; [#uses=1] + %tmp.upgrd.8 = icmp sgt i32 %tmp147, %M ; [#uses=1] + %indvar.next = add i32 %indvar, 1 ; [#uses=1] + br i1 %tmp.upgrd.8, label %return, label %cond_true return: ; preds = %cond_true, %entry ret void } -declare <16 x sbyte> %llvm.x86.sse2.loadu.dq(sbyte*) +declare <16 x i8> @llvm.x86.sse2.loadu.dq(i8*) -declare <4 x int> %llvm.x86.sse2.pcmpgt.d(<4 x int>, <4 x int>) +declare <4 x i32> @llvm.x86.sse2.pcmpgt.d(<4 x i32>, <4 x i32>)