2011-02-10 23:38:10 +00:00
|
|
|
; RUN: opt < %s -loop-simplify -loop-rotate -instcombine -indvars -S -verify-loop-info -verify-dom-info > %t
|
2009-06-27 21:30:38 +00:00
|
|
|
; RUN: not grep sext %t
|
Convert all tests using TCL-style quoting to use shell-style quoting.
This was done through the aid of a terrible Perl creation. I will not
paste any of the horrors here. Suffice to say, it require multiple
staged rounds of replacements, state carried between, and a few
nested-construct-parsing hacks that I'm not proud of. It happens, by
luck, to be able to deal with all the TCL-quoting patterns in evidence
in the LLVM test suite.
If anyone is maintaining large out-of-tree test trees, feel free to poke
me and I'll send you the steps I used to convert things, as well as
answer any painful questions etc. IRC works best for this type of thing
I find.
Once converted, switch the LLVM lit config to use ShTests the same as
Clang. In addition to being able to delete large amounts of Python code
from 'lit', this will also simplify the entire test suite and some of
lit's architecture.
Finally, the test suite runs 33% faster on Linux now. ;]
For my 16-hardware-thread (2x 4-core xeon e5520): 36s -> 24s
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@159525 91177308-0d34-0410-b5e6-96231b3b80d8
2012-07-02 12:47:22 +00:00
|
|
|
; RUN: grep "phi i64" %t | count 1
|
2009-06-27 21:30:38 +00:00
|
|
|
|
|
|
|
; Loopsimplify should be able to merge the two loop exits
|
|
|
|
; into one, so that loop rotate can rotate the loop, so
|
|
|
|
; that indvars can promote the induction variable to i64
|
|
|
|
; without needing casts.
|
|
|
|
|
2011-10-12 22:24:17 +00:00
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n32:64"
|
2009-06-27 21:30:38 +00:00
|
|
|
|
|
|
|
define float @t(float* %pTmp1, float* %peakWeight, i32 %bandEdgeIndex) nounwind {
|
|
|
|
entry:
|
|
|
|
%t0 = load float* %peakWeight, align 4 ; <float> [#uses=1]
|
|
|
|
br label %bb1
|
|
|
|
|
|
|
|
bb: ; preds = %bb2
|
|
|
|
%t1 = sext i32 %hiPart.0 to i64 ; <i64> [#uses=1]
|
|
|
|
%t2 = getelementptr float* %pTmp1, i64 %t1 ; <float*> [#uses=1]
|
|
|
|
%t3 = load float* %t2, align 4 ; <float> [#uses=1]
|
|
|
|
%t4 = fadd float %t3, %distERBhi.0 ; <float> [#uses=1]
|
|
|
|
%t5 = add i32 %hiPart.0, 1 ; <i32> [#uses=2]
|
|
|
|
%t6 = sext i32 %t5 to i64 ; <i64> [#uses=1]
|
|
|
|
%t7 = getelementptr float* %peakWeight, i64 %t6 ; <float*> [#uses=1]
|
|
|
|
%t8 = load float* %t7, align 4 ; <float> [#uses=1]
|
|
|
|
%t9 = fadd float %t8, %peakCount.0 ; <float> [#uses=1]
|
|
|
|
br label %bb1
|
|
|
|
|
|
|
|
bb1: ; preds = %bb, %entry
|
|
|
|
%peakCount.0 = phi float [ %t0, %entry ], [ %t9, %bb ] ; <float> [#uses=2]
|
|
|
|
%hiPart.0 = phi i32 [ 0, %entry ], [ %t5, %bb ] ; <i32> [#uses=3]
|
|
|
|
%distERBhi.0 = phi float [ 0.000000e+00, %entry ], [ %t4, %bb ] ; <float> [#uses=3]
|
|
|
|
%t10 = fcmp uge float %distERBhi.0, 2.500000e+00 ; <i1> [#uses=1]
|
|
|
|
br i1 %t10, label %bb3, label %bb2
|
|
|
|
|
|
|
|
bb2: ; preds = %bb1
|
|
|
|
%t11 = add i32 %bandEdgeIndex, -1 ; <i32> [#uses=1]
|
|
|
|
%t12 = icmp sgt i32 %t11, %hiPart.0 ; <i1> [#uses=1]
|
|
|
|
br i1 %t12, label %bb, label %bb3
|
|
|
|
|
|
|
|
bb3: ; preds = %bb2, %bb1
|
|
|
|
%t13 = fdiv float %peakCount.0, %distERBhi.0 ; <float> [#uses=1]
|
|
|
|
ret float %t13
|
|
|
|
}
|