mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-16 11:30:51 +00:00
26e46f2283
Summary: When computing branch weights in BPI, we used to disallow branches with weight 0. This is a minor nuisance, because a branch with weight 0 is different to "don't have information". In the context of instrumentation, it may mean "never executed", in the context of sampling, it means "never or seldom executed". In allowing 0 weight branches, I ran into issues with the switch expansion code in selection DAG. It is currently hardwired to not handle branches with weight 0. To maintain the current behaviour, I changed it to use 1 when it finds 0, but perhaps the algorithm needs changes to tolerate branches with weight zero. Reviewers: hansw Subscribers: llvm-commits Differential Revision: http://reviews.llvm.org/D9533 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@236617 91177308-0d34-0410-b5e6-96231b3b80d8
244 lines
10 KiB
LLVM
244 lines
10 KiB
LLVM
; RUN: opt < %s -sample-profile -sample-profile-file=%S/Inputs/propagate.prof | opt -analyze -branch-prob | FileCheck %s
|
|
|
|
; Original C++ code for this test case:
|
|
;
|
|
; #include <stdio.h>
|
|
;
|
|
; long foo(int x, int y, long N) {
|
|
; if (x < y) {
|
|
; return y - x;
|
|
; } else {
|
|
; for (long i = 0; i < N; i++) {
|
|
; if (i > N / 3)
|
|
; x--;
|
|
; if (i > N / 4) {
|
|
; y++;
|
|
; x += 3;
|
|
; } else {
|
|
; for (unsigned j = 0; j < i; j++) {
|
|
; x += j;
|
|
; y -= 3;
|
|
; }
|
|
; }
|
|
; }
|
|
; }
|
|
; return y * x;
|
|
; }
|
|
;
|
|
; int main() {
|
|
; int x = 5678;
|
|
; int y = 1234;
|
|
; long N = 999999;
|
|
; printf("foo(%d, %d, %ld) = %ld\n", x, y, N, foo(x, y, N));
|
|
; return 0;
|
|
; }
|
|
|
|
; ModuleID = 'propagate.cc'
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
@.str = private unnamed_addr constant [24 x i8] c"foo(%d, %d, %ld) = %ld\0A\00", align 1
|
|
|
|
; Function Attrs: nounwind uwtable
|
|
define i64 @_Z3fooiil(i32 %x, i32 %y, i64 %N) #0 {
|
|
entry:
|
|
%retval = alloca i64, align 8
|
|
%x.addr = alloca i32, align 4
|
|
%y.addr = alloca i32, align 4
|
|
%N.addr = alloca i64, align 8
|
|
%i = alloca i64, align 8
|
|
%j = alloca i32, align 4
|
|
store i32 %x, i32* %x.addr, align 4
|
|
store i32 %y, i32* %y.addr, align 4
|
|
store i64 %N, i64* %N.addr, align 8
|
|
%0 = load i32, i32* %x.addr, align 4, !dbg !11
|
|
%1 = load i32, i32* %y.addr, align 4, !dbg !11
|
|
%cmp = icmp slt i32 %0, %1, !dbg !11
|
|
br i1 %cmp, label %if.then, label %if.else, !dbg !11
|
|
|
|
if.then: ; preds = %entry
|
|
%2 = load i32, i32* %y.addr, align 4, !dbg !13
|
|
%3 = load i32, i32* %x.addr, align 4, !dbg !13
|
|
%sub = sub nsw i32 %2, %3, !dbg !13
|
|
%conv = sext i32 %sub to i64, !dbg !13
|
|
store i64 %conv, i64* %retval, !dbg !13
|
|
br label %return, !dbg !13
|
|
|
|
if.else: ; preds = %entry
|
|
store i64 0, i64* %i, align 8, !dbg !15
|
|
br label %for.cond, !dbg !15
|
|
|
|
for.cond: ; preds = %for.inc16, %if.else
|
|
%4 = load i64, i64* %i, align 8, !dbg !15
|
|
%5 = load i64, i64* %N.addr, align 8, !dbg !15
|
|
%cmp1 = icmp slt i64 %4, %5, !dbg !15
|
|
br i1 %cmp1, label %for.body, label %for.end18, !dbg !15
|
|
; CHECK: edge for.cond -> for.body probability is 10 / 10 = 100% [HOT edge]
|
|
; CHECK: edge for.cond -> for.end18 probability is 0 / 10 = 0%
|
|
|
|
for.body: ; preds = %for.cond
|
|
%6 = load i64, i64* %i, align 8, !dbg !18
|
|
%7 = load i64, i64* %N.addr, align 8, !dbg !18
|
|
%div = sdiv i64 %7, 3, !dbg !18
|
|
%cmp2 = icmp sgt i64 %6, %div, !dbg !18
|
|
br i1 %cmp2, label %if.then3, label %if.end, !dbg !18
|
|
; CHECK: edge for.body -> if.then3 probability is 1 / 5 = 20%
|
|
; CHECK: edge for.body -> if.end probability is 4 / 5 = 80%
|
|
|
|
if.then3: ; preds = %for.body
|
|
%8 = load i32, i32* %x.addr, align 4, !dbg !21
|
|
%dec = add nsw i32 %8, -1, !dbg !21
|
|
store i32 %dec, i32* %x.addr, align 4, !dbg !21
|
|
br label %if.end, !dbg !21
|
|
|
|
if.end: ; preds = %if.then3, %for.body
|
|
%9 = load i64, i64* %i, align 8, !dbg !22
|
|
%10 = load i64, i64* %N.addr, align 8, !dbg !22
|
|
%div4 = sdiv i64 %10, 4, !dbg !22
|
|
%cmp5 = icmp sgt i64 %9, %div4, !dbg !22
|
|
br i1 %cmp5, label %if.then6, label %if.else7, !dbg !22
|
|
; CHECK: edge if.end -> if.then6 probability is 3 / 6342 = 0.0473037%
|
|
; CHECK: edge if.end -> if.else7 probability is 6339 / 6342 = 99.9527% [HOT edge]
|
|
|
|
if.then6: ; preds = %if.end
|
|
%11 = load i32, i32* %y.addr, align 4, !dbg !24
|
|
%inc = add nsw i32 %11, 1, !dbg !24
|
|
store i32 %inc, i32* %y.addr, align 4, !dbg !24
|
|
%12 = load i32, i32* %x.addr, align 4, !dbg !26
|
|
%add = add nsw i32 %12, 3, !dbg !26
|
|
store i32 %add, i32* %x.addr, align 4, !dbg !26
|
|
br label %if.end15, !dbg !27
|
|
|
|
if.else7: ; preds = %if.end
|
|
store i32 0, i32* %j, align 4, !dbg !28
|
|
br label %for.cond8, !dbg !28
|
|
|
|
for.cond8: ; preds = %for.inc, %if.else7
|
|
%13 = load i32, i32* %j, align 4, !dbg !28
|
|
%conv9 = zext i32 %13 to i64, !dbg !28
|
|
%14 = load i64, i64* %i, align 8, !dbg !28
|
|
%cmp10 = icmp slt i64 %conv9, %14, !dbg !28
|
|
br i1 %cmp10, label %for.body11, label %for.end, !dbg !28
|
|
; CHECK: edge for.cond8 -> for.body11 probability is 16191 / 16191 = 100% [HOT edge]
|
|
; CHECK: edge for.cond8 -> for.end probability is 0 / 16191 = 0%
|
|
|
|
for.body11: ; preds = %for.cond8
|
|
%15 = load i32, i32* %j, align 4, !dbg !31
|
|
%16 = load i32, i32* %x.addr, align 4, !dbg !31
|
|
%add12 = add i32 %16, %15, !dbg !31
|
|
store i32 %add12, i32* %x.addr, align 4, !dbg !31
|
|
%17 = load i32, i32* %y.addr, align 4, !dbg !33
|
|
%sub13 = sub nsw i32 %17, 3, !dbg !33
|
|
store i32 %sub13, i32* %y.addr, align 4, !dbg !33
|
|
br label %for.inc, !dbg !34
|
|
|
|
for.inc: ; preds = %for.body11
|
|
%18 = load i32, i32* %j, align 4, !dbg !28
|
|
%inc14 = add i32 %18, 1, !dbg !28
|
|
store i32 %inc14, i32* %j, align 4, !dbg !28
|
|
br label %for.cond8, !dbg !28
|
|
|
|
for.end: ; preds = %for.cond8
|
|
br label %if.end15
|
|
|
|
if.end15: ; preds = %for.end, %if.then6
|
|
br label %for.inc16, !dbg !35
|
|
|
|
for.inc16: ; preds = %if.end15
|
|
%19 = load i64, i64* %i, align 8, !dbg !15
|
|
%inc17 = add nsw i64 %19, 1, !dbg !15
|
|
store i64 %inc17, i64* %i, align 8, !dbg !15
|
|
br label %for.cond, !dbg !15
|
|
|
|
for.end18: ; preds = %for.cond
|
|
br label %if.end19
|
|
|
|
if.end19: ; preds = %for.end18
|
|
%20 = load i32, i32* %y.addr, align 4, !dbg !36
|
|
%21 = load i32, i32* %x.addr, align 4, !dbg !36
|
|
%mul = mul nsw i32 %20, %21, !dbg !36
|
|
%conv20 = sext i32 %mul to i64, !dbg !36
|
|
store i64 %conv20, i64* %retval, !dbg !36
|
|
br label %return, !dbg !36
|
|
|
|
return: ; preds = %if.end19, %if.then
|
|
%22 = load i64, i64* %retval, !dbg !37
|
|
ret i64 %22, !dbg !37
|
|
}
|
|
|
|
; Function Attrs: uwtable
|
|
define i32 @main() #1 {
|
|
entry:
|
|
%retval = alloca i32, align 4
|
|
%x = alloca i32, align 4
|
|
%y = alloca i32, align 4
|
|
%N = alloca i64, align 8
|
|
store i32 0, i32* %retval
|
|
store i32 5678, i32* %x, align 4, !dbg !38
|
|
store i32 1234, i32* %y, align 4, !dbg !39
|
|
store i64 999999, i64* %N, align 8, !dbg !40
|
|
%0 = load i32, i32* %x, align 4, !dbg !41
|
|
%1 = load i32, i32* %y, align 4, !dbg !41
|
|
%2 = load i64, i64* %N, align 8, !dbg !41
|
|
%3 = load i32, i32* %x, align 4, !dbg !41
|
|
%4 = load i32, i32* %y, align 4, !dbg !41
|
|
%5 = load i64, i64* %N, align 8, !dbg !41
|
|
%call = call i64 @_Z3fooiil(i32 %3, i32 %4, i64 %5), !dbg !41
|
|
%call1 = call i32 (i8*, ...) @printf(i8* getelementptr inbounds ([24 x i8], [24 x i8]* @.str, i32 0, i32 0), i32 %0, i32 %1, i64 %2, i64 %call), !dbg !41
|
|
ret i32 0, !dbg !42
|
|
}
|
|
|
|
declare i32 @printf(i8*, ...) #2
|
|
|
|
attributes #0 = { nounwind uwtable "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }
|
|
attributes #1 = { uwtable "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }
|
|
attributes #2 = { "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }
|
|
|
|
!llvm.dbg.cu = !{!0}
|
|
!llvm.module.flags = !{!8, !9}
|
|
!llvm.ident = !{!10}
|
|
|
|
!0 = !DICompileUnit(language: DW_LANG_C_plus_plus, producer: "clang version 3.5 ", isOptimized: false, emissionKind: 0, file: !1, enums: !2, retainedTypes: !2, subprograms: !3, globals: !2, imports: !2)
|
|
!1 = !DIFile(filename: "propagate.cc", directory: ".")
|
|
!2 = !{}
|
|
!3 = !{!4, !7}
|
|
!4 = !DISubprogram(name: "foo", line: 3, isLocal: false, isDefinition: true, virtualIndex: 6, flags: DIFlagPrototyped, isOptimized: false, scopeLine: 3, file: !1, scope: !5, type: !6, function: i64 (i32, i32, i64)* @_Z3fooiil, variables: !2)
|
|
!5 = !DIFile(filename: "propagate.cc", directory: ".")
|
|
!6 = !DISubroutineType(types: !{null})
|
|
!7 = !DISubprogram(name: "main", line: 24, isLocal: false, isDefinition: true, virtualIndex: 6, flags: DIFlagPrototyped, isOptimized: false, scopeLine: 24, file: !1, scope: !5, type: !6, function: i32 ()* @main, variables: !2)
|
|
!8 = !{i32 2, !"Dwarf Version", i32 4}
|
|
!9 = !{i32 1, !"Debug Info Version", i32 3}
|
|
!10 = !{!"clang version 3.5 "}
|
|
!11 = !DILocation(line: 4, scope: !12)
|
|
!12 = distinct !DILexicalBlock(line: 4, column: 0, file: !1, scope: !4)
|
|
!13 = !DILocation(line: 5, scope: !14)
|
|
!14 = distinct !DILexicalBlock(line: 4, column: 0, file: !1, scope: !12)
|
|
!15 = !DILocation(line: 7, scope: !16)
|
|
!16 = distinct !DILexicalBlock(line: 7, column: 0, file: !1, scope: !17)
|
|
!17 = distinct !DILexicalBlock(line: 6, column: 0, file: !1, scope: !12)
|
|
!18 = !DILocation(line: 8, scope: !19)
|
|
!19 = distinct !DILexicalBlock(line: 8, column: 0, file: !1, scope: !20)
|
|
!20 = distinct !DILexicalBlock(line: 7, column: 0, file: !1, scope: !16)
|
|
!21 = !DILocation(line: 9, scope: !19)
|
|
!22 = !DILocation(line: 10, scope: !23)
|
|
!23 = distinct !DILexicalBlock(line: 10, column: 0, file: !1, scope: !20)
|
|
!24 = !DILocation(line: 11, scope: !25)
|
|
!25 = distinct !DILexicalBlock(line: 10, column: 0, file: !1, scope: !23)
|
|
!26 = !DILocation(line: 12, scope: !25)
|
|
!27 = !DILocation(line: 13, scope: !25)
|
|
!28 = !DILocation(line: 14, scope: !29)
|
|
!29 = distinct !DILexicalBlock(line: 14, column: 0, file: !1, scope: !30)
|
|
!30 = distinct !DILexicalBlock(line: 13, column: 0, file: !1, scope: !23)
|
|
!31 = !DILocation(line: 15, scope: !32)
|
|
!32 = distinct !DILexicalBlock(line: 14, column: 0, file: !1, scope: !29)
|
|
!33 = !DILocation(line: 16, scope: !32)
|
|
!34 = !DILocation(line: 17, scope: !32)
|
|
!35 = !DILocation(line: 19, scope: !20)
|
|
!36 = !DILocation(line: 21, scope: !4)
|
|
!37 = !DILocation(line: 22, scope: !4)
|
|
!38 = !DILocation(line: 25, scope: !7)
|
|
!39 = !DILocation(line: 26, scope: !7)
|
|
!40 = !DILocation(line: 27, scope: !7)
|
|
!41 = !DILocation(line: 28, scope: !7)
|
|
!42 = !DILocation(line: 29, scope: !7)
|