This patch was split from https://reviews.llvm.org/D102246 [SampleFDO] New hierarchical discriminator for Flow Sensitive SampleFDO This is mainly for ProfileData part of change. It will load FS Profile when such profile is detected. For an extbinary format profile, create_llvm_prof tool will add a flag to profile summary section. For other format profiles, the users need to use an internal option (-profile-isfs) to tell the compiler that the profile uses FS discriminators. This patch also simplified the bit API used by FS discriminators. Differential Revision: https://reviews.llvm.org/D103041
231 lines
12 KiB
LLVM
231 lines
12 KiB
LLVM
; RUN: opt < %s -sample-profile -sample-profile-file=%S/Inputs/fsafdo.extbinary.afdo | opt -analyze -branch-prob -enable-new-pm=0 | FileCheck %s
|
|
; RUN: opt < %s -sample-profile -profile-isfs -sample-profile-file=%S/Inputs/fsafdo.prof | opt -analyze -branch-prob -enable-new-pm=0 | FileCheck %s
|
|
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
@sum = dso_local local_unnamed_addr global i32 0, align 4
|
|
|
|
declare i32 @bar(i32 %i) #0
|
|
declare void @work(i32 %i) #2
|
|
|
|
define dso_local void @foo() #0 !dbg !29 {
|
|
; CHECK: Printing analysis {{.*}} for function 'foo':
|
|
|
|
entry:
|
|
br label %for.cond1.preheader, !dbg !30
|
|
; CHECK: edge entry -> for.cond1.preheader probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
for.cond1.preheader:
|
|
%j.012 = phi i32 [ 0, %entry ], [ %inc11, %if.end9.3 ]
|
|
%mul = mul nuw nsw i32 %j.012, 48
|
|
%call = tail call i32 @bar(i32 %mul), !dbg !32
|
|
%0 = and i32 %call, 1, !dbg !33
|
|
%tobool.not = icmp eq i32 %0, 0, !dbg !33
|
|
br i1 %tobool.not, label %if.end, label %if.then, !dbg !35
|
|
; CHECK: edge for.cond1.preheader -> if.end probability is 0x3f6262b8 / 0x80000000 = 49.52%
|
|
; CHECK: edge for.cond1.preheader -> if.then probability is 0x409d9d48 / 0x80000000 = 50.48%
|
|
|
|
|
|
if.then:
|
|
%mul4 = shl nsw i32 %call, 1, !dbg !36
|
|
tail call void @work(i32 %mul4), !dbg !37
|
|
br label %if.end, !dbg !38
|
|
; CHECK: edge if.then -> if.end probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end:
|
|
%1 = and i32 %call, 3, !dbg !39
|
|
%tobool6.not = icmp eq i32 %1, 0, !dbg !39
|
|
br i1 %tobool6.not, label %if.end9, label %if.then7, !dbg !40
|
|
; CHECK: edge if.end -> if.end9 probability is 0x22c6bac3 / 0x80000000 = 27.17%
|
|
; CHECK: edge if.end -> if.then7 probability is 0x5d39453d / 0x80000000 = 72.83%
|
|
|
|
|
|
if.then7:
|
|
%mul8 = mul nsw i32 %call, 3, !dbg !41
|
|
tail call void @work(i32 %mul8), !dbg !42
|
|
br label %if.end9, !dbg !43
|
|
; CHECK: edge if.then7 -> if.end9 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end9:
|
|
%add.1 = or i32 %mul, 1, !dbg !44
|
|
%call.1 = tail call i32 @bar(i32 %add.1), !dbg !32
|
|
%2 = and i32 %call.1, 1, !dbg !33
|
|
%tobool.not.1 = icmp eq i32 %2, 0, !dbg !33
|
|
br i1 %tobool.not.1, label %if.end.1, label %if.then.1, !dbg !35
|
|
; CHECK: edge if.end9 -> if.end.1 probability is 0x3f6262b8 / 0x80000000 = 49.52%
|
|
; CHECK: edge if.end9 -> if.then.1 probability is 0x409d9d48 / 0x80000000 = 50.48%
|
|
|
|
for.end12:
|
|
ret void, !dbg !45
|
|
|
|
if.then.1:
|
|
%mul4.1 = shl nsw i32 %call.1, 1, !dbg !36
|
|
tail call void @work(i32 %mul4.1), !dbg !37
|
|
br label %if.end.1, !dbg !38
|
|
; CHECK: edge if.then.1 -> if.end.1 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end.1:
|
|
%3 = and i32 %call.1, 3, !dbg !39
|
|
%tobool6.not.1 = icmp eq i32 %3, 0, !dbg !39
|
|
br i1 %tobool6.not.1, label %if.end9.1, label %if.then7.1, !dbg !40
|
|
; CHECK: edge if.end.1 -> if.end9.1 probability is 0x22c6bac3 / 0x80000000 = 27.17%
|
|
; CHECK: edge if.end.1 -> if.then7.1 probability is 0x5d39453d / 0x80000000 = 72.83%
|
|
|
|
if.then7.1:
|
|
%mul8.1 = mul nsw i32 %call.1, 3, !dbg !41
|
|
tail call void @work(i32 %mul8.1), !dbg !42
|
|
br label %if.end9.1, !dbg !43
|
|
; CHECK: edge if.then7.1 -> if.end9.1 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end9.1:
|
|
%add.2 = or i32 %mul, 2, !dbg !44
|
|
%call.2 = tail call i32 @bar(i32 %add.2), !dbg !32
|
|
%4 = and i32 %call.2, 1, !dbg !33
|
|
%tobool.not.2 = icmp eq i32 %4, 0, !dbg !33
|
|
br i1 %tobool.not.2, label %if.end.2, label %if.then.2, !dbg !35
|
|
; CHECK: edge if.end9.1 -> if.end.2 probability is 0x3f6262b8 / 0x80000000 = 49.52%
|
|
; CHECK: edge if.end9.1 -> if.then.2 probability is 0x409d9d48 / 0x80000000 = 50.48%
|
|
|
|
if.then.2:
|
|
%mul4.2 = shl nsw i32 %call.2, 1, !dbg !36
|
|
tail call void @work(i32 %mul4.2), !dbg !37
|
|
br label %if.end.2, !dbg !38
|
|
; CHECK: edge if.then.2 -> if.end.2 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end.2:
|
|
%5 = and i32 %call.2, 3, !dbg !39
|
|
%tobool6.not.2 = icmp eq i32 %5, 0, !dbg !39
|
|
br i1 %tobool6.not.2, label %if.end9.2, label %if.then7.2, !dbg !40
|
|
; CHECK: edge if.end.2 -> if.end9.2 probability is 0x22c6bac3 / 0x80000000 = 27.17%
|
|
; CHECK: edge if.end.2 -> if.then7.2 probability is 0x5d39453d / 0x80000000 = 72.83%
|
|
|
|
if.then7.2:
|
|
%mul8.2 = mul nsw i32 %call.2, 3, !dbg !41
|
|
tail call void @work(i32 %mul8.2), !dbg !42
|
|
br label %if.end9.2, !dbg !43
|
|
; CHECK: edge if.then7.2 -> if.end9.2 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end9.2:
|
|
%add.3 = or i32 %mul, 3, !dbg !44
|
|
%call.3 = tail call i32 @bar(i32 %add.3), !dbg !32
|
|
%6 = and i32 %call.3, 1, !dbg !33
|
|
%tobool.not.3 = icmp eq i32 %6, 0, !dbg !33
|
|
br i1 %tobool.not.3, label %if.end.3, label %if.then.3, !dbg !35
|
|
; CHECK: edge if.end9.2 -> if.end.3 probability is 0x3f6262b8 / 0x80000000 = 49.52%
|
|
; CHECK: edge if.end9.2 -> if.then.3 probability is 0x409d9d48 / 0x80000000 = 50.48%
|
|
|
|
if.then.3:
|
|
%mul4.3 = shl nsw i32 %call.3, 1, !dbg !36
|
|
tail call void @work(i32 %mul4.3), !dbg !37
|
|
br label %if.end.3, !dbg !38
|
|
; CHECK: edge if.then.3 -> if.end.3 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end.3:
|
|
%7 = and i32 %call.3, 3, !dbg !39
|
|
%tobool6.not.3 = icmp eq i32 %7, 0, !dbg !39
|
|
br i1 %tobool6.not.3, label %if.end9.3, label %if.then7.3, !dbg !40
|
|
; CHECK: edge if.end.3 -> if.end9.3 probability is 0x22c6bac3 / 0x80000000 = 27.17%
|
|
; CHECK: edge if.end.3 -> if.then7.3 probability is 0x5d39453d / 0x80000000 = 72.83%
|
|
|
|
if.then7.3:
|
|
%mul8.3 = mul nsw i32 %call.3, 3, !dbg !41
|
|
tail call void @work(i32 %mul8.3), !dbg !42
|
|
br label %if.end9.3, !dbg !43
|
|
; CHECK: edge if.then7.3 -> if.end9.3 probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
|
|
|
|
if.end9.3:
|
|
%inc11 = add nuw nsw i32 %j.012, 1, !dbg !46
|
|
%exitcond.not = icmp eq i32 %inc11, 48, !dbg !48
|
|
br i1 %exitcond.not, label %for.end12, label %for.cond1.preheader, !dbg !30, !llvm.loop !49
|
|
; CHECK: edge if.end9.3 -> for.end12 probability is 0x00834dd9 / 0x80000000 = 0.40%
|
|
; CHECK: edge if.end9.3 -> for.cond1.preheader probability is 0x7f7cb227 / 0x80000000 = 99.60% [HOT edge]
|
|
}
|
|
|
|
define dso_local i32 @main() #3 !dbg !52 {
|
|
entry:
|
|
br label %for.body, !dbg !53
|
|
|
|
for.body:
|
|
%i.03 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
tail call void @foo(), !dbg !55
|
|
%inc = add nuw nsw i32 %i.03, 1, !dbg !56
|
|
%exitcond.not = icmp eq i32 %inc, 10000000, !dbg !58
|
|
br i1 %exitcond.not, label %for.end, label %for.body, !dbg !53, !llvm.loop !60
|
|
|
|
for.end:
|
|
ret i32 0, !dbg !63
|
|
}
|
|
|
|
|
|
attributes #0 = { noinline nounwind uwtable "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "unsafe-fp-math"="false" "use-soft-float"="false" "use-sample-profile"}
|
|
attributes #1 = { argmemonly nounwind willreturn }
|
|
attributes #2 = { nofree noinline norecurse nounwind uwtable "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "unsafe-fp-math"="false" "use-soft-float"="false" }
|
|
attributes #3 = { nounwind uwtable "disable-tail-calls"="false" "frame-pointer"="none" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "unsafe-fp-math"="false" "use-soft-float"="false" }
|
|
|
|
!llvm.dbg.cu = !{!0}
|
|
!llvm.module.flags = !{!3, !4, !5}
|
|
|
|
!0 = distinct !DICompileUnit(language: DW_LANG_C99, file: !1, isOptimized: true, runtimeVersion: 0, emissionKind: LineTablesOnly, enums: !2, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None)
|
|
!1 = !DIFile(filename: "unroll.c", directory: "a/")
|
|
!2 = !{}
|
|
!3 = !{i32 7, !"Dwarf Version", i32 4}
|
|
!4 = !{i32 2, !"Debug Info Version", i32 3}
|
|
!5 = !{i32 1, !"wchar_size", i32 4}
|
|
!7 = distinct !DISubprogram(name: "bar", scope: !1, file: !1, line: 3, type: !8, scopeLine: 3, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!8 = !DISubroutineType(types: !2)
|
|
!9 = !DILocation(line: 4, column: 3, scope: !7)
|
|
!10 = !DILocation(line: 5, column: 5, scope: !7)
|
|
!11 = !{!12, !12, i64 0}
|
|
!12 = !{!"int", !13, i64 0}
|
|
!13 = !{!"omnipotent char", !14, i64 0}
|
|
!14 = !{!"Simple C/C++ TBAA"}
|
|
!15 = !DILocation(line: 6, column: 10, scope: !7)
|
|
!16 = !DILocation(line: 7, column: 1, scope: !7)
|
|
!17 = !DILocation(line: 6, column: 3, scope: !18)
|
|
!18 = !DILexicalBlockFile(scope: !7, file: !1, discriminator: 1)
|
|
!19 = distinct !DISubprogram(name: "work", scope: !1, file: !1, line: 10, type: !8, scopeLine: 10, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!20 = !DILocation(line: 11, column: 7, scope: !19)
|
|
!21 = !DILocation(line: 11, column: 11, scope: !22)
|
|
!22 = !DILexicalBlockFile(scope: !19, file: !1, discriminator: 1)
|
|
!23 = !DILocation(line: 11, column: 11, scope: !24)
|
|
!24 = !DILexicalBlockFile(scope: !19, file: !1, discriminator: 2)
|
|
!25 = !DILocation(line: 11, column: 7, scope: !26)
|
|
!26 = !DILexicalBlockFile(scope: !19, file: !1, discriminator: 3)
|
|
!27 = !DILocation(line: 0, scope: !22)
|
|
!28 = !DILocation(line: 15, column: 1, scope: !19)
|
|
!29 = distinct !DISubprogram(name: "foo", scope: !1, file: !1, line: 17, type: !8, scopeLine: 17, flags: DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!30 = !DILocation(line: 19, column: 3, scope: !31)
|
|
!31 = !DILexicalBlockFile(scope: !29, file: !1, discriminator: 2)
|
|
!32 = !DILocation(line: 21, column: 16, scope: !31)
|
|
!33 = !DILocation(line: 22, column: 14, scope: !34)
|
|
!34 = !DILexicalBlockFile(scope: !29, file: !1, discriminator: 1)
|
|
!35 = !DILocation(line: 22, column: 11, scope: !31)
|
|
!36 = !DILocation(line: 23, column: 16, scope: !29)
|
|
!37 = !DILocation(line: 23, column: 9, scope: !34)
|
|
!38 = !DILocation(line: 23, column: 9, scope: !31)
|
|
!39 = !DILocation(line: 24, column: 14, scope: !34)
|
|
!40 = !DILocation(line: 24, column: 11, scope: !31)
|
|
!41 = !DILocation(line: 25, column: 16, scope: !29)
|
|
!42 = !DILocation(line: 25, column: 9, scope: !34)
|
|
!43 = !DILocation(line: 25, column: 9, scope: !31)
|
|
!44 = !DILocation(line: 21, column: 21, scope: !34)
|
|
!45 = !DILocation(line: 27, column: 1, scope: !29)
|
|
!46 = !DILocation(line: 19, column: 24, scope: !47)
|
|
!47 = !DILexicalBlockFile(scope: !29, file: !1, discriminator: 3)
|
|
!48 = !DILocation(line: 19, column: 17, scope: !34)
|
|
!49 = distinct !{!49, !50, !51}
|
|
!50 = !DILocation(line: 19, column: 3, scope: !29)
|
|
!51 = !DILocation(line: 26, column: 3, scope: !29)
|
|
!52 = distinct !DISubprogram(name: "main", scope: !1, file: !1, line: 29, type: !8, scopeLine: 29, flags: DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!53 = !DILocation(line: 31, column: 3, scope: !54)
|
|
!54 = !DILexicalBlockFile(scope: !52, file: !1, discriminator: 2)
|
|
!55 = !DILocation(line: 32, column: 5, scope: !52)
|
|
!56 = !DILocation(line: 31, column: 30, scope: !57)
|
|
!57 = !DILexicalBlockFile(scope: !52, file: !1, discriminator: 3)
|
|
!58 = !DILocation(line: 31, column: 17, scope: !59)
|
|
!59 = !DILexicalBlockFile(scope: !52, file: !1, discriminator: 1)
|
|
!60 = distinct !{!60, !61, !62}
|
|
!61 = !DILocation(line: 31, column: 3, scope: !52)
|
|
!62 = !DILocation(line: 33, column: 3, scope: !52)
|
|
!63 = !DILocation(line: 34, column: 1, scope: !52)
|