[llvm] [CSSPGO] Return error_code for missing probe profile (PR #102085)
Lei Wang via llvm-commits
llvm-commits at lists.llvm.org
Fri Aug 9 20:30:16 PDT 2024
https://github.com/wlei-llvm updated https://github.com/llvm/llvm-project/pull/102085
>From e73b151d06ccc9a478b80a624b6df65abfb5368b Mon Sep 17 00:00:00 2001
From: wlei <wlei at fb.com>
Date: Mon, 5 Aug 2024 17:06:18 -0700
Subject: [PATCH 1/3] [CSSPGO] Return error_code for missing probe profile
---
.../Utils/SampleProfileLoaderBaseImpl.h | 14 +-
.../Inputs/pseudo-probe-missing-probe.prof | 13 +
.../pseudo-probe-missing-probe.ll | 327 ++++++++++++++++++
3 files changed, 341 insertions(+), 13 deletions(-)
create mode 100644 llvm/test/Transforms/SampleProfile/Inputs/pseudo-probe-missing-probe.prof
create mode 100644 llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
diff --git a/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h b/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h
index 32bf7b8c96be3d..114159ab524bfe 100644
--- a/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h
+++ b/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h
@@ -449,9 +449,6 @@ SampleProfileLoaderBaseImpl<BT>::getInstWeightImpl(const InstructionT &Inst) {
return R;
}
-// Here use error_code to represent: 1) The dangling probe. 2) Ignore the weight
-// of non-probe instruction. So if all instructions of the BB give error_code,
-// tell the inference algorithm to infer the BB weight.
template <typename BT>
ErrorOr<uint64_t>
SampleProfileLoaderBaseImpl<BT>::getProbeWeight(const InstructionT &Inst) {
@@ -464,17 +461,8 @@ SampleProfileLoaderBaseImpl<BT>::getProbeWeight(const InstructionT &Inst) {
return std::error_code();
const FunctionSamples *FS = findFunctionSamples(Inst);
- // If none of the instruction has FunctionSample, we choose to return zero
- // value sample to indicate the BB is cold. This could happen when the
- // instruction is from inlinee and no profile data is found.
- // FIXME: This should not be affected by the source drift issue as 1) if the
- // newly added function is top-level inliner, it won't match the CFG checksum
- // in the function profile or 2) if it's the inlinee, the inlinee should have
- // a profile, otherwise it wouldn't be inlined. For non-probe based profile,
- // we can improve it by adding a switch for profile-sample-block-accurate for
- // block level counts in the future.
if (!FS)
- return 0;
+ return std::error_code();
auto R = FS->findSamplesAt(Probe->Id, Probe->Discriminator);
if (R) {
diff --git a/llvm/test/Transforms/SampleProfile/Inputs/pseudo-probe-missing-probe.prof b/llvm/test/Transforms/SampleProfile/Inputs/pseudo-probe-missing-probe.prof
new file mode 100644
index 00000000000000..cc50d6a2fad2b9
--- /dev/null
+++ b/llvm/test/Transforms/SampleProfile/Inputs/pseudo-probe-missing-probe.prof
@@ -0,0 +1,13 @@
+main:89650:0
+ 1: 0
+ 2: 16724
+ 3: 16724
+ 4: 14342
+ 5: 15026 bar:15026
+ 6: 1882
+ 8: 16724
+ 9: 0
+ !CFGChecksum: 563091374530180
+bar:15026:15026
+ 1: 15026
+ !CFGChecksum: 4294967295
diff --git a/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll b/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
new file mode 100644
index 00000000000000..23d322c5cc99f5
--- /dev/null
+++ b/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
@@ -0,0 +1,327 @@
+; RUN: opt < %s -passes=sample-profile --overwrite-existing-weights -sample-profile-file=%S/Inputs/pseudo-probe-missing-probe.prof | opt -passes='print<branch-prob>' -disable-output 2>&1 | FileCheck %s
+
+; CHECK: edge %while.body -> %if.then probability is 0x7212005e / 0x80000000 = 89.12% [HOT edge]
+; CHECK: edge %while.body -> %if.else probability is 0x0dedffa2 / 0x80000000 = 10.88%
+
+; CHECK-NOT: edge %while.body -> %if.then probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
+; CHECK-NOT: edge %while.body -> %if.else probability is 0x00000000 / 0x80000000 = 0.00%
+
+target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
+target triple = "x86_64-unknown-linux-gnu"
+
+ at x = dso_local global i32 0, align 4, !dbg !0
+
+; Function Attrs: noinline nounwind uwtable
+define dso_local void @bar(i32 noundef %i) #0 !dbg !47 !prof !52 {
+entry:
+ #dbg_value(i32 %i, !51, !DIExpression(), !53)
+ call void @llvm.pseudoprobe(i64 -2012135647395072713, i64 1, i32 0, i64 -1), !dbg !54
+ %0 = load volatile i32, ptr @x, align 4, !dbg !54, !tbaa !55
+ %add = add nsw i32 %0, 5, !dbg !54
+ store volatile i32 %add, ptr @x, align 4, !dbg !54, !tbaa !55
+ ret void, !dbg !59
+}
+
+; Function Attrs: nounwind uwtable
+define dso_local void @baz(i32 noundef %i) #1 !dbg !60 !prof !63 {
+entry:
+ #dbg_value(i32 %i, !62, !DIExpression(), !64)
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 1, i32 0, i64 -1), !dbg !65
+ %rem = srem i32 %i, 100, !dbg !67
+ %tobool = icmp ne i32 %rem, 0, !dbg !67
+ br i1 %tobool, label %if.then, label %if.end, !dbg !68
+
+if.then: ; preds = %entry
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 2, i32 0, i64 -1), !dbg !69
+ %0 = load volatile i32, ptr @x, align 4, !dbg !69, !tbaa !55
+ %inc = add nsw i32 %0, 1, !dbg !69
+ store volatile i32 %inc, ptr @x, align 4, !dbg !69, !tbaa !55
+ br label %if.end, !dbg !70
+
+if.end: ; preds = %if.then, %entry
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 3, i32 0, i64 -1), !dbg !71
+ %1 = load volatile i32, ptr @x, align 4, !dbg !71, !tbaa !55
+ %add = add nsw i32 %1, 2, !dbg !71
+ store volatile i32 %add, ptr @x, align 4, !dbg !71, !tbaa !55
+ %rem1 = srem i32 %i, 2, !dbg !72
+ %tobool2 = icmp ne i32 %rem1, 0, !dbg !72
+ br i1 %tobool2, label %if.then3, label %if.else, !dbg !74
+
+if.then3: ; preds = %if.end
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 4, i32 0, i64 -1), !dbg !75
+ %2 = load volatile i32, ptr @x, align 4, !dbg !75, !tbaa !55
+ %inc4 = add nsw i32 %2, 1, !dbg !75
+ store volatile i32 %inc4, ptr @x, align 4, !dbg !75, !tbaa !55
+ br label %if.end11, !dbg !76
+
+if.else: ; preds = %if.end
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 5, i32 0, i64 -1), !dbg !77
+ %rem5 = srem i32 %i, 3, !dbg !79
+ %tobool6 = icmp ne i32 %rem5, 0, !dbg !79
+ br i1 %tobool6, label %if.then7, label %if.else9, !dbg !80
+
+if.then7: ; preds = %if.else
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 6, i32 0, i64 -1), !dbg !81
+ %3 = load volatile i32, ptr @x, align 4, !dbg !81, !tbaa !55
+ %add8 = add nsw i32 %3, 2, !dbg !81
+ store volatile i32 %add8, ptr @x, align 4, !dbg !81, !tbaa !55
+ br label %if.end11, !dbg !82
+
+if.else9: ; preds = %if.else
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 7, i32 0, i64 -1), !dbg !83
+ %4 = load volatile i32, ptr @x, align 4, !dbg !83, !tbaa !55
+ %dec = add nsw i32 %4, -1, !dbg !83
+ store volatile i32 %dec, ptr @x, align 4, !dbg !83, !tbaa !55
+ br label %if.end11
+
+if.end11: ; preds = %if.then7, %if.else9, %if.then3
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 9, i32 0, i64 -1), !dbg !84
+ ret void, !dbg !84
+}
+
+; Function Attrs: nounwind uwtable
+define dso_local i32 @main() #1 !dbg !85 !prof !90 {
+entry:
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 1, i32 0, i64 -1), !dbg !91
+ #dbg_value(i32 0, !89, !DIExpression(), !92)
+ br label %while.cond, !dbg !93
+
+while.cond: ; preds = %if.end, %entry
+ %i.0 = phi i32 [ 0, %entry ], [ %inc, %if.end ], !dbg !92
+ #dbg_value(i32 %i.0, !89, !DIExpression(), !92)
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 2, i32 0, i64 -1), !dbg !94
+ %inc = add nsw i32 %i.0, 1, !dbg !94
+ #dbg_value(i32 %inc, !89, !DIExpression(), !92)
+ %cmp = icmp slt i32 %i.0, 160000000, !dbg !95
+ br i1 %cmp, label %while.body, label %while.end, !dbg !93, !prof !96
+
+while.body: ; preds = %while.cond
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 3, i32 0, i64 -1), !dbg !97
+ %rem = srem i32 %inc, 10, !dbg !100
+ %tobool = icmp ne i32 %rem, 0, !dbg !100
+ br i1 %tobool, label %if.then, label %if.else, !dbg !101, !prof !102
+
+if.then: ; preds = %while.body
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 4, i32 0, i64 -1), !dbg !103
+ call void @bar(i32 noundef %inc), !dbg !104, !prof !106
+ br label %if.end, !dbg !107
+
+if.else: ; preds = %while.body
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 6, i32 0, i64 -1), !dbg !108
+ #dbg_value(i32 %inc, !62, !DIExpression(), !109)
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 1, i32 0, i64 -1), !dbg !112
+ %rem.i = srem i32 %inc, 100, !dbg !113
+ %tobool.i = icmp ne i32 %rem.i, 0, !dbg !113
+ br i1 %tobool.i, label %if.then.i, label %if.end.i, !dbg !114, !prof !115
+
+if.then.i: ; preds = %if.else
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 2, i32 0, i64 -1), !dbg !116
+ %0 = load volatile i32, ptr @x, align 4, !dbg !116, !tbaa !55
+ %inc.i = add nsw i32 %0, 1, !dbg !116
+ store volatile i32 %inc.i, ptr @x, align 4, !dbg !116, !tbaa !55
+ br label %if.end.i, !dbg !117
+
+if.end.i: ; preds = %if.then.i, %if.else
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 3, i32 0, i64 -1), !dbg !118
+ %1 = load volatile i32, ptr @x, align 4, !dbg !118, !tbaa !55
+ %add.i = add nsw i32 %1, 2, !dbg !118
+ store volatile i32 %add.i, ptr @x, align 4, !dbg !118, !tbaa !55
+ %rem1.i = srem i32 %inc, 2, !dbg !119
+ %tobool2.i = icmp ne i32 %rem1.i, 0, !dbg !119
+ br i1 %tobool2.i, label %if.then3.i, label %if.else.i, !dbg !120, !prof !121
+
+if.then3.i: ; preds = %if.end.i
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 4, i32 0, i64 -1), !dbg !122
+ %2 = load volatile i32, ptr @x, align 4, !dbg !122, !tbaa !55
+ %inc4.i = add nsw i32 %2, 1, !dbg !122
+ store volatile i32 %inc4.i, ptr @x, align 4, !dbg !122, !tbaa !55
+ br label %baz.exit, !dbg !123
+
+if.else.i: ; preds = %if.end.i
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 5, i32 0, i64 -1), !dbg !124
+ %rem5.i = srem i32 %inc, 3, !dbg !125
+ %tobool6.i = icmp ne i32 %rem5.i, 0, !dbg !125
+ br i1 %tobool6.i, label %if.then7.i, label %if.else9.i, !dbg !126, !prof !127
+
+if.then7.i: ; preds = %if.else.i
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 6, i32 0, i64 -1), !dbg !128
+ %3 = load volatile i32, ptr @x, align 4, !dbg !128, !tbaa !55
+ %add8.i = add nsw i32 %3, 2, !dbg !128
+ store volatile i32 %add8.i, ptr @x, align 4, !dbg !128, !tbaa !55
+ br label %baz.exit, !dbg !129
+
+if.else9.i: ; preds = %if.else.i
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 7, i32 0, i64 -1), !dbg !130
+ %4 = load volatile i32, ptr @x, align 4, !dbg !130, !tbaa !55
+ %dec.i = add nsw i32 %4, -1, !dbg !130
+ store volatile i32 %dec.i, ptr @x, align 4, !dbg !130, !tbaa !55
+ br label %baz.exit
+
+baz.exit: ; preds = %if.then3.i, %if.then7.i, %if.else9.i
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 9, i32 0, i64 -1), !dbg !131
+ br label %if.end
+
+if.end: ; preds = %baz.exit, %if.then
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 8, i32 0, i64 -1), !dbg !93
+ br label %while.cond, !dbg !93, !llvm.loop !132
+
+while.end: ; preds = %while.cond
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 9, i32 0, i64 -1), !dbg !135
+ ret i32 0, !dbg !135
+}
+
+; Function Attrs: mustprogress nocallback nofree nosync nounwind willreturn memory(argmem: readwrite)
+declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #2
+
+; Function Attrs: mustprogress nocallback nofree nosync nounwind willreturn memory(argmem: readwrite)
+declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #2
+
+; Function Attrs: mustprogress nocallback nofree nosync nounwind willreturn memory(inaccessiblemem: readwrite)
+declare void @llvm.pseudoprobe(i64, i64, i32, i64) #3
+
+attributes #0 = { noinline nounwind uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
+attributes #1 = { nounwind uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
+attributes #2 = { mustprogress nocallback nofree nosync nounwind willreturn memory(argmem: readwrite) }
+attributes #3 = { mustprogress nocallback nofree nosync nounwind willreturn memory(inaccessiblemem: readwrite) }
+
+!llvm.dbg.cu = !{!2}
+!llvm.module.flags = !{!7, !8, !9, !10, !11, !12, !13, !14}
+!llvm.ident = !{!43}
+!llvm.pseudo_probe_desc = !{!44, !45, !46}
+
+!0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression())
+!1 = distinct !DIGlobalVariable(name: "x", scope: !2, file: !3, line: 1, type: !5, isLocal: false, isDefinition: true)
+!2 = distinct !DICompileUnit(language: DW_LANG_C11, file: !3, producer: "clang version 20.0.0", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, nameTableKind: None)
+!3 = !DIFile(filename: "test.c", directory: "/home/", checksumkind: CSK_MD5, checksum: "b67c15e928f76c51702a59639dbebb4c")
+!4 = !{!0}
+!5 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !6)
+!6 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
+!7 = !{i32 7, !"Dwarf Version", i32 5}
+!8 = !{i32 2, !"Debug Info Version", i32 3}
+!9 = !{i32 1, !"wchar_size", i32 4}
+!10 = !{i32 8, !"PIC Level", i32 2}
+!11 = !{i32 7, !"PIE Level", i32 2}
+!12 = !{i32 7, !"uwtable", i32 2}
+!13 = !{i32 7, !"debug-info-assignment-tracking", i1 true}
+!14 = !{i32 1, !"ProfileSummary", !15}
+!15 = !{!16, !17, !18, !19, !20, !21, !22, !23, !24, !25}
+!16 = !{!"ProfileFormat", !"SampleProfile"}
+!17 = !{!"TotalCount", i64 105360}
+!18 = !{!"MaxCount", i64 16724}
+!19 = !{!"MaxInternalCount", i64 0}
+!20 = !{!"MaxFunctionCount", i64 15026}
+!21 = !{!"NumCounts", i64 14}
+!22 = !{!"NumFunctions", i64 2}
+!23 = !{!"IsPartialProfile", i64 0}
+!24 = !{!"PartialProfileRatio", double 0.000000e+00}
+!25 = !{!"DetailedSummary", !26}
+!26 = !{!27, !28, !29, !30, !31, !32, !33, !34, !35, !36, !37, !38, !39, !40, !41, !42}
+!27 = !{i32 10000, i64 16724, i32 3}
+!28 = !{i32 100000, i64 16724, i32 3}
+!29 = !{i32 200000, i64 16724, i32 3}
+!30 = !{i32 300000, i64 16724, i32 3}
+!31 = !{i32 400000, i64 16724, i32 3}
+!32 = !{i32 500000, i64 15026, i32 5}
+!33 = !{i32 600000, i64 15026, i32 5}
+!34 = !{i32 700000, i64 15026, i32 5}
+!35 = !{i32 800000, i64 14342, i32 6}
+!36 = !{i32 900000, i64 1882, i32 8}
+!37 = !{i32 950000, i64 1872, i32 10}
+!38 = !{i32 990000, i64 1550, i32 12}
+!39 = !{i32 999000, i64 1550, i32 12}
+!40 = !{i32 999900, i64 1550, i32 12}
+!41 = !{i32 999990, i64 1550, i32 12}
+!42 = !{i32 999999, i64 1550, i32 12}
+!43 = !{!"clang version 20.0.0"}
+!44 = !{i64 -2012135647395072713, i64 4294967295, !"bar"}
+!45 = !{i64 7546896869197086323, i64 191430930410, !"baz"}
+!46 = !{i64 -2624081020897602054, i64 563091374530180, !"main"}
+!47 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 3, type: !48, scopeLine: 3, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !50)
+!48 = !DISubroutineType(types: !49)
+!49 = !{null, !6}
+!50 = !{!51}
+!51 = !DILocalVariable(name: "i", arg: 1, scope: !47, file: !3, line: 3, type: !6)
+!52 = !{!"function_entry_count", i64 15026}
+!53 = !DILocation(line: 0, scope: !47)
+!54 = !DILocation(line: 4, column: 5, scope: !47)
+!55 = !{!56, !56, i64 0}
+!56 = !{!"int", !57, i64 0}
+!57 = !{!"omnipotent char", !58, i64 0}
+!58 = !{!"Simple C/C++ TBAA"}
+!59 = !DILocation(line: 8, column: 1, scope: !47)
+!60 = distinct !DISubprogram(name: "baz", scope: !3, file: !3, line: 10, type: !48, scopeLine: 10, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !61)
+!61 = !{!62}
+!62 = !DILocalVariable(name: "i", arg: 1, scope: !60, file: !3, line: 10, type: !6)
+!63 = !{!"function_entry_count", i64 -1}
+!64 = !DILocation(line: 0, scope: !60)
+!65 = !DILocation(line: 11, column: 6, scope: !66)
+!66 = distinct !DILexicalBlock(scope: !60, file: !3, line: 11, column: 6)
+!67 = !DILocation(line: 11, column: 7, scope: !66)
+!68 = !DILocation(line: 11, column: 6, scope: !60)
+!69 = !DILocation(line: 12, column: 6, scope: !66)
+!70 = !DILocation(line: 12, column: 5, scope: !66)
+!71 = !DILocation(line: 14, column: 5, scope: !60)
+!72 = !DILocation(line: 15, column: 9, scope: !73)
+!73 = distinct !DILexicalBlock(scope: !60, file: !3, line: 15, column: 7)
+!74 = !DILocation(line: 15, column: 7, scope: !60)
+!75 = !DILocation(line: 16, column: 7, scope: !73)
+!76 = !DILocation(line: 16, column: 6, scope: !73)
+!77 = !DILocation(line: 17, column: 12, scope: !78)
+!78 = distinct !DILexicalBlock(scope: !73, file: !3, line: 17, column: 12)
+!79 = !DILocation(line: 17, column: 14, scope: !78)
+!80 = !DILocation(line: 17, column: 12, scope: !73)
+!81 = !DILocation(line: 18, column: 7, scope: !78)
+!82 = !DILocation(line: 18, column: 6, scope: !78)
+!83 = !DILocation(line: 20, column: 7, scope: !78)
+!84 = !DILocation(line: 21, column: 1, scope: !60)
+!85 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 23, type: !86, scopeLine: 23, flags: DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !88)
+!86 = !DISubroutineType(types: !87)
+!87 = !{!6}
+!88 = !{!89}
+!89 = !DILocalVariable(name: "i", scope: !85, file: !3, line: 24, type: !6)
+!90 = !{!"function_entry_count", i64 1}
+!91 = !DILocation(line: 24, column: 7, scope: !85)
+!92 = !DILocation(line: 0, scope: !85)
+!93 = !DILocation(line: 25, column: 3, scope: !85)
+!94 = !DILocation(line: 25, column: 11, scope: !85)
+!95 = !DILocation(line: 25, column: 14, scope: !85)
+!96 = !{!"branch_weights", i32 16724, i32 1}
+!97 = !DILocation(line: 26, column: 8, scope: !98)
+!98 = distinct !DILexicalBlock(scope: !99, file: !3, line: 26, column: 8)
+!99 = distinct !DILexicalBlock(scope: !85, file: !3, line: 25, column: 30)
+!100 = !DILocation(line: 26, column: 10, scope: !98)
+!101 = !DILocation(line: 26, column: 8, scope: !99)
+!102 = !{!"branch_weights", i32 14852, i32 1872}
+!103 = !DILocation(line: 27, column: 10, scope: !98)
+!104 = !DILocation(line: 27, column: 6, scope: !105)
+!105 = !DILexicalBlockFile(scope: !98, file: !3, discriminator: 455082031)
+!106 = !{!"branch_weights", i32 14852}
+!107 = !DILocation(line: 27, column: 6, scope: !98)
+!108 = !DILocation(line: 29, column: 10, scope: !98)
+!109 = !DILocation(line: 0, scope: !60, inlinedAt: !110)
+!110 = distinct !DILocation(line: 29, column: 6, scope: !111)
+!111 = !DILexicalBlockFile(scope: !98, file: !3, discriminator: 455082047)
+!112 = !DILocation(line: 11, column: 6, scope: !66, inlinedAt: !110)
+!113 = !DILocation(line: 11, column: 7, scope: !66, inlinedAt: !110)
+!114 = !DILocation(line: 11, column: 6, scope: !60, inlinedAt: !110)
+!115 = !{!"branch_weights", i32 1736, i32 136}
+!116 = !DILocation(line: 12, column: 6, scope: !66, inlinedAt: !110)
+!117 = !DILocation(line: 12, column: 5, scope: !66, inlinedAt: !110)
+!118 = !DILocation(line: 14, column: 5, scope: !60, inlinedAt: !110)
+!119 = !DILocation(line: 15, column: 9, scope: !73, inlinedAt: !110)
+!120 = !DILocation(line: 15, column: 7, scope: !60, inlinedAt: !110)
+!121 = !{!"branch_weights", i32 0, i32 1872}
+!122 = !DILocation(line: 16, column: 7, scope: !73, inlinedAt: !110)
+!123 = !DILocation(line: 16, column: 6, scope: !73, inlinedAt: !110)
+!124 = !DILocation(line: 17, column: 12, scope: !78, inlinedAt: !110)
+!125 = !DILocation(line: 17, column: 14, scope: !78, inlinedAt: !110)
+!126 = !DILocation(line: 17, column: 12, scope: !73, inlinedAt: !110)
+!127 = !{!"branch_weights", i32 936, i32 936}
+!128 = !DILocation(line: 18, column: 7, scope: !78, inlinedAt: !110)
+!129 = !DILocation(line: 18, column: 6, scope: !78, inlinedAt: !110)
+!130 = !DILocation(line: 20, column: 7, scope: !78, inlinedAt: !110)
+!131 = !DILocation(line: 21, column: 1, scope: !60, inlinedAt: !110)
+!132 = distinct !{!132, !93, !133, !134}
+!133 = !DILocation(line: 30, column: 3, scope: !85)
+!134 = !{!"llvm.loop.mustprogress"}
+!135 = !DILocation(line: 31, column: 3, scope: !85)
>From d9e89c68dacc0d2f16d420fa9a8eab08617eec38 Mon Sep 17 00:00:00 2001
From: wlei <wlei at fb.com>
Date: Mon, 5 Aug 2024 21:14:40 -0700
Subject: [PATCH 2/3] addressing comment
---
.../Transforms/Utils/SampleProfileLoaderBaseImpl.h | 7 ++++++-
.../SampleProfile/pseudo-probe-missing-probe.ll | 11 +++++------
2 files changed, 11 insertions(+), 7 deletions(-)
diff --git a/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h b/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h
index 114159ab524bfe..5132dca7c6a22b 100644
--- a/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h
+++ b/llvm/include/llvm/Transforms/Utils/SampleProfileLoaderBaseImpl.h
@@ -461,8 +461,13 @@ SampleProfileLoaderBaseImpl<BT>::getProbeWeight(const InstructionT &Inst) {
return std::error_code();
const FunctionSamples *FS = findFunctionSamples(Inst);
- if (!FS)
+ if (!FS) {
+ // If we can't find the function samples for a probe, it could be due to the
+ // probe is later optimized away or the inlining context is mismatced. We
+ // treat it as unknown, leaving it to profile inference instead of forcing a
+ // zero count.
return std::error_code();
+ }
auto R = FS->findSamplesAt(Probe->Id, Probe->Discriminator);
if (R) {
diff --git a/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll b/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
index 23d322c5cc99f5..6681e46aa739c3 100644
--- a/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
+++ b/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
@@ -1,10 +1,9 @@
-; RUN: opt < %s -passes=sample-profile --overwrite-existing-weights -sample-profile-file=%S/Inputs/pseudo-probe-missing-probe.prof | opt -passes='print<branch-prob>' -disable-output 2>&1 | FileCheck %s
+; RUN: opt < %s -passes=sample-profile --overwrite-existing-weights -sample-profile-file=%S/Inputs/pseudo-probe-missing-probe.prof -S | FileCheck %s
-; CHECK: edge %while.body -> %if.then probability is 0x7212005e / 0x80000000 = 89.12% [HOT edge]
-; CHECK: edge %while.body -> %if.else probability is 0x0dedffa2 / 0x80000000 = 10.88%
-
-; CHECK-NOT: edge %while.body -> %if.then probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]
-; CHECK-NOT: edge %while.body -> %if.else probability is 0x00000000 / 0x80000000 = 0.00%
+; CHECK: br i1 %tobool, label %if.then, label %if.else, !dbg ![[#]], !prof ![[#PROF:]]
+; CHECK: [[#PROF]] = !{!"branch_weights", i32 14904, i32 1820}
+; Verify the else branch is not set to a zero count
+; CHECK-NOT: [[#PROF]] = !{!"branch_weights", i32 16724, i32 0}
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
target triple = "x86_64-unknown-linux-gnu"
>From a679e61406b2673f849ebb9ce77cd07f6ea4d8f7 Mon Sep 17 00:00:00 2001
From: wlei <wlei at fb.com>
Date: Fri, 9 Aug 2024 20:29:20 -0700
Subject: [PATCH 3/3] remove the profile metadata in test
---
.../pseudo-probe-missing-probe.ll | 457 +++++++-----------
1 file changed, 187 insertions(+), 270 deletions(-)
diff --git a/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll b/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
index 6681e46aa739c3..3d559f2fb0159a 100644
--- a/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
+++ b/llvm/test/Transforms/SampleProfile/pseudo-probe-missing-probe.ll
@@ -1,197 +1,160 @@
-; RUN: opt < %s -passes=sample-profile --overwrite-existing-weights -sample-profile-file=%S/Inputs/pseudo-probe-missing-probe.prof -S | FileCheck %s
+; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/pseudo-probe-missing-probe.prof -S | FileCheck %s
-; CHECK: br i1 %tobool, label %if.then, label %if.else, !dbg ![[#]], !prof ![[#PROF:]]
-; CHECK: [[#PROF]] = !{!"branch_weights", i32 14904, i32 1820}
+; CHECK: br i1 %tobool.not.i, label %if.end.i, label %if.then.i, !dbg ![[#]], !prof ![[#PROF:]]
+
+; CHECK: [[#PROF]] = !{!"branch_weights", i32 918, i32 918}
; Verify the else branch is not set to a zero count
-; CHECK-NOT: [[#PROF]] = !{!"branch_weights", i32 16724, i32 0}
+; CHECK-NOT: [[#PROF]] = !{!"branch_weights", i32 1698, i32 0}
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
target triple = "x86_64-unknown-linux-gnu"
@x = dso_local global i32 0, align 4, !dbg !0
-; Function Attrs: noinline nounwind uwtable
-define dso_local void @bar(i32 noundef %i) #0 !dbg !47 !prof !52 {
+; Function Attrs: nofree noinline norecurse nounwind memory(readwrite, argmem: none) uwtable
+define dso_local void @bar(i32 %i) local_unnamed_addr #0 !dbg !18 {
entry:
- #dbg_value(i32 %i, !51, !DIExpression(), !53)
- call void @llvm.pseudoprobe(i64 -2012135647395072713, i64 1, i32 0, i64 -1), !dbg !54
- %0 = load volatile i32, ptr @x, align 4, !dbg !54, !tbaa !55
- %add = add nsw i32 %0, 5, !dbg !54
- store volatile i32 %add, ptr @x, align 4, !dbg !54, !tbaa !55
- ret void, !dbg !59
+ #dbg_value(i32 poison, !22, !DIExpression(), !23)
+ call void @llvm.pseudoprobe(i64 -2012135647395072713, i64 1, i32 0, i64 -1), !dbg !24
+ %0 = load volatile i32, ptr @x, align 4, !dbg !24, !tbaa !25
+ %add = add nsw i32 %0, 5, !dbg !24
+ store volatile i32 %add, ptr @x, align 4, !dbg !24, !tbaa !25
+ ret void, !dbg !29
}
-; Function Attrs: nounwind uwtable
-define dso_local void @baz(i32 noundef %i) #1 !dbg !60 !prof !63 {
+; Function Attrs: nofree norecurse nounwind memory(readwrite, argmem: none) uwtable
+define dso_local void @baz(i32 noundef %i) local_unnamed_addr #1 !dbg !30 {
entry:
- #dbg_value(i32 %i, !62, !DIExpression(), !64)
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 1, i32 0, i64 -1), !dbg !65
- %rem = srem i32 %i, 100, !dbg !67
- %tobool = icmp ne i32 %rem, 0, !dbg !67
- br i1 %tobool, label %if.then, label %if.end, !dbg !68
+ #dbg_value(i32 %i, !32, !DIExpression(), !33)
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 1, i32 0, i64 -1), !dbg !34
+ %rem = srem i32 %i, 100, !dbg !36
+ %tobool.not = icmp eq i32 %rem, 0, !dbg !36
+ br i1 %tobool.not, label %if.end, label %if.then, !dbg !37
if.then: ; preds = %entry
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 2, i32 0, i64 -1), !dbg !69
- %0 = load volatile i32, ptr @x, align 4, !dbg !69, !tbaa !55
- %inc = add nsw i32 %0, 1, !dbg !69
- store volatile i32 %inc, ptr @x, align 4, !dbg !69, !tbaa !55
- br label %if.end, !dbg !70
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 2, i32 0, i64 -1), !dbg !38
+ %0 = load volatile i32, ptr @x, align 4, !dbg !38, !tbaa !25
+ %inc = add nsw i32 %0, 1, !dbg !38
+ store volatile i32 %inc, ptr @x, align 4, !dbg !38, !tbaa !25
+ br label %if.end, !dbg !39
if.end: ; preds = %if.then, %entry
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 3, i32 0, i64 -1), !dbg !71
- %1 = load volatile i32, ptr @x, align 4, !dbg !71, !tbaa !55
- %add = add nsw i32 %1, 2, !dbg !71
- store volatile i32 %add, ptr @x, align 4, !dbg !71, !tbaa !55
- %rem1 = srem i32 %i, 2, !dbg !72
- %tobool2 = icmp ne i32 %rem1, 0, !dbg !72
- br i1 %tobool2, label %if.then3, label %if.else, !dbg !74
-
-if.then3: ; preds = %if.end
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 4, i32 0, i64 -1), !dbg !75
- %2 = load volatile i32, ptr @x, align 4, !dbg !75, !tbaa !55
- %inc4 = add nsw i32 %2, 1, !dbg !75
- store volatile i32 %inc4, ptr @x, align 4, !dbg !75, !tbaa !55
- br label %if.end11, !dbg !76
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 3, i32 0, i64 -1), !dbg !40
+ %1 = load volatile i32, ptr @x, align 4, !dbg !40, !tbaa !25
+ %add = add nsw i32 %1, 2, !dbg !40
+ store volatile i32 %add, ptr @x, align 4, !dbg !40, !tbaa !25
+ %2 = and i32 %i, 1, !dbg !41
+ %tobool2.not = icmp eq i32 %2, 0, !dbg !41
+ br i1 %tobool2.not, label %if.else, label %if.end11, !dbg !43
if.else: ; preds = %if.end
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 5, i32 0, i64 -1), !dbg !77
- %rem5 = srem i32 %i, 3, !dbg !79
- %tobool6 = icmp ne i32 %rem5, 0, !dbg !79
- br i1 %tobool6, label %if.then7, label %if.else9, !dbg !80
-
-if.then7: ; preds = %if.else
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 6, i32 0, i64 -1), !dbg !81
- %3 = load volatile i32, ptr @x, align 4, !dbg !81, !tbaa !55
- %add8 = add nsw i32 %3, 2, !dbg !81
- store volatile i32 %add8, ptr @x, align 4, !dbg !81, !tbaa !55
- br label %if.end11, !dbg !82
-
-if.else9: ; preds = %if.else
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 7, i32 0, i64 -1), !dbg !83
- %4 = load volatile i32, ptr @x, align 4, !dbg !83, !tbaa !55
- %dec = add nsw i32 %4, -1, !dbg !83
- store volatile i32 %dec, ptr @x, align 4, !dbg !83, !tbaa !55
- br label %if.end11
-
-if.end11: ; preds = %if.then7, %if.else9, %if.then3
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 9, i32 0, i64 -1), !dbg !84
- ret void, !dbg !84
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 5, i32 0, i64 -1), !dbg !44
+ %rem5 = srem i32 %i, 3, !dbg !46
+ %tobool6.not = icmp eq i32 %rem5, 0, !dbg !46
+ %spec.select = select i1 %tobool6.not, i32 -1, i32 2, !dbg !47
+ br label %if.end11, !dbg !47
+
+if.end11: ; preds = %if.else, %if.end
+ %.sink14 = phi i32 [ 1, %if.end ], [ %spec.select, %if.else ]
+ %3 = load volatile i32, ptr @x, align 4, !dbg !48, !tbaa !25
+ %add8 = add nsw i32 %3, %.sink14, !dbg !48
+ store volatile i32 %add8, ptr @x, align 4, !dbg !48, !tbaa !25
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 9, i32 0, i64 -1), !dbg !49
+ ret void, !dbg !49
}
-; Function Attrs: nounwind uwtable
-define dso_local i32 @main() #1 !dbg !85 !prof !90 {
+; Function Attrs: nofree norecurse nounwind uwtable
+define dso_local noundef i32 @main() local_unnamed_addr #2 !dbg !50 {
entry:
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 1, i32 0, i64 -1), !dbg !91
- #dbg_value(i32 0, !89, !DIExpression(), !92)
- br label %while.cond, !dbg !93
-
-while.cond: ; preds = %if.end, %entry
- %i.0 = phi i32 [ 0, %entry ], [ %inc, %if.end ], !dbg !92
- #dbg_value(i32 %i.0, !89, !DIExpression(), !92)
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 2, i32 0, i64 -1), !dbg !94
- %inc = add nsw i32 %i.0, 1, !dbg !94
- #dbg_value(i32 %inc, !89, !DIExpression(), !92)
- %cmp = icmp slt i32 %i.0, 160000000, !dbg !95
- br i1 %cmp, label %while.body, label %while.end, !dbg !93, !prof !96
-
-while.body: ; preds = %while.cond
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 3, i32 0, i64 -1), !dbg !97
- %rem = srem i32 %inc, 10, !dbg !100
- %tobool = icmp ne i32 %rem, 0, !dbg !100
- br i1 %tobool, label %if.then, label %if.else, !dbg !101, !prof !102
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 1, i32 0, i64 -1), !dbg !55
+ #dbg_value(i32 0, !54, !DIExpression(), !56)
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 2, i32 0, i64 -1), !dbg !57
+ br label %while.body, !dbg !58
+
+while.body: ; preds = %entry, %if.end
+ %inc7 = phi i32 [ 1, %entry ], [ %inc, %if.end ]
+ %i.06 = phi i32 [ 0, %entry ], [ %inc7, %if.end ]
+ #dbg_value(i32 %i.06, !54, !DIExpression(), !56)
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 3, i32 0, i64 -1), !dbg !59
+ %rem = urem i32 %inc7, 10, !dbg !62
+ %tobool.not = icmp eq i32 %rem, 0, !dbg !62
+ br i1 %tobool.not, label %if.else, label %if.then, !dbg !63
if.then: ; preds = %while.body
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 4, i32 0, i64 -1), !dbg !103
- call void @bar(i32 noundef %inc), !dbg !104, !prof !106
- br label %if.end, !dbg !107
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 4, i32 0, i64 -1), !dbg !64
+ tail call void @bar(i32 poison), !dbg !65
+ br label %if.end, !dbg !67
if.else: ; preds = %while.body
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 6, i32 0, i64 -1), !dbg !108
- #dbg_value(i32 %inc, !62, !DIExpression(), !109)
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 1, i32 0, i64 -1), !dbg !112
- %rem.i = srem i32 %inc, 100, !dbg !113
- %tobool.i = icmp ne i32 %rem.i, 0, !dbg !113
- br i1 %tobool.i, label %if.then.i, label %if.end.i, !dbg !114, !prof !115
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 6, i32 0, i64 -1), !dbg !68
+ #dbg_value(i32 %inc7, !32, !DIExpression(), !69)
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 1, i32 0, i64 -1), !dbg !72
+ %rem.i4 = urem i32 %inc7, 100, !dbg !73
+ %tobool.not.i = icmp eq i32 %rem.i4, 0, !dbg !73
+ br i1 %tobool.not.i, label %if.end.i, label %if.then.i, !dbg !74
if.then.i: ; preds = %if.else
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 2, i32 0, i64 -1), !dbg !116
- %0 = load volatile i32, ptr @x, align 4, !dbg !116, !tbaa !55
- %inc.i = add nsw i32 %0, 1, !dbg !116
- store volatile i32 %inc.i, ptr @x, align 4, !dbg !116, !tbaa !55
- br label %if.end.i, !dbg !117
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 2, i32 0, i64 -1), !dbg !75
+ %0 = load volatile i32, ptr @x, align 4, !dbg !75, !tbaa !25
+ %inc.i = add nsw i32 %0, 1, !dbg !75
+ store volatile i32 %inc.i, ptr @x, align 4, !dbg !75, !tbaa !25
+ br label %if.end.i, !dbg !76
if.end.i: ; preds = %if.then.i, %if.else
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 3, i32 0, i64 -1), !dbg !118
- %1 = load volatile i32, ptr @x, align 4, !dbg !118, !tbaa !55
- %add.i = add nsw i32 %1, 2, !dbg !118
- store volatile i32 %add.i, ptr @x, align 4, !dbg !118, !tbaa !55
- %rem1.i = srem i32 %inc, 2, !dbg !119
- %tobool2.i = icmp ne i32 %rem1.i, 0, !dbg !119
- br i1 %tobool2.i, label %if.then3.i, label %if.else.i, !dbg !120, !prof !121
-
-if.then3.i: ; preds = %if.end.i
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 4, i32 0, i64 -1), !dbg !122
- %2 = load volatile i32, ptr @x, align 4, !dbg !122, !tbaa !55
- %inc4.i = add nsw i32 %2, 1, !dbg !122
- store volatile i32 %inc4.i, ptr @x, align 4, !dbg !122, !tbaa !55
- br label %baz.exit, !dbg !123
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 3, i32 0, i64 -1), !dbg !77
+ %1 = load volatile i32, ptr @x, align 4, !dbg !77, !tbaa !25
+ %add.i = add nsw i32 %1, 2, !dbg !77
+ store volatile i32 %add.i, ptr @x, align 4, !dbg !77, !tbaa !25
+ %2 = and i32 %i.06, 1, !dbg !78
+ %tobool2.not.i.not = icmp eq i32 %2, 0, !dbg !78
+ br i1 %tobool2.not.i.not, label %baz.exit, label %if.else.i, !dbg !79
if.else.i: ; preds = %if.end.i
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 5, i32 0, i64 -1), !dbg !124
- %rem5.i = srem i32 %inc, 3, !dbg !125
- %tobool6.i = icmp ne i32 %rem5.i, 0, !dbg !125
- br i1 %tobool6.i, label %if.then7.i, label %if.else9.i, !dbg !126, !prof !127
-
-if.then7.i: ; preds = %if.else.i
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 6, i32 0, i64 -1), !dbg !128
- %3 = load volatile i32, ptr @x, align 4, !dbg !128, !tbaa !55
- %add8.i = add nsw i32 %3, 2, !dbg !128
- store volatile i32 %add8.i, ptr @x, align 4, !dbg !128, !tbaa !55
- br label %baz.exit, !dbg !129
-
-if.else9.i: ; preds = %if.else.i
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 7, i32 0, i64 -1), !dbg !130
- %4 = load volatile i32, ptr @x, align 4, !dbg !130, !tbaa !55
- %dec.i = add nsw i32 %4, -1, !dbg !130
- store volatile i32 %dec.i, ptr @x, align 4, !dbg !130, !tbaa !55
- br label %baz.exit
-
-baz.exit: ; preds = %if.then3.i, %if.then7.i, %if.else9.i
- call void @llvm.pseudoprobe(i64 7546896869197086323, i64 9, i32 0, i64 -1), !dbg !131
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 5, i32 0, i64 -1), !dbg !80
+ %rem5.i5 = urem i32 %inc7, 3, !dbg !81
+ %tobool6.not.i = icmp eq i32 %rem5.i5, 0, !dbg !81
+ %spec.select.i = select i1 %tobool6.not.i, i32 -1, i32 2, !dbg !82
+ br label %baz.exit, !dbg !82
+
+baz.exit: ; preds = %if.end.i, %if.else.i
+ %.sink14.i = phi i32 [ 1, %if.end.i ], [ %spec.select.i, %if.else.i ]
+ %3 = load volatile i32, ptr @x, align 4, !dbg !83, !tbaa !25
+ %add8.i = add nsw i32 %3, %.sink14.i, !dbg !83
+ store volatile i32 %add8.i, ptr @x, align 4, !dbg !83, !tbaa !25
+ call void @llvm.pseudoprobe(i64 7546896869197086323, i64 9, i32 0, i64 -1), !dbg !84
br label %if.end
if.end: ; preds = %baz.exit, %if.then
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 8, i32 0, i64 -1), !dbg !93
- br label %while.cond, !dbg !93, !llvm.loop !132
-
-while.end: ; preds = %while.cond
- call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 9, i32 0, i64 -1), !dbg !135
- ret i32 0, !dbg !135
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 8, i32 0, i64 -1), !dbg !58
+ #dbg_value(i32 %inc7, !54, !DIExpression(), !56)
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 2, i32 0, i64 -1), !dbg !57
+ %inc = add nuw nsw i32 %inc7, 1, !dbg !57
+ #dbg_value(i32 %inc, !54, !DIExpression(), !56)
+ %exitcond.not = icmp eq i32 %inc, 160000001, !dbg !85
+ br i1 %exitcond.not, label %while.end, label %while.body, !dbg !58, !llvm.loop !86
+
+while.end: ; preds = %if.end
+ call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 9, i32 0, i64 -1), !dbg !89
+ ret i32 0, !dbg !89
}
-; Function Attrs: mustprogress nocallback nofree nosync nounwind willreturn memory(argmem: readwrite)
-declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #2
-
-; Function Attrs: mustprogress nocallback nofree nosync nounwind willreturn memory(argmem: readwrite)
-declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #2
-
; Function Attrs: mustprogress nocallback nofree nosync nounwind willreturn memory(inaccessiblemem: readwrite)
declare void @llvm.pseudoprobe(i64, i64, i32, i64) #3
-attributes #0 = { noinline nounwind uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
-attributes #1 = { nounwind uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
-attributes #2 = { mustprogress nocallback nofree nosync nounwind willreturn memory(argmem: readwrite) }
+attributes #0 = { nofree noinline norecurse nounwind memory(readwrite, argmem: none) uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
+attributes #1 = { nofree norecurse nounwind memory(readwrite, argmem: none) uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
+attributes #2 = { nofree norecurse nounwind uwtable "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cmov,+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile"}
attributes #3 = { mustprogress nocallback nofree nosync nounwind willreturn memory(inaccessiblemem: readwrite) }
!llvm.dbg.cu = !{!2}
-!llvm.module.flags = !{!7, !8, !9, !10, !11, !12, !13, !14}
-!llvm.ident = !{!43}
-!llvm.pseudo_probe_desc = !{!44, !45, !46}
+!llvm.module.flags = !{!7, !8, !9, !10, !11, !12, !13}
+!llvm.ident = !{!14}
+!llvm.pseudo_probe_desc = !{!15, !16, !17}
!0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression())
!1 = distinct !DIGlobalVariable(name: "x", scope: !2, file: !3, line: 1, type: !5, isLocal: false, isDefinition: true)
!2 = distinct !DICompileUnit(language: DW_LANG_C11, file: !3, producer: "clang version 20.0.0", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, nameTableKind: None)
-!3 = !DIFile(filename: "test.c", directory: "/home/", checksumkind: CSK_MD5, checksum: "b67c15e928f76c51702a59639dbebb4c")
+!3 = !DIFile(filename: "test.c", directory: "/home", checksumkind: CSK_MD5, checksum: "b67c15e928f76c51702a59639dbebb4c")
!4 = !{!0}
!5 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !6)
!6 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
@@ -202,125 +165,79 @@ attributes #3 = { mustprogress nocallback nofree nosync nounwind willreturn memo
!11 = !{i32 7, !"PIE Level", i32 2}
!12 = !{i32 7, !"uwtable", i32 2}
!13 = !{i32 7, !"debug-info-assignment-tracking", i1 true}
-!14 = !{i32 1, !"ProfileSummary", !15}
-!15 = !{!16, !17, !18, !19, !20, !21, !22, !23, !24, !25}
-!16 = !{!"ProfileFormat", !"SampleProfile"}
-!17 = !{!"TotalCount", i64 105360}
-!18 = !{!"MaxCount", i64 16724}
-!19 = !{!"MaxInternalCount", i64 0}
-!20 = !{!"MaxFunctionCount", i64 15026}
-!21 = !{!"NumCounts", i64 14}
-!22 = !{!"NumFunctions", i64 2}
-!23 = !{!"IsPartialProfile", i64 0}
-!24 = !{!"PartialProfileRatio", double 0.000000e+00}
-!25 = !{!"DetailedSummary", !26}
-!26 = !{!27, !28, !29, !30, !31, !32, !33, !34, !35, !36, !37, !38, !39, !40, !41, !42}
-!27 = !{i32 10000, i64 16724, i32 3}
-!28 = !{i32 100000, i64 16724, i32 3}
-!29 = !{i32 200000, i64 16724, i32 3}
-!30 = !{i32 300000, i64 16724, i32 3}
-!31 = !{i32 400000, i64 16724, i32 3}
-!32 = !{i32 500000, i64 15026, i32 5}
-!33 = !{i32 600000, i64 15026, i32 5}
-!34 = !{i32 700000, i64 15026, i32 5}
-!35 = !{i32 800000, i64 14342, i32 6}
-!36 = !{i32 900000, i64 1882, i32 8}
-!37 = !{i32 950000, i64 1872, i32 10}
-!38 = !{i32 990000, i64 1550, i32 12}
-!39 = !{i32 999000, i64 1550, i32 12}
-!40 = !{i32 999900, i64 1550, i32 12}
-!41 = !{i32 999990, i64 1550, i32 12}
-!42 = !{i32 999999, i64 1550, i32 12}
-!43 = !{!"clang version 20.0.0"}
-!44 = !{i64 -2012135647395072713, i64 4294967295, !"bar"}
-!45 = !{i64 7546896869197086323, i64 191430930410, !"baz"}
-!46 = !{i64 -2624081020897602054, i64 563091374530180, !"main"}
-!47 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 3, type: !48, scopeLine: 3, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !50)
-!48 = !DISubroutineType(types: !49)
-!49 = !{null, !6}
-!50 = !{!51}
-!51 = !DILocalVariable(name: "i", arg: 1, scope: !47, file: !3, line: 3, type: !6)
-!52 = !{!"function_entry_count", i64 15026}
-!53 = !DILocation(line: 0, scope: !47)
-!54 = !DILocation(line: 4, column: 5, scope: !47)
-!55 = !{!56, !56, i64 0}
-!56 = !{!"int", !57, i64 0}
-!57 = !{!"omnipotent char", !58, i64 0}
-!58 = !{!"Simple C/C++ TBAA"}
-!59 = !DILocation(line: 8, column: 1, scope: !47)
-!60 = distinct !DISubprogram(name: "baz", scope: !3, file: !3, line: 10, type: !48, scopeLine: 10, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !61)
-!61 = !{!62}
-!62 = !DILocalVariable(name: "i", arg: 1, scope: !60, file: !3, line: 10, type: !6)
-!63 = !{!"function_entry_count", i64 -1}
-!64 = !DILocation(line: 0, scope: !60)
-!65 = !DILocation(line: 11, column: 6, scope: !66)
-!66 = distinct !DILexicalBlock(scope: !60, file: !3, line: 11, column: 6)
-!67 = !DILocation(line: 11, column: 7, scope: !66)
-!68 = !DILocation(line: 11, column: 6, scope: !60)
-!69 = !DILocation(line: 12, column: 6, scope: !66)
-!70 = !DILocation(line: 12, column: 5, scope: !66)
-!71 = !DILocation(line: 14, column: 5, scope: !60)
-!72 = !DILocation(line: 15, column: 9, scope: !73)
-!73 = distinct !DILexicalBlock(scope: !60, file: !3, line: 15, column: 7)
-!74 = !DILocation(line: 15, column: 7, scope: !60)
-!75 = !DILocation(line: 16, column: 7, scope: !73)
-!76 = !DILocation(line: 16, column: 6, scope: !73)
-!77 = !DILocation(line: 17, column: 12, scope: !78)
-!78 = distinct !DILexicalBlock(scope: !73, file: !3, line: 17, column: 12)
-!79 = !DILocation(line: 17, column: 14, scope: !78)
-!80 = !DILocation(line: 17, column: 12, scope: !73)
-!81 = !DILocation(line: 18, column: 7, scope: !78)
-!82 = !DILocation(line: 18, column: 6, scope: !78)
-!83 = !DILocation(line: 20, column: 7, scope: !78)
-!84 = !DILocation(line: 21, column: 1, scope: !60)
-!85 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 23, type: !86, scopeLine: 23, flags: DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !88)
-!86 = !DISubroutineType(types: !87)
-!87 = !{!6}
-!88 = !{!89}
-!89 = !DILocalVariable(name: "i", scope: !85, file: !3, line: 24, type: !6)
-!90 = !{!"function_entry_count", i64 1}
-!91 = !DILocation(line: 24, column: 7, scope: !85)
-!92 = !DILocation(line: 0, scope: !85)
-!93 = !DILocation(line: 25, column: 3, scope: !85)
-!94 = !DILocation(line: 25, column: 11, scope: !85)
-!95 = !DILocation(line: 25, column: 14, scope: !85)
-!96 = !{!"branch_weights", i32 16724, i32 1}
-!97 = !DILocation(line: 26, column: 8, scope: !98)
-!98 = distinct !DILexicalBlock(scope: !99, file: !3, line: 26, column: 8)
-!99 = distinct !DILexicalBlock(scope: !85, file: !3, line: 25, column: 30)
-!100 = !DILocation(line: 26, column: 10, scope: !98)
-!101 = !DILocation(line: 26, column: 8, scope: !99)
-!102 = !{!"branch_weights", i32 14852, i32 1872}
-!103 = !DILocation(line: 27, column: 10, scope: !98)
-!104 = !DILocation(line: 27, column: 6, scope: !105)
-!105 = !DILexicalBlockFile(scope: !98, file: !3, discriminator: 455082031)
-!106 = !{!"branch_weights", i32 14852}
-!107 = !DILocation(line: 27, column: 6, scope: !98)
-!108 = !DILocation(line: 29, column: 10, scope: !98)
-!109 = !DILocation(line: 0, scope: !60, inlinedAt: !110)
-!110 = distinct !DILocation(line: 29, column: 6, scope: !111)
-!111 = !DILexicalBlockFile(scope: !98, file: !3, discriminator: 455082047)
-!112 = !DILocation(line: 11, column: 6, scope: !66, inlinedAt: !110)
-!113 = !DILocation(line: 11, column: 7, scope: !66, inlinedAt: !110)
-!114 = !DILocation(line: 11, column: 6, scope: !60, inlinedAt: !110)
-!115 = !{!"branch_weights", i32 1736, i32 136}
-!116 = !DILocation(line: 12, column: 6, scope: !66, inlinedAt: !110)
-!117 = !DILocation(line: 12, column: 5, scope: !66, inlinedAt: !110)
-!118 = !DILocation(line: 14, column: 5, scope: !60, inlinedAt: !110)
-!119 = !DILocation(line: 15, column: 9, scope: !73, inlinedAt: !110)
-!120 = !DILocation(line: 15, column: 7, scope: !60, inlinedAt: !110)
-!121 = !{!"branch_weights", i32 0, i32 1872}
-!122 = !DILocation(line: 16, column: 7, scope: !73, inlinedAt: !110)
-!123 = !DILocation(line: 16, column: 6, scope: !73, inlinedAt: !110)
-!124 = !DILocation(line: 17, column: 12, scope: !78, inlinedAt: !110)
-!125 = !DILocation(line: 17, column: 14, scope: !78, inlinedAt: !110)
-!126 = !DILocation(line: 17, column: 12, scope: !73, inlinedAt: !110)
-!127 = !{!"branch_weights", i32 936, i32 936}
-!128 = !DILocation(line: 18, column: 7, scope: !78, inlinedAt: !110)
-!129 = !DILocation(line: 18, column: 6, scope: !78, inlinedAt: !110)
-!130 = !DILocation(line: 20, column: 7, scope: !78, inlinedAt: !110)
-!131 = !DILocation(line: 21, column: 1, scope: !60, inlinedAt: !110)
-!132 = distinct !{!132, !93, !133, !134}
-!133 = !DILocation(line: 30, column: 3, scope: !85)
-!134 = !{!"llvm.loop.mustprogress"}
-!135 = !DILocation(line: 31, column: 3, scope: !85)
+!14 = !{!"clang version 20.0.0"}
+!15 = !{i64 -2012135647395072713, i64 4294967295, !"bar"}
+!16 = !{i64 7546896869197086323, i64 191430930410, !"baz"}
+!17 = !{i64 -2624081020897602054, i64 563091374530180, !"main"}
+!18 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 3, type: !19, scopeLine: 3, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !21)
+!19 = !DISubroutineType(types: !20)
+!20 = !{null, !6}
+!21 = !{!22}
+!22 = !DILocalVariable(name: "i", arg: 1, scope: !18, file: !3, line: 3, type: !6)
+!23 = !DILocation(line: 0, scope: !18)
+!24 = !DILocation(line: 4, column: 5, scope: !18)
+!25 = !{!26, !26, i64 0}
+!26 = !{!"int", !27, i64 0}
+!27 = !{!"omnipotent char", !28, i64 0}
+!28 = !{!"Simple C/C++ TBAA"}
+!29 = !DILocation(line: 8, column: 1, scope: !18)
+!30 = distinct !DISubprogram(name: "baz", scope: !3, file: !3, line: 10, type: !19, scopeLine: 10, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !31)
+!31 = !{!32}
+!32 = !DILocalVariable(name: "i", arg: 1, scope: !30, file: !3, line: 10, type: !6)
+!33 = !DILocation(line: 0, scope: !30)
+!34 = !DILocation(line: 11, column: 6, scope: !35)
+!35 = distinct !DILexicalBlock(scope: !30, file: !3, line: 11, column: 6)
+!36 = !DILocation(line: 11, column: 7, scope: !35)
+!37 = !DILocation(line: 11, column: 6, scope: !30)
+!38 = !DILocation(line: 12, column: 6, scope: !35)
+!39 = !DILocation(line: 12, column: 5, scope: !35)
+!40 = !DILocation(line: 14, column: 5, scope: !30)
+!41 = !DILocation(line: 15, column: 9, scope: !42)
+!42 = distinct !DILexicalBlock(scope: !30, file: !3, line: 15, column: 7)
+!43 = !DILocation(line: 15, column: 7, scope: !30)
+!44 = !DILocation(line: 17, column: 12, scope: !45)
+!45 = distinct !DILexicalBlock(scope: !42, file: !3, line: 17, column: 12)
+!46 = !DILocation(line: 17, column: 14, scope: !45)
+!47 = !DILocation(line: 17, column: 12, scope: !42)
+!48 = !DILocation(line: 0, scope: !42)
+!49 = !DILocation(line: 21, column: 1, scope: !30)
+!50 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 23, type: !51, scopeLine: 23, flags: DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !53)
+!51 = !DISubroutineType(types: !52)
+!52 = !{!6}
+!53 = !{!54}
+!54 = !DILocalVariable(name: "i", scope: !50, file: !3, line: 24, type: !6)
+!55 = !DILocation(line: 24, column: 7, scope: !50)
+!56 = !DILocation(line: 0, scope: !50)
+!57 = !DILocation(line: 25, column: 11, scope: !50)
+!58 = !DILocation(line: 25, column: 3, scope: !50)
+!59 = !DILocation(line: 26, column: 8, scope: !60)
+!60 = distinct !DILexicalBlock(scope: !61, file: !3, line: 26, column: 8)
+!61 = distinct !DILexicalBlock(scope: !50, file: !3, line: 25, column: 30)
+!62 = !DILocation(line: 26, column: 10, scope: !60)
+!63 = !DILocation(line: 26, column: 8, scope: !61)
+!64 = !DILocation(line: 27, column: 10, scope: !60)
+!65 = !DILocation(line: 27, column: 6, scope: !66)
+!66 = !DILexicalBlockFile(scope: !60, file: !3, discriminator: 455082031)
+!67 = !DILocation(line: 27, column: 6, scope: !60)
+!68 = !DILocation(line: 29, column: 10, scope: !60)
+!69 = !DILocation(line: 0, scope: !30, inlinedAt: !70)
+!70 = distinct !DILocation(line: 29, column: 6, scope: !71)
+!71 = !DILexicalBlockFile(scope: !60, file: !3, discriminator: 455082047)
+!72 = !DILocation(line: 11, column: 6, scope: !35, inlinedAt: !70)
+!73 = !DILocation(line: 11, column: 7, scope: !35, inlinedAt: !70)
+!74 = !DILocation(line: 11, column: 6, scope: !30, inlinedAt: !70)
+!75 = !DILocation(line: 12, column: 6, scope: !35, inlinedAt: !70)
+!76 = !DILocation(line: 12, column: 5, scope: !35, inlinedAt: !70)
+!77 = !DILocation(line: 14, column: 5, scope: !30, inlinedAt: !70)
+!78 = !DILocation(line: 15, column: 9, scope: !42, inlinedAt: !70)
+!79 = !DILocation(line: 15, column: 7, scope: !30, inlinedAt: !70)
+!80 = !DILocation(line: 17, column: 12, scope: !45, inlinedAt: !70)
+!81 = !DILocation(line: 17, column: 14, scope: !45, inlinedAt: !70)
+!82 = !DILocation(line: 17, column: 12, scope: !42, inlinedAt: !70)
+!83 = !DILocation(line: 0, scope: !42, inlinedAt: !70)
+!84 = !DILocation(line: 21, column: 1, scope: !30, inlinedAt: !70)
+!85 = !DILocation(line: 25, column: 14, scope: !50)
+!86 = distinct !{!86, !58, !87, !88}
+!87 = !DILocation(line: 30, column: 3, scope: !50)
+!88 = !{!"llvm.loop.mustprogress"}
+!89 = !DILocation(line: 31, column: 3, scope: !50)
More information about the llvm-commits
mailing list