[llvm] [MemProf] Refactor backedge computation and invoke earlier (PR #128226)
via llvm-commits
llvm-commits at lists.llvm.org
Fri Feb 21 12:48:28 PST 2025
llvmbot wrote:
<!--LLVM PR SUMMARY COMMENT-->
@llvm/pr-subscribers-llvm-transforms
Author: Teresa Johnson (teresajohnson)
<details>
<summary>Changes</summary>
Invoke the backedge computation (refactored as a new method) at the end
of the graph construction, instead of at the start of cloning. That
makes more logical sense, and it also makes it easier to look at the
results in the postbuild dot graph with a follow on change to display
those differently.
---
Full diff: https://github.com/llvm/llvm-project/pull/128226.diff
1 Files Affected:
- (modified) llvm/lib/Transforms/IPO/MemProfContextDisambiguation.cpp (+29-15)
``````````diff
diff --git a/llvm/lib/Transforms/IPO/MemProfContextDisambiguation.cpp b/llvm/lib/Transforms/IPO/MemProfContextDisambiguation.cpp
index 8bfbb2c348459..705806b98f8da 100644
--- a/llvm/lib/Transforms/IPO/MemProfContextDisambiguation.cpp
+++ b/llvm/lib/Transforms/IPO/MemProfContextDisambiguation.cpp
@@ -530,6 +530,9 @@ class CallsiteContextGraph {
/// multiple different callee target functions.
void handleCallsitesWithMultipleTargets();
+ /// Mark backedges via the standard DFS based backedge algorithm.
+ void markBackedges();
+
// Try to partition calls on the given node (already placed into the AllCalls
// array) by callee function, creating new copies of Node as needed to hold
// calls with different callees, and moving the callee edges appropriately.
@@ -740,6 +743,7 @@ class CallsiteContextGraph {
void moveCalleeEdgeToNewCaller(const std::shared_ptr<ContextEdge> &Edge,
ContextNode *NewCaller);
+ /// Recursive helper for marking backedges via DFS.
void markBackedges(ContextNode *Node, DenseSet<const ContextNode *> &Visited,
DenseSet<const ContextNode *> &CurrentStack);
@@ -2108,6 +2112,8 @@ ModuleCallsiteContextGraph::ModuleCallsiteContextGraph(
handleCallsitesWithMultipleTargets();
+ markBackedges();
+
// Strip off remaining callsite metadata, no longer needed.
for (auto &FuncEntry : FuncToCallsWithMetadata)
for (auto &Call : FuncEntry.second)
@@ -2204,6 +2210,8 @@ IndexCallsiteContextGraph::IndexCallsiteContextGraph(
updateStackNodes();
handleCallsitesWithMultipleTargets();
+
+ markBackedges();
}
template <typename DerivedCCG, typename FuncTy, typename CallTy>
@@ -3405,6 +3413,27 @@ void CallsiteContextGraph<DerivedCCG, FuncTy, CallTy>::
// This is the standard DFS based backedge discovery algorithm.
template <typename DerivedCCG, typename FuncTy, typename CallTy>
+void CallsiteContextGraph<DerivedCCG, FuncTy, CallTy>::markBackedges() {
+ // If we are cloning recursive contexts, find and mark backedges from all root
+ // callers, using the typical DFS based backedge analysis.
+ if (!CloneRecursiveContexts)
+ return;
+ DenseSet<const ContextNode *> Visited;
+ DenseSet<const ContextNode *> CurrentStack;
+ for (auto &Entry : NonAllocationCallToContextNodeMap) {
+ auto *Node = Entry.second;
+ if (Node->isRemoved())
+ continue;
+ // It is a root if it doesn't have callers.
+ if (!Node->CallerEdges.empty())
+ continue;
+ markBackedges(Node, Visited, CurrentStack);
+ assert(CurrentStack.empty());
+ }
+}
+
+// Recursive helper for above markBackedges method.
+template <typename DerivedCCG, typename FuncTy, typename CallTy>
void CallsiteContextGraph<DerivedCCG, FuncTy, CallTy>::markBackedges(
ContextNode *Node, DenseSet<const ContextNode *> &Visited,
DenseSet<const ContextNode *> &CurrentStack) {
@@ -3429,22 +3458,7 @@ void CallsiteContextGraph<DerivedCCG, FuncTy, CallTy>::markBackedges(
template <typename DerivedCCG, typename FuncTy, typename CallTy>
void CallsiteContextGraph<DerivedCCG, FuncTy, CallTy>::identifyClones() {
- // If we are cloning recursive contexts, find and mark backedges from all root
- // callers, using the typical DFS based backedge analysis.
DenseSet<const ContextNode *> Visited;
- if (CloneRecursiveContexts) {
- DenseSet<const ContextNode *> CurrentStack;
- for (auto &Entry : NonAllocationCallToContextNodeMap) {
- auto *Node = Entry.second;
- if (Node->isRemoved())
- continue;
- // It is a root if it doesn't have callers.
- if (!Node->CallerEdges.empty())
- continue;
- markBackedges(Node, Visited, CurrentStack);
- assert(CurrentStack.empty());
- }
- }
for (auto &Entry : AllocationCallToContextNodeMap) {
Visited.clear();
identifyClones(Entry.second, Visited, Entry.second->getContextIds());
``````````
</details>
https://github.com/llvm/llvm-project/pull/128226
More information about the llvm-commits
mailing list