[MachineOutliner] Efficient Implementation of MachineOutliner::findCandidates() (#90260)

This reduce the time complexity of the main loop of `findCandidates()` method from $O(n^2)$ to $O(n \log n)$. For small $n$, the modification does not regress the build time, but it helps significantly when $n$ is large. For one application, this reduces the runtime of the main loop from 120 seconds to 28 seconds. This is the first commit for an enhanced version of machine outliner -- see [RFC](https://discourse.llvm.org/t/rfc-enhanced-machine-outliner-part-1-fulllto-part-2-thinlto-nolto-to-come/78732).
author: Xuan Zhang <144393379+xuanzh-meta@users.noreply.github.com> 2024-06-03 10:41:49 -0400
committer: GitHub <noreply@github.com> 2024-06-03 07:41:49 -0700
commit: 16c925ab5fd3d677792ce6575f81774c64b87cec (patch)
tree: d7d6c0f10e41260a5033fbe59911d6b71e7ea23c /llvm/lib/CodeGen/MachineOutliner.cpp
parent: 138856292235e4c805f2616b56ac09be5017f355 (diff)
download: llvm-16c925ab5fd3d677792ce6575f81774c64b87cec.zip
llvm-16c925ab5fd3d677792ce6575f81774c64b87cec.tar.gz
llvm-16c925ab5fd3d677792ce6575f81774c64b87cec.tar.bz2
1 files changed, 11 insertions, 10 deletions
diff --git a/llvm/lib/CodeGen/MachineOutliner.cpp b/llvm/lib/CodeGen/MachineOutliner.cpp
index f174dd8..626e577 100644
--- a/llvm/lib/CodeGen/MachineOutliner.cpp
+++ b/llvm/lib/CodeGen/MachineOutliner.cpp
@@ -584,7 +584,7 @@ void MachineOutliner::findCandidates(
   LLVM_DEBUG(dbgs() << "*** Discarding overlapping candidates *** \n");
   LLVM_DEBUG(
       dbgs() << "Searching for overlaps in all repeated sequences...\n");
-  for (const SuffixTree::RepeatedSubstring &RS : ST) {
+  for (SuffixTree::RepeatedSubstring &RS : ST) {
     CandidatesForRepeatedSeq.clear();
     unsigned StringLen = RS.Length;
     LLVM_DEBUG(dbgs() << "  Sequence length: " << StringLen << "\n");
@@ -593,6 +593,9 @@ void MachineOutliner::findCandidates(
     unsigned NumDiscarded = 0;
     unsigned NumKept = 0;
 #endif
+    // Sort the start indices so that we can efficiently check if candidates
+    // overlap with the ones we've already found for this sequence.
+    llvm::sort(RS.StartIndices);
     for (const unsigned &StartIdx : RS.StartIndices) {
       // Trick: Discard some candidates that would be incompatible with the
       // ones we've already found for this sequence. This will save us some
@@ -616,17 +619,15 @@ void MachineOutliner::findCandidates(
       // * End before the other starts
       // * Start after the other ends
       unsigned EndIdx = StartIdx + StringLen - 1;
-      auto FirstOverlap = find_if(
-          CandidatesForRepeatedSeq, [StartIdx, EndIdx](const Candidate &C) {
-            return EndIdx >= C.getStartIdx() && StartIdx <= C.getEndIdx();
-          });
-      if (FirstOverlap != CandidatesForRepeatedSeq.end()) {
+      if (!CandidatesForRepeatedSeq.empty() &&
+          StartIdx <= CandidatesForRepeatedSeq.back().getEndIdx()) {
 #ifndef NDEBUG
         ++NumDiscarded;
-        LLVM_DEBUG(dbgs() << "    .. DISCARD candidate @ [" << StartIdx
-                          << ", " << EndIdx << "]; overlaps with candidate @ ["
-                          << FirstOverlap->getStartIdx() << ", "
-                          << FirstOverlap->getEndIdx() << "]\n");
+        LLVM_DEBUG(dbgs() << "    .. DISCARD candidate @ [" << StartIdx << ", "
+                          << EndIdx << "]; overlaps with candidate @ ["
+                          << CandidatesForRepeatedSeq.back().getStartIdx()
+                          << ", " << CandidatesForRepeatedSeq.back().getEndIdx()
+                          << "]\n");
 #endif
         continue;
       }
author	Xuan Zhang <144393379+xuanzh-meta@users.noreply.github.com>	2024-06-03 10:41:49 -0400
committer	GitHub <noreply@github.com>	2024-06-03 07:41:49 -0700
commit	16c925ab5fd3d677792ce6575f81774c64b87cec (patch)
tree	d7d6c0f10e41260a5033fbe59911d6b71e7ea23c /llvm/lib/CodeGen/MachineOutliner.cpp
parent	138856292235e4c805f2616b56ac09be5017f355 (diff)
download	llvm-16c925ab5fd3d677792ce6575f81774c64b87cec.zip llvm-16c925ab5fd3d677792ce6575f81774c64b87cec.tar.gz llvm-16c925ab5fd3d677792ce6575f81774c64b87cec.tar.bz2