Bug 1959074 - Use a less-obviously-quadratic-time innermost-loop finder for loop unrolling. r=iain.

The MIR loop unroller in bug 1950284 uses a somewhat simplistic algorithm for finding innermost loops (for unrolling). This commit changes it to use the scheme shown at the end of BacktrackingAllocator::init(). This both simplifies the code and avoids the need to compare every loop in a function against every other loop in that function, in order to establish which ones are innermost. It thereby removes a potential quadratic cost. Differential Revision: https://phabricator.services.mozilla.com/D248931
2025-05-12 18:58:59 +00:00
parent 851a4124e0
commit af5578e3c5
1 changed files with 44 additions and 74 deletions
--- a/js/src/jit/UnrollLoops.cpp
+++ b/js/src/jit/UnrollLoops.cpp
@@ -1689,18 +1689,45 @@ bool FindInitialCandidates(MIRGraph& graph,
  // Find initial candidate loops, and place them in `initialCandidates`.
  MOZ_ASSERT(initialCandidates.empty());

-  // TODO: possibly use a linear-time algorithm to find innermost loops, as
-  // BackTrackingAllocator.cpp does, rather than the scheme below.
-  // See bug 1959074.
+  // First, using a single scan over the blocks, find blocks that are the
+  // headers of innermost loops.  This uses the same logic to find innermost
+  // loops as BacktrackingAllocator::init.
+  //
+  // The general idea is: we traverse the entire graph in RPO order, but ignore
+  // all blocks except loop headers and loop backedge blocks.  At a header we
+  // make a note of the backedge block it points at.  Because the loops are
+  // properly nested, this means that we will ignore backedges for
+  // non-innermost loops, and, so, when we do come to a block that matches
+  // `backedge`, we know we've identified an innermost loop.
+  //
+  // At the same time, release-assert that the blocks are numbered
+  // sequentially.  We need this for the loop-non-overlapping check below.
+  mozilla::Vector<MBasicBlock*, 128, SystemAllocPolicy> initialHeaders;
+  {
+    MBasicBlock* backedge = nullptr;
+    uint32_t expectedNextId = 0;
+    for (auto rpoIter(graph.rpoBegin()), rpoIterEnd(graph.rpoEnd());
+         rpoIter != rpoIterEnd; ++rpoIter) {
+      MBasicBlock* block = *rpoIter;
+      MOZ_RELEASE_ASSERT(block->id() == expectedNextId);
+      expectedNextId++;

-  // Collect up the loops in the function.  The iteration order doesn't matter
-  // here, but we have to choose something.
-  for (auto rpoIter(graph.rpoBegin()), rpoIterEnd(graph.rpoEnd());
-       rpoIter != rpoIterEnd; ++rpoIter) {
-    MBasicBlock* header = *rpoIter;
-    if (!header->isLoopHeader()) {
-      continue;
+      if (block->isLoopHeader()) {
+        backedge = block->backedge();
+      }
+      if (block == backedge) {
+        if (!initialHeaders.append(block->loopHeaderOfBackedge())) {
+          return false;
+        }
+      }
    }
+  }
+
+  // Now use MarkLoopBlocks to check each potential loop in more detail, and,
+  // for each non-empty, non-OSR one, create an entry in initialCandidates for
+  // it.
+  for (MBasicBlock* header : initialHeaders) {
+    MOZ_ASSERT(header->isLoopHeader());

    bool hasOsrEntry;
    size_t numBlocks = MarkLoopBlocks(graph, header, &hasOsrEntry);
@@ -1720,77 +1747,20 @@ bool FindInitialCandidates(MIRGraph& graph,
    }
  }

-  // Sort the loops by size (in blocks).
-  std::sort(initialCandidates.begin(), initialCandidates.end(),
-            [](const InitialCandidate& cand1, const InitialCandidate& cand2) {
-              return cand1.numBlocks < cand2.numBlocks;
-            });
-
-  // Remove non-innermost candidates from consideration.  We expect
-  // `initialCandidates` to describe contiguous, properly nested candidates.
-  // For each loop in `initialCandidates`, scan forwards in the vector and mark
-  // as invalid, any subsequent loops that contain it.
-  for (size_t i = 0; i < initialCandidates.length(); i++) {
-    const InitialCandidate& candI = initialCandidates[i];
-    MOZ_ASSERT(candI.numBlocks > 0);
-
-    for (size_t j = i + 1; j < initialCandidates.length(); j++) {
-      InitialCandidate& candJ = initialCandidates[j];
-      MOZ_ASSERT(candJ.numBlocks > 0);
-      // Because sorted by size:
-      MOZ_ASSERT(candI.numBlocks <= candJ.numBlocks);
-      if (!candJ.valid) {
-        // Already invalidated
-        continue;
-      }
-
-      // Determine relationship of I vs J.  Either non-overlapping, or I is
-      // completely contained inside J.  In which case invalidate J.
-      MOZ_ASSERT(candI.numBlocks > 0);
-      if (candI.header->id() + candI.numBlocks <= candJ.header->id()) {
-        continue;  // no overlap
-      }
-      if (candJ.header->id() + candJ.numBlocks <= candI.header->id()) {
-        continue;  // no overlap
-      }
-      // "I is completely contained within J"
-      MOZ_ASSERT(candJ.header->id() <= candI.header->id());
-      MOZ_ASSERT(candI.header->id() + candI.numBlocks <=
-                 candJ.header->id() + candJ.numBlocks);
-      // and they aren't identical
-      MOZ_ASSERT(candI.header->id() != candJ.header->id() ||
-                 candI.numBlocks != candJ.numBlocks);
-      candJ.valid = false;
-    }
-  }
-
-  // Slide the valid ones to the start of the vector and sort by starting block
-  // ID.  This makes it easy to verify that the cands are non-overlapping.
-  {
-    size_t wr = 0;
-    size_t rd;
-    for (rd = 0; rd < initialCandidates.length(); rd++) {
-      if (initialCandidates[rd].valid) {
-        initialCandidates[wr++] = initialCandidates[rd];
-      }
-    }
-    while (wr < rd) {
-      initialCandidates.popBack();
-      wr++;
-    }
-  }
-
  // Sort the loops by header ID.
  std::sort(initialCandidates.begin(), initialCandidates.end(),
            [](const InitialCandidate& cand1, const InitialCandidate& cand2) {
              return cand1.header->id() < cand2.header->id();
            });

-  // Now we can conveniently assert non-overlappingness.
+  // Now we can conveniently assert non-overlappingness.  Note that this
+  // depends on the property that each loop is a sequential sequence of block
+  // IDs, as we release-asserted above.  Presence of an overlap might indicate
+  // that a non-innermost loop made it this far.
  for (size_t i = 1; i < initialCandidates.length(); i++) {
-    MOZ_ASSERT(initialCandidates[i - 1].header->id() +
-                   initialCandidates[i - 1].numBlocks <=
-               initialCandidates[i].header->id());
+    MOZ_RELEASE_ASSERT(initialCandidates[i - 1].header->id() +
+                       initialCandidates[i - 1].numBlocks <=
+                       initialCandidates[i].header->id());
  }

  // Heuristics: calculate a "score" for each loop, indicating our desire to