Merging r205738:

------------------------------------------------------------------------ r205738 | atrick | 2014-04-07 17:29:22 -0400 (Mon, 07 Apr 2014) | 16 lines Put a limit on ScheduleDAGSDNodes::ClusterNeighboringLoads to avoid blowing up compile time. Fixes PR16365 - Extremely slow compilation in -O1 and -O2. The SD scheduler has a quadratic implementation of load clustering which absolutely blows up compile time for large blocks with constant pool loads. The MI scheduler has a better implementation of load clustering. However, we have not done the work yet to completely eliminate the SD scheduler. Some benchmarks still seem to benefit from early load clustering, although maybe by chance. As an intermediate term fix, I just put a nice limit on the number of DAG users to search before finding a match. With this limit there are no binary differences in the LLVM test suite, and the PR16365 test case does not suffer any compile time impact from this routine. ------------------------------------------------------------------------ llvm-svn: 205808
author: Tom Stellard <thomas.stellard@amd.com> 2014-04-08 21:47:17 +0000
committer: Tom Stellard <thomas.stellard@amd.com> 2014-04-08 21:47:17 +0000
commit: dcd1b1bd76510caa18700ff6cea045cc5f409108 (patch)
tree: 3b070e476b67819a095f3ae06a6d2e14e9278a3d
parent: 67415166176bc52ced5461c3f6cc083e069dc777 (diff)
download: llvm-dcd1b1bd76510caa18700ff6cea045cc5f409108.zip
llvm-dcd1b1bd76510caa18700ff6cea045cc5f409108.tar.gz
llvm-dcd1b1bd76510caa18700ff6cea045cc5f409108.tar.bz2
1 files changed, 6 insertions, 1 deletions
diff --git a/llvm/lib/CodeGen/SelectionDAG/ScheduleDAGSDNodes.cpp b/llvm/lib/CodeGen/SelectionDAG/ScheduleDAGSDNodes.cpp
index 054e3dd..c1893c9 100644
--- a/llvm/lib/CodeGen/SelectionDAG/ScheduleDAGSDNodes.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/ScheduleDAGSDNodes.cpp
@@ -219,8 +219,11 @@ void ScheduleDAGSDNodes::ClusterNeighboringLoads(SDNode *Node) {
   DenseMap<long long, SDNode*> O2SMap;  // Map from offset to SDNode.
   bool Cluster = false;
   SDNode *Base = Node;
+  // This algorithm requires a reasonably low use count before finding a match
+  // to avoid uselessly blowing up compile time in large blocks.
+  unsigned UseCount = 0;
   for (SDNode::use_iterator I = Chain->use_begin(), E = Chain->use_end();
-       I != E; ++I) {
+       I != E && UseCount < 100; ++I, ++UseCount) {
     SDNode *User = *I;
     if (User == Node || !Visited.insert(User))
       continue;
@@ -237,6 +240,8 @@ void ScheduleDAGSDNodes::ClusterNeighboringLoads(SDNode *Node) {
     if (Offset2 < Offset1)
       Base = User;
     Cluster = true;
+    // Reset UseCount to allow more matches.
+    UseCount = 0;
   }
 
   if (!Cluster)
author	Tom Stellard <thomas.stellard@amd.com>	2014-04-08 21:47:17 +0000
committer	Tom Stellard <thomas.stellard@amd.com>	2014-04-08 21:47:17 +0000
commit	dcd1b1bd76510caa18700ff6cea045cc5f409108 (patch)
tree	3b070e476b67819a095f3ae06a6d2e14e9278a3d
parent	67415166176bc52ced5461c3f6cc083e069dc777 (diff)
download	llvm-dcd1b1bd76510caa18700ff6cea045cc5f409108.zip llvm-dcd1b1bd76510caa18700ff6cea045cc5f409108.tar.gz llvm-dcd1b1bd76510caa18700ff6cea045cc5f409108.tar.bz2