aboutsummaryrefslogtreecommitdiff
path: root/llvm/lib/Target/CellSPU/SPUTargetMachine.cpp
diff options
context:
space:
mode:
authorKalle Raiskila <kalle.raiskila@nokia.com>2011-01-11 09:07:54 +0000
committerKalle Raiskila <kalle.raiskila@nokia.com>2011-01-11 09:07:54 +0000
commitbe9ad1e63183133c2b51d38b2d6ffe5fdaf93de9 (patch)
treed2ef5fc4e00d53261babd0fb5965b558e29d924e /llvm/lib/Target/CellSPU/SPUTargetMachine.cpp
parent23bf3bafb71107523987b59ef1b206987401a8d1 (diff)
downloadllvm-be9ad1e63183133c2b51d38b2d6ffe5fdaf93de9.zip
llvm-be9ad1e63183133c2b51d38b2d6ffe5fdaf93de9.tar.gz
llvm-be9ad1e63183133c2b51d38b2d6ffe5fdaf93de9.tar.bz2
Add a "nop filler" pass to SPU.
Filling no-ops is done just before emitting of assembly, when the instruction stream is final. No-ops are inserted to align the instructions so the dual-issue of the pipeline is utilized. This speeds up generated code with a minimum of 1% on a select set of algorithms. This pass may be redundant if the instruction scheduler and all subsequent passes that modify the instruction stream (prolog+epilog inserter, register scavenger, are there others?) are made aware of the instruction alignments. llvm-svn: 123226
Diffstat (limited to 'llvm/lib/Target/CellSPU/SPUTargetMachine.cpp')
-rw-r--r--llvm/lib/Target/CellSPU/SPUTargetMachine.cpp9
1 files changed, 9 insertions, 0 deletions
diff --git a/llvm/lib/Target/CellSPU/SPUTargetMachine.cpp b/llvm/lib/Target/CellSPU/SPUTargetMachine.cpp
index 3423c69..3ed7361 100644
--- a/llvm/lib/Target/CellSPU/SPUTargetMachine.cpp
+++ b/llvm/lib/Target/CellSPU/SPUTargetMachine.cpp
@@ -59,3 +59,12 @@ bool SPUTargetMachine::addInstSelector(PassManagerBase &PM,
PM.add(createSPUISelDag(*this));
return false;
}
+
+// passes to run just before printing the assembly
+bool SPUTargetMachine::
+addPreEmitPass(PassManagerBase &PM, CodeGenOpt::Level OptLevel)
+{
+ //align instructions with nops/lnops for dual issue
+ PM.add(createSPUNopFillerPass(*this));
+ return true;
+}