TailRecursionElimination.cpp revision 3fc6ef1bb96d9a3194cef667a2d3cbc94e3fb189
12240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//===- TailRecursionElimination.cpp - Eliminate Tail Calls ----------------===//
22240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//
32240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner// This file implements tail recursion elimination.
42240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//
52240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner// Caveats: The algorithm implemented is trivially simple.  There are several
62240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner// improvements that could be made:
72240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//
82240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//  1. If the function has any alloca instructions, these instructions will not
92240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     remain in the entry block of the function.  Doing this requires analysis
102240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     to prove that the alloca is not reachable by the recursively invoked
112240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     function call.
122240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//  2. Tail recursion is only performed if the call immediately preceeds the
132240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     return instruction.  Would it be useful to generalize this somehow?
142240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//  3. TRE is only performed if the function returns void or if the return
152240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     returns the result returned by the call.  It is possible, but unlikely,
162240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     that the return returns something else (like constant 0), and can still
172240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     be TRE'd.  It can be TRE'd if ALL OTHER return instructions in the
182240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//     function return the exact same value.
192240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//
202240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner//===----------------------------------------------------------------------===//
212240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
223fc6ef1bb96d9a3194cef667a2d3cbc94e3fb189Chris Lattner#include "llvm/Transforms/Scalar.h"
232240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner#include "llvm/DerivedTypes.h"
242240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner#include "llvm/Function.h"
252240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner#include "llvm/Instructions.h"
262240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner#include "llvm/Pass.h"
272240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner#include "Support/Statistic.h"
282240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
292240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattnernamespace {
302240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  Statistic<> NumEliminated("tailcallelim", "Number of tail calls removed");
312240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
322240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  struct TailCallElim : public FunctionPass {
332240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner    virtual bool runOnFunction(Function &F);
342240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  };
352240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  RegisterOpt<TailCallElim> X("tailcallelim", "Tail Call Elimination");
362240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner}
372240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
383fc6ef1bb96d9a3194cef667a2d3cbc94e3fb189Chris LattnerFunctionPass *createTailCallEliminationPass() { return new TailCallElim(); }
393fc6ef1bb96d9a3194cef667a2d3cbc94e3fb189Chris Lattner
402240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
412240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattnerbool TailCallElim::runOnFunction(Function &F) {
422240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  // If this function is a varargs function, we won't be able to PHI the args
432240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  // right, so don't even try to convert it...
442240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  if (F.getFunctionType()->isVarArg()) return false;
452240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
462240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  BasicBlock *OldEntry = 0;
472240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  std::vector<PHINode*> ArgumentPHIs;
482240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  bool MadeChange = false;
492240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
502240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  // Loop over the function, looking for any returning blocks...
512240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  for (Function::iterator BB = F.begin(), E = F.end(); BB != E; ++BB)
522240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner    if (ReturnInst *Ret = dyn_cast<ReturnInst>(BB->getTerminator()))
532240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner      if (Ret != BB->begin())
542240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner        if (CallInst *CI = dyn_cast<CallInst>(Ret->getPrev()))
552240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner          // Make sure the tail call is to the current function, and that the
562240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner          // return either returns void or returns the value computed by the
572240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner          // call.
582240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner          if (CI->getCalledFunction() == &F &&
592240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              (Ret->getNumOperands() == 0 || Ret->getReturnValue() == CI)) {
602240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            // Ohh, it looks like we found a tail call, is this the first?
612240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            if (!OldEntry) {
622240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // Ok, so this is the first tail call we have found in this
632240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // function.  Insert a new entry block into the function, allowing
642240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // us to branch back to the old entry block.
652240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              OldEntry = &F.getEntryNode();
662240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              BasicBlock *NewEntry = new BasicBlock("tailrecurse", OldEntry);
672240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              NewEntry->getInstList().push_back(new BranchInst(OldEntry));
682240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
692240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // Now that we have created a new block, which jumps to the entry
702240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // block, insert a PHI node for each argument of the function.
712240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // For now, we initialize each PHI to only have the real arguments
722240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              // which are passed in.
732240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              Instruction *InsertPos = OldEntry->begin();
742240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              for (Function::aiterator I = F.abegin(), E = F.aend(); I!=E; ++I){
752240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner                PHINode *PN = new PHINode(I->getType(), I->getName()+".tr",
762240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner                                          InsertPos);
772240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner                PN->addIncoming(I, NewEntry);
782240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner                ArgumentPHIs.push_back(PN);
792240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              }
802240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            }
812240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
822240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            // Ok, now that we know we have a pseudo-entry block WITH all of the
832240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            // required PHI nodes, add entries into the PHI node for the actual
842240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            // parameters passed into the tail-recursive call.
852240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            for (unsigned i = 0, e = CI->getNumOperands()-1; i != e; ++i)
862240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner              ArgumentPHIs[i]->addIncoming(CI->getOperand(i+1), BB);
872240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
882240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            // Now that all of the PHI nodes are in place, remove the call and
892240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            // ret instructions, replacing them with an unconditional branch.
902240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            new BranchInst(OldEntry, CI);
912240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            BB->getInstList().pop_back();  // Remove return.
922240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            BB->getInstList().pop_back();  // Remove call.
932240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            MadeChange = true;
942240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner            NumEliminated++;
952240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner          }
962240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
972240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner  return MadeChange;
982240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner}
992240d2b3f7b9f5835868c83ce78d125d1b65212bChris Lattner
100