1 //===- LowerSetJmp.cpp - Code pertaining to lowering set/long jumps -------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file implements the lowering of setjmp and longjmp to use the 11 // LLVM invoke and unwind instructions as necessary. 12 // 13 // Lowering of longjmp is fairly trivial. We replace the call with a 14 // call to the LLVM library function "__llvm_sjljeh_throw_longjmp()". 15 // This unwinds the stack for us calling all of the destructors for 16 // objects allocated on the stack. 17 // 18 // At a setjmp call, the basic block is split and the setjmp removed. 19 // The calls in a function that have a setjmp are converted to invoke 20 // where the except part checks to see if it's a longjmp exception and, 21 // if so, if it's handled in the function. If it is, then it gets the 22 // value returned by the longjmp and goes to where the basic block was 23 // split. Invoke instructions are handled in a similar fashion with the 24 // original except block being executed if it isn't a longjmp except 25 // that is handled by that function. 26 // 27 //===----------------------------------------------------------------------===// 28 29 //===----------------------------------------------------------------------===// 30 // FIXME: This pass doesn't deal with PHI statements just yet. That is, 31 // we expect this to occur before SSAification is done. This would seem 32 // to make sense, but in general, it might be a good idea to make this 33 // pass invokable via the "opt" command at will. 34 //===----------------------------------------------------------------------===// 35 36 #define DEBUG_TYPE "lowersetjmp" 37 #include "llvm/Transforms/IPO.h" 38 #include "llvm/Constants.h" 39 #include "llvm/DerivedTypes.h" 40 #include "llvm/Instructions.h" 41 #include "llvm/Intrinsics.h" 42 #include "llvm/LLVMContext.h" 43 #include "llvm/Module.h" 44 #include "llvm/Pass.h" 45 #include "llvm/Support/CallSite.h" 46 #include "llvm/Support/CFG.h" 47 #include "llvm/Support/InstVisitor.h" 48 #include "llvm/Transforms/Utils/Local.h" 49 #include "llvm/ADT/DepthFirstIterator.h" 50 #include "llvm/ADT/Statistic.h" 51 #include <map> 52 using namespace llvm; 53 54 STATISTIC(LongJmpsTransformed, "Number of longjmps transformed"); 55 STATISTIC(SetJmpsTransformed , "Number of setjmps transformed"); 56 STATISTIC(CallsTransformed , "Number of calls invokified"); 57 STATISTIC(InvokesTransformed , "Number of invokes modified"); 58 59 namespace { 60 //===--------------------------------------------------------------------===// 61 // LowerSetJmp pass implementation. 62 class LowerSetJmp : public ModulePass, public InstVisitor<LowerSetJmp> { 63 // LLVM library functions... 64 Constant *InitSJMap; // __llvm_sjljeh_init_setjmpmap 65 Constant *DestroySJMap; // __llvm_sjljeh_destroy_setjmpmap 66 Constant *AddSJToMap; // __llvm_sjljeh_add_setjmp_to_map 67 Constant *ThrowLongJmp; // __llvm_sjljeh_throw_longjmp 68 Constant *TryCatchLJ; // __llvm_sjljeh_try_catching_longjmp_exception 69 Constant *IsLJException; // __llvm_sjljeh_is_longjmp_exception 70 Constant *GetLJValue; // __llvm_sjljeh_get_longjmp_value 71 72 typedef std::pair<SwitchInst*, CallInst*> SwitchValuePair; 73 74 // Keep track of those basic blocks reachable via a depth-first search of 75 // the CFG from a setjmp call. We only need to transform those "call" and 76 // "invoke" instructions that are reachable from the setjmp call site. 77 std::set<BasicBlock*> DFSBlocks; 78 79 // The setjmp map is going to hold information about which setjmps 80 // were called (each setjmp gets its own number) and with which 81 // buffer it was called. 82 std::map<Function*, AllocaInst*> SJMap; 83 84 // The rethrow basic block map holds the basic block to branch to if 85 // the exception isn't handled in the current function and needs to 86 // be rethrown. 87 std::map<const Function*, BasicBlock*> RethrowBBMap; 88 89 // The preliminary basic block map holds a basic block that grabs the 90 // exception and determines if it's handled by the current function. 91 std::map<const Function*, BasicBlock*> PrelimBBMap; 92 93 // The switch/value map holds a switch inst/call inst pair. The 94 // switch inst controls which handler (if any) gets called and the 95 // value is the value returned to that handler by the call to 96 // __llvm_sjljeh_get_longjmp_value. 97 std::map<const Function*, SwitchValuePair> SwitchValMap; 98 99 // A map of which setjmps we've seen so far in a function. 100 std::map<const Function*, unsigned> SetJmpIDMap; 101 102 AllocaInst* GetSetJmpMap(Function* Func); 103 BasicBlock* GetRethrowBB(Function* Func); 104 SwitchValuePair GetSJSwitch(Function* Func, BasicBlock* Rethrow); 105 106 void TransformLongJmpCall(CallInst* Inst); 107 void TransformSetJmpCall(CallInst* Inst); 108 109 bool IsTransformableFunction(StringRef Name); 110 public: 111 static char ID; // Pass identification, replacement for typeid 112 LowerSetJmp() : ModulePass(ID) { 113 initializeLowerSetJmpPass(*PassRegistry::getPassRegistry()); 114 } 115 116 void visitCallInst(CallInst& CI); 117 void visitInvokeInst(InvokeInst& II); 118 void visitReturnInst(ReturnInst& RI); 119 void visitUnwindInst(UnwindInst& UI); 120 121 bool runOnModule(Module& M); 122 bool doInitialization(Module& M); 123 }; 124 } // end anonymous namespace 125 126 char LowerSetJmp::ID = 0; 127 INITIALIZE_PASS(LowerSetJmp, "lowersetjmp", "Lower Set Jump", false, false) 128 129 // run - Run the transformation on the program. We grab the function 130 // prototypes for longjmp and setjmp. If they are used in the program, 131 // then we can go directly to the places they're at and transform them. 132 bool LowerSetJmp::runOnModule(Module& M) { 133 bool Changed = false; 134 135 // These are what the functions are called. 136 Function* SetJmp = M.getFunction("llvm.setjmp"); 137 Function* LongJmp = M.getFunction("llvm.longjmp"); 138 139 // This program doesn't have longjmp and setjmp calls. 140 if ((!LongJmp || LongJmp->use_empty()) && 141 (!SetJmp || SetJmp->use_empty())) return false; 142 143 // Initialize some values and functions we'll need to transform the 144 // setjmp/longjmp functions. 145 doInitialization(M); 146 147 if (SetJmp) { 148 for (Value::use_iterator B = SetJmp->use_begin(), E = SetJmp->use_end(); 149 B != E; ++B) { 150 BasicBlock* BB = cast<Instruction>(*B)->getParent(); 151 for (df_ext_iterator<BasicBlock*> I = df_ext_begin(BB, DFSBlocks), 152 E = df_ext_end(BB, DFSBlocks); I != E; ++I) 153 /* empty */; 154 } 155 156 while (!SetJmp->use_empty()) { 157 assert(isa<CallInst>(SetJmp->use_back()) && 158 "User of setjmp intrinsic not a call?"); 159 TransformSetJmpCall(cast<CallInst>(SetJmp->use_back())); 160 Changed = true; 161 } 162 } 163 164 if (LongJmp) 165 while (!LongJmp->use_empty()) { 166 assert(isa<CallInst>(LongJmp->use_back()) && 167 "User of longjmp intrinsic not a call?"); 168 TransformLongJmpCall(cast<CallInst>(LongJmp->use_back())); 169 Changed = true; 170 } 171 172 // Now go through the affected functions and convert calls and invokes 173 // to new invokes... 174 for (std::map<Function*, AllocaInst*>::iterator 175 B = SJMap.begin(), E = SJMap.end(); B != E; ++B) { 176 Function* F = B->first; 177 for (Function::iterator BB = F->begin(), BE = F->end(); BB != BE; ++BB) 178 for (BasicBlock::iterator IB = BB->begin(), IE = BB->end(); IB != IE; ) { 179 visit(*IB++); 180 if (IB != BB->end() && IB->getParent() != BB) 181 break; // The next instruction got moved to a different block! 182 } 183 } 184 185 DFSBlocks.clear(); 186 SJMap.clear(); 187 RethrowBBMap.clear(); 188 PrelimBBMap.clear(); 189 SwitchValMap.clear(); 190 SetJmpIDMap.clear(); 191 192 return Changed; 193 } 194 195 // doInitialization - For the lower long/setjmp pass, this ensures that a 196 // module contains a declaration for the intrisic functions we are going 197 // to call to convert longjmp and setjmp calls. 198 // 199 // This function is always successful, unless it isn't. 200 bool LowerSetJmp::doInitialization(Module& M) 201 { 202 Type *SBPTy = Type::getInt8PtrTy(M.getContext()); 203 Type *SBPPTy = PointerType::getUnqual(SBPTy); 204 205 // N.B. See llvm/runtime/GCCLibraries/libexception/SJLJ-Exception.h for 206 // a description of the following library functions. 207 208 // void __llvm_sjljeh_init_setjmpmap(void**) 209 InitSJMap = M.getOrInsertFunction("__llvm_sjljeh_init_setjmpmap", 210 Type::getVoidTy(M.getContext()), 211 SBPPTy, (Type *)0); 212 // void __llvm_sjljeh_destroy_setjmpmap(void**) 213 DestroySJMap = M.getOrInsertFunction("__llvm_sjljeh_destroy_setjmpmap", 214 Type::getVoidTy(M.getContext()), 215 SBPPTy, (Type *)0); 216 217 // void __llvm_sjljeh_add_setjmp_to_map(void**, void*, unsigned) 218 AddSJToMap = M.getOrInsertFunction("__llvm_sjljeh_add_setjmp_to_map", 219 Type::getVoidTy(M.getContext()), 220 SBPPTy, SBPTy, 221 Type::getInt32Ty(M.getContext()), 222 (Type *)0); 223 224 // void __llvm_sjljeh_throw_longjmp(int*, int) 225 ThrowLongJmp = M.getOrInsertFunction("__llvm_sjljeh_throw_longjmp", 226 Type::getVoidTy(M.getContext()), SBPTy, 227 Type::getInt32Ty(M.getContext()), 228 (Type *)0); 229 230 // unsigned __llvm_sjljeh_try_catching_longjmp_exception(void **) 231 TryCatchLJ = 232 M.getOrInsertFunction("__llvm_sjljeh_try_catching_longjmp_exception", 233 Type::getInt32Ty(M.getContext()), SBPPTy, (Type *)0); 234 235 // bool __llvm_sjljeh_is_longjmp_exception() 236 IsLJException = M.getOrInsertFunction("__llvm_sjljeh_is_longjmp_exception", 237 Type::getInt1Ty(M.getContext()), 238 (Type *)0); 239 240 // int __llvm_sjljeh_get_longjmp_value() 241 GetLJValue = M.getOrInsertFunction("__llvm_sjljeh_get_longjmp_value", 242 Type::getInt32Ty(M.getContext()), 243 (Type *)0); 244 return true; 245 } 246 247 // IsTransformableFunction - Return true if the function name isn't one 248 // of the ones we don't want transformed. Currently, don't transform any 249 // "llvm.{setjmp,longjmp}" functions and none of the setjmp/longjmp error 250 // handling functions (beginning with __llvm_sjljeh_...they don't throw 251 // exceptions). 252 bool LowerSetJmp::IsTransformableFunction(StringRef Name) { 253 return !Name.startswith("__llvm_sjljeh_"); 254 } 255 256 // TransformLongJmpCall - Transform a longjmp call into a call to the 257 // internal __llvm_sjljeh_throw_longjmp function. It then takes care of 258 // throwing the exception for us. 259 void LowerSetJmp::TransformLongJmpCall(CallInst* Inst) 260 { 261 Type* SBPTy = Type::getInt8PtrTy(Inst->getContext()); 262 263 // Create the call to "__llvm_sjljeh_throw_longjmp". This takes the 264 // same parameters as "longjmp", except that the buffer is cast to a 265 // char*. It returns "void", so it doesn't need to replace any of 266 // Inst's uses and doesn't get a name. 267 CastInst* CI = 268 new BitCastInst(Inst->getArgOperand(0), SBPTy, "LJBuf", Inst); 269 Value *Args[] = { CI, Inst->getArgOperand(1) }; 270 CallInst::Create(ThrowLongJmp, Args, "", Inst); 271 272 SwitchValuePair& SVP = SwitchValMap[Inst->getParent()->getParent()]; 273 274 // If the function has a setjmp call in it (they are transformed first) 275 // we should branch to the basic block that determines if this longjmp 276 // is applicable here. Otherwise, issue an unwind. 277 if (SVP.first) 278 BranchInst::Create(SVP.first->getParent(), Inst); 279 else 280 new UnwindInst(Inst->getContext(), Inst); 281 282 // Remove all insts after the branch/unwind inst. Go from back to front to 283 // avoid replaceAllUsesWith if possible. 284 BasicBlock *BB = Inst->getParent(); 285 Instruction *Removed; 286 do { 287 Removed = &BB->back(); 288 // If the removed instructions have any users, replace them now. 289 if (!Removed->use_empty()) 290 Removed->replaceAllUsesWith(UndefValue::get(Removed->getType())); 291 Removed->eraseFromParent(); 292 } while (Removed != Inst); 293 294 ++LongJmpsTransformed; 295 } 296 297 // GetSetJmpMap - Retrieve (create and initialize, if necessary) the 298 // setjmp map. This map is going to hold information about which setjmps 299 // were called (each setjmp gets its own number) and with which buffer it 300 // was called. There can be only one! 301 AllocaInst* LowerSetJmp::GetSetJmpMap(Function* Func) 302 { 303 if (SJMap[Func]) return SJMap[Func]; 304 305 // Insert the setjmp map initialization before the first instruction in 306 // the function. 307 Instruction* Inst = Func->getEntryBlock().begin(); 308 assert(Inst && "Couldn't find even ONE instruction in entry block!"); 309 310 // Fill in the alloca and call to initialize the SJ map. 311 Type *SBPTy = 312 Type::getInt8PtrTy(Func->getContext()); 313 AllocaInst* Map = new AllocaInst(SBPTy, 0, "SJMap", Inst); 314 CallInst::Create(InitSJMap, Map, "", Inst); 315 return SJMap[Func] = Map; 316 } 317 318 // GetRethrowBB - Only one rethrow basic block is needed per function. 319 // If this is a longjmp exception but not handled in this block, this BB 320 // performs the rethrow. 321 BasicBlock* LowerSetJmp::GetRethrowBB(Function* Func) 322 { 323 if (RethrowBBMap[Func]) return RethrowBBMap[Func]; 324 325 // The basic block we're going to jump to if we need to rethrow the 326 // exception. 327 BasicBlock* Rethrow = 328 BasicBlock::Create(Func->getContext(), "RethrowExcept", Func); 329 330 // Fill in the "Rethrow" BB with a call to rethrow the exception. This 331 // is the last instruction in the BB since at this point the runtime 332 // should exit this function and go to the next function. 333 new UnwindInst(Func->getContext(), Rethrow); 334 return RethrowBBMap[Func] = Rethrow; 335 } 336 337 // GetSJSwitch - Return the switch statement that controls which handler 338 // (if any) gets called and the value returned to that handler. 339 LowerSetJmp::SwitchValuePair LowerSetJmp::GetSJSwitch(Function* Func, 340 BasicBlock* Rethrow) 341 { 342 if (SwitchValMap[Func].first) return SwitchValMap[Func]; 343 344 BasicBlock* LongJmpPre = 345 BasicBlock::Create(Func->getContext(), "LongJmpBlkPre", Func); 346 347 // Keep track of the preliminary basic block for some of the other 348 // transformations. 349 PrelimBBMap[Func] = LongJmpPre; 350 351 // Grab the exception. 352 CallInst* Cond = CallInst::Create(IsLJException, "IsLJExcept", LongJmpPre); 353 354 // The "decision basic block" gets the number associated with the 355 // setjmp call returning to switch on and the value returned by 356 // longjmp. 357 BasicBlock* DecisionBB = 358 BasicBlock::Create(Func->getContext(), "LJDecisionBB", Func); 359 360 BranchInst::Create(DecisionBB, Rethrow, Cond, LongJmpPre); 361 362 // Fill in the "decision" basic block. 363 CallInst* LJVal = CallInst::Create(GetLJValue, "LJVal", DecisionBB); 364 CallInst* SJNum = CallInst::Create(TryCatchLJ, GetSetJmpMap(Func), "SJNum", 365 DecisionBB); 366 367 SwitchInst* SI = SwitchInst::Create(SJNum, Rethrow, 0, DecisionBB); 368 return SwitchValMap[Func] = SwitchValuePair(SI, LJVal); 369 } 370 371 // TransformSetJmpCall - The setjmp call is a bit trickier to transform. 372 // We're going to convert all setjmp calls to nops. Then all "call" and 373 // "invoke" instructions in the function are converted to "invoke" where 374 // the "except" branch is used when returning from a longjmp call. 375 void LowerSetJmp::TransformSetJmpCall(CallInst* Inst) 376 { 377 BasicBlock* ABlock = Inst->getParent(); 378 Function* Func = ABlock->getParent(); 379 380 // Add this setjmp to the setjmp map. 381 Type* SBPTy = 382 Type::getInt8PtrTy(Inst->getContext()); 383 CastInst* BufPtr = 384 new BitCastInst(Inst->getArgOperand(0), SBPTy, "SBJmpBuf", Inst); 385 Value *Args[] = { 386 GetSetJmpMap(Func), BufPtr, 387 ConstantInt::get(Type::getInt32Ty(Inst->getContext()), SetJmpIDMap[Func]++) 388 }; 389 CallInst::Create(AddSJToMap, Args, "", Inst); 390 391 // We are guaranteed that there are no values live across basic blocks 392 // (because we are "not in SSA form" yet), but there can still be values live 393 // in basic blocks. Because of this, splitting the setjmp block can cause 394 // values above the setjmp to not dominate uses which are after the setjmp 395 // call. For all of these occasions, we must spill the value to the stack. 396 // 397 std::set<Instruction*> InstrsAfterCall; 398 399 // The call is probably very close to the end of the basic block, for the 400 // common usage pattern of: 'if (setjmp(...))', so keep track of the 401 // instructions after the call. 402 for (BasicBlock::iterator I = ++BasicBlock::iterator(Inst), E = ABlock->end(); 403 I != E; ++I) 404 InstrsAfterCall.insert(I); 405 406 for (BasicBlock::iterator II = ABlock->begin(); 407 II != BasicBlock::iterator(Inst); ++II) 408 // Loop over all of the uses of instruction. If any of them are after the 409 // call, "spill" the value to the stack. 410 for (Value::use_iterator UI = II->use_begin(), E = II->use_end(); 411 UI != E; ++UI) { 412 User *U = *UI; 413 if (cast<Instruction>(U)->getParent() != ABlock || 414 InstrsAfterCall.count(cast<Instruction>(U))) { 415 DemoteRegToStack(*II); 416 break; 417 } 418 } 419 InstrsAfterCall.clear(); 420 421 // Change the setjmp call into a branch statement. We'll remove the 422 // setjmp call in a little bit. No worries. 423 BasicBlock* SetJmpContBlock = ABlock->splitBasicBlock(Inst); 424 assert(SetJmpContBlock && "Couldn't split setjmp BB!!"); 425 426 SetJmpContBlock->setName(ABlock->getName()+"SetJmpCont"); 427 428 // Add the SetJmpContBlock to the set of blocks reachable from a setjmp. 429 DFSBlocks.insert(SetJmpContBlock); 430 431 // This PHI node will be in the new block created from the 432 // splitBasicBlock call. 433 PHINode* PHI = PHINode::Create(Type::getInt32Ty(Inst->getContext()), 2, 434 "SetJmpReturn", Inst); 435 436 // Coming from a call to setjmp, the return is 0. 437 PHI->addIncoming(Constant::getNullValue(Type::getInt32Ty(Inst->getContext())), 438 ABlock); 439 440 // Add the case for this setjmp's number... 441 SwitchValuePair SVP = GetSJSwitch(Func, GetRethrowBB(Func)); 442 SVP.first->addCase(ConstantInt::get(Type::getInt32Ty(Inst->getContext()), 443 SetJmpIDMap[Func] - 1), 444 SetJmpContBlock); 445 446 // Value coming from the handling of the exception. 447 PHI->addIncoming(SVP.second, SVP.second->getParent()); 448 449 // Replace all uses of this instruction with the PHI node created by 450 // the eradication of setjmp. 451 Inst->replaceAllUsesWith(PHI); 452 Inst->eraseFromParent(); 453 454 ++SetJmpsTransformed; 455 } 456 457 // visitCallInst - This converts all LLVM call instructions into invoke 458 // instructions. The except part of the invoke goes to the "LongJmpBlkPre" 459 // that grabs the exception and proceeds to determine if it's a longjmp 460 // exception or not. 461 void LowerSetJmp::visitCallInst(CallInst& CI) 462 { 463 if (CI.getCalledFunction()) 464 if (!IsTransformableFunction(CI.getCalledFunction()->getName()) || 465 CI.getCalledFunction()->isIntrinsic()) return; 466 467 BasicBlock* OldBB = CI.getParent(); 468 469 // If not reachable from a setjmp call, don't transform. 470 if (!DFSBlocks.count(OldBB)) return; 471 472 BasicBlock* NewBB = OldBB->splitBasicBlock(CI); 473 assert(NewBB && "Couldn't split BB of \"call\" instruction!!"); 474 DFSBlocks.insert(NewBB); 475 NewBB->setName("Call2Invoke"); 476 477 Function* Func = OldBB->getParent(); 478 479 // Construct the new "invoke" instruction. 480 TerminatorInst* Term = OldBB->getTerminator(); 481 CallSite CS(&CI); 482 std::vector<Value*> Params(CS.arg_begin(), CS.arg_end()); 483 InvokeInst* II = 484 InvokeInst::Create(CI.getCalledValue(), NewBB, PrelimBBMap[Func], 485 Params, CI.getName(), Term); 486 II->setCallingConv(CI.getCallingConv()); 487 II->setAttributes(CI.getAttributes()); 488 489 // Replace the old call inst with the invoke inst and remove the call. 490 CI.replaceAllUsesWith(II); 491 CI.eraseFromParent(); 492 493 // The old terminator is useless now that we have the invoke inst. 494 Term->eraseFromParent(); 495 ++CallsTransformed; 496 } 497 498 // visitInvokeInst - Converting the "invoke" instruction is fairly 499 // straight-forward. The old exception part is replaced by a query asking 500 // if this is a longjmp exception. If it is, then it goes to the longjmp 501 // exception blocks. Otherwise, control is passed the old exception. 502 void LowerSetJmp::visitInvokeInst(InvokeInst& II) 503 { 504 if (II.getCalledFunction()) 505 if (!IsTransformableFunction(II.getCalledFunction()->getName()) || 506 II.getCalledFunction()->isIntrinsic()) return; 507 508 BasicBlock* BB = II.getParent(); 509 510 // If not reachable from a setjmp call, don't transform. 511 if (!DFSBlocks.count(BB)) return; 512 513 BasicBlock* ExceptBB = II.getUnwindDest(); 514 515 Function* Func = BB->getParent(); 516 BasicBlock* NewExceptBB = BasicBlock::Create(II.getContext(), 517 "InvokeExcept", Func); 518 519 // If this is a longjmp exception, then branch to the preliminary BB of 520 // the longjmp exception handling. Otherwise, go to the old exception. 521 CallInst* IsLJExcept = CallInst::Create(IsLJException, "IsLJExcept", 522 NewExceptBB); 523 524 BranchInst::Create(PrelimBBMap[Func], ExceptBB, IsLJExcept, NewExceptBB); 525 526 II.setUnwindDest(NewExceptBB); 527 ++InvokesTransformed; 528 } 529 530 // visitReturnInst - We want to destroy the setjmp map upon exit from the 531 // function. 532 void LowerSetJmp::visitReturnInst(ReturnInst &RI) { 533 Function* Func = RI.getParent()->getParent(); 534 CallInst::Create(DestroySJMap, GetSetJmpMap(Func), "", &RI); 535 } 536 537 // visitUnwindInst - We want to destroy the setjmp map upon exit from the 538 // function. 539 void LowerSetJmp::visitUnwindInst(UnwindInst &UI) { 540 Function* Func = UI.getParent()->getParent(); 541 CallInst::Create(DestroySJMap, GetSetJmpMap(Func), "", &UI); 542 } 543 544 ModulePass *llvm::createLowerSetJmpPass() { 545 return new LowerSetJmp(); 546 } 547 548